Create README.md
Browse files
README.md
ADDED
@@ -0,0 +1,94 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
---
|
2 |
+
base_model: unsloth/Llama-3.3-70B-Instruct-bnb-4bit
|
3 |
+
tags:
|
4 |
+
- text-generation-inference
|
5 |
+
- transformers
|
6 |
+
- unsloth
|
7 |
+
- llama
|
8 |
+
- trl
|
9 |
+
- sft
|
10 |
+
license: apache-2.0
|
11 |
+
language:
|
12 |
+
- en
|
13 |
+
---
|
14 |
+
|
15 |
+
# Uploaded model
|
16 |
+
|
17 |
+
- **Developed by:** ykarout
|
18 |
+
- **License:** apache-2.0
|
19 |
+
- **Finetuned from model :** unsloth/Llama-3.3-70B-Instruct-bnb-4bit
|
20 |
+
|
21 |
+
This llama model was trained 2x faster with [Unsloth](https://github.com/unslothai/unsloth) and Huggingface's TRL library.
|
22 |
+
|
23 |
+
[<img src="https://raw.githubusercontent.com/unslothai/unsloth/main/images/unsloth%20made%20with%20love.png" width="200"/>](https://github.com/unslothai/unsloth)
|
24 |
+
|
25 |
+
|
26 |
+
To use with Ollama, create the Modelfile as per the below template:
|
27 |
+
|
28 |
+
FROM {__FILE_LOCATION__} (replace with your gguf file location)
|
29 |
+
|
30 |
+
TEMPLATE """{{ if .Messages }}
|
31 |
+
{{- if or .System .Tools }}<|start_header_id|>system<|end_header_id|>
|
32 |
+
{{- if .System }}
|
33 |
+
|
34 |
+
{{ .System }}
|
35 |
+
{{- end }}
|
36 |
+
{{- if .Tools }}
|
37 |
+
|
38 |
+
You are a helpful assistant with tool calling capabilities. When you receive a tool call response, use the output to format an answer to the original use question.
|
39 |
+
{{- end }}
|
40 |
+
{{- end }}<|eot_id|>
|
41 |
+
{{- range $i, $_ := .Messages }}
|
42 |
+
{{- $last := eq (len (slice $.Messages $i)) 1 }}
|
43 |
+
{{- if eq .Role "user" }}<|start_header_id|>user<|end_header_id|>
|
44 |
+
{{- if and $.Tools $last }}
|
45 |
+
|
46 |
+
Given the following functions, please respond with a JSON for a function call with its proper arguments that best answers the given prompt.
|
47 |
+
|
48 |
+
Respond in the format {"name": function name, "parameters": dictionary of argument name and its value}. Do not use variables.
|
49 |
+
|
50 |
+
{{ $.Tools }}
|
51 |
+
{{- end }}
|
52 |
+
|
53 |
+
{{ .Content }}<|eot_id|>{{ if $last }}<|start_header_id|>assistant<|end_header_id|>
|
54 |
+
|
55 |
+
{{ end }}
|
56 |
+
{{- else if eq .Role "assistant" }}<|start_header_id|>assistant<|end_header_id|>
|
57 |
+
{{- if .ToolCalls }}
|
58 |
+
|
59 |
+
{{- range .ToolCalls }}{"name": "{{ .Function.Name }}", "parameters": {{ .Function.Arguments }}}{{ end }}
|
60 |
+
{{- else }}
|
61 |
+
|
62 |
+
{{ .Content }}{{ if not $last }}<|eot_id|>{{ end }}
|
63 |
+
{{- end }}
|
64 |
+
{{- else if eq .Role "tool" }}<|start_header_id|>ipython<|end_header_id|>
|
65 |
+
|
66 |
+
{{ .Content }}<|eot_id|>{{ if $last }}<|start_header_id|>assistant<|end_header_id|>
|
67 |
+
|
68 |
+
{{ end }}
|
69 |
+
{{- end }}
|
70 |
+
{{- end }}
|
71 |
+
{{- else }}
|
72 |
+
{{- if .System }}<|start_header_id|>system<|end_header_id|>
|
73 |
+
|
74 |
+
{{ .System }}<|eot_id|>{{ end }}{{ if .Prompt }}<|start_header_id|>user<|end_header_id|>
|
75 |
+
|
76 |
+
{{ .Prompt }}<|eot_id|>{{ end }}<|start_header_id|>assistant<|end_header_id|>
|
77 |
+
|
78 |
+
{{ end }}{{ .Response }}{{ if .Response }}<|eot_id|>{{ end }}"""
|
79 |
+
|
80 |
+
PARAMETER stop "<|start_header_id|>"
|
81 |
+
PARAMETER stop "<|end_header_id|>"
|
82 |
+
PARAMETER stop "<|eot_id|>"
|
83 |
+
PARAMETER stop "<|eom_id|>"
|
84 |
+
|
85 |
+
PARAMETER temperature 1.5 #can be changed for experimenting different generations
|
86 |
+
|
87 |
+
PARAMETER min_p 0.1 #can be changed for experimenting different generations
|
88 |
+
|
89 |
+
PARAMETER repeat_penalty 1.15 #can be changed for experimenting different generations
|
90 |
+
|
91 |
+
PARAMETER top_p 0.9 #can be changed for experimenting different generations
|
92 |
+
|
93 |
+
PARAMETER top_k 45 #can be changed for experimenting different generations
|
94 |
+
|