Update README.md
Browse files
README.md
CHANGED
@@ -156,6 +156,7 @@ from typing import Optional
|
|
156 |
from huggingface_hub import snapshot_download
|
157 |
from vllm import EngineArgs, LLMEngine, RequestOutput, SamplingParams
|
158 |
from vllm.lora.request import LoRARequest
|
|
|
159 |
|
160 |
SYS_MESSAGE = 'A conversation between User and Assistant. The user asks a question, and the Assistant solves it. The assistant first thinks about the reasoning process in the mind and then provides the user with the answer. The reasoning process and answer are enclosed within <think> </think> and <answer> </answer> tags, respectively, i.e., <think> reasoning process here </think> <answer> answer here </answer>.'
|
161 |
tokenizer = transformers.AutoTokenizer.from_pretrained("")
|
|
|
156 |
from huggingface_hub import snapshot_download
|
157 |
from vllm import EngineArgs, LLMEngine, RequestOutput, SamplingParams
|
158 |
from vllm.lora.request import LoRARequest
|
159 |
+
import transformers
|
160 |
|
161 |
SYS_MESSAGE = 'A conversation between User and Assistant. The user asks a question, and the Assistant solves it. The assistant first thinks about the reasoning process in the mind and then provides the user with the answer. The reasoning process and answer are enclosed within <think> </think> and <answer> </answer> tags, respectively, i.e., <think> reasoning process here </think> <answer> answer here </answer>.'
|
162 |
tokenizer = transformers.AutoTokenizer.from_pretrained("")
|