Quantised-models
Collection
23 items
•
Updated
from transformers import AutoModelForCausalLM, AutoTokenizer
from auto_round import AutoRoundConfig ## must import for auto-round format
quantized_model_path = "Siddharth63/Qwen3-4B-Base-4bit-Autoround-GPTQ-sym"
model = AutoModelForCausalLM.from_pretrained(quantized_model_path,
device_map="auto", torch_dtype="auto")
tokenizer = AutoTokenizer.from_pretrained(quantized_model_path)
text = "There is a girl who likes adventure,"
inputs = tokenizer(text, return_tensors="pt").to(model.device)
print(tokenizer.decode(model.generate(**inputs, max_new_tokens=50)[0]))