from llama_cpp import Llama llm = Llama(model_path="./models/phi-2.Q4_0.gguf", n_ctx=2048) response = llm("What is the capital of France?") print(response) from sentence_transformers import SentenceTransformer model = SentenceTransformer("./models/embeddinggemma-300m") emb = model.encode("Test string") print(emb.shape)