Spaces:
Sleeping
Sleeping
File size: 807 Bytes
eff58d2 e31573a eff58d2 e31573a eff58d2 | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 | # model_loader.py
from langchain_community.chat_models import ChatLlamaCpp
import os
_llm_instance = None
def get_model(callbacks=None):
global _llm_instance
if _llm_instance is None:
model_path = os.path.join(os.path.dirname(__file__), os.pardir, "Model", "qwen2.5-0.5b-coding-assistant-q4_k_m.gguf")
model_path = os.path.abspath(model_path)
print(f"Loading ChatLlamaCpp model from local path: {model_path}")
_llm_instance = ChatLlamaCpp(
model_path=model_path,
temperature=0.7,
max_tokens=1000,
n_ctx=4096,
n_batch=512,
n_threads=8,
n_gpu_layers=0,
verbose=False,
)
print("Model loaded successfully!")
return _llm_instance
|