Spaces:
Sleeping
Sleeping
| # model_loader.py | |
| from langchain_community.chat_models import ChatLlamaCpp | |
| import os | |
| _llm_instance = None | |
| def get_model(callbacks=None): | |
| global _llm_instance | |
| if _llm_instance is None: | |
| model_path = os.path.join(os.path.dirname(__file__), os.pardir, "Model", "qwen2.5-0.5b-coding-assistant-q4_k_m.gguf") | |
| model_path = os.path.abspath(model_path) | |
| print(f"Loading ChatLlamaCpp model from local path: {model_path}") | |
| _llm_instance = ChatLlamaCpp( | |
| model_path=model_path, | |
| temperature=0.7, | |
| max_tokens=1000, | |
| n_ctx=4096, | |
| n_batch=512, | |
| n_threads=8, | |
| n_gpu_layers=0, | |
| verbose=False, | |
| ) | |
| print("Model loaded successfully!") | |
| return _llm_instance | |