Spaces:

junaid17
/

Cortex-Coder

Sleeping

Update scripts/load_model.py

e31573a verified 18 days ago

807 Bytes

	# model_loader.py
	from langchain_community.chat_models import ChatLlamaCpp
	import os

	_llm_instance = None

	def get_model(callbacks=None):
	global _llm_instance
	if _llm_instance is None:
	model_path = os.path.join(os.path.dirname(__file__), os.pardir, "Model", "qwen2.5-0.5b-coding-assistant-q4_k_m.gguf")
	model_path = os.path.abspath(model_path)
	print(f"Loading ChatLlamaCpp model from local path: {model_path}")
	_llm_instance = ChatLlamaCpp(
	model_path=model_path,
	temperature=0.7,
	max_tokens=1000,
	n_ctx=4096,
	n_batch=512,
	n_threads=8,
	n_gpu_layers=0,
	verbose=False,
	)
	print("Model loaded successfully!")
	return _llm_instance