sqfoo's picture
Update llm.py
ea4c290 verified
Raw
History Blame Contribute Delete
1.08 kB
from langchain_huggingface import ChatHuggingFace, HuggingFaceEndpoint
HUGGINGFACE = {
'type': 'huggingface',
'param':{
'repo_id': "Qwen/Qwen2.5-7B-Instruct",
'task': 'text-generation',
'max_new_tokens': 512,
'do_sample': False,
'repetition_penalty': 1.03,
'provider': 'auto',
},
'model': 'huggingface:Qwen2.5-7B-Instruct',
}
HUGGINGFACE_LITE = {
'type': 'huggingface-lite',
'param':{
'repo_id': "Qwen/Qwen2.5-1.5B-Instruct",
'task': 'text-generation',
'max_new_tokens': 512,
'do_sample': False,
'repetition_penalty': 1.03,
'provider': 'auto',
},
'model': 'huggingface:Qwen2.5-1.5B-Instruct',
}
valid_LLM = [HUGGINGFACE, HUGGINGFACE_LITE]
def setup_model(config: dict, API_KEY: str, callbacks=None):
if config['type'].startswith('huggingface'):
llm = HuggingFaceEndpoint(huggingfacehub_api_token=API_KEY, **config['param'])
model = ChatHuggingFace(llm=llm, callbacks=callbacks)
else:
model = None
return model