llm.py 3.1 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667
  1. # coding=utf-8
  2. from typing import Dict
  3. from django.utils.translation import gettext_lazy as _, gettext
  4. from langchain_core.messages import HumanMessage
  5. from common import forms
  6. from common.exception.app_exception import AppApiException
  7. from common.forms import BaseForm, TooltipLabel
  8. from models_provider.base_model_provider import BaseModelCredential, ValidCode
  9. class XinferenceLLMModelParams(BaseForm):
  10. temperature = forms.SliderField(TooltipLabel(_('Temperature'),
  11. _('Higher values make the output more random, while lower values make it more focused and deterministic')),
  12. required=True, default_value=0.7,
  13. _min=0.1,
  14. _max=1.0,
  15. _step=0.01,
  16. precision=2)
  17. max_tokens = forms.SliderField(
  18. TooltipLabel(_('Output the maximum Tokens'),
  19. _('Specify the maximum number of tokens that the model can generate')),
  20. required=True, default_value=800,
  21. _min=1,
  22. _max=100000,
  23. _step=1,
  24. precision=0)
  25. class XinferenceLLMModelCredential(BaseForm, BaseModelCredential):
  26. def is_valid(self, model_type: str, model_name, model_credential: Dict[str, object], model_params, provider,
  27. raise_exception=False):
  28. model_type_list = provider.get_model_type_list()
  29. if not any(list(filter(lambda mt: mt.get('value') == model_type, model_type_list))):
  30. raise AppApiException(ValidCode.valid_error.value,
  31. gettext('{model_type} Model type is not supported').format(model_type=model_type))
  32. try:
  33. model_list = provider.get_base_model_list(model_credential.get('api_base'), model_credential.get('api_key'),
  34. model_type)
  35. except Exception as e:
  36. raise AppApiException(ValidCode.valid_error.value, gettext('API domain name is invalid'))
  37. exist = provider.get_model_info_by_name(model_list, model_name)
  38. if len(exist) == 0:
  39. raise AppApiException(ValidCode.valid_error.value,
  40. gettext('The model does not exist, please download the model first'))
  41. model = provider.get_model(model_type, model_name, model_credential, **model_params)
  42. model.invoke([HumanMessage(content=gettext('Hello'))])
  43. return True
  44. def encryption_dict(self, model_info: Dict[str, object]):
  45. return {**model_info, 'api_key': super().encryption(model_info.get('api_key', ''))}
  46. def build_model(self, model_info: Dict[str, object]):
  47. for key in ['api_key', 'model']:
  48. if key not in model_info:
  49. raise AppApiException(500, gettext('{key} is required').format(key=key))
  50. self.api_key = model_info.get('api_key')
  51. return self
  52. api_base = forms.TextInputField('API URL', required=True)
  53. api_key = forms.PasswordInputField('API Key', required=True)
  54. def get_model_params_setting_form(self, model_name):
  55. return XinferenceLLMModelParams()