embedding.py 2.1 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465
  1. # coding=utf-8
  2. """
  3. @project: MaxKB
  4. @Author:虎
  5. @file: embedding.py
  6. @date:2024/10/17 16:48
  7. @desc:
  8. """
  9. from typing import Dict, List
  10. from langchain_community.embeddings import QianfanEmbeddingsEndpoint
  11. import openai
  12. from models_provider.base_model_provider import MaxKBBaseModel
  13. class QianfanV1Embeddings(MaxKBBaseModel, QianfanEmbeddingsEndpoint):
  14. @staticmethod
  15. def new_instance(model_type, model_name, model_credential: Dict[str, object], **model_kwargs):
  16. return QianfanV1Embeddings(
  17. model=model_name,
  18. qianfan_ak=model_credential.get('qianfan_ak'),
  19. qianfan_sk=model_credential.get('qianfan_sk'),
  20. )
  21. class QianfanV2EmbeddingModel(MaxKBBaseModel):
  22. model_name: str
  23. @staticmethod
  24. def is_cache_model():
  25. return False
  26. def __init__(self, api_key, base_url, model_name: str):
  27. self.client = openai.OpenAI(api_key=api_key, base_url=base_url).embeddings
  28. self.model_name = model_name
  29. @staticmethod
  30. def new_instance(model_type, model_name, model_credential: Dict[str, object], **model_kwargs):
  31. return QianfanV2EmbeddingModel(
  32. api_key=model_credential.get('qianfan_ak'),
  33. model_name=model_name,
  34. base_url=model_credential.get('api_base'),
  35. )
  36. def embed_query(self, text: str):
  37. res = self.embed_documents([text])
  38. return res[0]
  39. def embed_documents(
  40. self, texts: List[ str],
  41. ) -> List[List[float]]:
  42. res = self.client.create(input=texts, model=self.model_name, encoding_format="float")
  43. return [e.embedding for e in res.data]
  44. class QianfanEmbeddings(MaxKBBaseModel):
  45. @staticmethod
  46. def new_instance(model_type, model_name, model_credential: Dict[str, object], **model_kwargs):
  47. api_version = model_credential.get('api_version', 'v1')
  48. if api_version == "v1":
  49. return QianfanV1Embeddings.new_instance(model_type, model_name, model_credential, **model_kwargs)
  50. elif api_version == "v2":
  51. return QianfanV2EmbeddingModel.new_instance(model_type, model_name, model_credential, **model_kwargs)