blob: 2f41fe5df956b01a3c4fd61a9d52267d85eb8311 [file] [log] [blame]
# Licensed to the Apache Software Foundation (ASF) under one
# or more contributor license agreements. See the NOTICE file
# distributed with this work for additional information
# regarding copyright ownership. The ASF licenses this file
# to you under the Apache License, Version 2.0 (the
# "License"); you may not use this file except in compliance
# with the License. You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing,
# software distributed under the License is distributed on an
# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
# KIND, either express or implied. See the License for the
# specific language governing permissions and limitations
# under the License.
from typing import Optional, List
import os
import qianfan
"""
"QianFan" platform can be understood as a unified LLM platform that encompasses the
WenXin large model along with other
common open-source models.
It enables the invocation and switching between WenXin and these open-source models.
"""
class QianFanEmbedding:
def __init__(
self,
model_name: str = "embedding-v1",
api_key: Optional[str] = None,
secret_key: Optional[str] = None
):
qianfan.get_config().AK = api_key or os.getenv("QIANFAN_ACCESS_KEY")
qianfan.get_config().SK = secret_key or os.getenv("QIANFAN_SECRET_KEY")
self.embedding_model_name = model_name
self.client = qianfan.Embedding()
def get_text_embedding(self, text: str) -> List[float]:
""" Usage refer: https://cloud.baidu.com/doc/WENXINWORKSHOP/s/hlmokk9qn"""
response = self.client.do(
model=self.embedding_model_name,
texts=[text]
)
return response["body"]["data"][0]["embedding"]
async def async_get_text_embedding(self, text: str) -> List[float]:
""" Usage refer: https://cloud.baidu.com/doc/WENXINWORKSHOP/s/hlmokk9qn"""
response = await self.client.ado(
model=self.embedding_model_name,
texts=[text]
)
return response["body"]["data"][0]["embedding"]