Skip to content

Commit d5db882

Browse files
Fix embedding issue with ArangoDB due to deprecated HuggingFace API (#1694)
Signed-off-by: lvliang-intel <[email protected]>
1 parent bc1e498 commit d5db882

File tree

2 files changed

+9
-6
lines changed

2 files changed

+9
-6
lines changed

comps/dataprep/src/integrations/arangodb.py

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -10,12 +10,11 @@
1010
from fastapi import Body, File, Form, HTTPException, UploadFile
1111
from langchain.text_splitter import RecursiveCharacterTextSplitter
1212
from langchain_arangodb import ArangoGraph
13-
from langchain_community.embeddings import HuggingFaceHubEmbeddings
1413
from langchain_core.documents import Document
1514
from langchain_core.embeddings import Embeddings
1615
from langchain_core.prompts import ChatPromptTemplate
1716
from langchain_experimental.graph_transformers import LLMGraphTransformer
18-
from langchain_huggingface import HuggingFaceEmbeddings
17+
from langchain_huggingface import HuggingFaceEmbeddings, HuggingFaceEndpointEmbeddings
1918
from langchain_openai import ChatOpenAI, OpenAIEmbeddings
2019
from langchain_text_splitters import HTMLHeaderTextSplitter
2120

@@ -200,8 +199,9 @@ def _initialize_embeddings(self):
200199
"""Initialize the embeddings model."""
201200

202201
if TEI_EMBEDDING_ENDPOINT and HUGGINGFACEHUB_API_TOKEN:
203-
self.embeddings = HuggingFaceHubEmbeddings(
202+
self.embeddings = HuggingFaceEndpointEmbeddings(
204203
model=TEI_EMBEDDING_ENDPOINT,
204+
task="feature-extraction",
205205
huggingfacehub_api_token=HUGGINGFACEHUB_API_TOKEN,
206206
)
207207
elif TEI_EMBED_MODEL:

comps/retrievers/src/integrations/arangodb.py

Lines changed: 6 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -9,7 +9,8 @@
99
from arango.database import StandardDatabase
1010
from fastapi import HTTPException
1111
from langchain_arangodb import ArangoVector
12-
from langchain_community.embeddings import HuggingFaceBgeEmbeddings, HuggingFaceHubEmbeddings
12+
from langchain_community.embeddings import HuggingFaceBgeEmbeddings
13+
from langchain_huggingface import HuggingFaceEndpointEmbeddings
1314
from langchain_openai import ChatOpenAI, OpenAIEmbeddings
1415

1516
from comps import CustomLogger, EmbedDoc, OpeaComponent, OpeaComponentRegistry, ServiceType
@@ -421,8 +422,10 @@ async def invoke(
421422
if OPENAI_API_KEY and OPENAI_EMBED_MODEL and OPENAI_EMBED_ENABLED:
422423
embeddings = OpenAIEmbeddings(model=OPENAI_EMBED_MODEL, dimensions=dimension)
423424
elif TEI_EMBEDDING_ENDPOINT and HUGGINGFACEHUB_API_TOKEN:
424-
embeddings = HuggingFaceHubEmbeddings(
425-
model=TEI_EMBEDDING_ENDPOINT, huggingfacehub_api_token=HUGGINGFACEHUB_API_TOKEN
425+
embeddings = HuggingFaceEndpointEmbeddings(
426+
model=TEI_EMBEDDING_ENDPOINT,
427+
task="feature-extraction",
428+
huggingfacehub_api_token=HUGGINGFACEHUB_API_TOKEN,
426429
)
427430
else:
428431
embeddings = HuggingFaceBgeEmbeddings(model_name=TEI_EMBED_MODEL)

0 commit comments

Comments
 (0)