Spaces:

Zeri00
/

Cogni-Chat-document-reader-v2

Sleeping

riteshraut commited on 25 days ago

Commit

57bb94b

1 Parent(s): 2c5dd57

upgraded embedding

Files changed (2) hide show

Dockerfile CHANGED Viewed

@@ -13,6 +13,12 @@ RUN apt-get update && apt-get install -y \
 # Create a non-root user early
 RUN useradd --create-home --shell /bin/bash --uid 1000 appuser
 # Copy and install Python requirements as root first
 COPY requirements.txt .
 RUN pip install --no-cache-dir --upgrade pip

 # Create a non-root user early
 RUN useradd --create-home --shell /bin/bash --uid 1000 appuser
+# Add this line to accept the HF_TOKEN secret
+ARG HF_TOKEN
+# Add this line to log in to Hugging Face Hub
+RUN huggingface-cli login --token $HF_TOKEN
 # Copy and install Python requirements as root first
 COPY requirements.txt .
 RUN pip install --no-cache-dir --upgrade pip

app.py CHANGED Viewed

@@ -10,6 +10,7 @@ import re
 import io
 from gtts import gTTS
 from langchain_core.documents import Document
 from langchain_community.document_loaders import (
     TextLoader,
     Docx2txtLoader,
@@ -48,9 +49,11 @@ doc_stores = {} # To hold the InMemoryStore for each session
 print("Loading embedding model...")
 try:
     EMBEDDING_MODEL = HuggingFaceEmbeddings(
         model_name="google/embeddinggemma-300m",
-        model_kwargs={'device': 'cpu'}
     )
     print("Embedding model loaded successfully.")
 except Exception as e:

 import io
 from gtts import gTTS
 from langchain_core.documents import Document
 from langchain_community.document_loaders import (
     TextLoader,
     Docx2txtLoader,
 print("Loading embedding model...")
 try:
+    hf_token = os.getenv("HF_TOKEN")
     EMBEDDING_MODEL = HuggingFaceEmbeddings(
         model_name="google/embeddinggemma-300m",
+        model_kwargs={'device': 'cpu'},
+        encode_kwargs={'normalize_embeddings': True},
     )
     print("Embedding model loaded successfully.")
 except Exception as e: