Spaces:

HamidOmarov
/

FastAPI-RAG-API

Sleeping

App Files Files Community

HamidOmarov commited on Aug 10, 2025

Commit

a7ef914

1 Parent(s): 70b60a8

Clean Dockerfile; pre-translate paragraphs; add /debug/translate

Browse files

Files changed (3) hide show

Dockerfile +1 -1
app/api.py +13 -0
app/rag_system.py +6 -6

Dockerfile CHANGED Viewed

@@ -14,7 +14,7 @@ WORKDIR /app
 RUN apt-get update && apt-get install -y --no-install-recommends build-essential \
  && rm -rf /var/lib/apt/lists/*
-# Bust pip cache layer when requirements change
 ARG CACHEBUST=20250810
 COPY requirements.txt .
 RUN pip install --no-cache-dir -r requirements.txt

 RUN apt-get update && apt-get install -y --no-install-recommends build-essential \
  && rm -rf /var/lib/apt/lists/*
+# Bust pip cache when requirements change
 ARG CACHEBUST=20250810
 COPY requirements.txt .
 RUN pip install --no-cache-dir -r requirements.txt

app/api.py CHANGED Viewed

@@ -5,6 +5,19 @@ from fastapi.responses import JSONResponse, RedirectResponse
 from pathlib import Path
 import shutil
 import traceback
 from .rag_system import SimpleRAG, UPLOAD_DIR, synthesize_answer as summarize
 from .schemas import AskRequest, AskResponse, UploadResponse, HistoryResponse, HistoryItem

 from pathlib import Path
 import shutil
 import traceback
+# app/api.py (importların altından)
+from fastapi.responses import JSONResponse
+@app.get("/debug/translate")
+def debug_translate():
+    try:
+        from transformers import pipeline
+        tr = pipeline("translation", model="Helsinki-NLP/opus-mt-az-en", cache_dir=str(CACHE_DIR), device=-1)
+        out = tr("Sənəd təmiri və quraşdırılması ilə bağlı işlər görülüb.", max_length=80)[0]["translation_text"]
+        return {"ok": True, "example_in": "Sənəd təmiri və quraşdırılması ilə bağlı işlər görülüb.", "example_out": out}
+    except Exception as e:
+        return JSONResponse(status_code=500, content={"ok": False, "error": str(e)})
 from .rag_system import SimpleRAG, UPLOAD_DIR, synthesize_answer as summarize
 from .schemas import AskRequest, AskResponse, UploadResponse, HistoryResponse, HistoryItem

app/rag_system.py CHANGED Viewed

@@ -114,7 +114,7 @@ class SimpleRAG:
         chunks: List[str] = []
         for txt in pages:
             for i in range(0, len(txt), step):
-                part = txt[i:i+step].strip()
                 if part:
                     chunks.append(part)
         return chunks
@@ -162,20 +162,20 @@ class SimpleRAG:
         if not contexts:
             return "No relevant context found. Please upload a PDF or ask a more specific question."
-        # 1) Clean & keep top contexts
         cleaned_contexts = [_clean_for_summary(c) for c in contexts[:5]]
         cleaned_contexts = [c for c in cleaned_contexts if len(c) > 40]
         if not cleaned_contexts:
             return "The document appears largely tabular/numeric; couldn't extract readable sentences."
-        # 2) Pre-translate paragraphs to EN (if output language is EN)
         if OUTPUT_LANG == "en":
             try:
                 cleaned_contexts = self._translate_to_en(cleaned_contexts)
             except Exception:
                 pass
-        # 3) Split into candidate sentences and filter
         candidates: List[str] = []
         for para in cleaned_contexts:
             for s in _split_sentences(para):
@@ -189,13 +189,13 @@ class SimpleRAG:
         if not candidates:
             return "The document appears largely tabular/numeric; couldn't extract readable sentences."
-        # 4) Rank by similarity
         q_emb = self.model.encode([question], convert_to_numpy=True, normalize_embeddings=True).astype(np.float32)
         cand_emb = self.model.encode(candidates, convert_to_numpy=True, normalize_embeddings=True).astype(np.float32)
         scores = (cand_emb @ q_emb.T).ravel()
         order = np.argsort(-scores)
-        # 5) Aggressive near-duplicate removal
         selected: List[str] = []
         for i in order:
             s = candidates[i].strip()

         chunks: List[str] = []
         for txt in pages:
             for i in range(0, len(txt), step):
+                part = txt[i : i + step].strip()
                 if part:
                     chunks.append(part)
         return chunks
         if not contexts:
             return "No relevant context found. Please upload a PDF or ask a more specific question."
+        # 1) Clean top contexts
         cleaned_contexts = [_clean_for_summary(c) for c in contexts[:5]]
         cleaned_contexts = [c for c in cleaned_contexts if len(c) > 40]
         if not cleaned_contexts:
             return "The document appears largely tabular/numeric; couldn't extract readable sentences."
+        # 2) Pre-translate paragraphs to EN (if target is EN)
         if OUTPUT_LANG == "en":
             try:
                 cleaned_contexts = self._translate_to_en(cleaned_contexts)
             except Exception:
                 pass
+        # 3) Split into sentence candidates & filter
         candidates: List[str] = []
         for para in cleaned_contexts:
             for s in _split_sentences(para):
         if not candidates:
             return "The document appears largely tabular/numeric; couldn't extract readable sentences."
+        # 4) Rank by similarity to question
         q_emb = self.model.encode([question], convert_to_numpy=True, normalize_embeddings=True).astype(np.float32)
         cand_emb = self.model.encode(candidates, convert_to_numpy=True, normalize_embeddings=True).astype(np.float32)
         scores = (cand_emb @ q_emb.T).ravel()
         order = np.argsort(-scores)
+        # 5) Aggressive near-duplicate removal (Jaccard >= 0.90)
         selected: List[str] = []
         for i in order:
             s = candidates[i].strip()