Spaces:

viswadarshan06
/

Thirukkural_AI_Backend

Running

App Files Files Community

viswadarshan06 commited on Jul 13

Commit

1ba33db

verified ·

1 Parent(s): 6e1dfb9

Update app.py

Browse files

Files changed (1) hide show

app.py +11 -41

app.py CHANGED Viewed

@@ -4,36 +4,18 @@ from pydantic import BaseModel
 import faiss
 import pickle
 import numpy as np
-from transformers import AutoTokenizer, AutoModel
 import torch
-# Set cache to custom dir to avoid /.cache issues
 os.environ["HF_HOME"] = "/app/hf_cache"
 os.environ["TRANSFORMERS_CACHE"] = "/app/hf_cache"
-# Get Hugging Face token from environment (must be set in HF Space secrets)
-hf_token = os.getenv("HF_TOKEN")
-# Initialize FastAPI
 app = FastAPI()
-import shutil
-model_cache_path = "/app/hf_cache/models--viswadarshan06--paraphrase-multilingual-MiniLM-L12-v2-local"
-if os.path.exists(model_cache_path):
-    shutil.rmtree(model_cache_path)
-# ✅ Load your private model
-tokenizer = AutoTokenizer.from_pretrained(
-    "viswadarshan06/paraphrase-multilingual-MiniLM-L12-v2-local",
-    cache_dir="/app/hf_cache",
-    token=hf_token
-)
-model = AutoModel.from_pretrained(
-    "viswadarshan06/paraphrase-multilingual-MiniLM-L12-v2-local",
-    cache_dir="/app/hf_cache",
-    token=hf_token
-)
 # Load Thirukkural data
 with open("thirukkural_data.pkl", "rb") as f:
@@ -43,35 +25,23 @@ with open("thirukkural_data.pkl", "rb") as f:
 english_index = faiss.read_index("thirukkural_english_index.faiss")
 tamil_index = faiss.read_index("thirukkural_tamil_index.faiss")
-# Request schema
 class QueryRequest(BaseModel):
     query: str
     lang: str  # "en" or "ta"
     top_k: int = 3
-# Mean pooling (same as SentenceTransformer style)
-def mean_pooling(model_output, attention_mask):
-    token_embeddings = model_output[0]
-    input_mask_expanded = attention_mask.unsqueeze(-1).expand(token_embeddings.size()).float()
-    return torch.sum(token_embeddings * input_mask_expanded, 1) / torch.clamp(input_mask_expanded.sum(1), min=1e-9)
-# POST endpoint
 @app.post("/search/")
 def search_kural(req: QueryRequest):
-    encoded_input = tokenizer(req.query, padding=True, truncation=True, return_tensors="pt")
-    with torch.no_grad():
-        model_output = model(**encoded_input)
-        query_embedding = mean_pooling(model_output, encoded_input["attention_mask"])
-    query_embedding = query_embedding.detach().cpu().numpy()
     index = tamil_index if req.lang == "ta" else english_index
-    D, I = index.search(query_embedding.astype("float32"), req.top_k)
     results = [kural_data[i] for i in I[0]]
     return {"results": results}
-# Health check
 @app.get("/")
 def root():
-    return {"message": "Thirukkural FastAPI RAG is running with private model."}

 import faiss
 import pickle
 import numpy as np
+from sentence_transformers import SentenceTransformer
 import torch
+# Optional: set dummy cache paths if needed by other internal libs
 os.environ["HF_HOME"] = "/app/hf_cache"
 os.environ["TRANSFORMERS_CACHE"] = "/app/hf_cache"
+# Initialize FastAPI app
 app = FastAPI()
+# ✅ Load your locally uploaded SentenceTransformer model
+model = SentenceTransformer("/app/model")
 # Load Thirukkural data
 with open("thirukkural_data.pkl", "rb") as f:
 english_index = faiss.read_index("thirukkural_english_index.faiss")
 tamil_index = faiss.read_index("thirukkural_tamil_index.faiss")
+# Define request schema
 class QueryRequest(BaseModel):
     query: str
     lang: str  # "en" or "ta"
     top_k: int = 3
+# Search endpoint
 @app.post("/search/")
 def search_kural(req: QueryRequest):
+    query_embedding = model.encode([req.query])
     index = tamil_index if req.lang == "ta" else english_index
+    D, I = index.search(np.array(query_embedding).astype("float32"), req.top_k)
     results = [kural_data[i] for i in I[0]]
     return {"results": results}
+# Health check endpoint
 @app.get("/")
 def root():
+    return {"message": "Thirukkural FastAPI RAG is running with local model."}