Spaces:

thecuong
/

healthy-search

Runtime error

App Files Files Community

thecuong commited on Jul 14, 2024

Commit

2da3321

1 Parent(s): 606b7eb

feat: fastAPI

Browse files

Files changed (3) hide show

Dockerfile +1 -1
app.py +68 -1
requirements.txt +4 -2

Dockerfile CHANGED Viewed

@@ -1,7 +1,7 @@
 # read the doc: https://huggingface.co/docs/hub/spaces-sdks-docker
 # you will also find guides on how best to write your Dockerfile
-FROM python:3.9
 RUN useradd -m -u 1000 user
 USER user

 # read the doc: https://huggingface.co/docs/hub/spaces-sdks-docker
 # you will also find guides on how best to write your Dockerfile
+FROM python:3.10
 RUN useradd -m -u 1000 user
 USER user

app.py CHANGED Viewed

@@ -1,7 +1,74 @@
 from fastapi import FastAPI
 app = FastAPI()
 @app.get("/")
 def greet_json():
-    return {"Hello": "World!"}

+import os
+from typing import List
 from fastapi import FastAPI
+from pydantic import BaseModel
+from llama_index.vector_stores.milvus import MilvusVectorStore
+from llama_index.embeddings.huggingface import HuggingFaceEmbedding
+# from llama_index.core.postprocessor import SentenceTransformerRerank
+from llama_index.core import VectorStoreIndex
+from llama_index.core import Settings
 app = FastAPI()
+# rerank = SentenceTransformerRerank(
+#     model="cross-encoder/ms-marco-MiniLM-L-2-v2", top_n=3
+# )
+Settings.embed_model = HuggingFaceEmbedding(model_name="BAAI/bge-small-en-v1.5",
+                                            cache_folder=".cache")
+vector_store = MilvusVectorStore(
+    overwrite=False,
+    uri=os.getenv('MILVUS_CLOUD_URI'),
+    token=os.getenv('MILVUS_CLOUD_TOKEN'),
+    collection_name=os.getenv('COLLECTION_NAME'),
+    dim=384,
+)
 @app.get("/")
 def greet_json():
+    return {"Hello": "World!"}
+class SearchRequest(BaseModel):
+    query: str
+    limit: int = 10
+class Metadata(BaseModel):
+    window: str
+    original_text: str
+class MyNodeWithScore(BaseModel):
+    node: Metadata
+    relationships: List[Metadata]
+    score: float
+class MyResult(BaseModel):
+    results: List[MyNodeWithScore]
+@app.post("/search/")
+def search(search_request: SearchRequest):
+    sentence_index = VectorStoreIndex.from_vector_store(vector_store=vector_store)
+    retriever = sentence_index.as_retriever(
+        include_text=True,  # include source chunk with matching paths
+        similarity_top_k=search_request.limit,
+        # node_postprocessors=[rerank]
+    )
+    result_retriever_engine = retriever.retrieve(search_request.query)
+    node_with_score_list = MyResult(results=[MyNodeWithScore(
+                                                node=Metadata(window=result.metadata['window'],
+                                                              original_text=result.metadata['original_text']),
+                                                relationships=[
+                                                    Metadata(window=relationship.metadata.get('window', " "),
+                                                             original_text=relationship.metadata.get('original_text', " ")
+                                                             ) for key, relationship in result.node.relationships.items()
+                                                ],
+                                                score=result.get_score()) for result in result_retriever_engine])
+    # node_with_score_list = [json.loads(result.json()) for result in query_engine]
+    return node_with_score_list

requirements.txt CHANGED Viewed

@@ -1,2 +1,4 @@
-fastapi
-uvicorn[standard]

+fastapi==0.111.0
+uvicorn[standard]==0.30.1
+llama-index-vector-stores-milvus==0.1.20
+llama-index-embeddings-huggingface==0.2.2