Spaces:

Subhadip007
/

researchpilot-api

Running

App Files Files Community

Subhadip007 commited on 9 days ago

Commit

99e045a

1 Parent(s): 88b90e7

fix(backend): bust docker cache + fix async streaming generator to not block event loop

Browse files

Files changed (2) hide show

Dockerfile +4 -0
src/api/main.py +40 -7

Dockerfile CHANGED Viewed

@@ -13,6 +13,10 @@ RUN apt-get update && apt-get install -y \
 COPY requirements.txt .
 RUN pip install --no-cache-dir -r requirements.txt
 # Copy source code
 COPY src/ ./src/
 COPY config/ ./config/

 COPY requirements.txt .
 RUN pip install --no-cache-dir -r requirements.txt
+# Cache-bust: forces Docker to re-copy source code on every build
+# This ensures HuggingFace always gets the latest code from git
+ARG CACHEBUST=20260411_1
 # Copy source code
 COPY src/ ./src/
 COPY config/ ./config/

src/api/main.py CHANGED Viewed

@@ -170,15 +170,48 @@ async def stream_query_papers(
     request:     Request,
     query_input: QueryRequest,
 ):
     pipeline = request.app.state.rag_pipeline
     return StreamingResponse(
-        pipeline.stream_query(
-            question        = query_input.question,
-            top_k           = query_input.top_k,
-            filter_category = query_input.filter_category,
-            filter_year_gte = query_input.filter_year_gte,
-        ),
-        media_type="text/event-stream"
     )
 @app.post(

     request:     Request,
     query_input: QueryRequest,
 ):
+    import asyncio
     pipeline = request.app.state.rag_pipeline
+    async def async_generator():
+        """
+        Wraps the synchronous pipeline.stream_query() generator in an
+        async-friendly way using a thread + asyncio.Queue so we never
+        block the FastAPI event loop.
+        """
+        loop = asyncio.get_event_loop()
+        queue: asyncio.Queue = asyncio.Queue()
+        SENTINEL = object()
+        def run_sync():
+            try:
+                for chunk in pipeline.stream_query(
+                    question        = query_input.question,
+                    top_k           = query_input.top_k,
+                    filter_category = query_input.filter_category,
+                    filter_year_gte = query_input.filter_year_gte,
+                ):
+                    loop.call_soon_threadsafe(queue.put_nowait, chunk)
+            finally:
+                loop.call_soon_threadsafe(queue.put_nowait, SENTINEL)
+        import threading
+        thread = threading.Thread(target=run_sync, daemon=True)
+        thread.start()
+        while True:
+            item = await queue.get()
+            if item is SENTINEL:
+                break
+            yield item
     return StreamingResponse(
+        async_generator(),
+        media_type="text/event-stream",
+        headers={
+            "Cache-Control": "no-cache",
+            "X-Accel-Buffering": "no",
+        }
     )
 @app.post(