vision

Sleeping

App Files Files Community

abdullahalioo commited on Apr 28

Commit

6e02eb7

verified ·

1 Parent(s): 9373610

Update app.py

Browse files

Files changed (1) hide show

app.py +21 -8

app.py CHANGED Viewed

@@ -3,7 +3,6 @@ from fastapi import FastAPI, HTTPException
 from fastapi.responses import StreamingResponse
 from openai import AsyncOpenAI
 from pydantic import BaseModel
-import asyncio
 # Initialize FastAPI app
 app = FastAPI()
@@ -16,9 +15,18 @@ class PromptRequest(BaseModel):
 token = os.getenv("GITHUB_TOKEN")
 if not token:
     raise ValueError("GITHUB_TOKEN environment variable not set")
-endpoint = "https://models.github.ai/inference"
-model = "openai/gpt-4.1-mini"
-client = AsyncOpenAI(base_url=endpoint, api_key=token)
 # Async generator to stream chunks
 async def stream_response(prompt: str):
@@ -39,10 +47,11 @@ async def stream_response(prompt: str):
         async for chunk in stream:
             if chunk.choices and len(chunk.choices) > 0:
                 content = chunk.choices[0].delta.content or ""
-                yield content
     except Exception as err:
-        yield f"Error: {err}"
 # Endpoint to handle prompt and stream response
 @app.post("/generate")
@@ -51,8 +60,12 @@ async def generate_response(request: PromptRequest):
         # Return a StreamingResponse with the async generator
         return StreamingResponse(
             stream_response(request.prompt),
-            media_type="text/plain"
         )
     except Exception as err:
-        raise HTTPException(status_code=500, detail=f"Server error: {err}")

 from fastapi.responses import StreamingResponse
 from openai import AsyncOpenAI
 from pydantic import BaseModel
 # Initialize FastAPI app
 app = FastAPI()
 token = os.getenv("GITHUB_TOKEN")
 if not token:
     raise ValueError("GITHUB_TOKEN environment variable not set")
+# Use the correct endpoint for GitHub Models or fallback to a compatible OpenAI-like API
+endpoint = os.getenv("API_ENDPOINT", "https://api.github.com/models")  # Adjust based on GitHub Models documentation
+model = os.getenv("MODEL_NAME", "gpt-4o-mini")  # Use a valid model name, e.g., gpt-4o-mini or equivalent
+# Initialize AsyncOpenAI client without proxies to avoid TypeError
+client = AsyncOpenAI(
+    base_url=endpoint,
+    api_key=token,
+    # Explicitly disable proxies if not needed
+    http_client=None  # Avoid passing unexpected kwargs like proxies
+)
 # Async generator to stream chunks
 async def stream_response(prompt: str):
         async for chunk in stream:
             if chunk.choices and len(chunk.choices) > 0:
                 content = chunk.choices[0].delta.content or ""
+                if content:  # Only yield non-empty content
+                    yield content
     except Exception as err:
+        yield f"Error: {str(err)}"
 # Endpoint to handle prompt and stream response
 @app.post("/generate")
         # Return a StreamingResponse with the async generator
         return StreamingResponse(
             stream_response(request.prompt),
+            media_type="text/event-stream"  # Use text/event-stream for streaming
         )
     except Exception as err:
+        raise HTTPException(status_code=500, detail=f"Server error: {str(err)}")
+# Health check endpoint for Hugging Face Spaces
+@app.get("/")
+async def health_check():
+    return {"status": "healthy"}