ferro988
/
LocalFoodAI_FerRo988


			
				
					
						
						
							123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172
							import json
import logging
import httpx
from fastapi import FastAPI, HTTPException
from fastapi.responses import HTMLResponse, StreamingResponse
from fastapi.staticfiles import StaticFiles
from pydantic import BaseModel
from typing import List, Generator

logging.basicConfig(level=logging.INFO)
logger = logging.getLogger(__name__)

app = FastAPI(title="LocalFoodAI Chat")

OLLAMA_URL = "http://localhost:11434/api/chat"
MODEL_NAME = "llama3.1:8b"

# Mount static files to serve the frontend
app.mount("/static", StaticFiles(directory="static"), name="static")

class ChatMessage(BaseModel):
    role: str
    content: str

class ChatRequest(BaseModel):
    messages: List[ChatMessage]

@app.get("/", response_class=HTMLResponse)
async def read_root():
    """Serve the chat interface HTML"""
    try:
        with open("static/index.html", "r", encoding="utf-8") as f:
            return HTMLResponse(content=f.read())
    except FileNotFoundError:
        return HTMLResponse(content="<h1>Welcome to LocalFoodAI</h1><p>static/index.html not found. Please create the frontend.</p>")

@app.post("/chat")
async def chat_endpoint(request: ChatRequest):
    """Proxy chat requests to the local Ollama instance with streaming support"""
    payload = {
        "model": MODEL_NAME,
        "messages": [msg.model_dump() for msg in request.messages],
        "stream": True  # Enable streaming for a better UI experience
    }
    
    async def generate_response():
        try:
            async with httpx.AsyncClient() as client:
                async with client.stream("POST", OLLAMA_URL, json=payload, timeout=120.0) as response:
                    if response.status_code != 200:
                        error_detail = await response.aread()
                        logger.error(f"Error communicating with Ollama: {error_detail}")
                        yield f"data: {json.dumps({'error': 'Error communicating with local LLM.'})}\n\n"
                        return

                    async for line in response.aiter_lines():
                        if line:
                            data = json.loads(line)
                            if "message" in data and "content" in data["message"]:
                                content = data["message"]["content"]
                                yield f"data: {json.dumps({'content': content})}\n\n"
                            if data.get("done"):
                                break
        except Exception as e:
            logger.error(f"Unexpected error during stream: {e}")
            yield f"data: {json.dumps({'error': str(e)})}\n\n"

    return StreamingResponse(generate_response(), media_type="text/event-stream")

if __name__ == "__main__":
    import uvicorn
    uvicorn.run("main:app", host="127.0.0.1", port=8000, reload=True)