Spaces:

ProfessorCEO
/

coolshot-ai-backend

Running

App Files Files Community

Local AI Assistant commited on 17 days ago

Commit

7b9724a

1 Parent(s): a016784

Split services: Remove Auth/DB/Image from main API, proxy image requests

Browse files

Files changed (2) hide show

Dockerfile +25 -14
api.py +27 -105

Dockerfile CHANGED Viewed

@@ -1,23 +1,34 @@
-# Use Python 3.10
-FROM python:3.10
 # Set working directory
 WORKDIR /app
-# Copy requirements and install dependencies
 COPY requirements.txt .
-RUN pip install --no-cache-dir -r requirements.txt
-# Copy the rest of the application
-COPY . .
-# Create a writable directory for cache (Hugging Face requirement)
-RUN mkdir -p /app/cache
-ENV XDG_CACHE_HOME=/app/cache
-RUN chmod -R 777 /app/cache
-# Expose port 7860 (Hugging Face default)
-EXPOSE 7860
-# Run the application
-CMD ["uvicorn", "api:app", "--host", "0.0.0.0", "--port", "7860"]

+# Use a lightweight Python base image
+FROM python:3.10-slim
+# Set environment variables
+ENV PYTHONDONTWRITEBYTECODE=1 \
+    PYTHONUNBUFFERED=1 \
+    PORT=8080
 # Set working directory
 WORKDIR /app
+# Install system dependencies
+RUN apt-get update && apt-get install -y --no-install-recommends \
+    build-essential \
+    git \
+    && rm -rf /var/lib/apt/lists/*
+# Copy requirements file
 COPY requirements.txt .
+# Install Python dependencies
+# Note: We install torch CPU version to keep image size smaller if GPU is not used,
+# but Cloud Run is CPU-only by default anyway.
+RUN pip install --no-cache-dir --upgrade pip && \
+    pip install --no-cache-dir -r requirements.txt
+# Copy application code
+COPY . .
+# Expose the port
+EXPOSE 8080
+# Command to run the application
+CMD ["uvicorn", "api:app", "--host", "0.0.0.0", "--port", "8080"]

api.py CHANGED Viewed

@@ -14,13 +14,13 @@ import os
 import base64
 from chat_engine import ChatEngine
-from image_engine import ImageEngine
 from rag_engine import RAGEngine
 import models
 import shutil
 import schemas
 import firebase_admin
 from firebase_admin import credentials, firestore, auth
 # Initialize FastAPI
 app = FastAPI()
@@ -34,32 +34,15 @@ app.add_middleware(
     allow_headers=["*"],
 )
-# Initialize Firebase Admin
 if not firebase_admin._apps:
-    if os.path.exists("serviceAccountKey.json"):
-        cred = credentials.Certificate("serviceAccountKey.json")
-    else:
-        # Try getting from env var (for Hugging Face)
-        key_json = os.environ.get("FIREBASE_SERVICE_ACCOUNT_KEY")
-        if key_json:
-            import json
-            cred_dict = json.loads(key_json)
-            cred = credentials.Certificate(cred_dict)
-        else:
-            print("Warning: No service account key found. Firebase features will fail.")
-            cred = None
-    if cred:
-        firebase_admin.initialize_app(cred)
-if firebase_admin._apps:
-    db = firestore.client()
-else:
-    db = None
 # Global engine instances (Lazy loaded)
 chat_engine = None
-image_engine = None
 rag_engine = None
 def get_chat_engine():
@@ -69,13 +52,6 @@ def get_chat_engine():
         chat_engine = ChatEngine()
     return chat_engine
-def get_image_engine():
-    global image_engine
-    if image_engine is None:
-        print("Lazy loading Image Engine...")
-        image_engine = ImageEngine()
-    return image_engine
 def get_rag_engine():
     global rag_engine
     if rag_engine is None:
@@ -237,60 +213,20 @@ def read_root():
     return {"status": "Backend is running", "message": "Go to /docs to see the API"}
 @app.post("/chat")
-async def chat(request: ChatRequest, current_user: dict = Depends(get_current_user)):
-    # ... (Keep existing /chat for backward compatibility if needed, or redirect logic)
-    # For now, let's keep /chat as blocking and add /chat/stream
     try:
         # Get engine (lazy load)
         engine = get_chat_engine()
         # Generate Response
         response = engine.generate_response(request.message, request.history)
-        # Save to Firestore if conversation_id is present
-        if request.conversation_id:
-            conv_ref = db.collection('conversations').document(request.conversation_id)
-            # User Msg
-            conv_ref.collection('messages').add({
-                "role": "user",
-                "content": request.message,
-                "timestamp": datetime.utcnow()
-            })
-            # AI Msg
-            conv_ref.collection('messages').add({
-                "role": "assistant",
-                "content": response,
-                "timestamp": datetime.utcnow()
-            })
-            conv_ref.update({"updated_at": datetime.utcnow()})
         return {"response": response}
     except Exception as e:
         import traceback
         traceback.print_exc()
         raise HTTPException(status_code=500, detail=str(e))
-# RAG Endpoints
-@app.post("/upload")
-async def upload_file(file: UploadFile = File(...), current_user: dict = Depends(get_current_user)):
-    try:
-        # Save file locally
-        upload_dir = "uploads"
-        os.makedirs(upload_dir, exist_ok=True)
-        file_path = os.path.join(upload_dir, file.filename)
-        with open(file_path, "wb") as buffer:
-            shutil.copyfileobj(file.file, buffer)
-        # Ingest into RAG
-        rag = get_rag_engine()
-        rag.ingest_file(file_path)
-        return {"filename": file.filename, "status": "ingested"}
-    except Exception as e:
-        raise HTTPException(status_code=500, detail=str(e))
 @app.post("/chat/stream")
-async def chat_stream(request: ChatRequest, current_user: dict = Depends(get_current_user)):
     try:
         # Check for RAG context
         context = ""
@@ -300,36 +236,13 @@ async def chat_stream(request: ChatRequest, current_user: dict = Depends(get_cur
             context = "\n\nRelevant Context:\n" + "\n".join(rag_docs) + "\n\n"
             print(f"Found {len(rag_docs)} relevant documents.")
-        # Save User Message
-        if request.conversation_id:
-            conv_ref = db.collection('conversations').document(request.conversation_id)
-            conv_ref.collection('messages').add({
-                "role": "user",
-                "content": request.message,
-                "timestamp": datetime.utcnow()
-            })
-            conv_ref.update({"updated_at": datetime.utcnow()})
         async def stream_generator():
-            full_response = ""
-            # Prepend context to the message sent to AI (but not saved in DB as user message)
             augmented_message = context + request.message if context else request.message
             engine = get_chat_engine()
             for token in engine.generate_stream(augmented_message, request.history, request.language):
-                full_response += token
                 yield token
-            # Save AI Message after generation
-            if request.conversation_id:
-                conv_ref = db.collection('conversations').document(request.conversation_id)
-                conv_ref.collection('messages').add({
-                    "role": "assistant",
-                    "content": full_response,
-                    "timestamp": datetime.utcnow()
-                })
-            print(f"Generated response for conv {request.conversation_id}")
         return StreamingResponse(stream_generator(), media_type="text/plain")
@@ -338,19 +251,28 @@ async def chat_stream(request: ChatRequest, current_user: dict = Depends(get_cur
         traceback.print_exc()
         raise HTTPException(status_code=500, detail=str(e))
 @app.post("/generate-image")
-async def generate_image(request: ImageRequest, current_user: dict = Depends(get_current_user)):
     try:
-        # Generate image to a temporary file
-        filename = "temp_generated.png"
-        engine = get_image_engine()
-        engine.generate_image(request.prompt, output_path=filename)
-        # Read and encode to base64 to send to frontend
-        with open(filename, "rb") as image_file:
-            encoded_string = base64.b64encode(image_file.read()).decode('utf-8')
-        return {"image_base64": encoded_string}
     except Exception as e:
         raise HTTPException(status_code=500, detail=str(e))

 import base64
 from chat_engine import ChatEngine
 from rag_engine import RAGEngine
 import models
 import shutil
 import schemas
 import firebase_admin
 from firebase_admin import credentials, firestore, auth
+import requests
 # Initialize FastAPI
 app = FastAPI()
     allow_headers=["*"],
 )
+# Initialize Firebase Admin (Optional/Placeholder if needed later)
 if not firebase_admin._apps:
+    # ... (Keep existing logic or comment out if fully removing)
+    pass
+db = None # Placeholder
 # Global engine instances (Lazy loaded)
 chat_engine = None
 rag_engine = None
 def get_chat_engine():
         chat_engine = ChatEngine()
     return chat_engine
 def get_rag_engine():
     global rag_engine
     if rag_engine is None:
     return {"status": "Backend is running", "message": "Go to /docs to see the API"}
 @app.post("/chat")
+async def chat(request: ChatRequest):
     try:
         # Get engine (lazy load)
         engine = get_chat_engine()
         # Generate Response
         response = engine.generate_response(request.message, request.history)
         return {"response": response}
     except Exception as e:
         import traceback
         traceback.print_exc()
         raise HTTPException(status_code=500, detail=str(e))
 @app.post("/chat/stream")
+async def chat_stream(request: ChatRequest):
     try:
         # Check for RAG context
         context = ""
             context = "\n\nRelevant Context:\n" + "\n".join(rag_docs) + "\n\n"
             print(f"Found {len(rag_docs)} relevant documents.")
         async def stream_generator():
+            # Prepend context to the message sent to AI
             augmented_message = context + request.message if context else request.message
             engine = get_chat_engine()
             for token in engine.generate_stream(augmented_message, request.history, request.language):
                 yield token
         return StreamingResponse(stream_generator(), media_type="text/plain")
         traceback.print_exc()
         raise HTTPException(status_code=500, detail=str(e))
+    except Exception as e:
+        import traceback
+        traceback.print_exc()
+        raise HTTPException(status_code=500, detail=str(e))
+# ... (Imports)
+import requests
+# ... (Chat Engine setup)
+# Image Service URL (Hardcoded for now, or env var)
+IMAGE_SERVICE_URL = "https://professorceo-cool-shot-ai-imagine.hf.space/generate-image"
 @app.post("/generate-image")
+async def generate_image(request: ImageRequest):
     try:
+        # Call external Image Service
+        response = requests.post(IMAGE_SERVICE_URL, json={"prompt": request.prompt})
+        if response.status_code != 200:
+            raise HTTPException(status_code=response.status_code, detail="Image Service Error")
+        return response.json()
     except Exception as e:
         raise HTTPException(status_code=500, detail=str(e))