Spaces:

biyootiful
/

cv-chatbot

Running

App Files Files Community

biyootiful commited on Nov 4

Commit

c0da66d

1 Parent(s): 9c28499

remove groq

Browse files

Files changed (4) hide show

README.md +1 -2
app.py +2 -51
config.py +1 -7
requirements.txt +1 -1

README.md CHANGED Viewed

@@ -12,8 +12,7 @@ RAG-based chatbot for answering questions about professional background and expe
 Set environment variables in Space secrets:
-- `LLM_PROVIDER` - Set to `local` (default), `groq`, or `huggingface`
-- `GROQ_API_KEY` - Required if using Groq
 - `HUGGINGFACE_API_KEY` - Required if using HuggingFace Inference API
 - `SESSION_TOKEN_SECRET` - Optional, for session auth
 - `CLIENT_APP_ORIGINS` - Optional, comma-separated allowed origins

 Set environment variables in Space secrets:
+- `LLM_PROVIDER` - Set to `local` (default) or `huggingface`
 - `HUGGINGFACE_API_KEY` - Required if using HuggingFace Inference API
 - `SESSION_TOKEN_SECRET` - Optional, for session auth
 - `CLIENT_APP_ORIGINS` - Optional, comma-separated allowed origins

app.py CHANGED Viewed

@@ -11,8 +11,6 @@ import time
 from typing import List, Dict, Optional, Tuple
 import numpy as np
 import torch
-import httpx
-import inspect
 from fastapi import Depends, FastAPI, HTTPException, Header
 from fastapi.middleware.cors import CORSMiddleware
 from pydantic import BaseModel
@@ -73,32 +71,9 @@ if not hasattr(huggingface_hub, "cached_download"):
 from sentence_transformers import SentenceTransformer
 import faiss
-# Patch httpx to gracefully ignore deprecated `proxies` argument used by groq client when running with httpx>=0.28.
-if "proxies" not in inspect.signature(httpx.Client.__init__).parameters:
-    _original_httpx_client_init = httpx.Client.__init__
-    def _httpx_client_init_with_proxies(self, *args, proxies=None, **kwargs):
-        return _original_httpx_client_init(self, *args, **kwargs)
-    httpx.Client.__init__ = _httpx_client_init_with_proxies  # type: ignore[assignment]
-if "proxies" not in inspect.signature(httpx.AsyncClient.__init__).parameters:
-    _original_httpx_async_client_init = httpx.AsyncClient.__init__
-    def _httpx_async_client_init_with_proxies(self, *args, proxies=None, **kwargs):
-        if proxies is not None and "proxy" not in kwargs:
-            kwargs["proxy"] = proxies
-        return _original_httpx_async_client_init(self, *args, **kwargs)
-    httpx.AsyncClient.__init__ = _httpx_async_client_init_with_proxies  # type: ignore[assignment]
-from groq import Groq
 # Import configuration
 from config import (
     LLM_PROVIDER,
-    GROQ_API_KEY,
-    GROQ_MODEL,
     HUGGINGFACE_API_KEY,
     HUGGINGFACE_MODEL,
     LOCAL_MODEL_REPO,
@@ -375,12 +350,7 @@ def initialize_llm():
     """Initialize LLM client based on provider"""
     global llm_client, local_model_path
-    if LLM_PROVIDER == "groq":
-        if not GROQ_API_KEY:
-            raise ValueError("GROQ_API_KEY not set in environment variables")
-        llm_client = Groq(api_key=GROQ_API_KEY)
-        print(f"Initialized Groq client with model: {GROQ_MODEL}")
-    elif LLM_PROVIDER == "huggingface":
         # Will use requests for HF Inference API
         if not HUGGINGFACE_API_KEY:
             raise ValueError("HUGGINGFACE_API_KEY not set in environment variables")
@@ -453,23 +423,6 @@ def retrieve_relevant_chunks(query: str, top_k: int = TOP_K_RESULTS) -> List[str
     return relevant_chunks
-def generate_response_groq(prompt: str) -> str:
-    """Generate response using Groq API"""
-    try:
-        chat_completion = llm_client.chat.completions.create(
-            messages=[
-                {"role": "system", "content": SYSTEM_PROMPT},
-                {"role": "user", "content": prompt}
-            ],
-            model=GROQ_MODEL,
-            temperature=0.7,
-            max_tokens=500,
-        )
-        return chat_completion.choices[0].message.content
-    except Exception as e:
-        raise HTTPException(status_code=500, detail=f"Groq API error: {str(e)}")
 def generate_response_huggingface(prompt: str) -> str:
     """Generate response using HuggingFace Inference API (OpenAI-compatible endpoint)."""
     import requests
@@ -586,9 +539,7 @@ Provide a concise, professional answer based only on the context above."""
     combined_prompt = f"{system_prompt}\n\n{user_prompt}"
-    if LLM_PROVIDER == "groq":
-        return generate_response_groq(combined_prompt)
-    elif LLM_PROVIDER == "huggingface":
         return generate_response_huggingface(combined_prompt)
     elif LLM_PROVIDER == "local":
         return generate_response_local(system_prompt, user_prompt)

 from typing import List, Dict, Optional, Tuple
 import numpy as np
 import torch
 from fastapi import Depends, FastAPI, HTTPException, Header
 from fastapi.middleware.cors import CORSMiddleware
 from pydantic import BaseModel
 from sentence_transformers import SentenceTransformer
 import faiss
 # Import configuration
 from config import (
     LLM_PROVIDER,
     HUGGINGFACE_API_KEY,
     HUGGINGFACE_MODEL,
     LOCAL_MODEL_REPO,
     """Initialize LLM client based on provider"""
     global llm_client, local_model_path
+    if LLM_PROVIDER == "huggingface":
         # Will use requests for HF Inference API
         if not HUGGINGFACE_API_KEY:
             raise ValueError("HUGGINGFACE_API_KEY not set in environment variables")
     return relevant_chunks
 def generate_response_huggingface(prompt: str) -> str:
     """Generate response using HuggingFace Inference API (OpenAI-compatible endpoint)."""
     import requests
     combined_prompt = f"{system_prompt}\n\n{user_prompt}"
+    if LLM_PROVIDER == "huggingface":
         return generate_response_huggingface(combined_prompt)
     elif LLM_PROVIDER == "local":
         return generate_response_local(system_prompt, user_prompt)

config.py CHANGED Viewed

@@ -6,19 +6,13 @@ Change LLM_PROVIDER to switch between different models
 import os
 # Swappable LLM provider (environment configurable)
-LLM_PROVIDER = os.getenv("LLM_PROVIDER", "huggingface")  # Options: "groq", "huggingface", "openai", "local"
 # API Keys (set these as environment variables in HuggingFace Space secrets)
-GROQ_API_KEY = os.getenv("GROQ_API_KEY", "")
 HUGGINGFACE_API_KEY = os.getenv("HUGGINGFACE_API_KEY", "")
-OPENAI_API_KEY = os.getenv("OPENAI_API_KEY", "")
 # Model configurations
-GROQ_MODEL = "mixtral-8x7b-32768"  # Fast and good quality
-# GROQ_MODEL = "llama3-8b-8192"  # Alternative: faster but slightly lower quality
 HUGGINGFACE_MODEL = "google/gemma-2-2b-it"
-OPENAI_MODEL = "gpt-3.5-turbo"
 # Local model configuration (for quantized models hosted within the Space)
 LOCAL_MODEL_REPO = os.getenv("LOCAL_MODEL_REPO", "tensorblock/gemma-2-2b-it-GGUF")

 import os
 # Swappable LLM provider (environment configurable)
+LLM_PROVIDER = os.getenv("LLM_PROVIDER", "local")  # Options: "huggingface", "local"
 # API Keys (set these as environment variables in HuggingFace Space secrets)
 HUGGINGFACE_API_KEY = os.getenv("HUGGINGFACE_API_KEY", "")
 # Model configurations
 HUGGINGFACE_MODEL = "google/gemma-2-2b-it"
 # Local model configuration (for quantized models hosted within the Space)
 LOCAL_MODEL_REPO = os.getenv("LOCAL_MODEL_REPO", "tensorblock/gemma-2-2b-it-GGUF")

requirements.txt CHANGED Viewed

@@ -3,9 +3,9 @@ uvicorn[standard]==0.24.0
 sentence-transformers==2.2.2
 huggingface-hub<0.19
 faiss-cpu==1.8.0
-httpx<0.28
 pydantic==2.5.0
 numpy>=1.26.4,<2
 python-multipart==0.0.6
 llama-cpp-python==0.2.82
 itsdangerous==2.2.0

 sentence-transformers==2.2.2
 huggingface-hub<0.19
 faiss-cpu==1.8.0
 pydantic==2.5.0
 numpy>=1.26.4,<2
 python-multipart==0.0.6
 llama-cpp-python==0.2.82
 itsdangerous==2.2.0
+requests==2.31.0