Created using Colab

OneFineStarstuff · OneFineStarstuff · commit b2ec456160b2 · 2024-12-25T03:11:59.000+06:30
diff --git a/agi_pipeline.ipynb b/agi_pipeline.ipynb
@@ -5,7 +5,7 @@
     "colab": {
       "private_outputs": true,
       "provenance": [],
-      "authorship_tag": "ABX9TyPedi3hlUYgSbkDSkl23mSH",
+      "authorship_tag": "ABX9TyPoHH519BuqGSnR/HON75UP",
       "include_colab_link": true
     },
     "kernelspec": {
@@ -29,21 +29,18 @@
     },
     {
       "cell_type": "code",
-      "execution_count": null,
-      "metadata": {
-        "id": "TgxJtnG273_l"
-      },
-      "outputs": [],
       "source": [
         "# === Imports ===\n",
         "import os\n",
         "import asyncio\n",
+        "import time\n",
+        "from typing import List\n",
         "import torch\n",
         "from transformers import T5Tokenizer, T5ForConditionalGeneration\n",
         "from PIL import Image\n",
-        "from fastapi import FastAPI, UploadFile, Depends, HTTPException\n",
+        "from fastapi import FastAPI, UploadFile, Depends, HTTPException, Request\n",
         "from fastapi.security import OAuth2PasswordBearer\n",
-        "from pydantic import BaseModel\n",
+        "from pydantic import BaseModel, SecretStr\n",
         "import whisper\n",
         "from ultralytics import YOLO\n",
         "import pyttsx3\n",
@@ -54,101 +51,74 @@
         "\n",
         "# === Logging Setup ===\n",
         "logger.add(\"pipeline_{time}.log\", rotation=\"1 MB\", level=\"DEBUG\", enqueue=True, backtrace=True, diagnose=True)\n",
+        "logger.info(\"Application startup\")\n",
         "\n",
-        "# === Environment Variables and Authentication ===\n",
-        "SECURE_TOKEN = os.getenv(\"SECURE_TOKEN\", \"your_actual_secure_token\")\n",
+        "# === Security Enhancement: Environment Variable for Secure Token ===\n",
+        "SECURE_TOKEN = SecretStr(os.getenv(\"SECURE_TOKEN\", \"YvZz9Hni0hWJPh_UWW4dQYf9rhIe9nNYcC5ZQTTZz0Q\"))\n",
+        "\n",
+        "# === OAuth2PasswordBearer for Authentication ===\n",
         "oauth2_scheme = OAuth2PasswordBearer(tokenUrl=\"token\")\n",
         "\n",
+        "# === Authentication Function ===\n",
         "def authenticate_user(token: str = Depends(oauth2_scheme)):\n",
-        "    if token != SECURE_TOKEN:\n",
+        "    if token != SECURE_TOKEN.get_secret_value():\n",
         "        logger.warning(\"Authentication failed.\")\n",
         "        raise HTTPException(status_code=401, detail=\"Invalid token\")\n",
         "\n",
-        "# === Request and Response Models ===\n",
+        "# === Request and Response Models (Pydantic) ===\n",
         "class TextRequest(BaseModel):\n",
         "    text: str\n",
         "\n",
         "class TextResponse(BaseModel):\n",
         "    response: str\n",
         "\n",
-        "# === NLP Module ===\n",
+        "# === NLP Module (T5 Transformer) ===\n",
         "class NLPModule:\n",
         "    def __init__(self):\n",
         "        model_name = \"google/flan-t5-small\"\n",
-        "        try:\n",
-        "            self.tokenizer = T5Tokenizer.from_pretrained(model_name)\n",
-        "            self.model = T5ForConditionalGeneration.from_pretrained(model_name)\n",
-        "            logger.info(\"NLP model loaded successfully.\")\n",
-        "        except Exception as e:\n",
-        "            logger.error(f\"Failed to load NLP model: {e}\")\n",
-        "            raise RuntimeError(\"Failed to load NLP model.\")\n",
+        "        self.tokenizer = T5Tokenizer.from_pretrained(model_name)\n",
+        "        self.model = T5ForConditionalGeneration.from_pretrained(model_name)\n",
+        "        logger.info(\"NLP model loaded successfully.\")\n",
         "\n",
         "    def generate_text(self, prompt: str) -> str:\n",
         "        if not prompt.strip():\n",
         "            raise ValueError(\"Prompt cannot be empty.\")\n",
         "        logger.debug(f\"Generating text for prompt: {prompt}\")\n",
-        "        try:\n",
-        "            inputs = self.tokenizer(prompt, return_tensors=\"pt\")\n",
-        "            outputs = self.model.generate(inputs[\"input_ids\"], max_length=100)\n",
-        "            response = self.tokenizer.decode(outputs[0], skip_special_tokens=True)\n",
-        "            logger.info(f\"Generated response: {response}\")\n",
-        "            return response\n",
-        "        except Exception as e:\n",
-        "            logger.error(f\"Error in text generation: {e}\")\n",
-        "            raise RuntimeError(\"Text generation failed.\")\n",
-        "\n",
-        "# === CV Module with Object Detection ===\n",
+        "        inputs = self.tokenizer(prompt, return_tensors=\"pt\")\n",
+        "        outputs = self.model.generate(inputs[\"input_ids\"], max_length=100)\n",
+        "        response = self.tokenizer.decode(outputs[0], skip_special_tokens=True)\n",
+        "        logger.info(f\"Generated response: {response}\")\n",
+        "        return response\n",
+        "\n",
+        "# === CV Module (YOLOv8 for Object Detection) ===\n",
         "class CVModule:\n",
         "    def __init__(self):\n",
-        "        try:\n",
-        "            self.device = torch.device(\"cuda\" if torch.cuda.is_available() else \"cpu\")\n",
-        "            self.model = YOLO('yolov5su.pt').to(self.device)\n",
-        "            logger.info(\"CV model loaded successfully.\")\n",
-        "        except Exception as e:\n",
-        "            logger.error(f\"Failed to load CV model: {e}\")\n",
-        "            raise RuntimeError(\"Failed to load CV model.\")\n",
+        "        self.device = torch.device(\"cuda\" if torch.cuda.is_available() else \"cpu\")\n",
+        "        self.model = YOLO('yolov8n.pt').to(self.device)\n",
+        "        logger.info(\"CV model loaded successfully.\")\n",
         "\n",
         "    def detect_objects(self, image: Image.Image) -> str:\n",
         "        logger.debug(\"Detecting objects in the image.\")\n",
-        "        try:\n",
-        "            results = self.model(image)\n",
-        "            return results.pandas().xyxy[0].to_json()\n",
-        "        except Exception as e:\n",
-        "            logger.error(f\"Object detection failed: {e}\")\n",
-        "            raise ValueError(\"Object detection error.\")\n",
-        "\n",
-        "# === Speech Processor ===\n",
+        "        results = self.model(image)\n",
+        "        return results.pandas().xyxy[0].to_json()\n",
+        "\n",
+        "# === Speech Processor (Whisper for Speech-to-Text, PyTTSX3 for Text-to-Speech) ===\n",
         "class SpeechProcessor:\n",
         "    def __init__(self):\n",
-        "        try:\n",
-        "            import whisper  # Import inside the class to ensure correct package\n",
-        "            self.whisper_model = whisper.load_model(\"base\")\n",
-        "            self.tts = pyttsx3.init()\n",
-        "            logger.info(\"Speech processor initialized successfully.\")\n",
-        "        except Exception as e:\n",
-        "            logger.error(f\"Failed to initialize speech processor: {e}\")\n",
-        "            raise RuntimeError(\"Failed to initialize speech processor.\")\n",
+        "        self.whisper_model = whisper.load_model(\"base\")\n",
+        "        self.tts = pyttsx3.init()\n",
+        "        logger.info(\"Speech processor initialized successfully.\")\n",
         "\n",
         "    def speech_to_text(self, audio_file: UploadFile) -> str:\n",
-        "        logger.debug(\"Processing speech-to-text.\")\n",
-        "        try:\n",
-        "            with audio_file.file as audio_data:\n",
-        "                result = self.whisper_model.transcribe(audio_data)\n",
+        "        with audio_file.file as audio_data:\n",
+        "            result = self.whisper_model.transcribe(audio_data)\n",
         "            return result['text']\n",
-        "        except Exception as e:\n",
-        "            logger.error(f\"Speech-to-text failed: {e}\")\n",
-        "            raise ValueError(\"Speech-to-text error.\")\n",
         "\n",
         "    def text_to_speech(self, text: str) -> None:\n",
         "        if not text.strip():\n",
         "            raise ValueError(\"Text cannot be empty.\")\n",
-        "        logger.debug(\"Processing text-to-speech.\")\n",
-        "        try:\n",
-        "            self.tts.say(text)\n",
-        "            self.tts.runAndWait()\n",
-        "        except Exception as e:\n",
-        "            logger.error(f\"Text-to-speech failed: {e}\")\n",
-        "            raise RuntimeError(\"Text-to-speech error.\")\n",
+        "        self.tts.say(text)\n",
+        "        self.tts.runAndWait()\n",
         "\n",
         "    def __del__(self):\n",
         "        self.tts.stop()\n",
@@ -161,7 +131,7 @@
         "        self.speech_processor = SpeechProcessor()\n",
         "\n",
         "    async def process_nlp(self, text: str) -> str:\n",
-        "        return self.nlp.generate_text(text)\n",
+        "        return await asyncio.to_thread(self.nlp.generate_text, text)\n",
         "\n",
         "    async def process_cv(self, image: Image.Image) -> str:\n",
         "        return await asyncio.to_thread(self.cv.detect_objects, image)\n",
@@ -174,56 +144,52 @@
         "\n",
         "# === FastAPI Application ===\n",
         "app = FastAPI()\n",
+        "\n",
         "pipeline = EnhancedAGIPipeline()\n",
         "\n",
+        "# === Endpoints ===\n",
         "@app.post(\"/process-nlp/\", response_model=TextResponse, dependencies=[Depends(authenticate_user)])\n",
         "async def process_nlp(request: TextRequest):\n",
-        "    try:\n",
-        "        response = await pipeline.process_nlp(request.text)\n",
-        "        logger.info(\"NLP processed successfully.\")\n",
-        "        return {\"response\": response}\n",
-        "    except Exception as e:\n",
-        "        logger.error(f\"NLP processing failed: {e}\")\n",
-        "        raise HTTPException(status_code=500, detail=\"NLP processing error.\")\n",
+        "    response = await pipeline.process_nlp(request.text)\n",
+        "    return {\"response\": response}\n",
         "\n",
         "@app.post(\"/process-cv-detection/\", dependencies=[Depends(authenticate_user)])\n",
         "async def process_cv_detection(file: UploadFile):\n",
-        "    try:\n",
+        "    image = Image.open(io.BytesIO(await file.read()))\n",
+        "    response = await pipeline.process_cv(image)\n",
+        "    return {\"detections\": response}\n",
+        "\n",
+        "@app.post(\"/batch-cv-detection/\", dependencies=[Depends(authenticate_user)])\n",
+        "async def batch_cv_detection(files: List[UploadFile]):\n",
+        "    responses = []\n",
+        "    for file in files:\n",
         "        image = Image.open(io.BytesIO(await file.read()))\n",
         "        response = await pipeline.process_cv(image)\n",
-        "        logger.info(\"Object detection processed successfully.\")\n",
-        "        return {\"detections\": response}\n",
-        "    except Exception as e:\n",
-        "        logger.error(f\"Object detection failed: {e}\")\n",
-        "        raise HTTPException(status_code=500, detail=\"Object detection error.\")\n",
+        "        responses.append(response)\n",
+        "    return {\"batch_detections\": responses}\n",
         "\n",
         "@app.post(\"/speech-to-text/\", response_model=TextResponse, dependencies=[Depends(authenticate_user)])\n",
         "async def speech_to_text(file: UploadFile):\n",
-        "    try:\n",
-        "        response = await pipeline.process_speech_to_text(file)\n",
-        "        logger.info(\"Speech-to-text processed successfully.\")\n",
-        "        return {\"response\": response}\n",
-        "    except Exception as e:\n",
-        "        logger.error(f\"Speech-to-text failed: {e}\")\n",
-        "        raise HTTPException(status_code=500, detail=\"Speech-to-text error.\")\n",
+        "    response = await pipeline.process_speech_to_text(file)\n",
+        "    return {\"response\": response}\n",
         "\n",
         "@app.post(\"/text-to-speech/\", dependencies=[Depends(authenticate_user)])\n",
         "async def text_to_speech(request: TextRequest):\n",
-        "    try:\n",
-        "        await pipeline.process_text_to_speech(request.text)\n",
-        "        logger.info(\"Text-to-speech processed successfully.\")\n",
-        "        return {\"response\": \"Speech synthesis complete.\"}\n",
-        "    except Exception as e:\n",
-        "        logger.error(f\"Text-to-speech failed: {e}\")\n",
-        "        raise HTTPException(status_code=500, detail=\"Text-to-speech error.\")\n",
-        "\n",
-        "# === Run the Application with HTTPS ===\n",
+        "    await pipeline.process_text_to_speech(request.text)\n",
+        "    return {\"response\": \"Speech synthesis complete.\"}\n",
+        "\n",
+        "# === Run the Application with HTTPS (uvicorn) ===\n",
         "if __name__ == \"__main__\":\n",
         "    nest_asyncio.apply()\n",
         "    config = uvicorn.Config(app, host=\"0.0.0.0\", port=8000)\n",
         "    server = uvicorn.Server(config)\n",
         "    asyncio.run(server.serve())"
-      ]
+      ],
+      "metadata": {
+        "id": "UgUAMujBWqGS"
+      },
+      "execution_count": null,
+      "outputs": []
     }
   ]
 }