WIP- Under maintenence- Web research working.

2024-02-05 15:15:07 +05:30
parent fd7053fb4b
commit 2a3315f211
96 changed files with 4320 additions and 565 deletions
--- a/lib/gpt_providers/gemini_image_details.py
+++ b/lib/gpt_providers/gemini_image_details.py
@@ -0,0 +1,79 @@
+"""
+"""
+import os
+import logging
+from pathlib import Path
+
+import google.generativeai as genai
+logging.basicConfig(level=logging.INFO, format='%(asctime)s-%(levelname)s-%(module)s-%(lineno)d-%(message)s')
+from dotenv import load_dotenv
+load_dotenv(Path('../../.env'))
+
+from tenacity import (
+    retry,
+    stop_after_attempt,
+    wait_random_exponential,
+) # for exponential backoff
+
+
+@retry(wait=wait_random_exponential(min=1, max=60), stop=stop_after_attempt(6))
+def gemini_get_img_info(prompt, img_path):
+    """ Get image details from arxiv papers. """
+    logging.info(f"Get image details from Gemini Pro.")
+    try:
+        genai.configure(api_key=os.getenv("GEMINI_API_KEY"))
+    except Exception as e:
+        logging.error(f"Could not load gemini API key: {e}")
+        raise e
+
+    # Set up the model
+    generation_config = {
+        "temperature": 0.9,
+        "top_p": 1,
+        "top_k": 1,
+        "max_output_tokens": 1096,
+    }
+
+    safety_settings = [{
+        "category": "HARM_CATEGORY_HARASSMENT",
+        "threshold": "BLOCK_NONE"
+    },
+    {
+        "category": "HARM_CATEGORY_HATE_SPEECH",
+        "threshold": "BLOCK_NONE"
+    },
+    {
+        "category": "HARM_CATEGORY_SEXUALLY_EXPLICIT",
+        "threshold": "BLOCK_NONE"
+    },
+    {
+        "category": "HARM_CATEGORY_DANGEROUS_CONTENT",
+        "threshold": "BLOCK_NONE"
+    },]
+
+    try:
+        model = genai.GenerativeModel(model_name="gemini-pro-vision",
+            generation_config=generation_config,
+            safety_settings=safety_settings)
+    except Exception as e:
+        logging.error(f"Could not create GenerativeModel: {e}")
+        raise e
+
+    # Validate that an image is present
+    if not (img := Path(img_path)).exists():
+        raise FileNotFoundError(f"Could not find image: {img}")
+
+    image_parts = [{
+        "mime_type": "image/png",
+        "data": Path(img_path).read_bytes()
+    },]
+
+    prompt_parts = [f"{prompt}", image_parts[0],]
+
+    try:
+        response = model.generate_content(prompt_parts)
+        return response.text
+    except Exception as e:
+        logging.error(f"Gemini is blocking this request: {response.prompt_feedback.block_reason}")
+        logging.error(f"Gemini Vision, Failed to give image Details: {e}\n{response.prompt_feedback}")
+        raise e