Spaces:

Soumik555
/

FastApi

Running

App Files Files Community

Soumik555 commited on Apr 1

Commit

a172af8

1 Parent(s): 5f8515f

added openai in orchestrator

Browse files

Files changed (1) hide show

gemini_report_generator.py +1184 -316

gemini_report_generator.py CHANGED Viewed

@@ -1,366 +1,1234 @@
-import json
-import numpy as np
-import pandas as pd
-import re
-import os
-import uuid
-import logging
-from io import StringIO
-import sys
-import traceback
-from typing import Optional, Dict, Any, List
-from pydantic import BaseModel, Field
-from google.generativeai import GenerativeModel, configure
-from dotenv import load_dotenv
-import seaborn as sns
-import datetime as dt
-from supabase_service import upload_file_to_supabase
-pd.set_option('display.max_columns', None)
-pd.set_option('display.max_rows', None)
-pd.set_option('display.max_colwidth', None)
-load_dotenv()
-API_KEYS = os.getenv("GEMINI_API_KEYS", "").split(",")[::-1]
-MODEL_NAME = 'gemini-2.0-flash'
-class FileProps(BaseModel):
-    fileName: str
-    filePath: str
-    fileType: str  # 'csv' | 'image'
-class Files(BaseModel):
-    csv_files: List[FileProps]
-    image_files: List[FileProps]
-class FileBoxProps(BaseModel):
-    files: Files
-os.environ['MPLBACKEND'] = 'agg'
-import matplotlib.pyplot as plt
-plt.show = lambda: None
-logging.basicConfig(
-    level=logging.INFO,
-    format='%(asctime)s - %(levelname)s - %(message)s'
-)
-logger = logging.getLogger(__name__)
-class GeminiKeyManager:
-    """Manage multiple Gemini API keys with failover"""
-    def __init__(self, api_keys: List[str]):
-        self.original_keys = api_keys.copy()
-        self.available_keys = api_keys.copy()
-        self.active_key = None
-        self.failed_keys = {}
-    def configure(self) -> bool:
-        while self.available_keys:
-            key = self.available_keys.pop(0)
-            try:
-                configure(api_key=key)
-                self.active_key = key
-                logger.info(f"Configured with key: {self._mask_key(key)}")
-                return True
-            except Exception as e:
-                self.failed_keys[key] = str(e)
-                logger.error(f"Key failed: {self._mask_key(key)}. Error: {str(e)}")
-        logger.critical("All API keys failed")
-        return False
-    def _mask_key(self, key: str) -> str:
-        return f"{key[:8]}...{key[-4:]}" if key else ""
-class PythonREPL:
-    """Secure Python REPL with file generation tracking"""
-    def __init__(self, df: pd.DataFrame):
-        self.df = df
-        self.output_dir = os.path.abspath(f'generated_outputs/{uuid.uuid4()}')
-        os.makedirs(self.output_dir, exist_ok=True)
-        self.local_env = {
-            "pd": pd,
-            "df": self.df.copy(),
-            "plt": plt,
-            "os": os,
-            "uuid": uuid,
-            "sns": sns,
-            "json": json,
-            "dt": dt,
-            "output_dir": self.output_dir
-        }
-    def execute(self, code: str) -> Dict[str, Any]:
-        print('Executing code...', code)
-        old_stdout = sys.stdout
-        sys.stdout = mystdout = StringIO()
-        file_tracker = {
-            'csv_files': set(),
-            'image_files': set()
-        }
-        try:
-            code = f"""
-import matplotlib.pyplot as plt
-plt.switch_backend('agg')
-{code}
-plt.close('all')
-            """
-            exec(code, self.local_env)
-            self.df = self.local_env.get('df', self.df)
-            # Track generated files
-            for fname in os.listdir(self.output_dir):
-                if fname.endswith('.csv'):
-                    file_tracker['csv_files'].add(fname)
-                elif fname.lower().endswith(('.png', '.jpg', '.jpeg')):
-                    file_tracker['image_files'].add(fname)
-            error = False
-        except Exception as e:
-            error_msg = traceback.format_exc()
-            error = True
-        finally:
-            sys.stdout = old_stdout
-        return {
-            "output": mystdout.getvalue(),
-            "error": error,
-            "error_message": error_msg if error else None,
-            "df": self.local_env.get('df', self.df),
-            "output_dir": self.output_dir,
-            "files": {
-                "csv": [os.path.join(self.output_dir, f) for f in file_tracker['csv_files']],
-                "images": [os.path.join(self.output_dir, f) for f in file_tracker['image_files']]
-            }
-        }
-class RethinkAgent(BaseModel):
-    df: pd.DataFrame
-    max_retries: int = Field(default=5, ge=1)
-    gemini_model: Optional[GenerativeModel] = None
-    current_retry: int = Field(default=0, ge=0)
-    repl: Optional[PythonREPL] = None
-    key_manager: Optional[GeminiKeyManager] = None
-    class Config:
-        arbitrary_types_allowed = True
-    def _extract_code(self, response: str) -> str:
-        code_match = re.search(r'```python(.*?)```', response, re.DOTALL)
-        return code_match.group(1).strip() if code_match else response.strip()
-    def _generate_initial_prompt(self, query: str) -> str:
-        return f"""Generate DIRECT EXECUTION CODE (no functions, no explanations) following STRICT RULES:
-        MANDATORY REQUIREMENTS:
-        1. Operate directly on existing 'df' variable
-        2. Save ALL final DataFrames to CSV using: df.to_csv(f'{{output_dir}}/descriptive_name.csv')
-        3. For visualizations: plt.savefig(f'{{output_dir}}/chart_name.png')
-        4. Use EXACTLY this structure:
-           # Data processing
-           df_processed = df[...]  # filtering/grouping
-           # Save results
-           df_processed.to_csv(f'{{output_dir}}/result.csv')
-           # Visualizations (if needed)
-           plt.figure()
-           ... plotting code ...
-           plt.savefig(f'{{output_dir}}/chart.png')
-           plt.close()
-        FORBIDDEN:
-        - Function definitions
-        - Dummy data creation
-        - Any code blocks besides pandas operations and matplotlib
-        - Print statements showing dataframes
-        DATAFRAME COLUMNS: {', '.join(self.df.columns)}
-        DATAFRAME'S FIRST FIVE ROWS: {self.df.head().to_dict('records')}
-        USER QUERY: {query}
-        EXAMPLE RESPONSE FOR "Sales by region":
-        # Data processing
-        sales_by_region = df.groupby('region')['sales'].sum().reset_index()
-        # Save results
-        sales_by_region.to_csv(f'{{output_dir}}/sales_by_region.csv')
-        """
-    def _generate_retry_prompt(self, query: str, error: str, code: str) -> str:
-        return f"""FIX THIS CODE (failed with: {error}) by STRICTLY FOLLOWING:
-        1. REMOVE ALL FUNCTION DEFINITIONS
-        2. ENSURE DIRECT DF OPERATIONS
-        3. USE EXPLICIT output_dir PATHS
-        4. ADD NECESSARY IMPORTS IF MISSING
-        5. VALIDATE COLUMN NAMES EXIST
-        BAD CODE:
-        {code}
-        CORRECTED CODE:"""
-    def initialize_model(self, api_keys: List[str]) -> bool:
-        self.key_manager = GeminiKeyManager(api_keys)
-        if not self.key_manager.configure():
-            raise RuntimeError("API key initialization failed")
-        try:
-            self.gemini_model = GenerativeModel(MODEL_NAME)
-            return True
-        except Exception as e:
-            logger.error(f"Model init failed: {str(e)}")
-            return False
-    def generate_code(self, query: str, error: Optional[str] = None, previous_code: Optional[str] = None) -> str:
-        prompt = self._generate_retry_prompt(query, error, previous_code) if error else self._generate_initial_prompt(query)
-        try:
-            response = self.gemini_model.generate_content(prompt)
-            return self._extract_code(response.text)
-        except Exception as e:
-            if self.key_manager.available_keys and self.key_manager.configure():
-                return self.generate_code(query, error, previous_code)
-            raise
-    def execute_query(self, query: str) -> Dict[str, Any]:
-        self.repl = PythonREPL(self.df)
-        result = None
-        while self.current_retry < self.max_retries:
-            try:
-                code = self.generate_code(query,
-                                         result["error_message"] if result else None,
-                                         result["code"] if result else None)
-                execution_result = self.repl.execute(code)
-                if execution_result["error"]:
-                    self.current_retry += 1
-                    result = {
-                        "error_message": execution_result["error_message"],
-                        "code": code
-                    }
-                else:
-                    return {
-                        "text": execution_result["output"],
-                        "csv_files": execution_result["files"]["csv"],
-                        "image_files": execution_result["files"]["images"]
-                    }
-            except Exception as e:
-                return {
-                    "error": f"Critical failure: {str(e)}",
-                    "csv_files": [],
-                    "image_files": []
-                }
-        return {
-            "error": f"Failed after {self.max_retries} retries",
-            "csv_files": [],
-            "image_files": []
-        }
-def gemini_llm_chat(csv_url: str, query: str) -> Dict[str, Any]:
-    try:
-        df = pd.read_csv(csv_url)
-        agent = RethinkAgent(df=df)
-        if not agent.initialize_model(API_KEYS):
-            return {"error": "API configuration failed"}
-        result = agent.execute_query(query)
-        if "error" in result:
-            return result
-        return {
-            "message": result["text"],
-            "csv_files": result["csv_files"],
-            "image_files": result["image_files"]
-        }
-    except Exception as e:
-        logger.error(f"Processing failed: {str(e)}")
-        return {
-            "error": f"Processing error: {str(e)}",
-            "csv_files": [],
-            "image_files": []
-        }
-async def generate_csv_report(csv_url: str, query: str) -> FileBoxProps:
-    try:
-        result = gemini_llm_chat(csv_url, query)
-        logger.info(f"Raw result from gemini_llm_chat: {result}")
-        csv_files = []
-        image_files = []
-        # Check if we got the expected response structure
-        if isinstance(result, dict) and 'csv_files' in result and 'image_files' in result:
-            # Process CSV files
-            for csv_path in result['csv_files']:
-                if os.path.exists(csv_path):
-                    file_name = os.path.basename(csv_path)
-                    try:
-                        unique_file_name = f"{uuid.uuid4()}_{file_name}"
-                        public_url = await upload_file_to_supabase(
-                            file_path=csv_path,
-                            file_name=unique_file_name
-                        )
-                        csv_files.append(FileProps(
-                            fileName=file_name,
-                            filePath=public_url,
-                            fileType="csv"
-                        ))
-                        os.remove(csv_path)  # Clean up
-                    except Exception as upload_error:
-                        logger.error(f"Failed to upload CSV {file_name}: {str(upload_error)}")
-                        continue
-            # Process image files
-            for img_path in result['image_files']:
-                if os.path.exists(img_path):
-                    file_name = os.path.basename(img_path)
-                    try:
-                        unique_file_name = f"{uuid.uuid4()}_{file_name}"
-                        public_url = await upload_file_to_supabase(
-                            file_path=img_path,
-                            file_name=unique_file_name
-                        )
-                        image_files.append(FileProps(
-                            fileName=file_name,
-                            filePath=public_url,
-                            fileType="image"
-                        ))
-                        os.remove(img_path)  # Clean up
-                    except Exception as upload_error:
-                        logger.error(f"Failed to upload image {file_name}: {str(upload_error)}")
-                        continue
-            return FileBoxProps(
-                files=Files(
-                    csv_files=csv_files,
-                    image_files=image_files
-                )
             )
-        else:
-            raise ValueError("Unexpected response format from gemini_llm_chat")
-    except Exception as e:
-        logger.error(f"Report generation failed: {str(e)}")
-        # Return empty response but log the files we found
-        if 'csv_files' in locals() and 'image_files' in locals():
-            logger.info(f"Files that were generated but not processed: CSV: {result.get('csv_files', [])}, Images: {result.get('image_files', [])}")
-        return FileBoxProps(
-            files=Files(
-                csv_files=[],
-                image_files=[]
             )
-        )
-# if __name__ == "__main__":
-#     result = gemini_llm_chat("./documents/enterprise_sales_data.csv",
-#                            "Generate a detailed sales report of the last 6 months from all the aspects and include a bar chart showing the sales by region.")
-#     print(json.dumps(result, indent=2))

+# import json
+# import numpy as np
+# import pandas as pd
+# import re
+# import os
+# import uuid
+# import logging
+# from io import StringIO
+# import sys
+# import traceback
+# from typing import Optional, Dict, Any, List
+# from pydantic import BaseModel, Field
+# from google.generativeai import GenerativeModel, configure
+# from dotenv import load_dotenv
+# import seaborn as sns
+# import datetime as dt
+# from supabase_service import upload_file_to_supabase
+# pd.set_option('display.max_columns', None)
+# pd.set_option('display.max_rows', None)
+# pd.set_option('display.max_colwidth', None)
+# load_dotenv()
+# API_KEYS = os.getenv("GEMINI_API_KEYS", "").split(",")[::-1]
+# MODEL_NAME = 'gemini-2.0-flash'
+# class FileProps(BaseModel):
+#     fileName: str
+#     filePath: str
+#     fileType: str  # 'csv' | 'image'
+# class Files(BaseModel):
+#     csv_files: List[FileProps]
+#     image_files: List[FileProps]
+# class FileBoxProps(BaseModel):
+#     files: Files
+# os.environ['MPLBACKEND'] = 'agg'
+# import matplotlib.pyplot as plt
+# plt.show = lambda: None
+# logging.basicConfig(
+#     level=logging.INFO,
+#     format='%(asctime)s - %(levelname)s - %(message)s'
+# )
+# logger = logging.getLogger(__name__)
+# class GeminiKeyManager:
+#     """Manage multiple Gemini API keys with failover"""
+#     def __init__(self, api_keys: List[str]):
+#         self.original_keys = api_keys.copy()
+#         self.available_keys = api_keys.copy()
+#         self.active_key = None
+#         self.failed_keys = {}
+#     def configure(self) -> bool:
+#         while self.available_keys:
+#             key = self.available_keys.pop(0)
+#             try:
+#                 configure(api_key=key)
+#                 self.active_key = key
+#                 logger.info(f"Configured with key: {self._mask_key(key)}")
+#                 return True
+#             except Exception as e:
+#                 self.failed_keys[key] = str(e)
+#                 logger.error(f"Key failed: {self._mask_key(key)}. Error: {str(e)}")
+#         logger.critical("All API keys failed")
+#         return False
+#     def _mask_key(self, key: str) -> str:
+#         return f"{key[:8]}...{key[-4:]}" if key else ""
+# class PythonREPL:
+#     """Secure Python REPL with file generation tracking"""
+#     def __init__(self, df: pd.DataFrame):
+#         self.df = df
+#         self.output_dir = os.path.abspath(f'generated_outputs/{uuid.uuid4()}')
+#         os.makedirs(self.output_dir, exist_ok=True)
+#         self.local_env = {
+#             "pd": pd,
+#             "df": self.df.copy(),
+#             "plt": plt,
+#             "os": os,
+#             "uuid": uuid,
+#             "sns": sns,
+#             "json": json,
+#             "dt": dt,
+#             "output_dir": self.output_dir
+#         }
+#     def execute(self, code: str) -> Dict[str, Any]:
+#         print('Executing code...', code)
+#         old_stdout = sys.stdout
+#         sys.stdout = mystdout = StringIO()
+#         file_tracker = {
+#             'csv_files': set(),
+#             'image_files': set()
+#         }
+#         try:
+#             code = f"""
+# import matplotlib.pyplot as plt
+# plt.switch_backend('agg')
+# {code}
+# plt.close('all')
+#             """
+#             exec(code, self.local_env)
+#             self.df = self.local_env.get('df', self.df)
+#             # Track generated files
+#             for fname in os.listdir(self.output_dir):
+#                 if fname.endswith('.csv'):
+#                     file_tracker['csv_files'].add(fname)
+#                 elif fname.lower().endswith(('.png', '.jpg', '.jpeg')):
+#                     file_tracker['image_files'].add(fname)
+#             error = False
+#         except Exception as e:
+#             error_msg = traceback.format_exc()
+#             error = True
+#         finally:
+#             sys.stdout = old_stdout
+#         return {
+#             "output": mystdout.getvalue(),
+#             "error": error,
+#             "error_message": error_msg if error else None,
+#             "df": self.local_env.get('df', self.df),
+#             "output_dir": self.output_dir,
+#             "files": {
+#                 "csv": [os.path.join(self.output_dir, f) for f in file_tracker['csv_files']],
+#                 "images": [os.path.join(self.output_dir, f) for f in file_tracker['image_files']]
+#             }
+#         }
+# class RethinkAgent(BaseModel):
+#     df: pd.DataFrame
+#     max_retries: int = Field(default=5, ge=1)
+#     gemini_model: Optional[GenerativeModel] = None
+#     current_retry: int = Field(default=0, ge=0)
+#     repl: Optional[PythonREPL] = None
+#     key_manager: Optional[GeminiKeyManager] = None
+#     class Config:
+#         arbitrary_types_allowed = True
+#     def _extract_code(self, response: str) -> str:
+#         code_match = re.search(r'```python(.*?)```', response, re.DOTALL)
+#         return code_match.group(1).strip() if code_match else response.strip()
+#     def _generate_initial_prompt(self, query: str) -> str:
+#         return f"""Generate DIRECT EXECUTION CODE (no functions, no explanations) following STRICT RULES:
+#         MANDATORY REQUIREMENTS:
+#         1. Operate directly on existing 'df' variable
+#         2. Save ALL final DataFrames to CSV using: df.to_csv(f'{{output_dir}}/descriptive_name.csv')
+#         3. For visualizations: plt.savefig(f'{{output_dir}}/chart_name.png')
+#         4. Use EXACTLY this structure:
+#            # Data processing
+#            df_processed = df[...]  # filtering/grouping
+#            # Save results
+#            df_processed.to_csv(f'{{output_dir}}/result.csv')
+#            # Visualizations (if needed)
+#            plt.figure()
+#            ... plotting code ...
+#            plt.savefig(f'{{output_dir}}/chart.png')
+#            plt.close()
+#         FORBIDDEN:
+#         - Function definitions
+#         - Dummy data creation
+#         - Any code blocks besides pandas operations and matplotlib
+#         - Print statements showing dataframes
+#         DATAFRAME COLUMNS: {', '.join(self.df.columns)}
+#         DATAFRAME'S FIRST FIVE ROWS: {self.df.head().to_dict('records')}
+#         USER QUERY: {query}
+#         EXAMPLE RESPONSE FOR "Sales by region":
+#         # Data processing
+#         sales_by_region = df.groupby('region')['sales'].sum().reset_index()
+#         # Save results
+#         sales_by_region.to_csv(f'{{output_dir}}/sales_by_region.csv')
+#         """
+#     def _generate_retry_prompt(self, query: str, error: str, code: str) -> str:
+#         return f"""FIX THIS CODE (failed with: {error}) by STRICTLY FOLLOWING:
+#         1. REMOVE ALL FUNCTION DEFINITIONS
+#         2. ENSURE DIRECT DF OPERATIONS
+#         3. USE EXPLICIT output_dir PATHS
+#         4. ADD NECESSARY IMPORTS IF MISSING
+#         5. VALIDATE COLUMN NAMES EXIST
+#         BAD CODE:
+#         {code}
+#         CORRECTED CODE:"""
+#     def initialize_model(self, api_keys: List[str]) -> bool:
+#         self.key_manager = GeminiKeyManager(api_keys)
+#         if not self.key_manager.configure():
+#             raise RuntimeError("API key initialization failed")
+#         try:
+#             self.gemini_model = GenerativeModel(MODEL_NAME)
+#             return True
+#         except Exception as e:
+#             logger.error(f"Model init failed: {str(e)}")
+#             return False
+#     def generate_code(self, query: str, error: Optional[str] = None, previous_code: Optional[str] = None) -> str:
+#         prompt = self._generate_retry_prompt(query, error, previous_code) if error else self._generate_initial_prompt(query)
+#         try:
+#             response = self.gemini_model.generate_content(prompt)
+#             return self._extract_code(response.text)
+#         except Exception as e:
+#             if self.key_manager.available_keys and self.key_manager.configure():
+#                 return self.generate_code(query, error, previous_code)
+#             raise
+#     def execute_query(self, query: str) -> Dict[str, Any]:
+#         self.repl = PythonREPL(self.df)
+#         result = None
+#         while self.current_retry < self.max_retries:
+#             try:
+#                 code = self.generate_code(query,
+#                                          result["error_message"] if result else None,
+#                                          result["code"] if result else None)
+#                 execution_result = self.repl.execute(code)
+#                 if execution_result["error"]:
+#                     self.current_retry += 1
+#                     result = {
+#                         "error_message": execution_result["error_message"],
+#                         "code": code
+#                     }
+#                 else:
+#                     return {
+#                         "text": execution_result["output"],
+#                         "csv_files": execution_result["files"]["csv"],
+#                         "image_files": execution_result["files"]["images"]
+#                     }
+#             except Exception as e:
+#                 return {
+#                     "error": f"Critical failure: {str(e)}",
+#                     "csv_files": [],
+#                     "image_files": []
+#                 }
+#         return {
+#             "error": f"Failed after {self.max_retries} retries",
+#             "csv_files": [],
+#             "image_files": []
+#         }
+# def gemini_llm_chat(csv_url: str, query: str) -> Dict[str, Any]:
+#     try:
+#         df = pd.read_csv(csv_url)
+#         agent = RethinkAgent(df=df)
+#         if not agent.initialize_model(API_KEYS):
+#             return {"error": "API configuration failed"}
+#         result = agent.execute_query(query)
+#         if "error" in result:
+#             return result
+#         return {
+#             "message": result["text"],
+#             "csv_files": result["csv_files"],
+#             "image_files": result["image_files"]
+#         }
+#     except Exception as e:
+#         logger.error(f"Processing failed: {str(e)}")
+#         return {
+#             "error": f"Processing error: {str(e)}",
+#             "csv_files": [],
+#             "image_files": []
+#         }
+# async def generate_csv_report(csv_url: str, query: str) -> FileBoxProps:
+#     try:
+#         result = gemini_llm_chat(csv_url, query)
+#         logger.info(f"Raw result from gemini_llm_chat: {result}")
+#         csv_files = []
+#         image_files = []
+#         # Check if we got the expected response structure
+#         if isinstance(result, dict) and 'csv_files' in result and 'image_files' in result:
+#             # Process CSV files
+#             for csv_path in result['csv_files']:
+#                 if os.path.exists(csv_path):
+#                     file_name = os.path.basename(csv_path)
+#                     try:
+#                         unique_file_name = f"{uuid.uuid4()}_{file_name}"
+#                         public_url = await upload_file_to_supabase(
+#                             file_path=csv_path,
+#                             file_name=unique_file_name
+#                         )
+#                         csv_files.append(FileProps(
+#                             fileName=file_name,
+#                             filePath=public_url,
+#                             fileType="csv"
+#                         ))
+#                         os.remove(csv_path)  # Clean up
+#                     except Exception as upload_error:
+#                         logger.error(f"Failed to upload CSV {file_name}: {str(upload_error)}")
+#                         continue
+#             # Process image files
+#             for img_path in result['image_files']:
+#                 if os.path.exists(img_path):
+#                     file_name = os.path.basename(img_path)
+#                     try:
+#                         unique_file_name = f"{uuid.uuid4()}_{file_name}"
+#                         public_url = await upload_file_to_supabase(
+#                             file_path=img_path,
+#                             file_name=unique_file_name
+#                         )
+#                         image_files.append(FileProps(
+#                             fileName=file_name,
+#                             filePath=public_url,
+#                             fileType="image"
+#                         ))
+#                         os.remove(img_path)  # Clean up
+#                     except Exception as upload_error:
+#                         logger.error(f"Failed to upload image {file_name}: {str(upload_error)}")
+#                         continue
+#             return FileBoxProps(
+#                 files=Files(
+#                     csv_files=csv_files,
+#                     image_files=image_files
+#                 )
+#             )
+#         else:
+#             raise ValueError("Unexpected response format from gemini_llm_chat")
+#     except Exception as e:
+#         logger.error(f"Report generation failed: {str(e)}")
+#         # Return empty response but log the files we found
+#         if 'csv_files' in locals() and 'image_files' in locals():
+#             logger.info(f"Files that were generated but not processed: CSV: {result.get('csv_files', [])}, Images: {result.get('image_files', [])}")
+#         return FileBoxProps(
+#             files=Files(
+#                 csv_files=[],
+#                 image_files=[]
+#             )
+#         )
+# Newly Modified code with openai
+# Import necessary modules
+import asyncio
+import os
+import threading
+from typing import Any, Dict, Union
+import uuid
+from fastapi.encoders import jsonable_encoder
+from langchain_openai import ChatOpenAI
+import numpy as np
+import pandas as pd
+from pandasai import SmartDataframe
+from langchain_groq.chat_models import ChatGroq
+from dotenv import load_dotenv
+from pydantic import BaseModel
+from csv_service import clean_data, extract_chart_filenames
+from langchain_groq import ChatGroq
+import pandas as pd
+from langchain_experimental.tools import PythonAstREPLTool
+from langchain_experimental.agents import create_pandas_dataframe_agent
+import numpy as np
+import matplotlib.pyplot as plt
+import matplotlib
+import seaborn as sns
+from gemini_langchain_agent import langchain_gemini_csv_handler
+from supabase_service import upload_file_to_supabase
+from util_service import _prompt_generator, process_answer
+import matplotlib
+import logging
+matplotlib.use('Agg')
+load_dotenv()
+image_file_path = os.getenv("IMAGE_FILE_PATH")
+image_not_found = os.getenv("IMAGE_NOT_FOUND")
+allowed_hosts = os.getenv("ALLOWED_HOSTS", "").split(",")
+# Load environment variables
+groq_api_keys = os.getenv("GROQ_API_KEYS").split(",")
+model_name = os.getenv("GROQ_LLM_MODEL")
+openai_api_keys = os.getenv("OPENAI_API_KEYS").split(",")
+openai_base_url = os.getenv("OPENAI_BASE_URL")
+openai_api_base = os.getenv("OPENAI_BASE_URL")
+# Set up logging
+logging.basicConfig(level=logging.INFO)
+logger = logging.getLogger(__name__)
+class CsvUrlRequest(BaseModel):
+    csv_url: str
+class ImageRequest(BaseModel):
+    image_path: str
+class CsvCommonHeadersRequest(BaseModel):
+  file_urls: list[str]
+class CsvsMergeRequest(BaseModel):
+    file_urls: list[str]
+    merge_type: str
+    common_columns_name: list[str]
+# Thread-safe key management for openai_chat
+current_openai_key_index = 0
+current_openai_key_lock = threading.Lock()
+# Thread-safe key management for groq_chat
+current_groq_key_index = 0
+current_groq_key_lock = threading.Lock()
+# Thread-safe key management for langchain_csv_chat
+current_langchain_key_index = 0
+current_langchain_key_lock = threading.Lock()
+# CHAT CODING STARTS FROM HERE
+def handle_out_of_range_float(value):
+    if isinstance(value, float):
+        if np.isnan(value):
+            return None
+        elif np.isinf(value):
+            return "Infinity"
+    return value
+# Modified groq_chat function with thread-safe key rotation
+def groq_chat(csv_url: str, question: str):
+    global current_groq_key_index, current_groq_key_lock
+    while True:
+        with current_groq_key_lock:
+            if current_groq_key_index >= len(groq_api_keys):
+                return {"error": "All API keys exhausted."}
+            current_api_key = groq_api_keys[current_groq_key_index]
+        try:
+            # Delete cache file if exists
+            cache_db_path = "/workspace/cache/cache_db_0.11.db"
+            if os.path.exists(cache_db_path):
+                try:
+                    os.remove(cache_db_path)
+                except Exception as e:
+                    print(f"Error deleting cache DB file: {e}")
+            data = clean_data(csv_url)
+            llm = ChatGroq(model=model_name, api_key=current_api_key)
+            # Generate unique filename using UUID
+            chart_filename = f"chart_{uuid.uuid4()}.png"
+            chart_path = os.path.join("generated_charts", chart_filename)
+            # Configure SmartDataframe with chart settings
+            df = SmartDataframe(
+                data,
+                config={
+                    'llm': llm,
+                    'save_charts': True,  # Enable chart saving
+                    'open_charts': False,
+                    'save_charts_path': os.path.dirname(chart_path),  # Directory to save
+                    'custom_chart_filename': chart_filename  # Unique filename
+                }
+            )
+            answer = df.chat(question)
+            # Process different response types
+            if isinstance(answer, pd.DataFrame):
+                processed = answer.apply(handle_out_of_range_float).to_dict(orient="records")
+            elif isinstance(answer, pd.Series):
+                processed = answer.apply(handle_out_of_range_float).to_dict()
+            elif isinstance(answer, list):
+                processed = [handle_out_of_range_float(item) for item in answer]
+            elif isinstance(answer, dict):
+                processed = {k: handle_out_of_range_float(v) for k, v in answer.items()}
+            else:
+                processed = {"answer": str(handle_out_of_range_float(answer))}
+            return processed
+        except Exception as e:
+            error_message = str(e)
+            if error_message:
+                with current_groq_key_lock:
+                    current_groq_key_index += 1
+                    if current_groq_key_index >= len(groq_api_keys):
+                        print("All API keys exhausted.")
+                        return None
+            else:
+                print(f"Error with API key index {current_groq_key_index}: {error_message}")
+                return None
+# Modified langchain_csv_chat with thread-safe key rotation
+def langchain_csv_chat(csv_url: str, question: str, chart_required: bool):
+    global current_langchain_key_index, current_langchain_key_lock
+    data = clean_data(csv_url)
+    attempts = 0
+    while attempts < len(groq_api_keys):
+        with current_langchain_key_lock:
+            if current_langchain_key_index >= len(groq_api_keys):
+                current_langchain_key_index = 0
+            api_key = groq_api_keys[current_langchain_key_index]
+            current_key = current_langchain_key_index
+            current_langchain_key_index += 1
+            attempts += 1
+        try:
+            llm = ChatGroq(model=model_name, api_key=api_key)
+            tool = PythonAstREPLTool(locals={
+                "df": data,
+                "pd": pd,
+                "np": np,
+                "plt": plt,
+                "sns": sns,
+                "matplotlib": matplotlib
+            })
+            agent = create_pandas_dataframe_agent(
+                llm,
+                data,
+                agent_type="tool-calling",
+                verbose=True,
+                allow_dangerous_code=True,
+                extra_tools=[tool],
+                return_intermediate_steps=True
+            )
+            prompt = _prompt_generator(question, chart_required)
+            result = agent.invoke({"input": prompt})
+            return result.get("output")
+        except Exception as e:
+            print(f"Error with key index {current_key}: {str(e)}")
+    # If all keys are exhausted, return None
+    print("All API keys have been exhausted.")
+    return None
+def handle_out_of_range_float(value):
+    if isinstance(value, float):
+        if np.isnan(value):
+            return None
+        elif np.isinf(value):
+            return "Infinity"
+    return value
+# CHART CODING STARTS FROM HERE
+instructions = """
+- Please ensure that each value is clearly visible, You may need to adjust the font size, rotate the labels, or use truncation to improve readability (if needed).
+- For multiple charts, arrange them in a grid format (2x2, 3x3, etc.)
+- Use colorblind-friendly palette
+- Read above instructions and follow them.
+"""
+# Thread-safe configuration for chart endpoints
+current_groq_chart_key_index = 0
+current_groq_chart_lock = threading.Lock()
+current_langchain_chart_key_index = 0
+current_langchain_chart_lock = threading.Lock()
+def model():
+    global current_groq_chart_key_index, current_groq_chart_lock
+    with current_groq_chart_lock:
+        if current_groq_chart_key_index >= len(groq_api_keys):
+            raise Exception("All API keys exhausted for chart generation")
+        api_key = groq_api_keys[current_groq_chart_key_index]
+    return ChatGroq(model=model_name, api_key=api_key)
+def groq_chart(csv_url: str, question: str):
+    global current_groq_chart_key_index, current_groq_chart_lock
+    for attempt in range(len(groq_api_keys)):
+        try:
+            # Clean cache before processing
+            cache_db_path = "/workspace/cache/cache_db_0.11.db"
+            if os.path.exists(cache_db_path):
+                try:
+                    os.remove(cache_db_path)
+                except Exception as e:
+                    print(f"Cache cleanup error: {e}")
+            data = clean_data(csv_url)
+            with current_groq_chart_lock:
+                current_api_key = groq_api_keys[current_groq_chart_key_index]
+            llm = ChatGroq(model=model_name, api_key=current_api_key)
+            # Generate unique filename using UUID
+            chart_filename = f"chart_{uuid.uuid4()}.png"
+            chart_path = os.path.join("generated_charts", chart_filename)
+            # Configure SmartDataframe with chart settings
+            df = SmartDataframe(
+                data,
+                config={
+                    'llm': llm,
+                    'save_charts': True,  # Enable chart saving
+                    'open_charts': False,
+                    'save_charts_path': os.path.dirname(chart_path),  # Directory to save
+                    'custom_chart_filename': chart_filename  # Unique filename
+                }
+            )
+            answer = df.chat(question + instructions)
+            if process_answer(answer):
+                return "Chart not generated"
+            return answer
+        except Exception as e:
+            error = str(e)
+            if "429" in error or error is not None:
+                with current_groq_chart_lock:
+                    current_groq_chart_key_index = (current_groq_chart_key_index + 1) % len(groq_api_keys)
+            else:
+                print(f"Chart generation error: {error}")
+                return {"error": error}
+    print("All API keys exhausted for chart generation")
+    return None
+def langchain_csv_chart(csv_url: str, question: str, chart_required: bool):
+    global current_langchain_chart_key_index, current_langchain_chart_lock
+    data = clean_data(csv_url)
+    for attempt in range(len(groq_api_keys)):
+        try:
+            with current_langchain_chart_lock:
+                api_key = groq_api_keys[current_langchain_chart_key_index]
+                current_key = current_langchain_chart_key_index
+                current_langchain_chart_key_index = (current_langchain_chart_key_index + 1) % len(groq_api_keys)
+            llm = ChatGroq(model=model_name, api_key=api_key)
+            tool = PythonAstREPLTool(locals={
+                "df": data,
+                "pd": pd,
+                "np": np,
+                "plt": plt,
+                "sns": sns,
+                "matplotlib": matplotlib,
+                "uuid": uuid
+            })
+            agent = create_pandas_dataframe_agent(
+                llm,
+                data,
+                agent_type="tool-calling",
+                verbose=True,
+                allow_dangerous_code=True,
+                extra_tools=[tool],
+                return_intermediate_steps=True
+            )
+            result = agent.invoke({"input": _prompt_generator(f"{question} and use this csv_url: {csv_url} to read the csv file", True)})
+            output = result.get("output", "")
+            # Verify chart file creation
+            chart_files = extract_chart_filenames(output)
+            if len(chart_files) > 0:
+                return chart_files
+            if attempt < len(groq_api_keys) - 1:
+                print(f"Langchain chart error (key {current_key}): {output}")
+        except Exception as e:
+            print(f"Langchain chart error (key {current_key}): {str(e)}")
+    print("All API keys exhausted for chart generation")
+    return None
+####################################### OpenAI + PandasAI #######################################
+# Modified openai_chat function with thread-safe key rotation
+openai_model_name = 'gpt-4o'
+def openai_chat(csv_url: str, question: str):
+    global current_openai_key_index, current_openai_key_lock
+    while True:
+        with current_openai_key_lock:
+            if current_openai_key_index >= len(openai_api_keys):
+                return {"error": "All API keys exhausted."}
+            current_api_key = openai_api_keys[current_openai_key_index]
+        try:
+            # Delete cache file if exists
+            cache_db_path = "/workspace/cache/cache_db_0.11.db"
+            if os.path.exists(cache_db_path):
+                try:
+                    os.remove(cache_db_path)
+                except Exception as e:
+                    print(f"Error deleting cache DB file: {e}")
+            data = clean_data(csv_url)
+            llm = ChatOpenAI(model=openai_model_name, api_key=current_api_key,base_url=openai_api_base)
+            # Generate unique filename using UUID
+            chart_filename = f"chart_{uuid.uuid4()}.png"
+            chart_path = os.path.join("generated_charts", chart_filename)
+            # Configure SmartDataframe with chart settings
+            df = SmartDataframe(
+                data,
+                config={
+                    'llm': llm,
+                    'save_charts': True,  # Enable chart saving
+                    'open_charts': False,
+                    'save_charts_path': os.path.dirname(chart_path),  # Directory to save
+                    'custom_chart_filename': chart_filename  # Unique filename
+                }
             )
+            answer = df.chat(question)
+            # Process different response types
+            if isinstance(answer, pd.DataFrame):
+                processed = answer.apply(handle_out_of_range_float).to_dict(orient="records")
+            elif isinstance(answer, pd.Series):
+                processed = answer.apply(handle_out_of_range_float).to_dict()
+            elif isinstance(answer, list):
+                processed = [handle_out_of_range_float(item) for item in answer]
+            elif isinstance(answer, dict):
+                processed = {k: handle_out_of_range_float(v) for k, v in answer.items()}
+            else:
+                processed = {"answer": str(handle_out_of_range_float(answer))}
+            return processed
+        except Exception as e:
+            error_message = str(e)
+            if error_message:
+                with current_openai_key_lock:
+                    current_openai_key_index += 1
+                    if current_openai_key_index >= len(openai_api_keys):
+                        print("All API keys exhausted.")
+                        return None
+            else:
+                print(f"Error with API key index {current_openai_key_index}: {error_message}")
+                return None
+def openai_chart(csv_url: str, question: str):
+    global current_openai_key_index, current_openai_key_lock
+    while True:
+        with current_openai_key_lock:
+            if current_openai_key_index >= len(openai_api_keys):
+                return {"error": "All API keys exhausted."}
+            current_api_key = openai_api_keys[current_openai_key_index]
+        try:
+            # Delete cache file if exists
+            cache_db_path = "/workspace/cache/cache_db_0.11.db"
+            if os.path.exists(cache_db_path):
+                try:
+                    os.remove(cache_db_path)
+                except Exception as e:
+                    print(f"Error deleting cache DB file: {e}")
+            data = clean_data(csv_url)
+            llm = ChatOpenAI(model=openai_model_name, api_key=current_api_key,base_url=openai_api_base)
+            # Generate unique filename using UUID
+            chart_filename = f"chart_{uuid.uuid4()}.png"
+            chart_path = os.path.join("generated_charts", chart_filename)
+            # Configure SmartDataframe with chart settings
+            df = SmartDataframe(
+                data,
+                config={
+                    'llm': llm,
+                    'save_charts': True,  # Enable chart saving
+                    'open_charts': False,
+                    'save_charts_path': os.path.dirname(chart_path),  # Directory to save
+                    'custom_chart_filename': chart_filename  # Unique filename
+                }
             )
+            answer = df.chat(question + instructions)
+            if process_answer(answer):
+                return "Chart not generated"
+            return answer
+        except Exception as e:
+            error = str(e)
+            print(f"Error with API key index {current_openai_key_index}: {error}")
+            if "429" in error or error is not None:
+                with current_openai_key_lock:
+                    current_openai_key_index = (current_openai_key_index + 1) % len(openai_api_keys)
+            else:
+                print(f"Chart generation error: {error}")
+                return {"error": error}
+        print("All API keys exhausted for chart generation")
+        return None
+####################################### Start with lc_gemini #######################################
+# async def csv_chat(csv_url: str, query: str):
+#     """
+#     Generate a response based on the provided CSV URL and query.
+#     Prioritizes LangChain-Gemini, then LangChain-Groq, then raw OpenAI and finally raw Groq as fallback.
+#     Parameters:
+#     - csv_url (str): The URL of the CSV file.
+#     - query (str): The query for generating the response.
+#     Returns:
+#     - dict: A dictionary containing the generated response.
+#     Example:
+#     - csv_url: "https://example.com/data.csv"
+#     - query: "What is the total sales for the year 2022?"
+#     Returns:
+#     - dict: {"answer": "The total sales for 2022 is $100,000."}
+#     """
+#     try:
+#         updated_query = f"{query} and Do not show any charts or graphs."
+#         # --- 1. First Attempt: LangChain Gemini ---
+#         try:
+#             gemini_answer = await asyncio.to_thread(
+#                 langchain_gemini_csv_handler, csv_url, updated_query, False
+#             )
+#             print("LangChain-Gemini answer:", gemini_answer)
+#             if not process_answer(gemini_answer) or gemini_answer is None:
+#                 return {"answer": jsonable_encoder(gemini_answer)}
+#             raise Exception("LangChain-Gemini response not usable, falling back to LangChain-Groq")
+#         except Exception as gemini_error:
+#             print(f"LangChain-Gemini error: {str(gemini_error)}")
+#             # --- 2. Second Attempt: LangChain Groq ---
+#             try:
+#                 lang_groq_answer = await asyncio.to_thread(
+#                     langchain_csv_chat, csv_url, updated_query, False
+#                 )
+#                 print("LangChain-Groq answer:", lang_groq_answer)
+#                 if not process_answer(lang_groq_answer):
+#                     return {"answer": jsonable_encoder(lang_groq_answer)}
+#                 raise Exception("LangChain-Groq response not usable, falling back to raw Groq")
+#             except Exception as lang_groq_error:
+#                 print(f"LangChain-Groq error: {str(lang_groq_error)}")
+#                 # --- 3. Final Attempt: Raw OpenAI Chat ---
+#                 try:
+#                     raw_openai_answer = await asyncio.to_thread(openai_chat, csv_url, updated_query)
+#                     print("Raw OpenAI answer:", raw_openai_answer)
+#                     if process_answer(raw_openai_answer) == "Empty response received." or raw_openai_answer is None:
+#                         return {"answer": "Sorry, I couldn't find relevant data..."}
+#                     if process_answer(raw_openai_answer):
+#                 except Exception as openai_exception:
+#                     print(f"Raw OpenAI error: {str(openai_exception)}")
+#                 # --- 4. Final Attempt: Raw Groq Chat ---
+#                 try:
+#                     raw_groq_answer = await asyncio.to_thread(groq_chat, csv_url, updated_query)
+#                     print("Raw Groq answer:", raw_groq_answer)
+#                     if process_answer(raw_groq_answer) == "Empty response received." or raw_groq_answer is None:
+#                         return {"answer": "Sorry, I couldn't find relevant data..."}
+#                     if process_answer(raw_groq_answer):
+#                         raise Exception("All fallbacks exhausted")
+#                     return {"answer": jsonable_encoder(raw_groq_answer)}
+#                 except Exception as raw_groq_error:
+#                     print(f"Raw Groq error: {str(raw_groq_error)}")
+#                     return {"answer": "error"}
+#     except Exception as e:
+#         print(f"Unexpected error: {str(e)}")
+#         return {"answer": "error"}
+# async def csv_chart(csv_url: str, query: str):
+#     """
+#     Generate a chart based on the provided CSV URL and query.
+#     Prioritizes raw OpenAI, then raw Groq, then LangChain Gemini, and finally LangChain Groq as fallback.
+#     Parameters:
+#     - csv_url (str): The URL of the CSV file.
+#     - query (str): The query for generating the chart.
+#     Returns:
+#     - dict: A dictionary containing either:
+#         - {"image_url": "https://example.com/chart.png"} on success, or
+#         - {"error": "error message"} on failure
+#     Example:
+#     - csv_url: "https://example.com/data.csv"
+#     - query: "Show sales trends as a line chart"
+#     Returns:
+#     - dict: {"image_url": "https://storage.example.com/chart_uuid.png"}
+#     """
+#     async def upload_and_return(image_path: str) -> dict:
+#         """Helper function to handle image uploads"""
+#         unique_name = f'{uuid.uuid4()}.png'
+#         public_url = await upload_file_to_supabase(image_path, unique_name)
+#         print(f"Uploaded chart: {public_url}")
+#         os.remove(image_path) # Remove the local image file after upload
+#         return {"image_url": public_url}
+#     try:
+#         # --- 1. First Attempt: Raw OpenAI ---
+#         try:
+#             openai_result = await asyncio.to_thread(openai_chart, csv_url, query)
+#             print(f"OpenAI chart result:", openai_result)
+#             if openai_result and openai_result != 'Chart not generated':
+#                 return await upload_and_return(openai_result)
+#             raise Exception("OpenAI failed to generate chart")
+#         except Exception as openai_error:
+#             print(f"OpenAI failed ({str(openai_error)}), trying LangChain Gemini...")
+#             # --- 2.. First Attempt: Raw Groq ---
+#             try:
+#                 groq_result = await asyncio.to_thread(groq_chart, csv_url, query)
+#                 print(f"Raw Groq chart result:", groq_result)
+#                 if groq_result and groq_result != 'Chart not generated':
+#                     return await upload_and_return(groq_result)
+#                 raise Exception("Raw Groq failed to generate chart")
+#             except Exception as groq_error:
+#                 print(f"Raw Groq failed ({str(groq_error)}), trying LangChain Gemini...")
+#                 # --- 3. Second Attempt: LangChain Gemini ---
+#                 try:
+#                     gemini_result = await asyncio.to_thread(
+#                         langchain_gemini_csv_handler, csv_url, query, True
+#                     )
+#                     print("LangChain Gemini chart result:", gemini_result)
+#                     # --- i) If Gemini result is a string, return it ---
+#                     if gemini_result and isinstance(gemini_result, str):
+#                         clean_path = gemini_result.strip()
+#                         return await upload_and_return(clean_path)
+#                     # --- ii) If Gemini result is a list, return the first element ---
+#                     if gemini_result and isinstance(gemini_result, list) and len(gemini_result) > 0:
+#                         return await upload_and_return(gemini_result[0])
+#                     raise Exception("LangChain Gemini returned empty result")
+#                 except Exception as gemini_error:
+#                     print(f"LangChain Gemini failed ({str(gemini_error)}), trying LangChain Groq...")
+#                     # --- 4. Final Attempt: LangChain Groq ---
+#                     try:
+#                         lc_groq_paths = await asyncio.to_thread(
+#                             langchain_csv_chart, csv_url, query, True
+#                         )
+#                         print("LangChain Groq chart result:", lc_groq_paths)
+#                         if isinstance(lc_groq_paths, list) and lc_groq_paths:
+#                             return await upload_and_return(lc_groq_paths[0])
+#                         return {"error": "All chart generation methods failed"}
+#                     except Exception as lc_groq_error:
+#                         print(f"LangChain Groq failed: {str(lc_groq_error)}")
+#                         return {"error": "Could not generate chart"}
+#     except Exception as e:
+#         print(f"Critical error: {str(e)}")
+#         return {"error": "Internal system error"}
+####################################### Optimized Version #######################################
+async def csv_chat(csv_url: str, query: str) -> Dict[str, Any]:
+    """
+    Generate a response based on the provided CSV URL and query.
+    Prioritizes LangChain-Gemini, then LangChain-Groq, then raw OpenAI and finally raw Groq as fallback.
+    Parameters:
+    - csv_url (str): The URL of the CSV file.
+    - query (str): The query for generating the response.
+    Returns:
+    - dict: A dictionary containing the generated response or error message.
+    Example:
+    - csv_url: "https://example.com/data.csv"
+    - query: "What is the total sales for the year 2022?"
+    Returns:
+    - dict: {"answer": "The total sales for 2022 is $100,000."}
+    """
+    updated_query = f"{query} and Do not show any charts or graphs."
+    fallback_answer = "Sorry, I couldn't find relevant data..."
+    error_answer = "An error occurred while processing your request."
+    async def try_chat_method(method_name: str, method, *args) -> Dict[str, Any]:
+        """Attempt to get answer from a specific chat method"""
+        try:
+            logger.info(f"Attempting {method_name}")
+            answer = await asyncio.to_thread(method, *args)
+            if answer is None:
+                logger.warning(f"{method_name} returned None")
+                return {"status": "empty", "answer": None}
+            processed = process_answer(answer)
+            if processed == "Empty response received.":
+                logger.warning(f"{method_name} returned empty response")
+                return {"status": "empty", "answer": answer}
+            elif processed:
+                logger.warning(f"{method_name} response not usable")
+                return {"status": "invalid", "answer": answer}
+            else:
+                logger.info(f"{method_name} succeeded")
+                return {"status": "success", "answer": answer}
+        except Exception as e:
+            logger.error(f"{method_name} failed: {str(e)}")
+            return {"status": "error", "error": str(e)}
+    # Define the methods to try in priority order
+    chat_methods = [
+        ("LangChain-Gemini", langchain_gemini_csv_handler, csv_url, updated_query, False),
+        ("LangChain-Groq", langchain_csv_chat, csv_url, updated_query, False),
+        ("Raw OpenAI", openai_chat, csv_url, updated_query),
+        ("Raw Groq", groq_chat, csv_url, updated_query),
+    ]
+    for method_name, method, *args in chat_methods:
+        result = await try_chat_method(method_name, method, *args)
+        if result["status"] == "success":
+            return {"answer": jsonable_encoder(result["answer"])}
+        elif result["status"] == "empty":
+            return {"answer": fallback_answer}
+    # If all methods failed or returned invalid responses
+    logger.error("All chat methods failed to produce a valid response")
+    return {"answer": error_answer}
+async def csv_chart(csv_url: str, query: str) -> Dict[str, str]:
+    """
+    Generate a chart based on the provided CSV URL and query.
+    Prioritizes raw OpenAI, then raw Groq, then LangChain Gemini, and finally LangChain Groq as fallback.
+    Parameters:
+    - csv_url (str): The URL of the CSV file.
+    - query (str): The query for generating the chart.
+    Returns:
+    - dict: A dictionary containing either:
+        - {"image_url": "https://example.com/chart.png"} on success, or
+        - {"error": "error message"} on failure
+    Example:
+    - csv_url: "https://example.com/data.csv"
+    - query: "Show sales trends as a line chart"
+    Returns:
+    - dict: {"image_url": "https://storage.example.com/chart_uuid.png"}
+    """
+    async def upload_and_return(image_path: str) -> Dict[str, str]:
+        """Helper function to handle image uploads and cleanup"""
+        try:
+            if not os.path.exists(image_path):
+                raise FileNotFoundError(f"Image file not found at {image_path}")
+            unique_name = f'{uuid.uuid4()}.png'
+            public_url = await upload_file_to_supabase(image_path, unique_name)
+            logger.info(f"Uploaded chart: {public_url}")
+            try:
+                os.remove(image_path)
+            except OSError as e:
+                logger.warning(f"Failed to remove local image file: {e}")
+            return {"image_url": public_url}
+        except Exception as e:
+            logger.error(f"Error in upload_and_return: {e}")
+            raise e
+    async def try_generation(method_name: str, method, *args) -> Union[str, None]:
+        """Attempt chart generation with a specific method"""
+        try:
+            logger.info(f"Attempting chart generation with {method_name}")
+            result = await asyncio.to_thread(method, *args)
+            if not result or result == 'Chart not generated':
+                raise ValueError(f"{method_name} returned empty or invalid result")
+            if isinstance(result, str):
+                return result.strip()
+            elif isinstance(result, list) and result:
+                return result[0]
+            raise ValueError(f"{method_name} returned unexpected result type")
+        except Exception as e:
+            logger.warning(f"{method_name} failed: {str(e)}")
+            return None
+    generation_methods = [
+        ("Raw OpenAI", openai_chart, csv_url, query),
+        ("Raw Groq", groq_chart, csv_url, query),
+        ("LangChain Gemini", lambda u, q: langchain_gemini_csv_handler(u, q, True), csv_url, query),
+        ("LangChain Groq", lambda u, q: langchain_csv_chart(u, q, True), csv_url, query),
+    ]
+    for attempt, (method_name, method, *args) in enumerate(generation_methods, 1):
+        try:
+            result = await try_generation(method_name, method, *args)
+            if result:
+                return await upload_and_return(result)
+        except Exception as e:
+            logger.error(f"Error processing {method_name}: {e}")
+            if attempt == len(generation_methods):
+                logger.error("All chart generation methods failed")
+                return {"error": "Could not generate chart using any available method"}
+    return {"error": "All chart generation methods failed"}
+# Example usage:
+# csv_url = './documents/titanic.csv'
+# query = "Create a pie chart of male vs female passengers?"
+# result = openai_chart(csv_url, query)
+# print(result)