Spaces:

poemsforaphrodite
/

crew-climate

Sleeping

App Files Files Community

crew-climate / app.py

poemsforaphrodite

Update app.py

db301e1 verified 10 months ago

raw

history blame contribute delete

8.37 kB

	import os
	from dotenv import load_dotenv
	import streamlit as st
	from crewai import Agent, Task, Crew
	from crewai_tools import SerperDevTool, WebsiteSearchTool, FileReadTool
	from openai import OpenAI
	import tempfile
	import time

	# Load environment variables
	load_dotenv()

	# Get API keys from environment variables
	SERPER_API_KEY = os.getenv("SERPER_API_KEY")
	OPENAI_API_KEY = os.getenv("OPENAI_API_KEY")

	# Initialize OpenAI API
	client = OpenAI(api_key=OPENAI_API_KEY)

	# Create assistant
	assistant = client.beta.assistants.create(
	name="Climate Strategy Assistant",
	instructions="You are an expert in climate strategy. Analyze climate strategy documents and provide relevant insights.",
	model="gpt-4o",
	tools=[{"type": "file_search"}],
	)

	# Instantiate tools
	file_tool = FileReadTool(file_path='analysis.txt') # Adjusted to read analysis.txt
	search_tool = SerperDevTool()
	web_rag_tool = WebsiteSearchTool()

	# Create agents
	analyst = Agent(
	role='Climate Strategy Analyst',
	goal='Analyze the climate strategy plan to identify key requirements and objectives.',
	backstory='An expert in climate strategy with experience in sustainable solutions.',
	tools=[file_tool],
	verbose=True
	)

	researcher = Agent(
	role='Climate Tech Researcher',
	goal='Find and list specific climate tech companies that provide solutions aligning with the strategy plan.',
	backstory='A researcher specialized in identifying and evaluating climate technology solutions, with a focus on practical implementations.',
	tools=[search_tool, web_rag_tool],
	verbose=True
	)

	# Define tasks
	analyze_strategy = Task(
	description='Analyze the climate strategy plan from analysis.txt and extract key requirements.',
	expected_output='A detailed list of key requirements and objectives from the climate strategy plan.',
	agent=analyst
	)

	search_companies = Task(
	description='Search for and list specific climate tech companies that offer solutions meeting the extracted strategy requirements. Provide company names, brief descriptions of their solutions, and how they align with the strategy needs.',
	expected_output='A detailed list of climate tech companies, including company names, solution descriptions, and how they align with the strategy requirements.',
	agent=researcher,
	output_file='research_results/company_recommendations.md'
	)

	# Assemble a crew with planning enabled
	crew = Crew(
	agents=[analyst, researcher],
	tasks=[analyze_strategy, search_companies],
	verbose=True,
	planning=True,
	)

	def process_file_with_assistant(file, file_type, category, reports_needed, user_feedback):
	print(f"Starting {file_type} processing with Assistant")
	try:
	# Upload the file to OpenAI
	uploaded_file = client.files.create(
	file=file,
	purpose='assistants'
	)
	print(f"File uploaded successfully. File ID: {uploaded_file.id}")

	# Create an assistant
	assistant = client.beta.assistants.create(
	name=f"{file_type} Analyzer",
	instructions=f"You are an expert in analyzing {file_type} files, focusing on {category}. Provide insights and summaries of the content based on the following reports: {', '.join(reports_needed)}. Consider the user's previous feedback: {user_feedback}. Provide your response in plain text format without any formatting, bullet points, numbering, or source citations. Do not use asterisks, hashes, or any other special characters for emphasis or structure.",
	model="gpt-4o",
	tools=[{"type": "file_search"}]
	)
	print(f"Assistant created. Assistant ID: {assistant.id}")

	# Create a thread
	thread = client.beta.threads.create()
	print(f"Thread created. Thread ID: {thread.id}")

	# Add a message to the thread
	message = client.beta.threads.messages.create(
	thread_id=thread.id,
	role="user",
	content=f"Please analyze this file and provide insights for the {category} category, focusing on the following reports: {', '.join(reports_needed)}.",
	attachments=[
	{"file_id": uploaded_file.id, "tools": [{"type": "file_search"}]}
	]
	)
	print(f"Message added to thread. Message ID: {message.id}")

	# Run the assistant
	run = client.beta.threads.runs.create(
	thread_id=thread.id,
	assistant_id=assistant.id,
	additional_instructions="Use the uploaded file to answer the question. Provide your response in plain text format without any formatting, bullet points, numbering, or source citations. Do not use asterisks, hashes, or any other special characters for emphasis or structure."
	)
	print(f"Run created. Run ID: {run.id}")

	# Wait for the run to complete
	while run.status != 'completed':
	run = client.beta.threads.runs.retrieve(thread_id=thread.id, run_id=run.id)
	print(f"Run status: {run.status}")
	time.sleep(1)

	# Retrieve the messages
	messages = client.beta.threads.messages.list(thread_id=thread.id)

	# Extract the assistant's response
	analysis_result = next((msg.content[0].text.value for msg in messages if msg.role == 'assistant'), None)

	print(f"{file_type} analysis completed successfully")
	return analysis_result
	except Exception as e:
	print(f"Error in processing {file_type}: {str(e)}")
	return None

	# Update the existing process_pdf_with_assistant function
	def process_pdf_with_assistant(uploaded_file):
	"""Process the uploaded PDF using the Assistants API."""
	return process_file_with_assistant(
	file=uploaded_file,
	file_type="PDF",
	category="climate strategy",
	reports_needed=["key points summary"],
	user_feedback=""
	)

	def save_processed_content(content, filename='analysis.txt'):
	"""Save the processed content to a text file."""
	if content is not None:
	with open(filename, 'w') as f:
	f.write(content)
	else:
	print("No content to save.")

	def run_crew():
	# Create crew and execute tasks
	result = crew.kickoff()

	# Read and return the content of the output file
	with open('research_results/company_recommendations.md', 'r') as f:
	return f.read()

	# Initialize session state variables
	if 'pdf_processed' not in st.session_state:
	st.session_state.pdf_processed = False
	if 'processed_content' not in st.session_state:
	st.session_state.processed_content = None

	# Streamlit interface
	st.title("Climate Tech Company Finder")
	st.write("Upload a PDF to analyze climate strategy and find relevant companies.")

	# PDF Upload
	uploaded_pdf = st.file_uploader("Upload your climate strategy PDF", type=["pdf"])

	if uploaded_pdf is not None:
	# Button to trigger PDF analysis
	if st.button("Run PDF Analysis") or st.session_state.pdf_processed:
	if not st.session_state.pdf_processed:
	with st.spinner("Processing PDF..."):
	# Process PDF with Assistants API
	st.session_state.processed_content = process_pdf_with_assistant(uploaded_pdf)

	if st.session_state.processed_content:
	# Save processed content to analysis.txt
	save_processed_content(st.session_state.processed_content, 'analysis.txt')
	st.session_state.pdf_processed = True
	st.success("PDF processed successfully.")
	else:
	st.error("Failed to process the PDF. Please try again.")

	if st.session_state.pdf_processed:
	# Display the PDF analysis to the user
	st.subheader("PDF Analysis")
	st.text_area("Key Points Summary", st.session_state.processed_content, height=200)

	# Only show the crew analysis button after PDF analysis is complete
	if st.button("Run Crew Analysis"):
	with st.spinner("Running crew analysis..."):
	result = run_crew()
	st.subheader("Company Recommendations")
	st.markdown(result) # Use markdown to preserve formatting
	else:
	st.info("Please upload a climate strategy PDF to begin.")