Spaces:

dromerosm
/

crewai-groq-llama3

Running

App Files Files Community

dromerosm commited on May 6

Commit

ce281ba

•

1 Parent(s): c85a52f

Update app.py

Browse files

Files changed (1) hide show

app.py +43 -47

app.py CHANGED Viewed

@@ -9,6 +9,17 @@ from langchain_cohere import ChatCohere
 from langchain_community.tools import DuckDuckGoSearchRun, DuckDuckGoSearchResults
 from crewai_tools import tool, SeleniumScrapingTool, ScrapeWebsiteTool
 # Define the DuckDuckGoSearch tool using the decorator for tool registration
 # @tool('DuckDuckGoSearch')
 # def search(search_query: str):
@@ -17,7 +28,7 @@ from crewai_tools import tool, SeleniumScrapingTool, ScrapeWebsiteTool
 # Define the DuckDuckGoSearch tool
 @tool('DuckDuckGoResults')
-def search_results(search_query: str):
     """
     Performs a web search using the DuckDuckGo search engine to gather and return a collection of search results.
     This tool automates the retrieval of web-based information related to a specified query.
@@ -33,14 +44,10 @@ def search_results(search_query: str):
     - Output: [snippet: The telecommunications and media industry is at the forefront of integrating generative AI into their operations, viewing it as a catalyst for growth and innovation. Industry leaders are enthusiastic about its ability to not only enhance the current processes but also spearhead new innovations, create new opportunities, unlock new sources of ..., title: Generative AI in the telecom industry | Google Cloud Blog, link: https://cloud.google.com/blog/topics/telecommunications/generative-ai-in-the-telecom-industry], ...]
     """
-    return DuckDuckGoSearchResults().run(search_query)
-# Retrieve the Cohere API key from environment variables
-cohere_api_key = os.getenv('COHERE_API_KEY')
-co = cohere.Client(cohere_api_key)
 @tool('WebScrapper')
-def web_scrapper(url: str, topic: str):
     """
     A tool designed to extract and read the content of a specified link and generate a summary on a specific topic.
     It is capable of handling various types of web pages by making HTTP requests and parsing the received HTML content.
@@ -52,7 +59,7 @@ def web_scrapper(url: str, topic: str):
     - topic (str): The specific topic on which to generate a summary.
     Returns:
-    - text: summary of the url on the topic
     """
     # Scrape content from the specified URL
     scraper = ScrapeWebsiteTool(website_url=url)
@@ -66,6 +73,7 @@ def web_scrapper(url: str, topic: str):
         model='command-r-plus',
         message=prompt,
         temperature=0.2,
         chat_history=[],
         prompt_truncation='AUTO'
     )
@@ -93,35 +101,28 @@ def kickoff_crew(topic: str) -> dict:
         # Define Agents with Groq LLM
         researcher = Agent(
             role='Researcher',
-            goal='Collect detailed information on {topic}',
             tools=[search_results, web_scrapper],
-                llm=selected_llm,  # Assigning the Groq LLM here
             backstory=(
-                "As a diligent researcher, you explore the depths of the internet to "
-                "unearth crucial information and insights on the assigned topics. "
-                "With a keen eye for detail and a commitment to accuracy, you meticulously document every source "
-                "and piece of data gathered. Your research is thorough, ensuring that no stone is left unturned. "
-                "This dedication not only enhances the quality of the information but also ensures "
-                "reliability and trustworthiness in your findings."
-                "To achieve your objectives, think carefully about the {topic}, develop strategies to expand "
-                "and follows a step-by-step strategy to build conclusions."
             ),
             allow_delegation=False,
             max_iter=5,
             verbose=True,  # Optional
         )
         editor = Agent(
             role='Editor',
-            goal='Compile and refine the information into a comprehensive report on {topic}',
-                llm=selected_llm,  # Assigning the Groq LLM here
             backstory=(
-                "With a keen eye for detail and a strong command of language, you transform "
-                "raw data into polished, insightful reports that are both informative and engaging. "
-                "Your expertise in editing ensures that every report is not only thorough but also "
-                "clearly communicates the key findings in a manner that is accessible to all readers. "
-                "As an editor, your role is crucial in shaping the final presentation of data, making "
-                "complex information easy to understand and appealing to the audience."
             ),
             allow_delegation=False,
             max_iter=3,
@@ -131,39 +132,34 @@ def kickoff_crew(topic: str) -> dict:
         # Define Tasks
         research_task = Task(
             description=(
-                "First, use DuckDuckGoResults tool to gather snippets from search results about ## {topic} ##. "
-                "If you need to expand the search on the ## {topic} ##, generate new search queries. "
-                "Then, use the WebScrapper tool to extract additional information and insights from all links or URLs that appear significant regarding {topic} after analyzing the snippets of the search results. "
-                "Compile your findings into an initial draft, ensuring to include all sources with their titles and links relevant to the topic. "
-                "Throughout this process, maintain a high standard of accuracy and ensure that no information is fabricated or misrepresented."
             ),
             expected_output=(
-                "A draft report containing all relevant information about the topic and sources used. "
-                "The report should be well-structured, including an introduction, a detailed body with organized sections according to different aspects of the topic, and a conclusion. "
-                "Each section should cite sources accurately and provide a comprehensive overview of the findings."
             ),
             agent=researcher
         )
         edit_task = Task(
             description=(
-                "Review and refine the draft report produced by the research task. Organize the content methodically, "
-                "ensuring that the structure is logical and enhances the flow of information. Check all factual data for accuracy, "
-                "correct any discrepancies, and ensure that the information is current and well-supported by sources. "
-                "Enhance the readability of the report by improving language clarity, adjusting sentence structure, and ensuring consistency in tone. "
-                "Include a dedicated section that lists all sources used in the research_task. "
-                "Each source used in the analysis should be presented as a bullet point in the follwint format: "
-                "- title: link "
-                "Ensure that all sources you include in the final report exist by scrapping them if necessary. "
-                "This section should be comprehensive, clearly formatted, and easy to navigate, providing full transparency on the references used."
             ),
             expected_output=(
-                "A finalized comprehensive report on ## {topic} ##. The report should be polished, with a clear and engaging narrative "
-                "that accurately reflects the research findings. It should include an introduction, a detailed and extensive discussion section, a concise conclusion, "
-                "and a well-organized source list. The document should be free of grammatical errors and ready for publication or presentation."
             ),
             agent=editor,
-            context=[research_task]
         )
         # Forming the Crew

 from langchain_community.tools import DuckDuckGoSearchRun, DuckDuckGoSearchResults
 from crewai_tools import tool, SeleniumScrapingTool, ScrapeWebsiteTool
+# Ensure essential environment variables are set
+cohere_api_key = os.getenv('COHERE_API_KEY')
+if not cohere_api_key:
+    raise EnvironmentError("COHERE_API_KEY is not set in environment variables")
+groq_api_key = os.getenv("GROQ_API_KEY")
+if not groq_api_key:
+    raise EnvironmentError("GROQ_API_KEY is not set in environment variables")
+# Initialize API clients
+co = cohere.Client(cohere_api_key)
 # Define the DuckDuckGoSearch tool using the decorator for tool registration
 # @tool('DuckDuckGoSearch')
 # def search(search_query: str):
 # Define the DuckDuckGoSearch tool
 @tool('DuckDuckGoResults')
+def search_results(search_query: str): -> dict
     """
     Performs a web search using the DuckDuckGo search engine to gather and return a collection of search results.
     This tool automates the retrieval of web-based information related to a specified query.
     - Output: [snippet: The telecommunications and media industry is at the forefront of integrating generative AI into their operations, viewing it as a catalyst for growth and innovation. Industry leaders are enthusiastic about its ability to not only enhance the current processes but also spearhead new innovations, create new opportunities, unlock new sources of ..., title: Generative AI in the telecom industry | Google Cloud Blog, link: https://cloud.google.com/blog/topics/telecommunications/generative-ai-in-the-telecom-industry], ...]
     """
+    return DuckDuckGoSearchResults(max_results=3).run(search_query)
 @tool('WebScrapper')
+def web_scrapper(url: str, topic: str): -> str
     """
     A tool designed to extract and read the content of a specified link and generate a summary on a specific topic.
     It is capable of handling various types of web pages by making HTTP requests and parsing the received HTML content.
     - topic (str): The specific topic on which to generate a summary.
     Returns:
+    - summary (str): summary of the url on the topic
     """
     # Scrape content from the specified URL
     scraper = ScrapeWebsiteTool(website_url=url)
         model='command-r-plus',
         message=prompt,
         temperature=0.2,
+        max_tokens=300,
         chat_history=[],
         prompt_truncation='AUTO'
     )
         # Define Agents with Groq LLM
         researcher = Agent(
             role='Researcher',
+            goal='Collect detailed information on topic ## {topic} ##',
             tools=[search_results, web_scrapper],
+            llm=selected_llm,  # Assigning the Groq LLM here
             backstory=(
+                "You are a meticulous researcher, skilled at navigating vast amounts of information to extract essential insights on any given topic. "
+                "Your dedication to detail ensures the reliability and thoroughness of your findings. "
+                "With a strategic approach, you carefully analyze and document data, aiming to provide accurate and trustworthy results."
             ),
             allow_delegation=False,
             max_iter=5,
             verbose=True,  # Optional
         )
         editor = Agent(
             role='Editor',
+            goal='Compile and refine the information into a comprehensive report on topic ## {topic} ##',
+            llm=selected_llm,  # Assigning the Groq LLM here
             backstory=(
+                "As an expert editor, you specialize in transforming raw data into clear, engaging reports. "
+                "Your strong command of language and attention to detail ensure that each report not only conveys essential insights "
+                "but is also easily understandable and appealing to diverse audiences. "
             ),
             allow_delegation=False,
             max_iter=3,
         # Define Tasks
         research_task = Task(
             description=(
+                "Use the DuckDuckGoResults tool to collect initial search snippets on ##{topic}##. "
+                "If more detailed searches are required, generate and execute new queries related to ##{topic}##. "
+                "Subsequently, employ the WebScrapper tool to delve deeper into significant URLs identified from the snippets, extracting further information and insights. "
+                "Compile these findings into a preliminary draft, documenting all relevant sources, titles, and links associated with the topic. "
+                "Ensure high accuracy throughout the process and avoid any fabrication or misrepresentation of information."
             ),
             expected_output=(
+                "A structured draft report about the topic, featuring an introduction, a detailed main body organized by different aspects of the topic, and a conclusion. "
+                "Each section should properly cite sources, providing a thorough overview of the information gathered."
             ),
             agent=researcher
         )
         edit_task = Task(
             description=(
+                "Review and refine the initial draft report from the research task. Organize the content logically to enhance information flow. "
+                "Verify the accuracy of all data, correct discrepancies, and update information to ensure it reflects current knowledge and is well-supported by sources. "
+                "Improve the report’s readability by enhancing language clarity, adjusting sentence structures, and maintaining a consistent tone. "
+                "Include a section listing all sources used, formatted as bullet points like so: '- title: link'."
             ),
             expected_output=(
+                "A polished, comprehensive report on topic ## {topic} ##, with a clear, professional narrative that accurately reflects the research findings. "
+                "The report should include an introduction, an extensive discussion section, a concise conclusion, and a well-organized source list. "
+                "Ensure the document is grammatically correct and ready for publication or presentation."
             ),
             agent=editor,
+            # context=[research_task]
         )
         # Forming the Crew