exa error

2 years ago · 4480ead6aa
parent 9e2fda0a62
commit 4480ead6aa
6 changed files with 73 additions and 6 deletions
--- a/apps/paper_swarm.py
+++ b/apps/paper_swarm.py
@ -0,0 +1,66 @@
+"""
+Paper Swarm
+1. Scrape https://huggingface.co/papers for all papers, by search for all links on the paper with a /papers/, then clicks, gets the header, and then the abstract.
+and various links and then adds them to a txt file for each paper on https://huggingface.co/papers
+
+2. Feed prompts iteratively into Anthropic for summarizations + value score on impact, reliability, and novel, and other paper ranking mechanisms
+
+3. Store papers in a database with metadata. Agents can use retrieval
+
+4. Discord Bot // Twitter Bot
+"""
+
+
+import requests
+from bs4 import BeautifulSoup
+import os
+
+class Paper:
+    def __init__(self, title, date, authors, abstract):
+        self.title = title
+        self.date = date
+        self.authors = authors
+        self.abstract = abstract
+
+class Scraper:
+    def __init__(self, url):
+        self.url = url
+
+    def get_paper_links(self):
+        response = requests.get(self.url)
+        soup = BeautifulSoup(response.text, 'html.parser')
+        links = [a['href'] for a in soup.find_all('a', href=True) if '/papers/' in a['href']]
+        return links
+
+    def get_paper_details(self, link):
+        response = requests.get(self.url + link)
+        soup = BeautifulSoup(response.text, 'html.parser')
+        title = soup.find('h1').text
+        date_tag = soup.find('time')
+        date = date_tag.text if date_tag else 'Unknown'
+        authors = [author.text for author in soup.find_all('span', class_='author')]
+        abstract_tag = soup.find('div', class_='abstract')
+        abstract = abstract_tag.text if abstract_tag else 'Abstract not found'
+        return Paper(title, date, authors, abstract)
+
+class FileWriter:
+    def __init__(self, directory):
+        self.directory = directory
+
+    def write_paper(self, paper):
+        with open(os.path.join(self.directory, paper.title + '.txt'), 'w') as f:
+            f.write(f"h1: {paper.title}\n")
+            f.write(f"Published on {paper.date}\n")
+            f.write("Authors:\n")
+            for author in paper.authors:
+                f.write(f"{author}\n")
+            f.write("Abstract\n")
+            f.write(paper.abstract)
+
+scraper = Scraper('https://huggingface.co/papers')
+file_writer = FileWriter('images')
+
+links = scraper.get_paper_links()
+for link in links:
+    paper = scraper.get_paper_details(link)
+    file_writer.write_paper(paper)
--- a/images/404.txt
+++ b/images/404.txt
@ -0,0 +1,5 @@
+h1: 404
+Published on Unknown
+Authors:
+Abstract
+Abstract not found
--- a/images/Swarms.md
+++ b/images/Swarms.md
@ -1,2 +0,0 @@
-# Agents
-* Agents are the fundamental building blocks of a swarm, they are indivi
--- a/pyproject.toml
+++ b/pyproject.toml
@ -4,7 +4,7 @@ build-backend = "poetry.core.masonry.api"

 [tool.poetry]
 name = "swarms"
-version = "1.8.1"
+version = "1.8.2"
 description = "Swarms - Pytorch"
 license = "MIT"
 authors = ["Kye Gomez <kye@apac.ai>"]
@ -46,7 +46,6 @@ redis = "*"
 Pillow = "*"
 chromadb = "*"
 agent-protocol = "*"
-exxa = "*"
 open-interpreter = "*"
 tabulate = "*"
 termcolor = "*"
--- a/swarms/prompts/multi_modal_visual_prompts.py
+++ b/swarms/prompts/multi_modal_visual_prompts.py
@ -45,4 +45,4 @@ New input: {input}
 Since Worker Multi-Modal Agent is a text language model, Worker Multi-Modal Agent must use tools to observe images rather than imagination.
 The thoughts and observations are only visible for Worker Multi-Modal Agent, Worker Multi-Modal Agent should remember to repeat important information in the final response for Human.
 Thought: Do I need to use a tool? {agent_scratchpad} Let's think step by step.
-"""
+"""
--- a/swarms/tools/autogpt.py
+++ b/swarms/tools/autogpt.py
@ -146,7 +146,6 @@ class WebpageQATool(BaseTool):
        raise NotImplementedError


-
@tool
 def VQAinference(self, inputs):
    """