manuelsh · September 11, 2024 17:39 · manuelsh · Sep 11, 2024
diff --git a/get_github_stars.py b/get_github_stars.py
 import requests
 import pandas as pd

 # Let's read the file first and inspect its content to identify how to extract the required information.
 file_path = 'README.md'

 with open(file_path, 'r') as file:
    file_content = file.read()

 # Updating the logic to specifically capture only GitHub URLs

 def extract_tool_info_github_only(markdown_text):
    tool_data = []
    
    # Split the markdown content by sections (e.g., tool entries appear under "## [ToolName](URL)")
    tool_sections = re.split(r'## \[(.*?)\]\((.*?)\)', markdown_text)

    # We expect the list to alternate between tool name/URL pairs and their descriptions
    for i in range(1, len(tool_sections), 3):
        name = tool_sections[i].strip()
        url = tool_sections[i+1].strip()
        
        # Only proceed if the URL is a GitHub URL
        if "https://github.com" in url:
            description_part = tool_sections[i+2].strip()
            
            # Extract category and description from the description part
            category_search = re.search(r'### Category\n(.*?)\n', description_part)
            description_search = re.search(r'### Description\n(.*?)\n', description_part, re.DOTALL)
            
            category = category_search.group(1).strip() if category_search else "N/A"
            description = description_search.group(1).strip() if description_search else "No description available"
            
            tool_data.append([name, url, category, description])
    
    return tool_data



 # Extract the data using the filtered GitHub URLs
 tools_info = extract_tool_info_github_only(file_content)

 # Create a DataFrame for better visualization
 df_tools = pd.DataFrame(tools_info, columns=['Name', 'GitHub URL', 'Category', 'Description'])

 # Display the updated DataFrame to the user
 print(df_tools.head())



 # Function to get the star count from GitHub API
 def get_repo_stars(owner, repo, token=None):
    url = f"https://api.github.com/repos/{owner}/{repo}"
    headers = {}

    if token:
        headers['Authorization'] = f'token {token}'

    response = requests.get(url, headers=headers)

    if response.status_code == 200:
        repo_data = response.json()
        return repo_data.get('stargazers_count', 0)
    else:
        print(f"Failed to retrieve data for {owner}/{repo}: {response.status_code}")
        return None

 # Add a new column for the stars
 df_tools['Stars'] = None

 # Iterate through the dataframe and update the star counts
 for index, row in df_tools.iterrows():
    github_url = row['GitHub URL']
    if pd.notna(github_url) and "github.com" in github_url:
        try:
            owner_repo = github_url.replace("https://github.com/", "").split('/')
            if len(owner_repo) == 2:
                owner, repo = owner_repo
                stars = get_repo_stars(owner, repo)
                df_tools.at[index, 'Stars'] = stars
        except Exception as e:
            print(f"Error fetching stars for {github_url}: {e}")
            df_tools.at[index, 'Stars'] = 'Error'

 # Save the updated dataframe to a new CSV file
 output_csv_path = "tools_info_with_stars.csv"
 df_tools.to_csv(output_csv_path, index=False)

 print(f"Updated data saved to {output_csv_path}")


 # Ensure that the 'Stars' column is numeric, in case there are any non-numeric values
 df_tools['Stars'] = pd.to_numeric(df_tools['Stars'], errors='coerce')

 # Sort the dataframe by 'Stars' in descending order
 df_tools_sorted = df_tools.sort_values(by='Stars', ascending=False).reset_index(drop=True)

 # Display the sorted dataframe
 print( df_tools_sorted[['Name','Stars','GitHub URL','Description','Category']].to_markdown(index=False) )
	import requests
	import pandas as pd

	# Let's read the file first and inspect its content to identify how to extract the required information.
	file_path = 'README.md'

	with open(file_path, 'r') as file:
	file_content = file.read()

	# Updating the logic to specifically capture only GitHub URLs

	def extract_tool_info_github_only(markdown_text):
	tool_data = []

	# Split the markdown content by sections (e.g., tool entries appear under "## [ToolName](URL)")
	tool_sections = re.split(r'## \[(.?)\]\((.?)\)', markdown_text)

	# We expect the list to alternate between tool name/URL pairs and their descriptions
	for i in range(1, len(tool_sections), 3):
	name = tool_sections[i].strip()
	url = tool_sections[i+1].strip()

	# Only proceed if the URL is a GitHub URL
	if "https://github.com" in url:
	description_part = tool_sections[i+2].strip()

	# Extract category and description from the description part
	category_search = re.search(r'### Category\n(.*?)\n', description_part)
	description_search = re.search(r'### Description\n(.*?)\n', description_part, re.DOTALL)

	category = category_search.group(1).strip() if category_search else "N/A"
	description = description_search.group(1).strip() if description_search else "No description available"

	tool_data.append([name, url, category, description])

	return tool_data



	# Extract the data using the filtered GitHub URLs
	tools_info = extract_tool_info_github_only(file_content)

	# Create a DataFrame for better visualization
	df_tools = pd.DataFrame(tools_info, columns=['Name', 'GitHub URL', 'Category', 'Description'])

	# Display the updated DataFrame to the user
	print(df_tools.head())



	# Function to get the star count from GitHub API
	def get_repo_stars(owner, repo, token=None):
	url = f"https://api.github.com/repos/{owner}/{repo}"
	headers = {}

	if token:
	headers['Authorization'] = f'token {token}'

	response = requests.get(url, headers=headers)

	if response.status_code == 200:
	repo_data = response.json()
	return repo_data.get('stargazers_count', 0)
	else:
	print(f"Failed to retrieve data for {owner}/{repo}: {response.status_code}")
	return None

	# Add a new column for the stars
	df_tools['Stars'] = None

	# Iterate through the dataframe and update the star counts
	for index, row in df_tools.iterrows():
	github_url = row['GitHub URL']
	if pd.notna(github_url) and "github.com" in github_url:
	try:
	owner_repo = github_url.replace("https://github.com/", "").split('/')
	if len(owner_repo) == 2:
	owner, repo = owner_repo
	stars = get_repo_stars(owner, repo)
	df_tools.at[index, 'Stars'] = stars
	except Exception as e:
	print(f"Error fetching stars for {github_url}: {e}")
	df_tools.at[index, 'Stars'] = 'Error'

	# Save the updated dataframe to a new CSV file
	output_csv_path = "tools_info_with_stars.csv"
	df_tools.to_csv(output_csv_path, index=False)

	print(f"Updated data saved to {output_csv_path}")


	# Ensure that the 'Stars' column is numeric, in case there are any non-numeric values
	df_tools['Stars'] = pd.to_numeric(df_tools['Stars'], errors='coerce')

	# Sort the dataframe by 'Stars' in descending order
	df_tools_sorted = df_tools.sort_values(by='Stars', ascending=False).reset_index(drop=True)

	# Display the sorted dataframe
	print( df_tools_sorted[['Name','Stars','GitHub URL','Description','Category']].to_markdown(index=False) )
Name	Stars	GitHub URL	Description	Category
MetaGPT	43543	https://github.com/geekan/MetaGPT	MetaGPT is a multi-agent framework that, given one line requirement, returns PRD, Design, Tasks, or Repo.	Multi-agent, Coding, Build your own
AutoGen	30685	https://github.com/microsoft/autogen	- A framework for developing LLM (Large Language Model) applications with multiple conversational agents.	General purpose, Build your own, Multi-agent
GPT Pilot	29516	https://github.com/Pythagora-io/gpt-pilot	GPT Pilot is an AI agent that codes the entire app as you oversee the code being written	Coding
ChatDev	25040	https://github.com/OpenBMB/ChatDev	- ChatDev is a virtual software company driven by a multitude of intelligent agents assuming different roles such as CEO, CPO, CTO, programmer, reviewer, tester, and art designer, each represented by unique icons.	Coding, Multi-agent
JARVIS	23538	https://github.com/microsoft/JARVIS	JARVIS is a system to connect LLMs with the ML community.	General purpose
BabyAGI	19918	https://github.com/yoheinakajima/babyagi	- A pared-down version of the original Task-Driven Autonomous Agent	General purpose
Local GPT	19783	https://github.com/PromtEngineer/localGPT	LocalGPT is an open-source initiative that allows you to converse with your documents without compromising your privacy. Inspired by privateGPT, allows using your own documents as an information source	Research, Data analysis, General purpose
CrewAI	19049	https://github.com/joaomdmoura/crewai	- Cutting-edge framework for orchestrating role-playing, autonomous AI agents.	Build-your-own, SDK for agents, Multi-agent
Devika	18243	https://github.com/stitionai/devika	- Devika is an Agentic AI Software Engineer that can understand high-level human instructions, break them down into steps, research relevant information, and write code to achieve the given objective.	Coding, general purpose
Aider	17877	https://github.com/paul-gauthier/aider	- Aider is a command line tool that lets you pair program with GPT-3.5/GPT-4, to edit code stored in your local git repository	Coding, GitHub
GPT Researcher	13973	https://github.com/assafelovic/gpt-researcher	GPT Researcher is a GPT-based autonomous agent that does online comprehensive research on any given topic	Research, Science
MemGPT	11349	https://github.com/cpacker/MemGPT	- A system that intelligently manages different memory tiers in LLMs to effectively provide the extended context within the LLM's limited context window.	Memory management, Data analysis
GPT Migrate	6802	https://github.com/0xpayne/gpt-migrate	GOT Migrate easily migrates your codebase from one framework or language to another.	Coding
DevOpsGPT	6473	https://github.com/kuafuai/DevOpsGPT	Welcome to the AI Driven Software Development Automation Solution, abbreviated as DevOpsGPT. We combine LLM (Large Language Model) with DevOps tools to convert natural language requirements into working software. This innovative feature greatly improves development efficiency, shortens development cycles, and reduces communication costs, resulting in higher-quality software delivery.	Coding
CAMEL	5308	https://github.com/camel-ai/camel	- CAMEL is an open-source library designed for the study of autonomous and communicative agents.	General purpose
Agents	5157	https://github.com/aiwaves-cn/agents	- Long-short Term Memory: Language agents in the library are equipped with both long-term memory implemented via VectorDB + Semantic Search and short-term memory (working memory) maintained and updated by an LLM.	General purpose, Build your own, Multi-agent
AgentVerse	4028	https://github.com/OpenBMB/AgentVerse	- Assembles multiple agents to collaboratively accomplish tasks.	General purpose, Build your own, Multi-agent
Devon	3132	https://github.com/entropy-research/Devon	- Open-source alternative to Devin by Entropy research	Coding, general purpose
Mini AGI	2792	https://github.com/muellerberndt/mini-agi	- MiniAGI is a minimal general-purpose autonomous agent based on GPT-3.5 / GPT-4	General purpose
Mentat	2498	https://github.com/biobootloader/mentat	Mentat is the AI tool that assists you with any coding task, right from your command line.	Coding
Langroid	2277	https://github.com/langroid/langroid		General purpose, Build your own
dotagent	2180	https://github.com/dot-agent/dotagent	- An agent management system that facilitates the creation of robust AI applications and experimental autonomous agents through a rich suite of developer tools.	Build-your-own
GPT Discord	1805	https://github.com/Kav-K/GPTDiscord	- GPT Discord is a robust, all-in-one GPT interface for Discord.	Content creation, Productivity, General purpose, Discord
DevGPT	1741	https://github.com/jina-ai/dev-gpt	- "Tell your AI team what microservice you want to build, and they will do it for you. Your imagination is the limit!!	Coding, Multi-agent
DemoGPT	1672	https://github.com/melih-unsal/DemoGPT	- DemoGPT leverages the power of Language Models (LLMs) to provide fast and effective demo creation for applications.	Build-your-own, General purpose
AI Legion	1339	https://github.com/eumemic/ai-legion	- An LLM-powered autonomous agent platform	Multi-agent, Build-your-own
AutoPR	1233	https://github.com/irgolic/AutoPR	- Triggered by adding a label containing AutoPR to an issue, AutoPR will:	Coding, GitHub
CodeFuse-ChatBot	1123	https://github.com/codefuse-ai/codefuse-chatbot	- An intelligent assistant serving the entire software development lifecycle, powered by a Multi-Agent Framework, working with DevOps Toolkits, Code&Doc Repo RAG, etc.	Coding
IX	1005	https://github.com/kreneskyp/ix	IX is a platform for building, debugging, and deploying collaborative Agents and cognitive workflows.	Build your own, Multi-agent
LLM Agents	925	https://github.com/mpaepper/llm_agents	A minimalistic library for building agents that leverage large language models to automate tasks through a loop of commands and tool integrations.	Coding
Adala	911	https://github.com/HumanSignal/Adala		General purpose, Build your own, Multi-agent
AIlice	785	https://github.com/myshell-ai/AIlice	- "An Agent in the form of a chatbot independently plans tasks given in natural language and dynamically creates an agents calling tree to execute tasks.	General purpose, Personal assistant, Productivity
Automata	604	https://github.com/emrgnt-cmplxty/automata	- Model: GPT 4	Coding
ChemCrow	581	https://github.com/ur-whitelab/chemcrow-public	- ChemCrow is an open source package for the accurate solution of reasoning-intensive chemical tasks	Science, Chemistry
Multi GPT	547	https://github.com/rumpfmax/Multi-GPT	- An experimental open-source attempt to make GPT-4 fully autonomous	General purpose
AgentForge	494	https://github.com/DataBassGit/AgentForge	- A low-code framework designed for the swift creation, testing, and iteration of AI-powered autonomous agents and Cognitive Architectures, compatible with various LLM models.	General purpose, Build your own, Multi-agent
data-to-paper	438	https://github.com/Technion-Kishony-lab/data-to-paper	data-to-paper is a framework for systematically navigating the power of AI to perform complete end-to-end	Science, Research, Multi-agent
BambooAI	436	https://github.com/pgalko/BambooAI	- BambooAI runs in a loop (until user decides to end it).	Data analysis
BeeBot	392	https://github.com/AutoPackAI/beebot	- "BeeBot is currently a work in progress and should be treated as an early stage research project. Its focus is not on production usage at this time."	General purpose, Productivity
GeniA	364	https://github.com/genia-dev/GeniA	- GeniA is able to work along side you on your production enviroment, executing tasks on your behalf in your dev & cloud environments, AWS/k8s/Argo/GitHub etc.	Coding
GPT Runner	346	https://github.com/nicepkg/gpt-runner	- Conversation with your files which selected by you, no embedding, no vector database!	Research, Science
Multiagent Debate	330	https://github.com/composable-models/llm_multiagent_debate	Multiagent Debate is an implementation of the paper "Improving Factuality and Reasoning in Language Models through Multiagent Debate".	General purpose, Multi-agent
Autonomous HR Chatbot	327	https://github.com/stepanogil/autonomous-hr-chatbot	- A prototype enterprise application - an Autonomous HR Assistant powered by GPT-3.5.	HR, Business intelligence, Productivity
Lemon Agent	311	https://github.com/felixbrock/lemon-agent	Lemon agent is a Plan-Validate-Solve (PVS) Agent for accurate, reliable and reproducable workflow automation	Productivity, Coding
AgentPilot	295	https://github.com/jbexta/AgentPilot		General purpose
English Compiler	283	https://github.com/uilicious/english-compiler	- OC AI based Compiler, for converting english based markdown specs, into functional code	Coding
MemFree	282	https://github.com/memfreeme/memfree		Open Source, AI Search, Build your own
Agent4Rec	241	https://github.com/LehengTHU/Agent4Rec	- Agent4Rec is a recommender system simulator that utilizes 1,000 LLM-empowered generative agents.	General purpose, Build your own, Multi-agent
MutahunterAI	224	https://github.com/codeintegrity-ai/mutahunter	- Use Mutahunter to generate unit tests for your codebase, that specifically target the code vulnerabilities. By targeting the exact weaknesses in the code, we boost developer productivity.	Developer tools, Software security, Multi-agent, General purpose
bumpgen	92	https://github.com/xeol-io/bumpgen	- Put dependency management and upgrades on autopilot	Coding
Cody by ajhous44	50	https://github.com/ajhous44/cody	- An AI assistant designed to let you interactively query your codebase using natural language.	Coding
L2MAC	49	https://github.com/samholt/l2mac	L2MAC is a multi-agent generation framework that, a single input prompt can generate an extensive unbounded output, such as an entire codebase or an entire book.	Multi-agent, Coding, Build your own
NLSOM	41	https://github.com/mczhuge/NLSOM	- Natural Language-Based Societies of Mind - concept with societies and communities of agents	Science, Multimodal, Social, Multi-agent
Blinky	39	https://github.com/seahyinghang8/blinky	- Blinky is an open-source AI debugging agent for VSCode that uses LLMs to help identify and fix backend code errors (inspired by SWE-agent).	Coding, Debugging
BabyCommandAGI	34	https://github.com/saten-private/BabyCommandAGI	- gent designed to test what happens when you combine CLI and LLM, which are more traditional interfaces than GUI (created by @saten-private)	General purpose, Coding
BabyFoxAGI	nan	https://github.com/yoheinakajima/babyagi/tree/main/classic/babyfoxagi	- A mod of BabyElfAGI, in a series of mods w the naming of BabyAGI in alphabetical order	General purpose
Clippy	nan	https://github.com/ennucore/clippy/	- The purpose of Clippy is to elop code for or with the user.	Coding
Friday	nan	https://github.com/amirrezasalimi/friday/	- A developer assistant able to make whole nodejs project with unlimited prompts	Coding
Loop GPT	nan	https://github.com/farizrahman4u/loopgpt/tree/main	Loop GPT is a re-implementation of the popular Auto-GPT project as a proper python package, written with modularity and extensibility in mind	General purpose
OpenAgents	nan	https://github.com/xlang-ai/OpenAgents	OpenAgents is an Open Platform for Language Agents in the Wild, ChatGPT Plus Replica for Researchers, Developers, and General Users.	General purpose
OpenAGI	nan	https://github.com/agiresearch/OpenAGI	OpenAGI is an open-source AGI R&D platform that enables agents for both benchmark tasks and open-ended tasks	General purpose
OpenDevin	nan	https://github.com/OpenDevin/OpenDevin	- The OpenDevin project is born out of a desire to replicate, enhance, and innovate beyond the original Devin model.	Coding, general purpose
PromethAI	nan	https://github.com/topoteretes/PromethAI-Backend	- "Personalized AI assistant that decomposes problems, offers solutions, and lets you use Agent actions to automate your flows"	Productivity, General purpose
Smol developer	nan	https://github.com/smol-ai/developer	Smol is your own junior developer. Deployed in few seconds via e2b	Coding
Stackwise	nan	https://github.com/stackwiseai/stackwise	Stackwise is a VS Code extension that writes and imports nodejs functions so that you can write code without context switching	Tool for agents, Coding
Suspicion Agent	nan	https://github.com/CR-Gjx/Suspicion-Agent	- Playing Imperfect Information Games with Theory of Mind Aware GPT-4	General purpose
SWE Agent	nan	https://github.com/princeton-nlp/SWE-agent	- This Devin alternative scores 12.3% on the FULL swe benchmark	Coding, general purpose
Taxy AI	nan	https://github.com/TaxyAI/browser-extension	- Taxy uses GPT-4 to control your browser and perform repetitive actions on your behalf	General purpose, Productivity
Teenage AGI	nan	https://github.com/seanpixel/Teenage-AGI/blob/main/README.md#experiments	A BabyAGI-inspired agent that can recall infinite memory, "thinks" before making action, and doesn't lose memory after being shutting down	General purpose
UFO	nan	https://github.com/microsoft/UFO	- Agent by Microsoft	Multi-agent, GUI Agent
WorkGPT	nan	https://github.com/team-openpm/workgpt	- WorkGPT is an agent framework in a similar fashion to AutoGPT or LangChain. You give it a directive and an array of APIs and it will converse back and forth with the AI until its directive is complete.	Coding
XAgent	nan	https://github.com/OpenBMB/XAgent	XAgent is an open-source experimental Large Language Model (LLM) driven autonomous agent that can automatically solve various tasks	General purpose, Coding
yAgents	nan	https://github.com/yeagerai/yeagerai-agent	yAgents is an Agent-Builder Agent made by Yeager.ai capable of designing, coding and debugging its own tools.	Coding, Build-your-own
Yourgoal	nan	https://github.com/pj4533/yourgoal/?utm_source=awesome-ai-agents	- "This is a Swift port of BabyAGI, an example of an AI-powered task management system that uses OpenAI and Pinecone APIs to create, prioritize, and execute tasks. The main idea behind this system is that it creates tasks based on the result of previous tasks and a predefined objective."	General purpose
Artisian AI	nan	https://github.com/Artisan-AI	- YC company	Multi-agent, Build-your-own
GitHub Copilot X	nan	https://github.com/features/preview/copilot-x	- AI pair programmer	Coding, GitHub
Instrukt	nan	https://github.com/blob42/Instrukt	- Enables users to create and instruct modular AI agents, generate document indexes for question-answering, and attach tools to agents for enhanced functionalities.	Coding, Build-your-own