Spaces:
Running
Running
import requests | |
import csv | |
# Set the GitHub repository and the API endpoint | |
repo_url = "https://api.github.com/repos/pytorch/pytorch" | |
issues_endpoint = f"{repo_url}/issues" | |
# Initialize an empty list to store all issues | |
all_issues = [] | |
page = 1 | |
while True: | |
# Set the parameters for the API request | |
params = { | |
'state': 'open', # Change to 'closed' for closed issues | |
'per_page': 100, # Number of issues per page (adjust as needed) | |
'page': page | |
} | |
# Send the GET request to fetch issues | |
response = requests.get(issues_endpoint, params=params) | |
# Check if the request was successful (status code 200) | |
if response.status_code == 200: | |
issues = response.json() | |
if not issues: | |
break # No more issues to fetch | |
all_issues.extend(issues) | |
page += 1 | |
else: | |
print(f"Failed to retrieve issues. Status code: {response.status_code}") | |
break | |
# Open a CSV file for writing | |
with open('torch_github_issues.csv', mode='w', newline='') as csv_file: | |
fieldnames = ['Serial Number', 'Issue Number', 'Title', 'Labels', 'Body','Comments'] | |
writer = csv.DictWriter(csv_file, fieldnames=fieldnames) | |
# Write the header row | |
writer.writeheader() | |
# Write the issues data to the CSV file | |
for serial, issue in enumerate(all_issues, start=1): | |
writer.writerow({ | |
'Serial Number': serial, | |
'Issue Number': issue['number'], | |
'Title': issue['title'], | |
'Labels': ', '.join(label['name'] for label in issue['labels']), | |
'Body': issue['body'], | |
'Comments': issue['comments'] | |
}) | |
print(f"Data written to github_issues.csv") | |