|
| 1 | +from dataclasses import asdict |
| 2 | +from typing import Generator |
| 3 | +from time import sleep |
| 4 | + |
| 5 | +import requests |
| 6 | + |
| 7 | +from src.constants import TIMEDELTA |
| 8 | +from src.repo_dataclasses import PullRequestData |
| 9 | +from src.interface_wrapper import IRepositoryAPI, Repository |
| 10 | +from src.utils import logger |
| 11 | + |
| 12 | + |
| 13 | +# -----------GraphQLAPI block-------------- |
| 14 | + |
| 15 | +def log_repositories_pr_by_graphql(owner, repo_name, token, csv_name, first_n=100): |
| 16 | + HEADERS = {"Authorization": f"Bearer {token}", "Content-Type": "application/json"} |
| 17 | + |
| 18 | + query = """ |
| 19 | + query GetPRData($owner: String!, $repo: String!, $first: Int!, $after: String) { |
| 20 | + repository(owner: $owner, name: $repo) { |
| 21 | + nameWithOwner |
| 22 | + pullRequests(first: $first, after: $after, states: [OPEN, CLOSED, MERGED], orderBy: {field: CREATED_AT, direction: DESC}) { |
| 23 | + totalCount |
| 24 | + pageInfo { |
| 25 | + hasNextPage |
| 26 | + endCursor |
| 27 | + } |
| 28 | + nodes { |
| 29 | + title |
| 30 | + number |
| 31 | + state |
| 32 | + createdAt |
| 33 | + |
| 34 | + author { |
| 35 | + login |
| 36 | + ... on User { |
| 37 | + name |
| 38 | + email |
| 39 | + } |
| 40 | + } |
| 41 | + |
| 42 | + baseRef { |
| 43 | + name |
| 44 | + target { |
| 45 | + oid |
| 46 | + } |
| 47 | + } |
| 48 | +
|
| 49 | + headRef { |
| 50 | + name |
| 51 | + target { |
| 52 | + oid |
| 53 | + } |
| 54 | + } |
| 55 | + |
| 56 | + changedFiles |
| 57 | + additions |
| 58 | + deletions |
| 59 | + |
| 60 | + mergedAt |
| 61 | + mergedBy { |
| 62 | + login |
| 63 | + ... on User { |
| 64 | + name |
| 65 | + email |
| 66 | + } |
| 67 | + } |
| 68 | + |
| 69 | + assignees(first: 10) { |
| 70 | + nodes { |
| 71 | + login |
| 72 | + name |
| 73 | + } |
| 74 | + } |
| 75 | + |
| 76 | + labels(first: 20) { |
| 77 | + nodes { |
| 78 | + name |
| 79 | + color |
| 80 | + } |
| 81 | + } |
| 82 | + } |
| 83 | + } |
| 84 | + } |
| 85 | + } |
| 86 | + """ |
| 87 | + |
| 88 | + has_next_page = True |
| 89 | + after_cursor = None |
| 90 | + processed_count = 0 |
| 91 | + |
| 92 | + while has_next_page: |
| 93 | + |
| 94 | + variables = { |
| 95 | + "owner": owner, |
| 96 | + "repo": repo_name, |
| 97 | + "first": first_n, |
| 98 | + "after": after_cursor, |
| 99 | + } |
| 100 | + |
| 101 | + response = requests.post( |
| 102 | + "https://api.github.com/graphql", |
| 103 | + headers=HEADERS, |
| 104 | + json={"query": query, "variables": variables}, |
| 105 | + ) |
| 106 | + |
| 107 | + if response.status_code != 200: |
| 108 | + logger.log_error(f"GraphQL request failed: {response.status_code} - {response.text}") |
| 109 | + logger.log_to_stdout(f"Sleep to {100*TIMEDELTA} and retry") |
| 110 | + sleep(100*TIMEDELTA) |
| 111 | + continue |
| 112 | + |
| 113 | + graphql_data = response.json() |
| 114 | + |
| 115 | + if "errors" in graphql_data: |
| 116 | + logger.log_error(f"GraphQL errors: {graphql_data['errors']}") |
| 117 | + logger.log_to_stdout(f"Sleep to {100*TIMEDELTA} and retry") |
| 118 | + sleep(100*TIMEDELTA) |
| 119 | + continue |
| 120 | + |
| 121 | + repo_data = graphql_data["data"]["repository"] |
| 122 | + |
| 123 | + page_info = repo_data["pullRequests"]["pageInfo"] |
| 124 | + has_next_page = page_info["hasNextPage"] |
| 125 | + after_cursor = page_info["endCursor"] |
| 126 | + |
| 127 | + prs = repo_data["pullRequests"]["nodes"] |
| 128 | + |
| 129 | + processed_count += len(prs) |
| 130 | + logger.log_to_stdout(f"Processing {processed_count} / {repo_data["pullRequests"]['totalCount']}") |
| 131 | + |
| 132 | + for pr in prs: |
| 133 | + pr_data = PullRequestData( |
| 134 | + repository_name=repo_data["nameWithOwner"], |
| 135 | + title=pr["title"], |
| 136 | + id=pr["number"], |
| 137 | + state=str(pr["state"]).lower(), |
| 138 | + commit_into=( |
| 139 | + pr["baseRef"]["target"]["oid"] |
| 140 | + if pr["baseRef"] and pr["baseRef"]["target"] |
| 141 | + else None |
| 142 | + ), |
| 143 | + commit_from=( |
| 144 | + pr["headRef"]["target"]["oid"] |
| 145 | + if pr["headRef"] and pr["headRef"]["target"] |
| 146 | + else None |
| 147 | + ), |
| 148 | + created_at=pr["createdAt"], |
| 149 | + creator_name=( |
| 150 | + pr["author"]["name"] |
| 151 | + if pr["author"] and "name" in pr["author"] |
| 152 | + else None |
| 153 | + ), |
| 154 | + creator_login=pr["author"]["login"] if pr["author"] else None, |
| 155 | + creator_email=( |
| 156 | + pr["author"]["email"] |
| 157 | + if pr["author"] and "email" in pr["author"] |
| 158 | + else None |
| 159 | + ), |
| 160 | + changed_files=pr["changedFiles"], |
| 161 | + comment_body=None, |
| 162 | + comment_created_at=None, |
| 163 | + comment_author_name=None, |
| 164 | + comment_author_login=None, |
| 165 | + comment_author_email=None, |
| 166 | + merger_name=( |
| 167 | + pr["mergedBy"]["name"] |
| 168 | + if pr["mergedBy"] and "name" in pr["mergedBy"] |
| 169 | + else None |
| 170 | + ), |
| 171 | + merger_login=pr["mergedBy"]["login"] if pr["mergedBy"] else None, |
| 172 | + merger_email=( |
| 173 | + pr["mergedBy"]["email"] |
| 174 | + if pr["mergedBy"] and "email" in pr["mergedBy"] |
| 175 | + else None |
| 176 | + ), |
| 177 | + source_branch=pr["headRef"]["name"] if pr["headRef"] else None, |
| 178 | + target_branch=pr["baseRef"]["name"] if pr["baseRef"] else None, |
| 179 | + assignee_story=None, |
| 180 | + related_issues=None, |
| 181 | + labels=", ".join([label["name"] for label in pr["labels"]["nodes"]]), |
| 182 | + milestone=None, |
| 183 | + ) |
| 184 | + |
| 185 | + pr_info = asdict(pr_data) |
| 186 | + logger.log_to_csv(csv_name, list(pr_info.keys()), pr_info) |
| 187 | + logger.log_to_stdout(pr_info) |
| 188 | + |
| 189 | + |
| 190 | +def log_pull_requests_by_graphql( |
| 191 | + binded_repos: Generator[tuple[IRepositoryAPI, Repository, str], None, None], |
| 192 | + csv_name: str, |
| 193 | +): |
| 194 | + info = asdict(PullRequestData()) |
| 195 | + logger.log_to_csv(csv_name, list(info.keys())) |
| 196 | + |
| 197 | + for _, repo, token in binded_repos: |
| 198 | + logger.log_title(repo.name) |
| 199 | + log_repositories_pr_by_graphql( |
| 200 | + owner=repo.owner.login, repo_name=repo.name, csv_name=csv_name, token=token |
| 201 | + ) |
| 202 | + sleep(100*TIMEDELTA) |
0 commit comments