-
Notifications
You must be signed in to change notification settings - Fork 13
/
Copy pathget-prs
executable file
·152 lines (135 loc) · 5.83 KB
/
get-prs
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
#!/usr/bin/env python3
#
# Copyright 2021 Proofcraft Pty Ltd
# Copyright 2022 Axel Heider ([email protected])
#
# SPDX-License-Identifier: BSD-2-Clause
#
#
# Parse a PR description body for comments of the form
# "[T|t]est with[:]? <ref> ((, | and) <ref>)*"
# where
# <ref> = "<org>/<repo>#<id>" | "https://github.com/<org>/<repo>/pull/<id>"
#
# For URLs in comments, the Github GUI displays URLs pointing to PRs on Github
# as "<org>/<repo>#<id>", even if "https://github.com/<org>/<repo>/pull/<id>" is
# what the parser finds. For convenience, we support both forms.
#
# Expects a GitHub event file to be available for the PR number.
#
# Outputs space separated list of "org/repo#id"
# Outputs empty string if no such references.
#
# Fails if not a PR.
import json
import os
import re
import sys
from github import Github
# Using "(?:...)" makes a regex a non-capturing group, which is an atomic
# expression that operators can be applied to safely.
def regex_atom(regex):
return f"(?:{regex})"
test_start_re = regex_atom("[Tt]est with:?")
org_re = regex_atom("[a-zA-Z0-9_-]+")
repo_re = regex_atom("[a-zA-Z0-9_-]+")
pr_id_re = regex_atom("[0-9]+")
# Any match of "pr_ref" will yield a 3-tupel, where either the first element or
# the last two elements ("org_re/repo_re" and "pr_id_re") are not empty. That
# nicely allows determining what PR reference form we have found.
pr_ref_short_re = regex_atom(f"({org_re}/{repo_re}#{pr_id_re})")
pr_ref_url_re = regex_atom(f"https://github.com/({org_re}/{repo_re})/pull/({pr_id_re})")
pr_ref_re = regex_atom(f"{pr_ref_short_re}|{pr_ref_url_re}")
# For the reference list, multiple commas or spaces work ("<ref>, ,, <ref>"),
# it's practically support of empty items. The Oxford comma ("<ref>, and <ref>")
# is also supported.
ref_sep_re = regex_atom("[, ]+(?:and)?[ ]*")
pr_list_next_item_re = regex_atom(f"{ref_sep_re}{pr_ref_re}")
pr_list_re = regex_atom(f"{pr_ref_re}{pr_list_next_item_re}*")
# Finally, the complete regex can be build. In Python the number of groups that
# match an expression is fixed. For repeating matches like in the list, only the
# last match is returned for each group. To work around this, a matching group
# for the whole reference list is used and then decomposed in a second step.
test_with_prs_cre = re.compile(f"{test_start_re}[ ]+({pr_list_re})")
pr_ref_cre = re.compile(pr_ref_re)
def find_pr_to_test_with(text):
prs = []
if text is not None:
for line in text.splitlines():
m = test_with_prs_cre.match(line)
if m:
for t in pr_ref_cre.findall(m.group(0)):
prs.append(t[0] if t[0] else f"{t[1]}#{t[2]}")
return prs
def unit_test():
a = find_pr_to_test_with(
"This is a test\n" \
"-- Good case tests for basic things:\n" \
"Test with: org101/repo101#101\n" \
"test with https://github.com/org102/repo102/pull/102\n" \
"Test with: \n" \
"-- Good case tests for lists:\n" \
"Test with: org103/repo103#103 and org104/repo104#104," \
"https://github.com/org105/repo105/pull/105, and org106/repo106#106\n" \
"-- Trailing list separators are accepted:\n" \
"Test with: https://github.com/org107/repo107/pull/107,\n" \
"Test with: org108/repo108#108 and \n" \
"-- Space separators are accepted:\n" \
"Test with: org109/repo109#109 org110/repo110#110\n" \
"-- Multiple commas are supported:\n" \
"Test with: org111/repo111#111,, , , and org112/repo112#112\n" \
"-- Lines with trailing data are accepted, references there are ignored\n" \
"Test with: org113/repo113#113 android org901/repo901#901\n"\
"-- A proper separator is required, otherwise it's considered a comment\n" \
"-- This can become quite odd\n" \
"Test with: org114/repo114#114org902/repo902#902\n" \
"Test with: org115/repo115#115 org116/repo116#116org903/repo903#903\n" \
"Test with: org117/repo117#117andorg904/repo904#904\n" \
"Test with: org118/repo118#118gliberishorg905/repo905#905\n" \
"-- Leading space makes the parser ignore things:\n" \
" Test with: https://github.com/org906/repo906/pull/906\n" \
"*** TEST END ***"
)
print("matches:", a)
assert a[0] == "org101/repo101#101"
assert a[1] == "org102/repo102#102"
assert a[2] == "org103/repo103#103"
assert a[3] == "org104/repo104#104"
assert a[4] == "org105/repo105#105"
assert a[5] == "org106/repo106#106"
assert a[6] == "org107/repo107#107"
assert a[7] == "org108/repo108#108"
assert a[8] == "org109/repo109#109"
assert a[9] == "org110/repo110#110"
assert a[10] == "org111/repo111#111"
assert a[11] == "org112/repo112#112"
assert a[12] == "org113/repo113#113"
assert a[13] == "org114/repo114#114"
assert a[14] == "org115/repo115#115"
assert a[15] == "org116/repo116#116"
assert a[16] == "org117/repo117#117"
assert a[17] == "org118/repo118#118"
assert len(a) == 18
def main():
if os.environ['GITHUB_EVENT_NAME'] != 'pull_request' and \
os.environ['GITHUB_EVENT_NAME'] != 'pull_request_target':
print('Not a pull request')
sys.exit(1)
with open(os.environ['GITHUB_EVENT_PATH']) as f:
event = json.load(f)
issue_id = int(event['number'])
# optional auth token
token = os.environ.get('INPUT_TOKEN')
# if INPUT_TOKEN is set, but the empty string, use None instead
if not token:
token = None
# get body dynamically so we don't miss updates on test re-run:
gh = Github(login_or_token=token)
repo = gh.get_repo(os.environ['GITHUB_REPOSITORY'])
issue = repo.get_issue(number=issue_id)
# parse the issue body
prs = find_pr_to_test_with(issue.body)
print(" ".join(prs))
if __name__ == '__main__':
#unit_test()
main()