3 # Copyright (C) 2020-2023 Free Software Foundation, Inc.
5 # This file is part of GCC.
7 # GCC is free software; you can redistribute it and/or modify
8 # it under the terms of the GNU General Public License as published by
9 # the Free Software Foundation; either version 3, or (at your option)
12 # GCC is distributed in the hope that it will be useful,
13 # but WITHOUT ANY WARRANTY; without even the implied warranty of
14 # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
15 # GNU General Public License for more details.
17 # You should have received a copy of the GNU General Public License
18 # along with GCC; see the file COPYING. If not, write to
19 # the Free Software Foundation, 51 Franklin Street, Fifth Floor,
20 # Boston, MA 02110-1301, USA.
22 # This script parses a .diff file generated with 'diff -up' or 'diff -cp'
23 # and adds a skeleton ChangeLog file to the file. It does not try to be
24 # too smart when parsing function names, but it produces a reasonable
27 # Author: Martin Liska <mliska@suse.cz>
36 from itertools
import takewhile
40 from unidiff
import PatchSet
44 CO_AUTHORED_BY_PREFIX
= 'co-authored-by: '
46 pr_regex
= re
.compile(r
'(\/(\/|\*)|[Cc*!])\s+(?P<pr>PR [a-z+-]+\/[0-9]+)')
47 prnum_regex
= re
.compile(r
'PR (?P<comp>[a-z+-]+)/(?P<num>[0-9]+)')
48 dr_regex
= re
.compile(r
'(\/(\/|\*)|[Cc*!])\s+(?P<dr>DR [0-9]+)')
49 dg_regex
= re
.compile(r
'{\s+dg-(error|warning)')
50 pr_filename_regex
= re
.compile(r
'(^|[\W_])[Pp][Rr](?P<pr>\d{4,})')
51 identifier_regex
= re
.compile(r
'^([a-zA-Z0-9_#].*)')
52 comment_regex
= re
.compile(r
'^\/\*')
53 struct_regex
= re
.compile(r
'^(class|struct|union|enum)\s+'
54 r
'(GTY\(.*\)\s+)?([a-zA-Z0-9_]+)')
55 macro_regex
= re
.compile(r
'#\s*(define|undef)\s+([a-zA-Z0-9_]+)')
56 super_macro_regex
= re
.compile(r
'^DEF[A-Z0-9_]+\s*\(([a-zA-Z0-9_]+)')
57 fn_regex
= re
.compile(r
'([a-zA-Z_][^()\s]*)\s*\([^*]')
58 template_and_param_regex
= re
.compile(r
'<[^<>]*>')
59 md_def_regex
= re
.compile(r
'\(define.*\s+"(.*)"')
60 bugzilla_url
= 'https://gcc.gnu.org/bugzilla/rest.cgi/bug?id=%s&' \
61 'include_fields=summary,component'
63 function_extensions
= {'.c', '.cpp', '.C', '.cc', '.h', '.inc', '.def', '.md'}
65 # NB: Makefile.in isn't listed as it's not always generated.
66 generated_files
= {'aclocal.m4', 'config.h.in', 'configure'}
69 Generate ChangeLog template for PATCH.
70 PATCH must be generated using diff(1)'s -up or -cp options
71 (or their equivalent in git).
74 script_folder
= os
.path
.realpath(__file__
)
75 root
= os
.path
.dirname(os
.path
.dirname(script_folder
))
78 def find_changelog(path
):
79 folder
= os
.path
.split(path
)[0]
81 if os
.path
.exists(os
.path
.join(root
, folder
, 'ChangeLog')):
83 folder
= os
.path
.dirname(folder
)
86 raise AssertionError()
89 def extract_function_name(line
):
90 if comment_regex
.match(line
):
92 m
= struct_regex
.search(line
)
95 return m
.group(1) + ' ' + m
.group(3)
96 m
= macro_regex
.search(line
)
100 m
= super_macro_regex
.search(line
)
104 m
= fn_regex
.search(line
)
106 # Discard template and function parameters.
108 fn
= re
.sub(template_and_param_regex
, '', fn
)
113 def try_add_function(functions
, line
):
114 fn
= extract_function_name(line
)
115 if fn
and fn
not in functions
:
120 def sort_changelog_files(changed_file
):
121 return (changed_file
.is_added_file
, changed_file
.is_removed_file
)
124 def get_pr_titles(prs
):
126 for idx
, pr
in enumerate(prs
):
127 pr_id
= pr
.split('/')[-1]
128 r
= requests
.get(bugzilla_url
% pr_id
)
129 bugs
= r
.json()['bugs']
131 prs
[idx
] = 'PR %s/%s' % (bugs
[0]['component'], pr_id
)
132 out
= '%s - %s\n' % (prs
[idx
], bugs
[0]['summary'])
133 if out
not in output
:
137 return '\n'.join(output
)
140 def append_changelog_line(out
, relative_path
, text
):
141 line
= f
'\t* {relative_path}:'
142 if len(line
.replace('\t', ' ' * TAB_WIDTH
) + ' ' + text
) <= LINE_LIMIT
:
143 out
+= f
'{line} {text}\n'
150 def get_rel_path_if_prefixed(path
, folder
):
151 if path
.startswith(folder
):
152 return path
[len(folder
):].lstrip('/')
157 def generate_changelog(data
, no_functions
=False, fill_pr_titles
=False,
158 additional_prs
=None):
165 diff
= PatchSet(data
)
168 for apr
in additional_prs
:
169 if not apr
.startswith('PR ') and '/' in apr
:
174 # skip files that can't be parsed
175 if file.path
== '/dev/null':
177 changelog
= find_changelog(file.path
)
178 if changelog
not in changelogs
:
179 changelogs
[changelog
] = []
180 changelog_list
.append(changelog
)
181 changelogs
[changelog
].append(file)
183 # Extract PR entries from newly added tests
184 if 'testsuite' in file.path
and file.is_added_file
:
185 # Only search first ten lines as later lines may
186 # contains commented code which a note that it
187 # has not been tested due to a certain PR or DR.
191 for line
in hunks
[0][0:10]:
192 m
= pr_regex
.search(line
.value
)
197 this_file_prs
.append(pr
.split('/')[-1])
199 m
= dr_regex
.search(line
.value
)
204 this_file_prs
.append(dr
.split('/')[-1])
205 elif dg_regex
.search(line
.value
):
206 # Found dg-warning/dg-error line
209 # PR number in the file name
210 fname
= os
.path
.basename(file.path
)
211 m
= pr_filename_regex
.search(fname
)
215 if pr
not in this_file_prs
and pr2
not in prs
:
219 out
+= get_pr_titles(prs
)
221 # print list of PR entries before ChangeLog entries
229 # sort ChangeLog so that 'testsuite' is at the end
230 for changelog
in sorted(changelog_list
, key
=lambda x
: 'testsuite' in x
):
231 files
= changelogs
[changelog
]
232 out
+= '%s:\n' % os
.path
.join(changelog
, 'ChangeLog')
234 # new and deleted files should be at the end
235 for file in sorted(files
, key
=sort_changelog_files
):
236 assert file.path
.startswith(changelog
)
237 in_tests
= 'testsuite' in changelog
or 'testsuite' in file.path
238 relative_path
= get_rel_path_if_prefixed(file.path
, changelog
)
240 if file.is_added_file
:
241 msg
= 'New test.' if in_tests
else 'New file.'
242 out
= append_changelog_line(out
, relative_path
, msg
)
243 elif file.is_removed_file
:
244 out
= append_changelog_line(out
, relative_path
, 'Removed.')
245 elif hasattr(file, 'is_rename') and file.is_rename
:
246 # A file can be theoretically moved to a location that
247 # belongs to a different ChangeLog. Let user fix it.
249 # Since unidiff 0.7.0, path.file == path.target_file[2:],
250 # it used to be path.source_file[2:]
251 relative_path
= get_rel_path_if_prefixed(file.source_file
[2:],
253 out
= append_changelog_line(out
, relative_path
, 'Moved to...')
254 new_path
= get_rel_path_if_prefixed(file.target_file
[2:],
256 out
+= f
'\t* {new_path}: ...here.\n'
257 elif os
.path
.basename(file.path
) in generated_files
:
258 out
+= '\t* %s: Regenerate.\n' % (relative_path
)
259 append_changelog_line(out
, relative_path
, 'Regenerate.')
263 # Do not add function names for testsuite files
264 extension
= os
.path
.splitext(relative_path
)[1]
265 if not in_tests
and extension
in function_extensions
:
267 modified_visited
= False
270 m
= identifier_regex
.match(line
.value
)
271 if line
.is_added
or line
.is_removed
:
272 # special-case definition in .md files
273 m2
= md_def_regex
.match(line
.value
)
274 if extension
== '.md' and m2
:
276 if fn
not in functions
:
281 if not line
.value
.strip():
283 modified_visited
= True
284 if m
and try_add_function(functions
,
288 elif line
.is_context
:
289 if last_fn
and modified_visited
:
290 try_add_function(functions
, last_fn
)
292 modified_visited
= False
296 modified_visited
= False
298 try_add_function(functions
,
301 out
+= '\t* %s (%s):\n' % (relative_path
, functions
[0])
302 for fn
in functions
[1:]:
303 out
+= '\t(%s):\n' % fn
305 out
+= '\t* %s:\n' % relative_path
310 def update_copyright(data
):
311 current_timestamp
= datetime
.datetime
.now().strftime('%Y-%m-%d')
312 username
= subprocess
.check_output('git config user.name', shell
=True,
313 encoding
='utf8').strip()
314 email
= subprocess
.check_output('git config user.email', shell
=True,
315 encoding
='utf8').strip()
318 diff
= PatchSet(data
)
321 changelog
= os
.path
.join(find_changelog(file.path
), 'ChangeLog')
322 if changelog
not in changelogs
:
323 changelogs
.add(changelog
)
324 with
open(changelog
) as f
:
326 with
open(changelog
, 'w+') as f
:
327 f
.write(f
'{current_timestamp} {username} <{email}>\n\n')
328 f
.write('\tUpdate copyright years.\n\n')
332 def skip_line_in_changelog(line
):
333 if line
.lower().startswith(CO_AUTHORED_BY_PREFIX
) or line
.startswith('#'):
338 if __name__
== '__main__':
339 extra_args
= os
.getenv('GCC_MKLOG_ARGS')
341 sys
.argv
+= json
.loads(extra_args
)
343 parser
= argparse
.ArgumentParser(description
=help_message
)
344 parser
.add_argument('input', nargs
='?',
345 help='Patch file (or missing, read standard input)')
346 parser
.add_argument('-b', '--pr-numbers', action
='store',
347 type=lambda arg
: arg
.split(','), nargs
='?',
348 help='Add the specified PRs (comma separated)')
349 parser
.add_argument('-s', '--no-functions', action
='store_true',
350 help='Do not generate function names in ChangeLogs')
351 parser
.add_argument('-p', '--fill-up-bug-titles', action
='store_true',
352 help='Download title of mentioned PRs')
353 parser
.add_argument('-d', '--directory',
354 help='Root directory where to search for ChangeLog '
356 parser
.add_argument('-c', '--changelog',
357 help='Append the ChangeLog to a git commit message '
359 parser
.add_argument('--update-copyright', action
='store_true',
360 help='Update copyright in ChangeLog files')
361 args
= parser
.parse_args()
362 if args
.input == '-':
365 root
= args
.directory
367 data
= open(args
.input, newline
='\n') if args
.input else sys
.stdin
368 if args
.update_copyright
:
369 update_copyright(data
)
371 output
= generate_changelog(data
, args
.no_functions
,
372 args
.fill_up_bug_titles
, args
.pr_numbers
)
374 lines
= open(args
.changelog
).read().split('\n')
375 start
= list(takewhile(skip_line_in_changelog
, lines
))
376 end
= lines
[len(start
):]
377 with
open(args
.changelog
, 'w') as f
:
378 if not start
or not start
[0]:
380 # initial commit subject line 'component: [PRnnnnn]'
381 m
= prnum_regex
.match(prs
[0])
383 title
= f
'{m.group("comp")}: [PR{m.group("num")}]'
384 start
.insert(0, title
)
390 # append 2 empty lines
392 f
.write('\n'.join(start
))
395 f
.write('\n'.join(end
))
397 print(output
, end
='')