git-interface: Add test suite and basic tests
[aur.git] / git-interface / git-update.py
blob28207203a52f87e8a9396aad8c78119541800afe
1 #!/usr/bin/python3
3 import os
4 import pygit2
5 import re
6 import subprocess
7 import sys
8 import time
10 import srcinfo.parse
11 import srcinfo.utils
13 import config
14 import db
16 notify_cmd = config.get('notifications', 'notify-cmd')
18 repo_path = config.get('serve', 'repo-path')
19 repo_regex = config.get('serve', 'repo-regex')
21 max_blob_size = config.getint('update', 'max-blob-size')
24 def size_humanize(num):
25 for unit in ['B', 'KiB', 'MiB', 'GiB', 'TiB', 'PiB', 'EiB', 'ZiB']:
26 if abs(num) < 2048.0:
27 if isinstance(num, int):
28 return "{}{}".format(num, unit)
29 else:
30 return "{:.2f}{}".format(num, unit)
31 num /= 1024.0
32 return "{:.2f}{}".format(num, 'YiB')
35 def extract_arch_fields(pkginfo, field):
36 values = []
38 if field in pkginfo:
39 for val in pkginfo[field]:
40 values.append({"value": val, "arch": None})
42 for arch in ['i686', 'x86_64']:
43 if field + '_' + arch in pkginfo:
44 for val in pkginfo[field + '_' + arch]:
45 values.append({"value": val, "arch": arch})
47 return values
50 def parse_dep(depstring):
51 dep, _, desc = depstring.partition(': ')
52 depname = re.sub(r'(<|=|>).*', '', dep)
53 depcond = dep[len(depname):]
55 if (desc):
56 return (depname + ': ' + desc, depcond)
57 else:
58 return (depname, depcond)
61 def save_metadata(metadata, conn, user):
62 # Obtain package base ID and previous maintainer.
63 pkgbase = metadata['pkgbase']
64 cur = conn.execute("SELECT ID, MaintainerUID FROM PackageBases "
65 "WHERE Name = ?", [pkgbase])
66 (pkgbase_id, maintainer_uid) = cur.fetchone()
67 was_orphan = not maintainer_uid
69 # Obtain the user ID of the new maintainer.
70 cur = conn.execute("SELECT ID FROM Users WHERE Username = ?", [user])
71 user_id = int(cur.fetchone()[0])
73 # Update package base details and delete current packages.
74 now = int(time.time())
75 conn.execute("UPDATE PackageBases SET ModifiedTS = ?, " +
76 "PackagerUID = ?, OutOfDateTS = NULL WHERE ID = ?",
77 [now, user_id, pkgbase_id])
78 conn.execute("UPDATE PackageBases SET MaintainerUID = ? " +
79 "WHERE ID = ? AND MaintainerUID IS NULL",
80 [user_id, pkgbase_id])
81 conn.execute("DELETE FROM Packages WHERE PackageBaseID = ?",
82 [pkgbase_id])
84 for pkgname in srcinfo.utils.get_package_names(metadata):
85 pkginfo = srcinfo.utils.get_merged_package(pkgname, metadata)
87 if 'epoch' in pkginfo and int(pkginfo['epoch']) > 0:
88 ver = '{:d}:{:s}-{:s}'.format(int(pkginfo['epoch']),
89 pkginfo['pkgver'],
90 pkginfo['pkgrel'])
91 else:
92 ver = '{:s}-{:s}'.format(pkginfo['pkgver'], pkginfo['pkgrel'])
94 for field in ('pkgdesc', 'url'):
95 if field not in pkginfo:
96 pkginfo[field] = None
98 # Create a new package.
99 cur = conn.execute("INSERT INTO Packages (PackageBaseID, Name, " +
100 "Version, Description, URL) " +
101 "VALUES (?, ?, ?, ?, ?)",
102 [pkgbase_id, pkginfo['pkgname'], ver,
103 pkginfo['pkgdesc'], pkginfo['url']])
104 conn.commit()
105 pkgid = cur.lastrowid
107 # Add package sources.
108 for source_info in extract_arch_fields(pkginfo, 'source'):
109 conn.execute("INSERT INTO PackageSources (PackageID, Source, " +
110 "SourceArch) VALUES (?, ?, ?)",
111 [pkgid, source_info['value'], source_info['arch']])
113 # Add package dependencies.
114 for deptype in ('depends', 'makedepends',
115 'checkdepends', 'optdepends'):
116 cur = conn.execute("SELECT ID FROM DependencyTypes WHERE Name = ?",
117 [deptype])
118 deptypeid = cur.fetchone()[0]
119 for dep_info in extract_arch_fields(pkginfo, deptype):
120 depname, depcond = parse_dep(dep_info['value'])
121 deparch = dep_info['arch']
122 conn.execute("INSERT INTO PackageDepends (PackageID, " +
123 "DepTypeID, DepName, DepCondition, DepArch) " +
124 "VALUES (?, ?, ?, ?, ?)",
125 [pkgid, deptypeid, depname, depcond, deparch])
127 # Add package relations (conflicts, provides, replaces).
128 for reltype in ('conflicts', 'provides', 'replaces'):
129 cur = conn.execute("SELECT ID FROM RelationTypes WHERE Name = ?",
130 [reltype])
131 reltypeid = cur.fetchone()[0]
132 for rel_info in extract_arch_fields(pkginfo, reltype):
133 relname, relcond = parse_dep(rel_info['value'])
134 relarch = rel_info['arch']
135 conn.execute("INSERT INTO PackageRelations (PackageID, " +
136 "RelTypeID, RelName, RelCondition, RelArch) " +
137 "VALUES (?, ?, ?, ?, ?)",
138 [pkgid, reltypeid, relname, relcond, relarch])
140 # Add package licenses.
141 if 'license' in pkginfo:
142 for license in pkginfo['license']:
143 cur = conn.execute("SELECT ID FROM Licenses WHERE Name = ?",
144 [license])
145 row = cur.fetchone()
146 if row:
147 licenseid = row[0]
148 else:
149 cur = conn.execute("INSERT INTO Licenses (Name) " +
150 "VALUES (?)", [license])
151 conn.commit()
152 licenseid = cur.lastrowid
153 conn.execute("INSERT INTO PackageLicenses (PackageID, " +
154 "LicenseID) VALUES (?, ?)",
155 [pkgid, licenseid])
157 # Add package groups.
158 if 'groups' in pkginfo:
159 for group in pkginfo['groups']:
160 cur = conn.execute("SELECT ID FROM Groups WHERE Name = ?",
161 [group])
162 row = cur.fetchone()
163 if row:
164 groupid = row[0]
165 else:
166 cur = conn.execute("INSERT INTO Groups (Name) VALUES (?)",
167 [group])
168 conn.commit()
169 groupid = cur.lastrowid
170 conn.execute("INSERT INTO PackageGroups (PackageID, "
171 "GroupID) VALUES (?, ?)", [pkgid, groupid])
173 # Add user to notification list on adoption.
174 if was_orphan:
175 cur = conn.execute("SELECT COUNT(*) FROM PackageNotifications WHERE " +
176 "PackageBaseID = ? AND UserID = ?",
177 [pkgbase_id, user_id])
178 if cur.fetchone()[0] == 0:
179 conn.execute("INSERT INTO PackageNotifications " +
180 "(PackageBaseID, UserID) VALUES (?, ?)",
181 [pkgbase_id, user_id])
183 conn.commit()
186 def update_notify(conn, user, pkgbase_id):
187 # Obtain the user ID of the new maintainer.
188 cur = conn.execute("SELECT ID FROM Users WHERE Username = ?", [user])
189 user_id = int(cur.fetchone()[0])
191 # Execute the notification script.
192 subprocess.Popen((notify_cmd, 'update', str(user_id), str(pkgbase_id)))
195 def die(msg):
196 sys.stderr.write("error: {:s}\n".format(msg))
197 exit(1)
200 def warn(msg):
201 sys.stderr.write("warning: {:s}\n".format(msg))
204 def die_commit(msg, commit):
205 sys.stderr.write("error: The following error " +
206 "occurred when parsing commit\n")
207 sys.stderr.write("error: {:s}:\n".format(commit))
208 sys.stderr.write("error: {:s}\n".format(msg))
209 exit(1)
212 repo = pygit2.Repository(repo_path)
214 user = os.environ.get("AUR_USER")
215 pkgbase = os.environ.get("AUR_PKGBASE")
216 privileged = (os.environ.get("AUR_PRIVILEGED", '0') == '1')
217 warn_or_die = warn if privileged else die
219 if len(sys.argv) == 2 and sys.argv[1] == "restore":
220 if 'refs/heads/' + pkgbase not in repo.listall_references():
221 die('{:s}: repository not found: {:s}'.format(sys.argv[1], pkgbase))
222 refname = "refs/heads/master"
223 sha1_old = sha1_new = repo.lookup_reference('refs/heads/' + pkgbase).target
224 elif len(sys.argv) == 4:
225 refname, sha1_old, sha1_new = sys.argv[1:4]
226 else:
227 die("invalid arguments")
229 if refname != "refs/heads/master":
230 die("pushing to a branch other than master is restricted")
232 conn = db.Connection()
234 # Detect and deny non-fast-forwards.
235 if sha1_old != "0000000000000000000000000000000000000000" and not privileged:
236 walker = repo.walk(sha1_old, pygit2.GIT_SORT_TOPOLOGICAL)
237 walker.hide(sha1_new)
238 if next(walker, None) is not None:
239 die("denying non-fast-forward (you should pull first)")
241 # Prepare the walker that validates new commits.
242 walker = repo.walk(sha1_new, pygit2.GIT_SORT_TOPOLOGICAL)
243 if sha1_old != "0000000000000000000000000000000000000000":
244 walker.hide(sha1_old)
246 # Validate all new commits.
247 for commit in walker:
248 for fname in ('.SRCINFO', 'PKGBUILD'):
249 if fname not in commit.tree:
250 die_commit("missing {:s}".format(fname), str(commit.id))
252 for treeobj in commit.tree:
253 blob = repo[treeobj.id]
255 if isinstance(blob, pygit2.Tree):
256 die_commit("the repository must not contain subdirectories",
257 str(commit.id))
259 if not isinstance(blob, pygit2.Blob):
260 die_commit("not a blob object: {:s}".format(treeobj),
261 str(commit.id))
263 if blob.size > max_blob_size:
264 die_commit("maximum blob size ({:s}) exceeded".format(size_humanize(max_blob_size)), str(commit.id))
266 metadata_raw = repo[commit.tree['.SRCINFO'].id].data.decode()
267 (metadata, errors) = srcinfo.parse.parse_srcinfo(metadata_raw)
268 if errors:
269 sys.stderr.write("error: The following errors occurred "
270 "when parsing .SRCINFO in commit\n")
271 sys.stderr.write("error: {:s}:\n".format(str(commit.id)))
272 for error in errors:
273 for err in error['error']:
274 sys.stderr.write("error: line {:d}: {:s}\n".format(error['line'], err))
275 exit(1)
277 metadata_pkgbase = metadata['pkgbase']
278 if not re.match(repo_regex, metadata_pkgbase):
279 die_commit('invalid pkgbase: {:s}'.format(metadata_pkgbase),
280 str(commit.id))
282 for pkgname in set(metadata['packages'].keys()):
283 pkginfo = srcinfo.utils.get_merged_package(pkgname, metadata)
285 for field in ('pkgver', 'pkgrel', 'pkgname'):
286 if field not in pkginfo:
287 die_commit('missing mandatory field: {:s}'.format(field),
288 str(commit.id))
290 if 'epoch' in pkginfo and not pkginfo['epoch'].isdigit():
291 die_commit('invalid epoch: {:s}'.format(pkginfo['epoch']),
292 str(commit.id))
294 if not re.match(r'[a-z0-9][a-z0-9\.+_-]*$', pkginfo['pkgname']):
295 die_commit('invalid package name: {:s}'.format(pkginfo['pkgname']),
296 str(commit.id))
298 for field in ('pkgname', 'pkgdesc', 'url'):
299 if field in pkginfo and len(pkginfo[field]) > 255:
300 die_commit('{:s} field too long: {:s}'.format(field, pkginfo[field]),
301 str(commit.id))
303 for field in ('install', 'changelog'):
304 if field in pkginfo and not pkginfo[field] in commit.tree:
305 die_commit('missing {:s} file: {:s}'.format(field, pkginfo[field]),
306 str(commit.id))
308 for field in extract_arch_fields(pkginfo, 'source'):
309 fname = field['value']
310 if "://" in fname or "lp:" in fname:
311 continue
312 if fname not in commit.tree:
313 die_commit('missing source file: {:s}'.format(fname),
314 str(commit.id))
317 # Display a warning if .SRCINFO is unchanged.
318 if sha1_old not in ("0000000000000000000000000000000000000000", sha1_new):
319 srcinfo_id_old = repo[sha1_old].tree['.SRCINFO'].id
320 srcinfo_id_new = repo[sha1_new].tree['.SRCINFO'].id
321 if srcinfo_id_old == srcinfo_id_new:
322 warn(".SRCINFO unchanged. The package database will not be updated!")
324 # Read .SRCINFO from the HEAD commit.
325 metadata_raw = repo[repo[sha1_new].tree['.SRCINFO'].id].data.decode()
326 (metadata, errors) = srcinfo.parse.parse_srcinfo(metadata_raw)
328 # Ensure that the package base name matches the repository name.
329 metadata_pkgbase = metadata['pkgbase']
330 if metadata_pkgbase != pkgbase:
331 die('invalid pkgbase: {:s}, expected {:s}'.format(metadata_pkgbase, pkgbase))
333 # Ensure that packages are neither blacklisted nor overwritten.
334 pkgbase = metadata['pkgbase']
335 cur = conn.execute("SELECT ID FROM PackageBases WHERE Name = ?", [pkgbase])
336 row = cur.fetchone()
337 pkgbase_id = row[0] if row else 0
339 cur = conn.execute("SELECT Name FROM PackageBlacklist")
340 blacklist = [row[0] for row in cur.fetchall()]
342 cur = conn.execute("SELECT Name, Repo FROM OfficialProviders")
343 providers = dict(cur.fetchall())
345 for pkgname in srcinfo.utils.get_package_names(metadata):
346 pkginfo = srcinfo.utils.get_merged_package(pkgname, metadata)
347 pkgname = pkginfo['pkgname']
349 if pkgname in blacklist:
350 warn_or_die('package is blacklisted: {:s}'.format(pkgname))
351 if pkgname in providers:
352 repo = providers[pkgname]
353 warn_or_die('package already provided by [{:s}]: {:s}'.format(repo, pkgname))
355 cur = conn.execute("SELECT COUNT(*) FROM Packages WHERE Name = ? AND " +
356 "PackageBaseID <> ?", [pkgname, pkgbase_id])
357 if cur.fetchone()[0] > 0:
358 die('cannot overwrite package: {:s}'.format(pkgname))
360 # Store package base details in the database.
361 save_metadata(metadata, conn, user)
363 # Create (or update) a branch with the name of the package base for better
364 # accessibility.
365 repo.create_reference('refs/heads/' + pkgbase, sha1_new, True)
367 # Work around a Git bug: The HEAD ref is not updated when using gitnamespaces.
368 # This can be removed once the bug fix is included in Git mainline. See
369 # http://git.661346.n2.nabble.com/PATCH-receive-pack-Create-a-HEAD-ref-for-ref-namespace-td7632149.html
370 # for details.
371 repo.create_reference('refs/namespaces/' + pkgbase + '/HEAD', sha1_new, True)
373 # Send package update notifications.
374 update_notify(conn, user, pkgbase_id)
376 # Close the database.
377 conn.close()