Author: sebb
Date: Wed Sep 13 12:29:06 2023
New Revision: 1912284
URL: http://svn.apache.org/viewvc?rev=1912284&view=rev
Log:
Eliminate file types that cannot be sources
Modified:
comdev/projects.apache.org/trunk/scripts/cronjobs/parsereleases.py
Modified: comdev/projects.apache.org/trunk/scripts/cronjobs/parsereleases.py
URL:
http://svn.apache.org/viewvc/comdev/projects.apache.org/trunk/scripts/cronjobs/parsereleases.py?rev=1912284&r1=1912283&r2=1912284&view=diff
==============================================================================
--- comdev/projects.apache.org/trunk/scripts/cronjobs/parsereleases.py
(original)
+++ comdev/projects.apache.org/trunk/scripts/cronjobs/parsereleases.py Wed Sep
13 12:29:06 2023
@@ -78,7 +78,17 @@ def cleanReleases(committeeId):
del releases[committeeId]
del files[committeeId]
+# all source releases must be one of these
+VALID_TYPES = ['tgz', 'gz', 'zip', 'xz', 'bz2']
+
+# for gz, xz and bz2, the next extension must be tar
+TAR_TYPES = ['gz', 'xz', 'bz2']
+
def parseFile(committeeId, file, date, path):
+ parts = file.split('.')
+ ext = parts.pop() # final extension
+ if not ext in VALID_TYPES or (ext in TAR_TYPES and parts.pop() != 'tar'):
+ return
if not
re.search(r"(MD5SUM|SHA1SUM|\.s?nupkg|\.md5|\.mds|\.sh1|\.sh2|\.sha|\.asc|\.sig|\.bin|\.pom|\.jar|\.whl|\.pdf|\.xml|\.xsd|\.html|\.txt|\.cfg|\.ish|\.pl|RELEASE.NOTES|LICENSE|KEYS|CHANGELOG|NOTICE|MANIFEST|Changes|readme|x86|amd64|-manual\.|-docs\.|-docs-|-doc-|Announcement|current|-deps|-dependencies|binary|-bin-|-bin\.|-javadoc-|-distro|rat_report|\.png|\.jpg|\.gif|\.sqlite|\.yaml|\.yml|\.prov)",
file, flags=re.IGNORECASE):
filename = cleanFilename(file)
if len(filename) > 1: