scripts: add missing regex for dl_cleanup script
[openwrt/staging/hauke.git] / scripts / dl_cleanup.py
1 #!/usr/bin/env python3
2 """
3 # OpenWrt download directory cleanup utility.
4 # Delete all but the very last version of the program tarballs.
5 #
6 # Copyright (C) 2010-2015 Michael Buesch <m@bues.ch>
7 # Copyright (C) 2013-2015 OpenWrt.org
8 """
9
10 from __future__ import print_function
11
12 import sys
13 import os
14 import re
15 import getopt
16
17 # Commandline options
18 opt_dryrun = False
19
20
21 def parseVer_1234(match, filepath):
22 progname = match.group(1)
23 progversion = (int(match.group(2)) << 64) |\
24 (int(match.group(3)) << 48) |\
25 (int(match.group(4)) << 32) |\
26 (int(match.group(5)) << 16)
27 return (progname, progversion)
28
29 def parseVer_123(match, filepath):
30 progname = match.group(1)
31 try:
32 patchlevel = match.group(5)
33 except IndexError as e:
34 patchlevel = None
35 if patchlevel:
36 patchlevel = ord(patchlevel[0])
37 else:
38 patchlevel = 0
39 progversion = (int(match.group(2)) << 64) |\
40 (int(match.group(3)) << 48) |\
41 (int(match.group(4)) << 32) |\
42 patchlevel
43 return (progname, progversion)
44
45 def parseVer_12(match, filepath):
46 progname = match.group(1)
47 try:
48 patchlevel = match.group(4)
49 except IndexError as e:
50 patchlevel = None
51 if patchlevel:
52 patchlevel = ord(patchlevel[0])
53 else:
54 patchlevel = 0
55 progversion = (int(match.group(2)) << 64) |\
56 (int(match.group(3)) << 48) |\
57 patchlevel
58 return (progname, progversion)
59
60 def parseVer_r(match, filepath):
61 progname = match.group(1)
62 progversion = (int(match.group(2)) << 64)
63 return (progname, progversion)
64
65 def parseVer_ymd_GIT_SHASUM(match, filepath):
66 progname = match.group(1)
67 progversion = (int(match.group(2)) << 64) |\
68 (int(match.group(3)) << 48) |\
69 (int(match.group(4)) << 32)
70 return (progname, progversion)
71
72 def parseVer_ymd(match, filepath):
73 progname = match.group(1)
74 progversion = (int(match.group(2)) << 64) |\
75 (int(match.group(3)) << 48) |\
76 (int(match.group(4)) << 32)
77 return (progname, progversion)
78
79 def parseVer_GIT(match, filepath):
80 progname = match.group(1)
81 st = os.stat(filepath)
82 progversion = int(st.st_mtime) << 64
83 return (progname, progversion)
84
85 extensions = (
86 ".tar.gz",
87 ".tar.bz2",
88 ".tar.xz",
89 ".orig.tar.gz",
90 ".orig.tar.bz2",
91 ".orig.tar.xz",
92 ".zip",
93 ".tgz",
94 ".tbz",
95 ".txz",
96 )
97
98 versionRegex = (
99 (re.compile(r"(.+)[-_](\d+)\.(\d+)\.(\d+)\.(\d+)"), parseVer_1234), # xxx-1.2.3.4
100 (re.compile(r"(.+)[-_](\d\d\d\d)-?(\d\d)-?(\d\d)-"), parseVer_ymd_GIT_SHASUM), # xxx-YYYY-MM-DD-GIT_SHASUM
101 (re.compile(r"(.+)[-_](\d\d\d\d)-?(\d\d)-?(\d\d)"), parseVer_ymd), # xxx-YYYY-MM-DD
102 (re.compile(r"(.+)[-_]([0-9a-fA-F]{40,40})"), parseVer_GIT), # xxx-GIT_SHASUM
103 (re.compile(r"(.+)[-_](\d+)\.(\d+)\.(\d+)(\w?)"), parseVer_123), # xxx-1.2.3a
104 (re.compile(r"(.+)[-_](\d+)_(\d+)_(\d+)"), parseVer_123), # xxx-1_2_3
105 (re.compile(r"(.+)[-_](\d+)\.(\d+)(\w?)"), parseVer_12), # xxx-1.2a
106 (re.compile(r"(.+)[-_]r?(\d+)"), parseVer_r), # xxx-r1111
107 )
108
109 blacklist = [
110 ("linux", re.compile(r"linux-\d.*")),
111 ("gcc", re.compile(r"gcc-.*")),
112 ("wl_apsta", re.compile(r"wl_apsta.*")),
113 (".fw", re.compile(r".*\.fw")),
114 (".arm", re.compile(r".*\.arm")),
115 (".bin", re.compile(r".*\.bin")),
116 ("rt-firmware", re.compile(r"RT[\d\w]+_Firmware.*")),
117 ]
118
119 class EntryParseError(Exception): pass
120
121 class Entry:
122 def __init__(self, directory, filename):
123 self.directory = directory
124 self.filename = filename
125 self.progname = ""
126 self.fileext = ""
127
128 for ext in extensions:
129 if filename.endswith(ext):
130 filename = filename[0:0-len(ext)]
131 self.fileext = ext
132 break
133 else:
134 print(self.filename, "has an unknown file-extension")
135 raise EntryParseError("ext")
136 for (regex, parseVersion) in versionRegex:
137 match = regex.match(filename)
138 if match:
139 (self.progname, self.version) = parseVersion(
140 match, directory + "/" + filename + self.fileext)
141 break
142 else:
143 print(self.filename, "has an unknown version pattern")
144 raise EntryParseError("ver")
145
146 def getPath(self):
147 return (self.directory + "/" + self.filename).replace("//", "/")
148
149 def deleteFile(self):
150 path = self.getPath()
151 print("Deleting", path)
152 if not opt_dryrun:
153 os.unlink(path)
154
155 def __ge__(self, y):
156 return self.version >= y.version
157
158 def usage():
159 print("OpenWrt download directory cleanup utility")
160 print("Usage: " + sys.argv[0] + " [OPTIONS] <path/to/dl>")
161 print("")
162 print(" -d|--dry-run Do a dry-run. Don't delete any files")
163 print(" -B|--show-blacklist Show the blacklist and exit")
164 print(" -w|--whitelist ITEM Remove ITEM from blacklist")
165
166 def main(argv):
167 global opt_dryrun
168
169 try:
170 (opts, args) = getopt.getopt(argv[1:],
171 "hdBw:",
172 [ "help", "dry-run", "show-blacklist", "whitelist=", ])
173 if len(args) != 1:
174 usage()
175 return 1
176 except getopt.GetoptError as e:
177 usage()
178 return 1
179 directory = args[0]
180
181 if not os.path.exists(directory):
182 print("Can't find dl path", directory)
183 return 1
184
185 for (o, v) in opts:
186 if o in ("-h", "--help"):
187 usage()
188 return 0
189 if o in ("-d", "--dry-run"):
190 opt_dryrun = True
191 if o in ("-w", "--whitelist"):
192 for i in range(0, len(blacklist)):
193 (name, regex) = blacklist[i]
194 if name == v:
195 del blacklist[i]
196 break
197 else:
198 print("Whitelist error: Item", v,\
199 "is not in blacklist")
200 return 1
201 if o in ("-B", "--show-blacklist"):
202 for (name, regex) in blacklist:
203 sep = "\t\t"
204 if len(name) >= 8:
205 sep = "\t"
206 print("%s%s(%s)" % (name, sep, regex.pattern))
207 return 0
208
209 # Create a directory listing and parse the file names.
210 entries = []
211 for filename in os.listdir(directory):
212 if filename == "." or filename == "..":
213 continue
214 for (name, regex) in blacklist:
215 if regex.match(filename):
216 if opt_dryrun:
217 print(filename, "is blacklisted")
218 break
219 else:
220 try:
221 entries.append(Entry(directory, filename))
222 except EntryParseError as e:
223 pass
224
225 # Create a map of programs
226 progmap = {}
227 for entry in entries:
228 if entry.progname in progmap.keys():
229 progmap[entry.progname].append(entry)
230 else:
231 progmap[entry.progname] = [entry,]
232
233 # Traverse the program map and delete everything but the last version
234 for prog in progmap:
235 lastVersion = None
236 versions = progmap[prog]
237 for version in versions:
238 if lastVersion is None or version >= lastVersion:
239 lastVersion = version
240 if lastVersion:
241 for version in versions:
242 if version is not lastVersion:
243 version.deleteFile()
244 if opt_dryrun:
245 print("Keeping", lastVersion.getPath())
246
247 return 0
248
249 if __name__ == "__main__":
250 sys.exit(main(sys.argv))