-
Notifications
You must be signed in to change notification settings - Fork 2
Expand file tree
/
Copy pathcleanup-old-packages.py
More file actions
294 lines (247 loc) · 8.69 KB
/
cleanup-old-packages.py
File metadata and controls
294 lines (247 loc) · 8.69 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
# SPDX-FileCopyrightText: 2023 Intel Corporation
#
# SPDX-License-Identifier: Apache-2.0
"""Script to clean up old anaconda packages."""
import argparse
import re
from collections import defaultdict
from operator import itemgetter
try:
from binstar_client.utils import bool_input, get_server_api, parse_specs
except ImportError:
raise Exception(
"Script requires anaconda-clinet. Please install it in "
+ "the same environment you are running this script."
)
QUOTAS = {
# lets try keeping at least 1Gb free. Total quota is 3Gb
"dppy/dpctl": 1024 * 1024 * 1024,
"dppy/dpnp": 1024 * 1024 * 1024,
"dppy/numba-dpex": 256 * 1024 * 1024,
"dppy/numba-mlir": 512 * 1024 * 1024,
"dppy/dpbench": 128 * 1024 * 1024,
"dppy/dpcpp-llvm-spirv": 256 * 1024 * 1024,
}
def is_dev_version(version: str) -> bool:
"""Checks if input string match dev or rc version pattern (e.g. X.Y.ZdevW).
Args:
version: input version string
Returns:
True if input version is development version
"""
return bool(re.search(r"^\d+\.\d+\.\d+\.?(dev|rc)\d+", version))
def build_number(file) -> int:
"""Extracts build number from file.
Works both with conda and wheel packages.
Args:
file: anaconda's file metadata representing file stored in registry.
Returns:
Integer build number
"""
return max(
file.get("attrs", {}).get("build_number", 0),
# wheels attribute is a string
int(file.get("attrs", {}).get("build_no", 0)),
)
def max_build(files: list) -> int:
"""Returns max build number for the list of files.
Intended to use for the list of files of the same version.
Args:
files: anacondas' files metadata representing files stored in registry.
Returns:
Integer build number
"""
return max(map(build_number, files), default=0)
def cleanup_packages(
package_path,
label,
token,
keep_count,
max_size,
max_priority,
dry_run,
force,
verbose,
):
"""Clean up packages according to criteria. Run --help for more information.
Args:
package_path: path to anaconda's package
label: filter files by label
token: anaconda token
keep_count: number of files to keep
max_size: max size all the files can take. Files above the limit must be
removed
max_priority: files that must be removed with this priority
dry_run: run without removing files. Shows files that will be removed.
May not require token for this
force: remove files without confirmation
verbose: verbose output for the script execution
"""
def print_verbose(*args):
if verbose:
print(*args)
aserver_api = get_server_api(token, None)
spec = parse_specs(package_path)
package = aserver_api.package(spec.user, spec.package)
versions = package["versions"]
print_verbose("versions", versions)
files = package["files"]
if label is not None:
files = list(filter(lambda a: label in a["labels"], files))
files_by_version = defaultdict(lambda: [])
for f in files:
files_by_version[f["version"]].append(f)
# NIT: max does not work on semantic vesrions.
# last_dev = max(filter(is_dev_version, versions), default=None)
last_dev = None
for v in versions:
if is_dev_version(v):
last_dev = v
print_verbose("last_dev:", last_dev)
total_size = sum(map(lambda f: f["size"], files))
print_verbose("total size:", total_size)
for version in versions:
is_dev = is_dev_version(version)
mbd = max_build(files_by_version[version])
for file in files_by_version[version]:
prioity = 4
if build_number(file) == mbd:
if is_dev and file["version"] != last_dev:
prioity = 2
elif is_dev and file["version"] == last_dev:
prioity = 3
elif is_dev:
prioity = 0
else:
prioity = 1
file["cleanup_priority"] = prioity
for file in files:
print_verbose(
"priority:",
file["cleanup_priority"],
"build:",
build_number(file),
file["full_name"],
)
print_verbose("")
files.sort(key=itemgetter("cleanup_priority", "upload_time"))
last_version, last_build = None, None
cleanup_size = 0
while len(files) > 0:
file = files[0]
version, build = file["version"], build_number(file)
# check if we have to remove this file
need_clean = (
(max_size is not None and total_size > max_size)
or (
max_priority is not None
and file["cleanup_priority"] <= max_priority
)
or (keep_count is not None and len(files) > keep_count)
)
# clean up all releases of last removed version
if not need_clean and (
last_version is None
or (last_version != version or last_build != build)
):
last_version, last_build = None, None
break
last_version, last_build = file["version"], build_number(file)
if dry_run or force:
print_verbose(f"Removing {file['full_name']}", need_clean)
if not dry_run:
remove_spec = parse_specs(file["full_name"])
msg = "Are you sure you want to remove file %s ?" % (remove_spec,)
if force or bool_input(msg, False):
aserver_api.remove_dist(
remove_spec.user,
remove_spec.package,
remove_spec.version,
remove_spec.basename,
)
# iterantion
files = files[1:]
total_size -= file["size"]
cleanup_size += file["size"]
print_verbose("Cleaned size:", cleanup_size)
if __name__ == "__main__":
parser = argparse.ArgumentParser(
formatter_class=argparse.RawTextHelpFormatter
)
parser.add_argument(
"--package", dest="package_path", type=str, required=True
)
parser.add_argument(
"--label", dest="label", type=str, default=None, required=False
)
parser.add_argument("--token", dest="token", type=str, default="")
parser.add_argument(
"--keep-count",
dest="keep_count",
type=int,
default=None,
required=False,
)
parser.add_argument(
"--max-size", dest="max_size", type=int, default=None, required=False
)
parser.add_argument(
"--max-priority",
dest="max_priority",
type=int,
default=None,
required=False,
help="0 - removes builds for dev versions other than the most recent \n"
+ " build, except for builds of the latest dev version;\n"
+ "1 - same as above but also applies to released versions;\n"
+ "2 - removes dev versions except for the last dev version;\n"
+ "3 - in last dev version keep only the latest build;\n"
+ "4 - removes regular builds and latest dev version (e.g. remove \n"
+ " everything)\n"
+ "Example:\n"
+ "- pkg_v1.0_bld-0 priority: 1\n"
+ "- pkg_v1.0_bld-1 priority: 4\n"
+ "- pkg_v1.2dev1_bld-0 priority: 2\n"
+ "- pkg_v2.0_bld-0 priority: 4\n"
+ "- pkg_v2.1dev1_bld-0 priority: 0\n"
+ "- pkg_v2.1dev1_bld-1 priority: 2\n"
+ "- pkg_v2.1dev2_bld-0 priority: 3\n"
+ "- pkg_v2.1dev2_bld-2 priority: 4\n"
+ "The set of files considered by a given priority includes all the \n"
+ "sets considered by lower priorities.\n",
)
parser.add_argument(
"--dry-run", dest="dry_run", action="store_true", default=False
)
parser.add_argument(
"--force", dest="force", action="store_true", default=False
)
parser.add_argument(
"--verbose", dest="verbose", action="store_true", default=False
)
args = parser.parse_args()
if (
args.max_size is None
and QUOTAS.get(args.package_path, None) is not None
):
args.max_size = QUOTAS[args.package_path]
if (
args.max_size is None
and args.max_priority is None
and args.keep_count is None
):
raise Exception(
"at least one of --keep-count, --max-size, --max-priority must be "
+ "set"
)
cleanup_packages(
package_path=args.package_path,
label=args.label,
token=args.token,
keep_count=args.keep_count,
max_priority=args.max_priority,
max_size=args.max_size,
dry_run=args.dry_run,
force=args.force,
verbose=args.verbose,
)