forked from docker-archive/docker-registry
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathdump_repos_data.py
executable file
·78 lines (63 loc) · 2.31 KB
/
dump_repos_data.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
#!/usr/bin/env python
import os
import sys
import simplejson as json
root_path = os.path.abspath(os.path.join(os.path.dirname(__file__), '..'))
sys.path.append(os.path.join(root_path, 'lib'))
import storage
store = storage.load()
def walk_all_tags():
for namespace_path in store.list_directory(store.repositories):
for repos_path in store.list_directory(namespace_path):
try:
for tag in store.list_directory(repos_path):
fname = tag.split('/').pop()
if not fname.startswith('tag_'):
continue
(namespace, repos) = repos_path.split('/')[-2:]
yield (namespace, repos, store.get_content(tag))
except OSError:
pass
def walk_ancestry(image_id):
try:
ancestry_data = store.get_content(store.image_ancestry_path(image_id))
ancestry = json.loads(ancestry_data)
return iter(ancestry)
except IOError:
print 'Ancestry file for {0} is missing'.format(image_id)
return []
def get_image_checksum(image_id):
checksum_path = store.image_checksum_path(image_id)
if not store.exists(checksum_path):
return
checksum = store.get_content(checksum_path)
return checksum.strip()
def dump_json(all_repos, all_checksums, filename):
data = []
for ((namespace, repos), images) in all_repos.iteritems():
images_checksums = []
for i in set(images):
images_checksums.append({'id': i, 'checksum': all_checksums[i]})
data.append({
'namespace': namespace,
'repository': repos,
'images': images_checksums
})
with open(filename, 'w') as f:
json.dump(data, f, indent=4)
if __name__ == '__main__':
if len(sys.argv) < 2:
print 'Usage: {0} <output_file>'.format(sys.argv[0])
sys.exit(1)
all_repos = {}
all_checksums = {}
for (namespace, repos, image_id) in walk_all_tags():
key = (namespace, repos)
if key not in all_repos:
all_repos[key] = []
for i in walk_ancestry(image_id):
all_repos[key].append(i)
if i in all_checksums:
continue
all_checksums[i] = get_image_checksum(i)
dump_json(all_repos, all_checksums, sys.argv[1])