forked from google/syzkaller
-
Notifications
You must be signed in to change notification settings - Fork 6
/
Copy pathcheck_links.py
executable file
·66 lines (50 loc) · 1.18 KB
/
check_links.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
#!/usr/bin/python
import os
import re
import sys
link_re = re.compile('\[' + '[^\[\]]+' + '\]' + '\(' + '([^\(\)]+)' + '\)')
if len(sys.argv) < 3:
print 'Usage: <root_dir> <doc_files>...'
sys.exit(1)
root = sys.argv[1]
docs = sys.argv[2:]
links = []
for doc in docs:
with open(doc) as f:
data = f.read()
r = link_re.findall(data)
for link in r:
links += [(doc, link)]
def filter_link((doc, link)):
if link.startswith('http'):
return False
if link.startswith('#'):
return False
return True
links = filter(filter_link, links)
def fix_link((doc, link)):
link = link.split('#')[0]
link = link.split('?')[0]
return (doc, link)
links = map(fix_link, links)
errors = []
def check_link((doc, link)):
path = os.path.dirname(doc)
full_link = None
if link[0] == '/':
link = link[1:]
full_link = os.path.join(root, link)
else:
full_link = os.path.join(root, path, link)
if not os.path.exists(full_link):
return False
return True
for link in links:
if not check_link(link):
errors += [link]
if len(errors) == 0:
print '%d links checked: OK' % (len(links),)
sys.exit(0)
for (doc, link) in errors:
print 'File %s linked from %s not found' % (link, doc)
sys.exit(2)