forked from circleci/circleci-docs
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathdocs-stats.py
executable file
·70 lines (52 loc) · 2.21 KB
/
docs-stats.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
#!/usr/bin/env python3
### Docs Stats --
# This script iterates over our docs and checks the last time each file was updated.
# On completion, it should print out a table of files from least-recently updated to most recently.
import os
import glob
from pathlib import Path
updated_docs_metadata = []
docs_paths = (
'../jekyll/_cci2/*.md',
'../jekyll/_cci2/*.adoc',
'../jekyll/_cci2_ja/*.md',
'../jekyll/_cci2_ja/*.adoc',
)
def create_document_metadata(file_name, last_updated, last_updated_ts, file_path, file_dir):
"""Create a dict of metadata for each file;
a list of these dict are stored in updated_docs_metadata"""
f = {
"last_updated": last_updated,
"last_updated_ts": last_updated_ts,
"file_name": file_name,
"file_path": file_path,
"file_dir": file_dir
}
return f
def iterate_docs():
"""retrieve data on each doc using git and store in a global list."""
print("Checking last time updated...")
# for file in list(glob.glob('../jekyll/**/*.md')): # figure out why **/ glob is not working.
files = []
for path in docs_paths:
files.extend(glob.glob(path))
for file in files:
relative_date = os.popen('git log -1 --date=relative --format="%ad" -- ' + file).read()
epoch_date = os.popen('git log -1 --format="%ct" -- ' + file).read()
fpath = Path(file)
file_name = str(fpath.stem)
file_dir = str(fpath.parent.name)
name = file_name + str(fpath.suffix)
doc_data = create_document_metadata(name, relative_date, epoch_date, file, file_dir)
updated_docs_metadata.append(doc_data)
def print_docs_table():
print ("{:<4} | {:<9} | {:<50} | {:<20}".format('#', 'Dir', 'File','Last Updated'))
print ("----------------------------------------------------------------------------------")
for index, doc in enumerate(updated_docs_metadata):
print ("{:<4} | {:<9} | {:<50} | {:<20}".format(index, doc['file_dir'], doc["file_name"], doc["last_updated"].rstrip()))
def sort_by_date():
updated_docs_metadata.sort(key = lambda i: (i['file_dir'], i['last_updated_ts']))
# -------
iterate_docs()
sort_by_date()
print_docs_table()