forked from openedx/edx-documentation
-
Notifications
You must be signed in to change notification settings - Fork 0
/
dochealth.py
156 lines (132 loc) · 5.07 KB
/
dochealth.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
"""
Uses the readthedocs API to assess the publishing health of our books.
Results are written in two forms, readble to stdout, and to health.csv.
Setting up authentication:
- Get an API token from https://readthedocs.org/accounts/tokens/
- Then, either:
1. Define a READTHEDOCS_TOKEN environment variable with the token, or
2. Edit or create your ~/.netrc file to have an entry like this:
machine readthedocs.org
login edx
password 247cb3fb3fcc8f919a81842ce8160b2c92ee0c86
Running::
$ python dochealth.py
This will write information to the terminal, and also create a health.csv file
to import into a spreadsheet.
"""
import collections
import csv
import netrc
import os
import requests
import time
CSV_FILE = "health.csv"
class ReadthedocsAuth:
"""Implement readthedocs.org "token: xxxxx" authentication for requests."""
def __call__(self, req):
token = os.environ.get("READTHEDOCS_TOKEN")
if token is None:
credentials = netrc.netrc().hosts.get("readthedocs.org")
assert credentials is not None, f"No API token! See the instructions in the {__file__} docstring."
token = credentials[2]
req.headers["Authorization"] = f"token {token}"
return req
def get_data(url):
while True:
resp = requests.get(url, auth=ReadthedocsAuth())
if resp.status_code == 200:
return resp.json()
if resp.status_code == 429:
# Rate-limited. Simple-minded waiting.
time.sleep(10)
continue
resp.raise_for_status()
def normalize_url(url):
if url.endswith(".git"):
url = url[:-4]
if url.startswith("http:"):
url = "https:" + url[5:]
if url.endswith("/"):
url = url[:-1]
return url
def date(timestamp):
return timestamp.partition("T")[0]
with open(CSV_FILE, "w") as health_out:
writer = csv.writer(health_out)
writer.writerow([
"repo",
"title",
"branch",
"last_build",
"succeeded",
"last_good_build",
"python_version",
"conf_file",
"requirements",
])
data = get_data("https://readthedocs.org/api/v3/projects/?limit=100")
assert data["next"] is None, "Oops, more than 100 projects, have to update the code"
print(f"{data['count']} projects")
by_repo = collections.defaultdict(list)
for proj in data["results"]:
url = normalize_url(proj["repository"]["url"])
by_repo[url].append(proj)
for url, projs in sorted(by_repo.items()):
show_count = ""
if len(projs) > 1:
show_count = f" {len(projs)} projects"
print(f"repo {url}:{show_count}")
for proj in projs:
show_branch = show_sub = ""
branch = proj["default_branch"]
super_proj = proj["subproject_of"]
if super_proj:
show_sub = f" (sub of: {super_proj['name']})"
if branch != "master":
show_branch = f" (branch {branch})"
print(f""" "{proj["name"]}"{show_branch}{show_sub}""")
builds_url = proj["_links"]["builds"] + "?limit=100"
builds = get_data(builds_url)["results"]
build = builds[0]
show_status = ""
if not build["success"]:
show_status = " failed"
print(f""" latest build: {build["created"]}{show_status}""")
if build["success"]:
last_good = build
else:
last_good = next((b for b in builds if b["success"]), None)
if last_good is None:
print(" ** no successful build")
else:
print(f""" last success: {last_good["created"]}""")
build_details = get_data(build["_links"]["_self"] + "?expand=config")
version = build_details["version"]
print(f""" version: {version}""")
config = build_details["config"]
if config:
python_version = config["python"]["version"]
print(f""" python version: {python_version}""")
conf_file = config["sphinx"]["configuration"]
if conf_file:
conf_file = conf_file.rpartition(f"checkouts/{version}/")[-1]
print(f""" conf file: {conf_file}""")
try:
requirements = config["python"]["install"][0]["requirements"]
print(f""" requirements: {requirements}""")
except:
import pprint; pprint.pprint(config)
else:
conf_file = python_version = requirements = ""
writer.writerow([
url,
proj["name"],
branch,
date(build["created"]),
"success" if build["success"] else "fail",
date(last_good["created"]) if last_good else "never",
python_version,
conf_file,
requirements,
])
print(f"Wrote {CSV_FILE}")