-
Notifications
You must be signed in to change notification settings - Fork 0
/
github-insights.py
164 lines (145 loc) · 6 KB
/
github-insights.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
from github import Github
from decouple import config
from prometheus_client import start_http_server, Gauge
from decouple import config
from apscheduler.schedulers.blocking import BlockingScheduler
from apscheduler.triggers.cron import CronTrigger
from prometheus_client import start_http_server, Gauge
from logfmt_logger import getLogger
ORG_NAME = config("ORG_NAME", default="")
USER_NAME = config("USER_NAME", default="")
REPO_TYPE = config("REPO_TYPE", default="public")
REPO_NAME_CONTAINS = config("REPO_NAME_CONTAINS", default="")
CRONTAB_SCHEDULE = config("CRONTAB_SCHEDULE", default="0 * * * *")
GITHUB_TOKEN = config('GITHUB_TOKEN')
github = Github(GITHUB_TOKEN)
logger = getLogger("github_traffic")
gh_traffic_views = Gauge(
"github_traffic_views",
"Number of views",
["repository"],
)
gh_traffic_unique_views = Gauge(
"github_traffic_unique_views",
"Number of unique views",
["repository"],
)
gh_traffic_clones = Gauge(
"github_traffic_clones",
"Number of clones",
["repository"],
)
gh_traffic_unique_clones = Gauge(
"github_traffic_unique_clones",
"Number of unique views",
["repository"],
)
gh_traffic_top_paths = Gauge(
"github_traffic_top_paths",
"Number of visits to top paths",
["repository", "path", "title"],
)
gh_traffic_top_unique_paths = Gauge(
"github_traffic_top_unique_paths",
"Number of unique visits to top paths",
["repository", "path", "title"],
)
gh_traffic_top_referrers = Gauge(
"github_traffic_top_referrers",
"Number of visits from top referrers",
["repository", "referrer"],
)
gh_traffic_top_unique_referrers = Gauge(
"github_traffic_top_unique_referrers",
"Number of unique visits from top referrers",
["repository", "referrer"],
)
gh_traffic_stars = Gauge(
"github_traffic_stars",
"Number of stars",
["repository"],
)
gh_traffic_api_requests_limit = Gauge(
"github_traffic_api_requests_limit",
"Requests limit from Github API limits",
)
gh_traffic_api_requests_remaining = Gauge(
"github_traffic_api_requests_remaining",
"Requests remaining from Github API limits",
)
def job_function():
api_limits = github.get_rate_limit().core
gh_traffic_api_requests_limit.set(api_limits.limit)
gh_traffic_api_requests_remaining.set(api_limits.remaining)
if(not ORG_NAME and not USER_NAME):
logger.error(f"Please fill ORG_NAME or USER_NAME in config")
if(ORG_NAME):
repositories = github.get_organization(ORG_NAME).get_repos(type=REPO_TYPE)
if(USER_NAME):
repositories = github.get_user(USER_NAME).get_repos(type=REPO_TYPE)
for repo in repositories:
if REPO_NAME_CONTAINS in repo.name:
repo_name = repo.name
toShow = dict()
toShow['repo'] = repo_name
try:
# Views stats
data_views = repo.get_views_traffic(per="day")
gh_traffic_views.labels(repo_name).set(data_views["views"][-1].count)
gh_traffic_unique_views.labels(repo_name).set(data_views["views"][-1].uniques)
toShow['views'] = data_views["views"][-1].count
toShow['unique_views'] = data_views["views"][-1].uniques
except Exception as e:
logger.error(f"Failed to extract views on {repo_name}: {e}")
try:
# Clones stats
data_clones = repo.get_clones_traffic(per="day")
gh_traffic_clones.labels(repo_name).set(data_clones["clones"][-1].count)
gh_traffic_unique_clones.labels(repo_name).set(data_clones["clones"][-1].uniques)
toShow['clones'] = data_clones["clones"][-1].count
toShow['unique_clones'] = data_clones["clones"][-1].uniques
except Exception as e:
logger.error(f"Failed to extract clones on {repo_name}: {e}")
try:
# Star stats
gh_traffic_stars.labels(repo_name).set(repo.stargazers_count)
toShow['stars'] = repo.stargazers_count
except Exception as e:
logger.error(f"Failed to get stars on {repo_name}: {e}")
try:
# Top Paths
total_count = 0
total_unique_count = 0
for path in repo.get_top_paths():
gh_traffic_top_paths.labels(repo_name, path.path, path.title).set(path.count)
total_count = total_count + path.count
gh_traffic_top_unique_paths.labels(repo_name, path.path, path.title).set(path.uniques)
total_unique_count = total_unique_count + path.uniques
toShow['sum(top_paths)'] = total_count
toShow['sum(top_unique_paths)'] = total_unique_count
except Exception as e:
logger.error(f"Failed to get top paths on {repo_name}: {e}")
try:
# Top Referrers
total_count = 0
total_unique_count = 0
for referrer in repo.get_top_referrers():
gh_traffic_top_referrers.labels(repo_name, referrer.referrer).set(referrer.count)
total_count = total_count + referrer.count
gh_traffic_top_unique_referrers.labels(repo_name, referrer.referrer).set(referrer.uniques)
total_unique_count = total_unique_count + referrer.uniques
toShow['sum(top_referrers)'] = total_count
toShow['sum(top_unique_referrers)'] = total_unique_count
except Exception as e:
logger.error(f"Failed to get top referrers on {repo_name}: {e}")
logger.info('Gather insights', extra={"context": toShow})
if __name__ == "__main__":
logger.info('Github traffic is running!')
# Start up the server to expose the metrics.
start_http_server(8001)
# Schedule run the job on startup.
job_function()
# Start scheduler
sched = BlockingScheduler()
sched.add_job(job_function, CronTrigger.from_crontab(CRONTAB_SCHEDULE))
sched.start()