Skip to content
GitLab
Explore
Sign in
Primary navigation
Search or go to…
Project
Wiki Replica
Manage
Activity
Members
Labels
Plan
Issues
Issue boards
Milestones
Code
Merge requests
Repository
Branches
Commits
Tags
Repository graph
Compare revisions
Build
Pipelines
Jobs
Pipeline schedules
Artifacts
Deploy
Releases
Container Registry
Model registry
Operate
Environments
Monitor
Incidents
Analyze
Value stream analytics
Contributor analytics
CI/CD analytics
Repository analytics
Model experiments
Help
Help
Support
GitLab documentation
Compare GitLab plans
Community forum
Contribute to GitLab
Provide feedback
Keyboard shortcuts
?
Snippets
Groups
Projects
Show more breadcrumbs
The Tor Project
TPA
Wiki Replica
Commits
95afe0df
Verified
Commit
95afe0df
authored
5 years ago
by
anarcat
Browse files
Options
Downloads
Patches
Plain Diff
add metrics in the report and a way to generate them
parent
40219ed5
No related branches found
Branches containing commit
No related tags found
No related merge requests found
Changes
2
Hide whitespace changes
Inline
Side-by-side
Showing
2 changed files
tsa/meeting/2019-09-09.mdwn
+22
-0
22 additions, 0 deletions
tsa/meeting/2019-09-09.mdwn
tsa/meeting/monthly-report
+155
-0
155 additions, 0 deletions
tsa/meeting/monthly-report
with
177 additions
and
0 deletions
tsa/meeting/2019-09-09.mdwn
+
22
−
0
View file @
95afe0df
...
...
@@ -184,3 +184,25 @@ plan.
# Next meeting
october 7th 1400UTC
# Metrics of the month
I figured I would bring back this tradition that Linus had going before
I started doing the reports, but that I omitted because of lack of time
and familiarity with the infrastructure. Now I'm a little more
comfortable so I made a script in the wiki which polls numbers from
various sources and makes a nice overview of what our infra looks
like. Access and transfer rates are over the last 30 days.
* hosts in Puppet: 76, LDAP: 79, Prometheus exporters: 121
* number of apache servers monitored: 32, hits per second: 168
* number of self-hosted nameservers: 5, mail servers: 10
* pending upgrades: 0, reboots: 0
* average load: 0.56, memory available: 357.18 GiB/934.53 GiB, running processes: 441
* bytes sent: 126.79 MB/s, received: 96.13 MB/s
Those metrics should be taken with a grain of salt: many of those might
not mean what you think they do, and some others might be gross
mischaracterizations as well. I hope to improve those reports as time
goes on.
This diff is collapsed.
Click to expand it.
tsa/meeting/monthly-report
0 → 100755
+
155
−
0
View file @
95afe0df
#!/usr/bin/python3
import
json
import
os
import
re
import
subprocess
import
requests
PUPPET_HOST
=
"
pauli.torproject.org
"
LDAP_HOST
=
"
alberti.torproject.org
"
PROMETHEUS_API
=
"
https://{HTTP_USER}:{HTTP_PASS}@prometheus.torproject.org/api/v1
"
.
format
(
**
os
.
environ
)
# noqa: E501
def
prom_query
(
query
):
resp
=
requests
.
get
(
PROMETHEUS_API
+
"
/query?query=
"
+
query
)
return
float
(
resp
.
json
()[
'
data
'
][
'
result
'
][
0
][
'
value
'
][
1
])
def
host_count_puppet
():
puppetdb_data
=
subprocess
.
check_output
([
'
ssh
'
,
PUPPET_HOST
,
'
curl -s -G
"
http://localhost:8080/pdb/query/v4/nodes
"'
])
# noqa: E501
return
len
(
json
.
loads
(
puppetdb_data
))
def
host_count_ldap
():
ldap_data
=
subprocess
.
check_output
([
'
ssh
'
,
LDAP_HOST
,
'
ldapsearch -ZZ -vLx -h db.torproject.org -b
"
ou=hosts,dc=torproject,dc=org
"
2>/dev/null
'
])
# noqa: E501
return
len
(
re
.
findall
(
r
'
^dn: host
'
,
ldap_data
.
decode
(
'
ascii
'
),
re
.
M
))
def
sizeof_fmt
(
num
,
suffix
=
'
B
'
,
units
=
None
,
power
=
None
,
sep
=
'
'
,
precision
=
2
,
sign
=
False
):
"""
format the given size as a human-readable size
"""
prefix
=
'
+
'
if
sign
and
num
>
0
else
''
for
unit
in
units
[:
-
1
]:
if
abs
(
round
(
num
,
precision
))
<
power
:
if
isinstance
(
num
,
int
):
return
"
{}{}{}{}{}
"
.
format
(
prefix
,
num
,
sep
,
unit
,
suffix
)
else
:
return
"
{}{:3.{}f}{}{}{}
"
.
format
(
prefix
,
num
,
precision
,
sep
,
unit
,
suffix
)
num
/=
float
(
power
)
return
"
{}{:.{}f}{}{}{}
"
.
format
(
prefix
,
num
,
precision
,
sep
,
units
[
-
1
],
suffix
)
def
sizeof_fmt_iec
(
num
,
suffix
=
'
B
'
,
sep
=
'
'
,
precision
=
2
,
sign
=
False
):
return
sizeof_fmt
(
num
,
suffix
=
suffix
,
power
=
1024
,
units
=
[
''
,
'
Ki
'
,
'
Mi
'
,
'
Gi
'
,
'
Ti
'
,
'
Pi
'
,
'
Ei
'
,
'
Zi
'
,
'
Yi
'
],
sep
=
sep
,
precision
=
precision
,
sign
=
sign
)
def
sizeof_fmt_decimal
(
num
,
suffix
=
'
B
'
,
sep
=
'
'
,
precision
=
2
,
sign
=
False
):
"""
# no rounding necessary for those
>>>
sizeof_fmt_decimal
(
0
)
'
0 B
'
>>>
sizeof_fmt_decimal
(
1
)
'
1 B
'
>>>
sizeof_fmt_decimal
(
142
)
'
142 B
'
>>>
sizeof_fmt_decimal
(
999
)
'
999 B
'
>>>
# rounding starts here
>>>
sizeof_fmt_decimal
(
1000
)
'
1.00 kB
'
>>>
# should be rounded away
>>>
sizeof_fmt_decimal
(
1001
)
'
1.00 kB
'
>>>
# should be rounded down
>>>
sizeof_fmt_decimal
(
1234
)
'
1.23 kB
'
>>>
# should be rounded up
>>>
sizeof_fmt_decimal
(
1235
)
'
1.24 kB
'
>>>
# rounded down as well
>>>
sizeof_fmt_decimal
(
1010
)
'
1.01 kB
'
>>>
# rounded down
>>>
sizeof_fmt_decimal
(
999990000
)
'
999.99 MB
'
>>>
# rounded down
>>>
sizeof_fmt_decimal
(
999990001
)
'
999.99 MB
'
>>>
# rounded up to next unit
>>>
sizeof_fmt_decimal
(
999995000
)
'
1.00 GB
'
>>>
# and all the remaining units, megabytes
>>>
sizeof_fmt_decimal
(
10
**
6
)
'
1.00 MB
'
>>>
# gigabytes
>>>
sizeof_fmt_decimal
(
10
**
9
)
'
1.00 GB
'
>>>
# terabytes
>>>
sizeof_fmt_decimal
(
10
**
12
)
'
1.00 TB
'
>>>
# petabytes
>>>
sizeof_fmt_decimal
(
10
**
15
)
'
1.00 PB
'
>>>
# exabytes
>>>
sizeof_fmt_decimal
(
10
**
18
)
'
1.00 EB
'
>>>
# zottabytes
>>>
sizeof_fmt_decimal
(
10
**
21
)
'
1.00 ZB
'
>>>
# yottabytes
>>>
sizeof_fmt_decimal
(
10
**
24
)
'
1.00 YB
'
>>>
# negative value
>>>
sizeof_fmt_decimal
(
-
1
)
'
-1 B
'
>>>
# negative value with rounding
>>>
sizeof_fmt_decimal
(
-
1010
)
'
-1.01 kB
'
"""
return
sizeof_fmt
(
num
,
suffix
=
suffix
,
power
=
1000
,
units
=
[
''
,
'
k
'
,
'
M
'
,
'
G
'
,
'
T
'
,
'
P
'
,
'
E
'
,
'
Z
'
,
'
Y
'
],
sep
=
sep
,
precision
=
precision
,
sign
=
sign
)
def
main
():
print
(
"
* hosts in Puppet: %d, LDAP: %d, Prometheus exporters: %d
"
%
(
host_count_puppet
(),
host_count_ldap
(),
prom_query
(
'
sum(up)
'
)))
print
(
"
* number of apache servers monitored: %d, hits per second: %d
"
%
(
prom_query
(
'
count(apache_up)
'
),
# XXX: wtf vs http_requests_total
prom_query
(
'
sum(rate(apache_accesses_total[30d]))
'
)))
print
(
"
* number of self-hosted nameservers: %d, mail servers: %d
"
%
(
prom_query
(
'
sum(bind_up)
'
),
prom_query
(
'
sum(postfix_up)
'
)))
print
(
"
* pending upgrades: %d, reboots: %d
"
%
(
prom_query
(
'
sum(apt_upgrades_pending)
'
),
prom_query
(
'
sum(node_reboot_required)
'
)))
print
(
"
* average load: %0.2f, memory available: %s/%s, running processes: %d
"
%
# noqa: E501
(
prom_query
(
'
avg(node_load15)
'
),
sizeof_fmt_iec
(
prom_query
(
'
sum(node_memory_MemFree_bytes)
'
)),
sizeof_fmt_iec
(
prom_query
(
'
sum(node_memory_MemTotal_bytes)
'
)),
prom_query
(
'
sum(node_procs_running)
'
)))
print
(
"
* bytes sent: %s/s, received: %s/s
"
%
(
sizeof_fmt_decimal
(
prom_query
(
'
sum(rate(node_network_transmit_bytes_total[30d]))
'
)),
# noqa: E501
sizeof_fmt_decimal
(
prom_query
(
'
sum(rate(node_network_receive_bytes_total[30d]))
'
))))
# noqa: E501
if
__name__
==
'
__main__
'
:
main
()
This diff is collapsed.
Click to expand it.
Preview
0%
Loading
Try again
or
attach a new file
.
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Save comment
Cancel
Please
register
or
sign in
to comment