-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathaggregate-access-log
executable file
·277 lines (219 loc) · 8.84 KB
/
aggregate-access-log
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
#!/usr/bin/env awk -f
BEGIN {
# derive class from matching hostname against regex patterns provided from environment variable
# export ACCESS_CLASSES='[["clj", "^clj-fe-"], ["app-topic", "app-topic.*$"]]'
# OR via mol-config
# config:
# /:
# ACCESS_CLASSES:
# - [ clj, '(clj-|bauhaus-)' ]
# - [ cc, '(cc-|cc[d])' ]
class="default"
"hostname" | getline hostname
while("echo \"$ACCESS_CLASSES\" | jq -r '.[] | .[0] +\" \"+.[1]'" | getline) {
_regex=$2
_class=$1
#printf "Checking if %s matches %s to give %s\n", hostname, $_regex, $_class > "/dev/stderr"
if (hostname ~ $_regex) {
#printf ">> %s matches %s to give %s\n", hostname, $_regex, $_class > "/dev/stderr"
class=$_class
break;
}
}
if (match(hostname, /-(\w+)[0-9]+\./, results)) {
#printf "Cluster for host %s found %s \n", hostname, results[1] > "/dev/stderr"
cluster=results[1]
} else {
#printf "cluster not found for %s\n", hostname > "/dev/stderr"
cluster=null
}
printf "METRIC ns=aggregatelogger.start host=%s class=%s cluster=%s\n", hostname, class, cluster > "/dev/stderr"
}
function top_array(result, top, acc) {
delete temp
c = 0
for(i in acc) {
temp[c] = sprintf("%05d %s", acc[i], i)
c += 1
}
n = asort(temp)
startfrom = n < top ? 0 : n-top
ai=0
for(i = startfrom+1;i<=n;i++) {
line = temp[i]
count = substr(line, 1, 6)+0
value = substr(line, 7, length(line)-1)
result[ai][1] = count
result[ai][2] = value
ai += 1
}
}
function print_ua(ts, acc) {
top_array(tops, 15, acc)
for (i in tops) {
ua = tops[i][2]
gsub("\"", "'", ua)
printf "%s ns=fe.access.ua class="%s" cluster="%s" count=%d ua=\"%s\"\n", ts, class, cluster, tops[i][1], ua
}
delete tops
}
function print_errors(ts, acc) {
top_array(tops, 15, acc)
for (i in tops) {
value = tops[i][2]
split(value, values, " ")
code = values[1]+0
uri = values[2]
printf "%s ns=fe.access.errors class="%s" cluster="%s" count=%d error=%d uri=\"%s\"\n", ts, class, cluster, tops[i][1], code, uri
}
delete tops
}
function print_reqs(ts, acc) {
top_array(tops, 15, acc["uri_time"])
for (i in tops) {
value = tops[i][2]
# total = acc["uri_time"][value]
# count = tops[i][1]
total = tops[i][1]
count = acc["reqs"][value]
split(value, values, " ")
code = values[1]+0
uri = values[2]
printf "%s ns=fe.access.slow class="%s" cluster="%s" count=%d total=%d code=%d uri=\"%s\"\n", ts, class, cluster, count, total, code, uri
}
delete tops
top_array(tops, 15, acc["reqs"])
for (i in tops) {
value = tops[i][2]
total = acc["uri_time"][value]
count = tops[i][1]
split(value, values, " ")
code = values[1]+0
uri = values[2]
printf "%s ns=fe.access.count class="%s" cluster="%s" count=%d total=%d code=%d uri=\"%s\"\n", ts, class, cluster, count, total, code, uri
}
delete tops
}
function print_groups(ts, acc) {
for (i in acc["times"]) {
printf "%s ns=fe.access.group class="%s" cluster="%s" group_name=\"%s\" count=%d avg=%.1f max=%d min=%d\n", ts, class, cluster, i, acc["count"][i], acc["times"][i]/acc["count"][i], acc["max"][i], acc["min"][i]
}
}
function print_codes(ts, acc) {
for (i in acc["code"]) {
printf "%s ns=fe.access.bots class="%s" cluster="%s" response_code=%s count=%d bots=%d\n", ts, class, cluster, i, acc["code"][i], acc["bots"][i]
}
}
function print_acc(ts, acc) {
#DEBUG ONLY
#printf "%s times=%s class="%s" cluster="%s" code=%s ua=%s reqs=%s count=%s size=%s\n ", ts, class, cluster, length(acc["times"]), length(acc["code"]), length(acc["ua"]), length(acc["reqs"]), length(acc["count"]), length(acc["size"]) > "/dev/stderr"
# in case we lose the next few bytes if network connection is lost, we just lose empty lines
for (i = 1; i <= 10; i++) {
printf "%s\n", ts
}
if (length(acc["ua"]) > 0) { print_ua(ts, acc["ua"]) }
print_groups(ts, acc)
print_codes(ts, acc)
if (length(acc["errors"]) > 0) { print_errors(ts, acc["errors"]) }
if (length(acc["reqs"]) > 0) { print_reqs(ts, acc) }
print ts > "/dev/stderr" # not 100% sure what this is for. Possibly originally planned to flush buffer but it goes to STDERR which doesn't make sense. Leaving incase removing breaks it. At least it shows that the process is not hung.
#printf "%s times=%s code=%s", ts, length(acc["times"]), length(acc["code"]) > "/dev/stderr"
fflush(stdout)
}
{
# DEBUG ONLY
# printf "line is '%s'\n", $0 > "/dev/stderr"
# Known log formats
# ::ffff:10.251.203.252 - - [15/Mar/2018:11:50:55 +0000] "GET /api/apptopics HTTP/1.1" 200 40331 "http://app-topics.int.mol.dmgt.net/" "Mozilla/5.0 (Macintosh; Intel Mac OS X 10_12_6) AppleWebKit/537.36 (KHTML, like Ge
# 10.251.198.10 - - [2018-03-15T14:46:11.946+0000] "HEAD /home/index.html HTTP/1.1" 200 0 579 "-" "Varnish Health Probe"
# ip ? ? time method url proto code length restime(opt) referrer ua
if (match($0, /([^ ]+)\s([^ ]+)\s([^ ]+)\s\[([^\]]+)\]\s\"(\w+) ([^ ]+)\s([^ ]+)"\s([0-9]+)\s([0-9]+)\s(([0-9]+)\s)?"([^ ]+)"\s"(.*)"/, results)) {
process_line(results)
} else {
printf "Invalid line '%s'\n", $0 > "/dev/stderr";
}
}
function process_line(results) {
_time=results[4]
_url=results[6]
_proto=results[7]
_code=results[8]
_size=results[9]
_duration=results[11]
_ua=results[13]
# Known time formats
#[2018-03-15T14:46:11.946+0000]
#[15/Mar/2018:11:50:55 +0000]
ts = _time
match(_time, /(.*[0-9]{2}:[0-9]{2}):[0-9]{2}/, _time_results); //find string reprepresenting time to nearest min
current_minute = _time_results[1]
# output aggregations if we have passed prior recorded minute
if (current_minute != last_minute) {
if (length(first_timestamp)>0) {
print_acc(first_timestamp, acc)
}
first_timestamp = ts
last_minute = current_minute;
delete acc
}
url = _url
if (gsub("^/textbased/.*", "textbased", url) ||
gsub(".*article-[0-9]*/amp/.*", "amp/articles", url) ||
gsub(".*article-[0-9]*/.*mobile=true.*", "mobile/articles", url) ||
gsub(".*article-[0-9]*/.*", "articles", url) ||
gsub(".*video-[0-9]*/.*mobile=true.*", "mobile/video", url) ||
gsub(".*video-[0-9]*/.*", "video", url) ||
gsub(".*columnist-[0-9]*/.*mobile=true.*", "mobile/columnist", url) ||
gsub(".*columnist-[0-9]*/.*", "columnist", url) ||
gsub(".*/(home|homeus|homeau)/index.html.*mobile=true.*", "mobile/home", url) ||
gsub(".*/(home|homeus|homeau)/index.html.*", "home", url) ||
gsub(".*index.html.*mobile=true.*", "mobile/channels", url) ||
gsub(".*index.html.*", "channels", url) ||
gsub(".*rss.*", "rss", url) ||
gsub(".*registration.*", "registration", url) ||
gsub(".*meta.*", "meta", url) ||
gsub(".*/geolocation/.*", "esi calls", url) ||
gsub(".*/mobile/.*", "mobile feed", url) ||
gsub(".*/api/.*", "api", url) ||
gsub(".*/home/search.html.*", "search", url) ||
gsub(".*/home/sitemap.*.html.*", "sitemap/html", url) ||
gsub(".*sitemap.*.xml.*", "sitemap/xml", url) ||
gsub(".*embed/video/.*", "embedded video", url) ||
gsub(".*videoarchive.*", "video archive", url) ||
gsub(".*c.*/item.cms.*", "cms items", url) ||
gsub(".*/.*.html.*", "topic pages", url) ||
gsub("^/$", "home", url) ||
gsub("^/.*$", "others", url))
{}
acc["code"][_code] +=1
response_time = _duration+0
acc["count"][url] += 1
acc["size"][url] += _size
acc["times"][url] += response_time
if (length(acc["min"][url]) == 0 || acc["min"][url] > response_time) {
acc["min"][url] = response_time
}
if (acc["max"][url] < response_time) {
acc["max"][url] = response_time
}
ua = _ua
acc["ua"][ua] += 1
IGNORECASE = 1
if (match(ua, /bot|google|crawler|spider|robot|crawling|wget|http|slurp|analyzer|sitecon|@/) || ua == "-") {
acc["bots"][_code] += 1
}
code = _code+0
uri = _url
gsub("\\?.*", "", uri)
code_uri = sprintf("%03d %s", code, uri)
acc["reqs"][code_uri] += 1
acc["uri_time"][code_uri] += response_time
if (code >= 400) {
acc["errors"][code_uri] += 1
}
# DEBUG ONLY
# printf "_time=%s _url=%s _proto=%s _code=%s _size=%s _duration=%s ts=%s ua=%s code_uri=%s \n", _time, _url, _proto, _code, _size, _duration, ts, ua, code_uri > "/dev/stderr"
}
END {
print_acc(first_timestamp, acc)
}