aboutsummaryrefslogtreecommitdiffstatshomepage
path: root/mirror-checker.lua
blob: 23c7e332ec4e3bf9d5ced5beb5f517d2a8240c11 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
#!/usr/bin/env luajit


local args = {...}

--[[ TODO - What to do about HTTPS://deb.devuan.org/ redirects.
	    Some mirrors give a 404.
		Sledjhamr gives a 404, coz it's not listening on 443 for deb.devuan.org.
	    Some mirrors give a 200.
		They shouldn't have the proper certificate, but are giving a result anyway.
]]

verbosity = 0
keep = false
-- TODO - Should actually implement this.
fork = true
options =
{
    referenceSite =
	{
	    typ = "string",
	    help = "",
	    value = "pkgmaster.devuan.org",
	},
    tests =
	{
	    typ = "table",
	    help = "",
	    value =
	    {
	        "IPv4",
	        "IPv6",
--	        "ftp",
	        "http",
	        "https",
--	        "rsync",
	        "DNS-RR",
	        "Protocol",
--	        "URL-Sanity",
--	        "Integrity",
--	        "Updated",
	    },
	},
}

local defaultURL = {scheme = "http"}
local downloadLock = "flock -n results/wget-"
local download = "wget --timeout=300 -np -N -r -P results "	-- Note wget has a default read timeout of 900 seconds (15 minutes).
local releases = {"jessie", "ascii", "beowulf", "ceres"}
local releaseFiles =
{
    -- Release file.
    "/Release",
    "/InRelease",
    "/main/binary-all/Packages.gz",
    -- Contents files.
    "/main/Contents-all.gz",
    "/main/Contents-amd64.gz",
    "/main/Contents-arm64.gz",
    "-security/main/Contents-all.gz",
    "-security/main/Contents-amd64.gz",
    "-security/main/Contents-arm64.gz",
}
local notExist =
{
    "ceres-security"	-- This will never exist, it's our code name for the testing suite.
}
local referenceDebs =
{
    -- Debian package.
    "merged/pool/DEBIAN/main/d/dash/dash_0.5.8-2.4_amd64.deb",
    -- Debian security package.  NOTE this one should always be redirected?
    "merged/pool/DEBIAN-SECURITY/updates/main/a/apt/apt-transport-https_1.4.9_amd64.deb",
}
local referenceDevs =
{
    -- Devuan package.  NOTE this one should not get redirected, but that's more a warning than an error.
    "merged/pool/DEVUAN/main/d/desktop-base/desktop-base_2.0.3_all.deb",
--    "merged/pool/DEVUAN/main/u/util-linux/util-linux_2.32.1-0.1+devuan2.1_amd64.deb",
}
local arg = {}
local sendArgs = ""
local logFile


local socket = require 'socket'
local ftp = require 'socket.ftp'
local http = require 'socket.http'
local https = require 'ssl.https'	-- See https://github.com/brunoos/luasec/wiki/LuaSec-0.6 for docs.
local url = require 'socket.url'


-- Use this to dump a table to a string.
dumpTable = function (table, space, name)
    local r = ""
    if "" == space then r = r .. space .. name .. " =\n" else r = r .. space .. "[" .. name .. "] =\n" end
    r = r .. space .. "{\n"
    r = r .. dumpTableSub(table, space .. "  ")
    if "" == space then r = r .. space .. "}\n" else r = r .. space .. "},\n" end
    return r
end
dumpTableSub = function (table, space)
    local r = ""
    for k, v in pairs(table) do 
        if type(k) == "string" then k = '"' .. k .. '"' end
	if type(v) == "table" then
	    r = r .. dumpTable(v, space, k)
	elseif type(v) == "string" then
	    r = r .. space .. "[" .. k .. "] = '" .. v .. "';\n"
	elseif type(v) == "function" then
	    r = r .. space .. "[" .. k .. "] = function ();\n"
	elseif type(v) == "userdata" then
	    r = r .. space .. "userdata " .. "[" .. k .. "];\n"
	elseif type(v) == "boolean" then
	    if (v) then
		r = r .. space .. "[" .. k .. "] = true;\n"
	    else
		r = r .. space .. "[" .. k .. "] = false;\n"
	    end
	else
	    r = r .. space .. "[" .. k .. "] = " .. v .. ";\n"
	end
    end
    return r
end


local log = function(v, t, s)
    if v <= verbosity then
	if 3 <= verbosity then t = os.date() .. " " .. t end
	print(t .. ": " .. s)
    end
    if nil ~= logFile then
	logFile:write(os.date() .. " " .. t .. ": " .. s .. "\n")
	logFile:flush()
    end
end
local D = function(s) log(3,  "DEBUG   ", s) end
local I = function(s) log(2,  "INFO    ", s) end
local W = function(s) log(1,  "WARNING ", s) end
local E = function(s) log(0,  "ERROR   ", s) end
local C = function(s) log(-1, "CRITICAL", s) end

local mirrors = {}

local testing = function(t, host)
    for i, v in pairs(options.tests.value) do
	if t == v then
	    local h = mirrors[host]
	    if nil == h then return true end
	    if true == h["Protocols"][t] then return true else D("Skipping " .. t .. " checks for " .. host) end
	end
    end
    return false
end

local checkExes = function (exe)
    local count = io.popen('ps x | grep "' .. exe .. '" | grep -v " grep " | wc -l'):read("*l")
    D(count .. " " .. exe .. " commands still running.")
    return tonumber(count)
end

local repoExists = function (r)
    r = r:match("([%a-]*)")
    if nil == r then return false end
    for k, v in pairs(notExist) do
	if v == r then return false end
    end
    return true
end

local IP = {}
local gatherIPs = function (host)
    if nil == IP[host] then
        local IPs
	local dig = io.popen('dig +keepopen +noall +nottlid +answer ' .. host .. ' A ' .. host .. ' AAAA ' .. host .. ' CNAME ' .. host .. ' SRV | sort -r | uniq')
	repeat
	    IPs = dig:read("*l")
	    if nil ~= IPs then
		for k, t, v in IPs:gmatch("([%w_%-%.]*)%.%s*IN%s*(%a*)%s*(.*)") do
		    if "." == v:sub(-1, -1) then v = v:sub(1, -2) end
		    if nil == IP[k] then IP[k] = {} end
		    IP[k][v] = t
		end
	    end
	until nil == IPs
    end
end

-- Returns FTP directory listing
local nlst = function (u)
    local t = {}
    local p = url.parse(u)
    p.command = "nlst"
    p.sink = ltn12.sink.table(t)
    local r, e = ftp.get(p)
    return r and table.concat(t), e
end

checkHEAD = function (host, URL, r, retry)
    if nil == r then r = 0 end
    if nil == retry then retry = 0 end
    local check = "Checking file"
    if 0 < r then
	check = "Redirecting to"
	--[[ The hard part here is that we end up throwing ALL of the test files at the redirected location.
	    Not good for deb.debian.org, which we should only be throwing .debs at.
	    What we should do is loop through the DNS entries, and only test the specific protocol & file being tested here.

	    This is what I came up with for checking if we are already testing a specific URL.
	    Still duplicates a tiny bit, but much less than the previous find based method.
	]]
	local pl = url.parse(URL, defaultURL)
	local file = host .. "://" .. pl.path
        local f = io.popen(string.format('if [ ! -f results/%s.check ] ; then touch results/%s.check; echo -n "check"; fi', file:gsub("/", "_"), file:gsub("/", "_") )):read("*a")
	if (nil == f) or ("check" == f) then
	    I("  Now checking redirected host " .. file)
	    checkRedirects(host, host, nil, "redir", pl.path)
	else
	    D("  Already checking " .. file)
	end

    end
    if 0 < retry then
-- TODO - should have a random sleep here before retrying.
	check = "Retry " .. retry .. " " .. check
    end
    if 10 < r then
	E("too many redirects!  " .. check .. " " .. host .. " -> " .. URL)
	return
    end
    if 10 < retry then
	E("too many retries!  " .. check .. " " .. host .. " -> " .. URL)
	return
    end
    local PU = url.parse(URL, defaultURL)
    D(PU.scheme .. " ://  " .. check .. " " .. host .. " -> " .. URL)
    if not testing(PU.scheme, host) then D("Not testing " .. PU.scheme .. " " .. host .. " -> " .. URL);  return end
    -- TODO - Perhaps we should try it anyway, and mark it as a warning if it DOES work?
    if "https" == PU.scheme and "deb.devuan.org" == host then D("Not testing " .. PU.scheme .. " " .. host .. " -> " .. URL .. " mirrors shouldn't have the correct cert.");  return end
    local hd = {Host = host}
    local htp = http;
    if PU.scheme == "https" then htp = https end
    -- NOTE - the docs for lua-sec say that redirect isn't supported is version 0.6, no idea if that means it ignores redirections like we want.
    --		The protocol and options are lua-sec specific arguments.
    local p, c, h, s = htp.request{method = "HEAD", redirect = false, url = URL, headers = hd, protocol = "any", options = "all"}
    if nil == s then s = "" end
    if nil == p then
	E("  " .. c .. " " .. s .. "!   " .. check .. " " .. host .. " -> " .. URL)
	-- So far the only errors are "timeout", "Network is unreachable", and "closed", and I suspect "closed" is due to saturating my bandwidth.
	-- Might be worthwhile retrying those, some number of times.
	if ("closed" == c) or ("Network is unreachable" == c) or ("timeout" == c) then checkHEAD(host, URL, r, retry + 1) end
    else
	if ("4" == tostring(c):sub(1, 1)) or ("5" == tostring(c):sub(1, 1)) then
	    E("  " .. c .. " " .. s .. ".   " .. check .. " " .. host .. " -> " .. URL)
	else
	    I("  " .. c .. " " .. s .. ".   " .. check .. " " .. host .. " -> " .. URL)
	end
	l = h.location
	if nil ~= l then
	    local pu = url.parse(l, defaultURL)
	    if pu.scheme ~= PU.scheme then
		if testing("Protocol") then
		    W("    protocol changed during redirect!  " .. check .. " " .. host .. " -> " .. URL .. " -> " .. l)
		end
	    elseif l == URL then
		E("    redirect loop!  " .. check .. " " .. host .. " -> " .. URL)
	    elseif nil == pu.host then
		W("    no location host!  " .. check .. " " .. host .. " -> " .. URL .. " -> " .. l)
		checkHEAD(host, PU.scheme .. "://" .. PU.host .. l, r + 1)
	    else
		checkHEAD(pu.host, l, r + 1)
	    end
	end
    end
end

local checkPaths = function (host, ip, path, file)
    if nil ~= file then
	if "redirect" == ip then ip = host end
	I("  Checking IP for file " .. host .. " -> " .. ip .. " " .. path .. " " .. file)
	if testing("http", host)  then checkHEAD(host, "http://"  .. ip .. path .. "/" .. file) end
	if testing("https", host) then checkHEAD(host, "https://" .. ip .. path .. "/" .. file) end
    else
	I("  Checking IP " .. host .. " -> " .. ip .. " " .. path)
	for i, s in pairs(referenceDevs) do
	    if testing("http", host)  then checkHEAD(host, "http://"  .. ip .. path .. "/" .. s) end
	    if testing("https", host) then checkHEAD(host, "https://" .. ip .. path .. "/" .. s) end
	end

	for i, s in pairs(releases) do
	    for j, k in pairs(releaseFiles) do
		if repoExists(s .. k) then
		    if testing("http", host)  then checkHEAD(host, "http://"  .. ip .. path .. "/merged/dists/" .. s .. k) end
		    if testing("https", host) then checkHEAD(host, "https://" .. ip .. path .. "/merged/dists/" .. s .. k) end
		end
	    end
	end
    end
end

local execute = function (s)
    D("  executing " .. s)
    os.execute(s)
end

checkRedirects = function (orig, host, path, ip, file)
    if nil == host then host = orig end
    if nil == path then path = "" end
    if nil == file then file = "" end
    local ph = url.parse("http://" .. host)
    if (nil ~= ip) and ("redir" ~= ip) then
	local po = url.parse("http://" .. orig)
	if "" ~= file then
	    D("checking redirected file " .. po.host .. " " .. file)
	    checkPaths(po.host, ip, path, file)
	else
	    checkPaths(po.host, ip, path)
	end
    else
	if orig == host then D("checkRedirects " .. orig .. "" .. file) else D("checkRedirects " .. orig .. " -> " .. host) end
-- TODO - use checkPaths() here ^^^ on the original domain name, coz that's not getting caught yet.  I think.
	gatherIPs(ph.host)
	for k, v in pairs(IP[ph.host]) do
	    D("  DNS record " .. v .. " " .. ph.host .. " -> " .. k)
	    if v == "A" then
    		if testing("IPv4") then execute("ionice -c3 ./mirror-checker.lua " .. sendArgs .. " " .. orig .. path .. " " .. k .. " " .. file .." &") end
	    elseif v == "AAAA" then
		if testing("IPv6") then execute("ionice -c3 ./mirror-checker.lua " .. sendArgs .. " " .. orig .. path .. " [" .. k .. "] " .. file .. " &") end
	    elseif v == "CNAME" then
		checkRedirects(orig, k, path, ip, file)  -- Check the original, with the DNS records from the CNAME.  Do not check the CNAME, it's just a source of IPs.
	    elseif v == "SRV" then
		print("SVR record found, now what do we do?")
	    end
	end
    end
end

local downloads = function (cut, host, URL)
    if 0 ~= cut then cd = " --cut-dirs=" .. cut .. " " else cd = "" end
    if nil == URL then URL = "/" end
    local lock = "%s-" .. host .. ".log "
    local log = " --rejected-log=results/wget-%s_REJECTS-" .. host .. ".log -a results/wget-%s-" .. host .. ".log "
    I("starting file download commands for " .. host .. " " .. URL)
    local cm = "ionice -c3 " .. downloadLock .. lock:format("debs") .. download .. log:format("debs", "debs") .. cd
    for i, s in pairs(referenceDevs) do
	cm = cm .. " https://" .. host .. URL .. "/" .. s
    end
    for i, s in pairs(referenceDebs) do
	cm = cm .. " https://" .. host .. URL .. "/" .. s
    end
    for i, s in pairs(releases) do
	execute(cm .. " &")
	cm = "ionice -c3 " .. downloadLock .. lock:format(s) .. download .. log:format(s, s) .. cd
	if repoExists(s .. k) then
	    for j, k in pairs(releaseFiles) do
		cm = cm .. " https://" .. host .. URL .. "/merged/dists/" .. s .. k
	    end
	end
    end
    execute(cm .. " &")
end

local getMirrors = function ()
    local mirrors = {}
    local host = ""
    local m = {}
    local active = true
    local URL = "https://" .. options.referenceSite.value .. "/mirror_list.txt"
    I("getting mirrors.")
    local p, c, h = http.request(URL)
    if nil == p then E(c .. " fetching " .. URL) else
	for l in p:gmatch("\n*([^\n]+)\n*") do
	    local t, d = l:match("(%a*):%s*(.*)")
	    d = string.lower(d)
	    if "FQDN" == t then
		if "" ~= host then
		    if active then mirrors[host] = m end
		    m = {}
		    active = true
		end
		host = d
		m[t] = d
	    elseif "Protocols" == t then
		local prot = {}
		for w in d:gmatch("(%w+)") do
		    prot[w] = true;
		end
		m[t] = prot
	    elseif "Active" == t and nil == d:find("yes", 1, true) then
		W("Mirror " .. host .. " is not active - " .. d)
		active = false
	    else
		m[t] = d
	    end
	end
	if "" ~= host and active then
	    mirrors[host] = m
	end
    end
    local file, e = io.open("results/mirrors.lua", "w+")
    if nil == file then C("opening mirrors file - " .. e) else
	file:write(dumpTable(mirrors, "", "mirrors") .. "\nreturn mirrors\n")
        file:close()
    end
    return mirrors
end


if 0 ~= #args then
    local option = ""
    for i, a in pairs(args) do
	if ("--help" == a) or ("-h" == a) then
	    print("I should write some docs, huh?  Read README.md for instructions.")
	elseif "--version" == a then
	    print("mirror-checker-lua version 0.1 WIP development version")
	elseif "-v" == a then
	    verbosity = verbosity + 1
	    sendArgs = sendArgs .. a .. " "
	elseif "-q" == a then
	    verbosity = -1
	    sendArgs = sendArgs .. a .. " "
	elseif "-k" == a then
	    keep = true
	elseif "-n" == a then
	    fork = false
	elseif "--" == a:sub(1, 2) then
	    local s, e = a:find("=")
	    if nil == s then e = -1 end
	    option = a:sub(3, e - 1)
	    local o = options[option]
	    if nil == o then
		print("Unknown option --" .. option)
		option = ""
	    else
		option = a
		sendArgs = sendArgs .. a .. " "
		local s, e = a:find("=")
		if nil == s then e = 0 end
		option = a:sub(3, e - 1)
		if "table" == options[option].typ then
		    local result = {}
		    for t in (a:sub(e + 1) .. ","):gmatch("([+%-]?%w*),") do
			local f = t:sub(1, 1)
			local n = t:sub(2, -1)
			if ("+" ~= f) and ("-" ~= f) then
			    table.insert(result, t)
			end
		    end
		    if 0 ~= #result then
			options[option].value = result
		    else
			for t in (a:sub(e + 1) .. ","):gmatch("([+%-]?%w*),") do
			    local f = t:sub(1, 1)
			    local n = t:sub(2, -1)
			    if "+" == f then
				table.insert(options[option].value, n)
			    elseif "-" == f then
				local r = {}
				for i, k in pairs(options[option].value) do
				    if k ~= n then table.insert(r, k) end
				end
				options[option].value = r
			    end
			end
		    end
		else
		    options[option].value = a
		end
		option = ""
	    end
	elseif "-" == a:sub(1, 1) then
	    print("Unknown option " .. a)
	else
	    table.insert(arg, a)
	end
    end
end

--print(dumpTable(options.tests.value, "", "tests"))

execute("mkdir -p results")

if 0 < #arg then
    if "/" == arg[1]:sub(-1, -1) then
	W("slash at end of path!  " .. arg[1])
	arg[1] = arg[1]:sub(1, -2)
    end
    local pu = url.parse("http://" .. arg[1])
    if nil ~= arg[2] then
	logFile, e = io.open("results/mirror-checker-lua_" .. pu.host .. "_" .. arg[2] .. ".log", "a+")
    else
	logFile, e = io.open("results/mirror-checker-lua_" .. pu.host .. ".log", "a+")
    end
    if nil == logFile then C("opening log file - " .. e); return end
    I("Starting tests for " ..arg[1] .. " with these tests - " .. table.concat(options.tests.value, ", "))
    mirrors = loadfile("results/mirrors.lua")()
--print(dumpTable(mirrors, "", "mirrors"))
    if nil ~= arg[2] then I("  Using IP " .. arg[2]) end
    if nil ~= arg[3] then I("  Using file " .. arg[3]); end
    if testing("Integrity") or testing("Updated") then
	if nil == arg[3] then
	    if not keep then execute("rm -fr results/" .. pu.host) end
	    cut = 0
	    for t in arg[1]:gmatch("(/)") do
		cut = cut + 1
	    end
	    downloads(cut, pu.host, pu.path)
	    checkExes("mirror-checker.lua " .. sendArgs)
	    checkExes(downloadLock)
	end
    end
    checkRedirects(pu.host, pu.host, pu.path, arg[2], arg[3])
    logFile:close()
else
    if not keep then os.execute("rm -f results/*.log") end
    os.execute("rm -f results/*.check")
    os.execute("mkdir -p results; touch results/stamp")
    logFile, e = io.open("results/mirror-checker-lua.log", "a+")
    if nil == logFile then C("opening log file - " .. e); return end
    I("Starting tests " .. table.concat(options.tests.value, ", "))
    execute("mkdir -p results")
    mirrors = getMirrors()
--print(dumpTable(mirrors, "", "mirrors"))
    mirrors[options.referenceSite.value] = nil
    checkRedirects(options.referenceSite.value)
--    forkIP(options.referenceSite.value)
    checkRedirects("deb.devuan.org")
--    forkIP("deb.devuan.org")
    for k, m in pairs(mirrors) do
	if "/" == m.BaseURL:sub(-1, -1) then
	    W("slash at end of BaseURL in mirror_list.txt!  " .. m.BaseURL)
	    m.BaseURL = m.BaseURL:sub(1, -2)
	end
	local pu = url.parse("http://" .. m.BaseURL)
	checkRedirects(m.BaseURL)
--	forkIP(m.BaseURL)
        checkExes("mirror-checker.lua " .. sendArgs)
        if testing("Integrity") or testing("Updated") then checkExes(downloadLock) end
    end
    while 1 <= checkExes("mirror-checker.lua " .. sendArgs) do os.execute("sleep 30") end
    if testing("Integrity") or testing("Updated") then
	while 0 < checkExes(downloadLock) do os.execute("sleep 30") end
    end
    os.execute("rm -f results/*.check")
    logFile:close()
end