Book a Demo!
CoCalc Logo Icon
StoreFeaturesDocsShareSupportNewsAboutPoliciesSign UpSign In
1N3
GitHub Repository: 1N3/Sn1per
Path: blob/master/bin/waybackurls.py
2960 views
1
import requests
2
import sys
3
import json
4
5
6
def waybackurls(host, with_subs):
7
if with_subs:
8
url = 'http://web.archive.org/cdx/search/cdx?url=*.%s/*&output=json&fl=original&collapse=urlkey' % host
9
else:
10
url = 'http://web.archive.org/cdx/search/cdx?url=%s/*&output=json&fl=original&collapse=urlkey' % host
11
r = requests.get(url)
12
results = r.json()
13
return results[1:]
14
15
16
if __name__ == '__main__':
17
argc = len(sys.argv)
18
if argc < 2:
19
print('Usage:\n\tpython3 waybackurls.py <url> <include_subdomains:optional>')
20
sys.exit()
21
22
host = sys.argv[1]
23
with_subs = False
24
if argc > 3:
25
with_subs = True
26
27
urls = waybackurls(host, with_subs)
28
json_urls = json.dumps(urls)
29
if urls:
30
filename = '%s-waybackurls.json' % host
31
with open(filename, 'w') as f:
32
f.write(json_urls)
33
print('[*] Saved results to %s' % filename)
34
else:
35
print('[-] Found nothing')
36
37