-
-
Notifications
You must be signed in to change notification settings - Fork 30
/
Copy pathwayback.py
80 lines (60 loc) · 2.29 KB
/
wayback.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
#!/usr/bin/env python3
import requests
from datetime import date
class Colors:
RED = '\033[31m'
GREEN = '\033[32m'
CYAN = '\033[36m'
WHITE = '\033[0m'
YELLOW = '\033[33m'
WAYBACK_AVAIL_URL = 'http://archive.org/wayback/available'
WAYBACK_SEARCH_URL = 'http://web.archive.org/cdx/search/cdx'
def print_status(status, color, message):
print(f'{Colors.YELLOW}[!] {Colors.CYAN}{message}', end='') #, flush=True
print(f'{color}[' + '.'.rjust(5, '.') + f' {status} ]{Colors.WHITE}')
def check_wayback_availability(target):
avail_data = {'url': target}
try:
check_rqst = requests.get(WAYBACK_AVAIL_URL, params=avail_data, timeout=10)
check_sc = check_rqst.status_code
if check_sc == 200:
check_data = check_rqst.json()
if check_data['archived_snapshots']:
print_status('Available', Colors.GREEN, 'Checking Availability on Wayback Machine')
return True
else:
print_status('N/A', Colors.RED, 'Checking Availability on Wayback Machine')
else:
print(f'\n{Colors.RED}[-] Status : {Colors.CYAN}{check_sc}{Colors.WHITE}')
except Exception as e:
print(f'\n{Colors.RED}[-] Exception : {Colors.CYAN}{e}{Colors.WHITE}')
return False
def fetch_wayback_links(target):
if not check_wayback_availability(target):
return
print_status('Fetching URLs', Colors.CYAN, 'Fetching URLs')
curr_yr = date.today().year
last_yr = curr_yr - 5
payload = {
'url': f'{target}/*',
'fl': 'original',
'fastLatest': 'true',
'from': str(last_yr),
'to': str(curr_yr)
}
try:
r = requests.get(WAYBACK_SEARCH_URL, params=payload)
r_sc = r.status_code
if r_sc == 200:
r_data = set(r.text.split('\n'))
print_status(len(r_data), Colors.GREEN, f'Fetching URLs')
result = {'links': list(r_data), 'exported': False}
print("\n[Wayback Links]")
for link in r_data:
print(link)
else:
print_status(r_sc, Colors.RED, 'Fetching URLs')
except Exception as e:
print(f'\n{Colors.RED}[-] Exception : {Colors.CYAN}{e}{Colors.WHITE}')
if __name__ == '__main__':
fetch_wayback_links(target='spyboy.in')