-
-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathTool-13-Geolocation-Tagger.py
More file actions
230 lines (186 loc) · 7.55 KB
/
Tool-13-Geolocation-Tagger.py
File metadata and controls
230 lines (186 loc) · 7.55 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
import json
import requests
import time
from dotenv import load_dotenv
import os
from datetime import datetime
import socket
# Load API key and rate limit from .env file
load_dotenv(".env")
API_KEY = os.getenv("IPINFO_API_TOKEN")
RATE_LIMIT = int(os.getenv("IPINFO_RATE_LIMIT", 60)) # Default to 60 if not specified
# Define the input file
INPUT_FILE = "../Database-Files/Edit-Database/Compromised-Discord-Accounts.json"
CACHE_FILE = "domain_cache.json" # File to store cached domain results
IPINFO_URL = "https://ipinfo.io/"
# Domains that should be automatically set to US
AUTO_US_DOMAINS = {
"discord.com",
"discord.gg",
"steamcommunity.com",
"funpay.com",
"mediafire.com",
"t.me",
"t.co",
"telegra.ph",
"telegram.com",
}
def load_cache():
try:
with open(CACHE_FILE, "r", encoding="utf-8") as file:
return json.load(file)
except (FileNotFoundError, json.JSONDecodeError):
return {}
def save_cache(cache):
with open(CACHE_FILE, "w", encoding="utf-8") as file:
json.dump(cache, file, indent=4)
def log(message):
timestamp = datetime.now().strftime("[%Y-%m-%d %H:%M:%S]")
print(f"{timestamp} {message}")
def resolve_ip(domain):
try:
# Resolve the domain to an IP address
ip_address = socket.gethostbyname(domain)
log(f"Resolved {domain} to IP: {ip_address}")
return ip_address
except socket.gaierror as e:
log(f"Error resolving {domain} to IP: {e}")
return None
def get_geolocation(domain, cache):
if domain in AUTO_US_DOMAINS:
log(f"Skipping API call for {domain}, setting to US")
return "US"
# Check cache first
if domain in cache:
log(f"Using cached result for {domain}: {cache[domain]}")
return cache[domain]
# Resolve the domain to an IP address
ip_address = resolve_ip(domain)
if not ip_address:
return "N/A" # Skip to the next domain if IP resolution fails
try:
log(f"Querying ipinfo.io for IP: {ip_address}")
response = requests.get(
f"{IPINFO_URL}{ip_address}/json", params={"token": API_KEY}
)
data = response.json()
country = data.get("country", "N/A")
log(f"Received response for {domain} (IP: {ip_address}): {country}")
# Update cache with new result
cache[domain] = country
return country
except requests.RequestException as e:
log(f"Error querying {domain} (IP: {ip_address}): {e}")
return "N/A"
def count_urls_to_check():
with open(INPUT_FILE, "r", encoding="utf-8") as file:
accounts = json.load(file)
total_auto_us = 0
total_other = 0
for account_id, details in accounts.items():
final_url_domain = details.get("FINAL_URL_DOMAIN", "")
if final_url_domain:
if final_url_domain in AUTO_US_DOMAINS:
total_auto_us += 1
else:
total_other += 1
log(f"Total URLs to check: {total_auto_us + total_other}")
log(f" URLs automatically set to US: {total_auto_us}")
log(f" URLs that will be checked: {total_other}")
def update_auto_us_domains(accounts):
updated_count = 0
current_time = datetime.utcnow().isoformat()
for account_id, details in accounts.items():
final_url_domain = details.get("FINAL_URL_DOMAIN", "")
if final_url_domain in AUTO_US_DOMAINS:
accounts[account_id]["SUSPECTED_REGION_OF_ORIGIN"] = "US"
accounts[account_id]["LAST_CHECK"] = current_time
updated_count += 1
log(
f"Updated {account_id}: {final_url_domain} -> US | Last Check: {current_time}"
)
if updated_count > 0:
with open(INPUT_FILE, "w", encoding="utf-8") as file:
json.dump(accounts, file, indent=4)
log(f"Updated {updated_count} cases with AUTO_US domains to US")
def update_compromised_accounts(start_from=0):
# Load cache at start
domain_cache = load_cache()
log(f"Loaded {len(domain_cache)} cached domain results")
with open(INPUT_FILE, "r", encoding="utf-8") as file:
accounts = json.load(file)
total_cases = len(accounts)
updated_count = 0
unknown_count = 0
skipped_count = 0
request_counter = 0
cached_count = 0
log(f"Found {total_cases} cases in {INPUT_FILE}")
# First, update all cases with AUTO_US domains
update_auto_us_domains(accounts)
# Then, process the rest with the API
for i, (account_id, details) in enumerate(accounts.items()):
if i < start_from:
continue
final_url_domain = details.get("FINAL_URL_DOMAIN", "")
if final_url_domain and final_url_domain not in AUTO_US_DOMAINS:
# Check if we have a cached result for this domain
if final_url_domain in domain_cache:
cached_result = domain_cache[final_url_domain]
current_time = datetime.utcnow().isoformat()
accounts[account_id]["SUSPECTED_REGION_OF_ORIGIN"] = cached_result
accounts[account_id]["LAST_CHECK"] = current_time
cached_count += 1
log(
f"Used cached result for {account_id}: {final_url_domain} -> {cached_result} | Last Check: {current_time}"
)
else:
# No cached result, process normally
current_time = datetime.utcnow().isoformat()
country = get_geolocation(final_url_domain, domain_cache)
accounts[account_id]["SUSPECTED_REGION_OF_ORIGIN"] = country
accounts[account_id]["LAST_CHECK"] = current_time
if country == "US":
skipped_count += 1
elif country == "N/A":
unknown_count += 1
else:
updated_count += 1
log(
f"Updated {account_id}: {final_url_domain} -> {country} | Last Check: {current_time}"
)
# Only increment the request counter and apply rate limiting if we actually queried the API
if country != "N/A" and final_url_domain not in domain_cache:
request_counter += 1
if request_counter >= RATE_LIMIT:
log(
f"Reached API rate limit ({RATE_LIMIT} per minute), sleeping for 60 seconds..."
)
time.sleep(60)
request_counter = 0
else:
time.sleep(60 / RATE_LIMIT) # Distribute requests evenly
# Save progress after each update
with open(INPUT_FILE, "w", encoding="utf-8") as file:
json.dump(accounts, file, indent=4)
# Save cache at the end
save_cache(domain_cache)
log(f"Saved {len(domain_cache)} domain results to cache")
log(
f"Update complete: {updated_count} updated, {unknown_count} set to N/A, {skipped_count} auto-set to US, {cached_count} from cache"
)
if __name__ == "__main__":
count_urls_to_check() # Print the count before starting the update
# Ask the user if they want to process the full file or start from a specific case number
user_input = (
input(
"Do you want to process the full file (F) or start from a specific case number (S)? "
)
.strip()
.lower()
)
if user_input == "s":
start_from = int(input("Enter the case number to start from: "))
update_compromised_accounts(start_from)
else:
update_compromised_accounts()