nDPI/utils/mining_list_update.py
JH ebb47c9a84
Add auto-updating cryptocurrency mining pool lists (#2891)
Co-authored-by: Ivan Nardi <nardi.ivan@gmail.com>
2025-07-01 20:27:22 +02:00

126 lines
No EOL
3.7 KiB
Python
Executable file

#!/usr/bin/env python3
import os
import requests
import re
from datetime import datetime
import time
import sys
# Configuration
URL = "https://minerstat.com/mining-pool-whitelist.txt"
SCRIPT_DIR = os.path.dirname(os.path.abspath(__file__))
DOMAIN_LIST_PATH = os.path.join(SCRIPT_DIR, "../lists/42_mining_domain.list")
IP_LIST_PATH = os.path.join(SCRIPT_DIR, "../lists/protocols/42_mining_ip.list")
TEMP_FILE = os.path.join(SCRIPT_DIR, "minerstat_temp.txt")
def download_file():
print(f"Downloading file... {URL}...")
start_time = time.time()
try:
response = requests.get(URL, timeout=30)
response.raise_for_status()
with open(TEMP_FILE, "w") as f:
f.write(response.text)
dl_time = time.time() - start_time
print(f"Download completed in {dl_time:.2f}s, saved to {TEMP_FILE}")
return True
except Exception as e:
print(f"Download failed: {str(e)}")
return False
def process_file():
domains = []
ips = set() # IP deduplication
domain_count = 0
ip_count = 0
skip_count = 0
# Precompiled regular expressions improve efficiency
ip_pattern = re.compile(r'^\d{1,3}\.\d{1,3}\.\d{1,3}\.\d{1,3}$')
start_time = time.time()
with open(TEMP_FILE, "r") as f:
for line in f:
line = line.strip()
if not line or line.startswith("#"):
skip_count += 1
continue
parts = line.split(maxsplit=1)
if len(parts) < 2:
skip_count += 1
continue
ip, domain = parts[0], parts[1]
# IP deduplication
if ip_pattern.match(ip):
ips.add(f"{ip}/32")
ip_count += 1
domains.append(domain)
domain_count += 1
proc_time = time.time() - start_time
print(f"(2) Processed {domain_count} domains and {ip_count} IPs in {proc_time:.4f}s")
print(f"Skipped {skip_count} invalid lines")
return domains, ips
def save_lists(domains, ips):
os.makedirs(os.path.dirname(DOMAIN_LIST_PATH), exist_ok=True)
os.makedirs(os.path.dirname(IP_LIST_PATH), exist_ok=True)
# Write to DOMAIN_LIST
start_time = time.time()
with open(DOMAIN_LIST_PATH, "w") as f:
f.write(f"# Generated at {datetime.now().isoformat()}\n")
f.write("\n".join(domains))
domain_time = time.time() - start_time
# Write to IP_LIST
start_time = time.time()
with open(IP_LIST_PATH, "w") as f:
f.write(f"# Generated at {datetime.now().isoformat()}\n")
f.write("\n".join(ips))
ip_time = time.time() - start_time
print(f"(3) Domain list path: {os.path.abspath(DOMAIN_LIST_PATH)}")
print(f"IP list path: {os.path.abspath(IP_LIST_PATH)}")
print(f"Saved {len(domains)} domains in {domain_time:.4f}s")
print(f"Saved {len(ips)} IPs in {ip_time:.4f}s")
def main():
total_start = time.time()
print(f"(1) Starting update at {datetime.now().isoformat()}")
try:
if not download_file():
return 1
domains, ips = process_file()
save_lists(domains, ips)
# Clean up TEMP_FILE
if os.path.exists(TEMP_FILE):
os.remove(TEMP_FILE)
print(f"Removed temporary file: {TEMP_FILE}")
total_time = time.time() - total_start
print(f"Update completed in {total_time:.2f} seconds")
return 0
except Exception as e:
print(f"Error occurred: {str(e)}")
return 1
if __name__ == "__main__":
sys.exit(main())