Replace requests with urllib for HTTP requests in JSON file retrieval, enhancing compatibility and removing the test_regex.py file as it is no longer needed.

This commit is contained in:
2025-07-29 19:18:09 +02:00
parent da4b380b1e
commit c92f583609
2 changed files with 17 additions and 56 deletions

24
main.py
View File

@@ -6,19 +6,25 @@
import sys
import galdPl
import requests
import urllib.request
import urllib.parse
import re
import os
def get_json_files_from_folder(folder):
base_url = "https://git.gald.site/gald/galdistream/src/branch/main/resources/"
url = base_url + folder
r = requests.get(url, timeout=10)
r.raise_for_status()
# Použijeme urllib místo requests
req = urllib.request.Request(url)
req.add_header('User-Agent', 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36')
with urllib.request.urlopen(req, timeout=10) as response:
html_content = response.read().decode('utf-8')
# Hledáme JSON soubory pomocí regex
json_pattern = r'href="(/gald/galdistream/src/branch/main/resources/[^"]*\.json)"'
matches = re.findall(json_pattern, r.text)
matches = re.findall(json_pattern, html_content)
files = []
for match in matches:
@@ -41,11 +47,15 @@ def update_json_db():
url = base_url_raw + file
local_path = "resources/" + file
try:
r = requests.get(url, timeout=10)
r.raise_for_status()
req = urllib.request.Request(url)
req.add_header('User-Agent', 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36')
with urllib.request.urlopen(req, timeout=10) as response:
content = response.read()
os.makedirs(os.path.dirname(local_path), exist_ok=True)
with open(local_path, "wb") as f:
f.write(r.content)
f.write(content)
except Exception as e:
print(f"Chyba při stahování {file}: {e}")