#!/usr/bin/env python3 import os import json import asyncio import aiohttp import tarfile # Получаем ключи и данные из переменных окружения STEAM_KEY = os.environ.get('STEAM_KEY') LINUX_GAMING_API_KEY = os.environ.get('LINUX_GAMING_API_KEY') LINUX_GAMING_API_USERNAME = os.environ.get('LINUX_GAMING_API_USERNAME') # Конфигурация API STEAM_BASE_URL = "https://api.steampowered.com/IStoreService/GetAppList/v1/?" LINUX_GAMING_BASE_URL = "https://linux-gaming.ru" CATEGORY_STEAM = "games" CATEGORY_LINUX_GAMING = "ppdb" LINUX_GAMING_HEADERS = { "Api-Key": LINUX_GAMING_API_KEY, "Api-Username": LINUX_GAMING_API_USERNAME } def normalize_name(s): """ Приведение строки к нормальному виду: - перевод в нижний регистр, - удаление символов ™ и ®, - замена разделителей (-, :, ,) на пробел, - удаление лишних пробелов, - удаление суффиксов 'bin' или 'app' в конце строки, - удаление ключевых слов типа 'ultimate', 'edition' и т.п. """ s = s.lower() for ch in ["™", "®"]: s = s.replace(ch, "") for ch in ["-", ":", ","]: s = s.replace(ch, " ") s = " ".join(s.split()) for suffix in ["bin", "app"]: if s.endswith(suffix): s = s[:-len(suffix)].strip() keywords_to_remove = {"ultimate", "edition", "definitive", "complete", "remastered"} words = s.split() filtered_words = [word for word in words if word not in keywords_to_remove] return " ".join(filtered_words) def process_steam_apps(steam_apps): """ Для каждого приложения из Steam добавляет ключ "normalized_name", содержащий нормализованное значение имени (поле "name"), и удаляет ненужные поля: "name", "last_modified", "price_change_number". """ for app in steam_apps: original = app.get("name", "") if not app.get("normalized_name"): app["normalized_name"] = normalize_name(original) app.pop("name", None) app.pop("last_modified", None) app.pop("price_change_number", None) return steam_apps async def get_app_list(session, last_appid, endpoint): """ Получает часть списка приложений из API Steam. Если last_appid передан, добавляет его к URL для постраничной загрузки. """ url = endpoint if last_appid: url = f"{url}&last_appid={last_appid}" async with session.get(url) as response: response.raise_for_status() return await response.json() async def fetch_games_json(session): """ Загружает JSON с данными из AreWeAntiCheatYet и извлекает поля normalized_name и status. """ url = "https://raw.githubusercontent.com/AreWeAntiCheatYet/AreWeAntiCheatYet/HEAD/games.json" try: async with session.get(url) as response: response.raise_for_status() text = await response.text() data = json.loads(text) return [{"normalized_name": normalize_name(game["name"]), "status": game["status"]} for game in data] except Exception as error: print(f"Ошибка загрузки games.json: {error}") return [] async def get_linux_gaming_topics(session, category_slug): """ Получает все темы из указанной категории linux-gaming.ru. Сохраняет только нормализованное название (normalized_title) и slug. """ page = 0 all_topics = [] while True: page += 1 url = f"{LINUX_GAMING_BASE_URL}/c/{category_slug}/l/latest.json?page={page}" try: async with session.get(url, headers=LINUX_GAMING_HEADERS) as response: response.raise_for_status() data = await response.json() topics = data.get("topic_list", {}).get("topics", []) if not topics: break for topic in topics: all_topics.append({ "normalized_title": normalize_name(topic["title"]), "slug": topic["slug"] }) print(f"Обработано {len(topics)} тем на странице {page}, всего: {len(all_topics)}.") except Exception as error: print(f"Ошибка получения тем для страницы {page}: {error}") break return all_topics async def request_data(): """ Получает данные из Steam, AreWeAntiCheatYet и linux-gaming.ru, обрабатывает их и сохраняет в JSON-файлы и tar.xz архивы. """ # Параметры запроса для Steam game_param = "&include_games=true" dlc_param = "&include_dlc=false" software_param = "&include_software=false" videos_param = "&include_videos=false" hardware_param = "&include_hardware=false" endpoint = ( f"{STEAM_BASE_URL}key={STEAM_KEY}" f"{game_param}{dlc_param}{software_param}{videos_param}{hardware_param}" f"&max_results=50000" ) output_json = [] total_parsed = 0 linux_gaming_topics = [] anticheat_games = [] try: async with aiohttp.ClientSession() as session: # Загружаем данные Steam have_more_results = True last_appid_val = None while have_more_results: app_list = await get_app_list(session, last_appid_val, endpoint) apps = app_list['response']['apps'] apps = process_steam_apps(apps) output_json.extend(apps) total_parsed += len(apps) have_more_results = app_list['response'].get('have_more_results', False) last_appid_val = app_list['response'].get('last_appid') print(f"Обработано {len(apps)} игр Steam, всего: {total_parsed}.") # Загружаем данные AreWeAntiCheatYet anticheat_games = await fetch_games_json(session) # Загружаем данные linux-gaming.ru if LINUX_GAMING_API_KEY and LINUX_GAMING_API_USERNAME: linux_gaming_topics = await get_linux_gaming_topics(session, CATEGORY_LINUX_GAMING) else: print("Предупреждение: LINUX_GAMING_API_KEY или LINUX_GAMING_API_USERNAME не установлены.") except Exception as error: print(f"Ошибка получения данных: {error}") return False repo_root = os.path.abspath(os.path.join(os.path.dirname(__file__), "..")) data_dir = os.path.join(repo_root, "data") os.makedirs(data_dir, exist_ok=True) # Сохранение данных Steam output_json_full = os.path.join(data_dir, f"{CATEGORY_STEAM}_appid.json") output_json_min = os.path.join(data_dir, f"{CATEGORY_STEAM}_appid_min.json") with open(output_json_full, "w", encoding="utf-8") as f: json.dump(output_json, f, ensure_ascii=False, indent=2) with open(output_json_min, "w", encoding="utf-8") as f: json.dump(output_json, f, ensure_ascii=False, separators=(',',':')) # Сохранение данных AreWeAntiCheatYet anticheat_json_full = os.path.join(data_dir, "anticheat_games.json") anticheat_json_min = os.path.join(data_dir, "anticheat_games_min.json") with open(anticheat_json_full, "w", encoding="utf-8") as f: json.dump(anticheat_games, f, ensure_ascii=False, indent=2) with open(anticheat_json_min, "w", encoding="utf-8") as f: json.dump(anticheat_games, f, ensure_ascii=False, separators=(',',':')) # Сохранение данных linux-gaming.ru linux_gaming_json_full = os.path.join(data_dir, "linux_gaming_topics.json") linux_gaming_json_min = os.path.join(data_dir, "linux_gaming_topics_min.json") if linux_gaming_topics: with open(linux_gaming_json_full, "w", encoding="utf-8") as f: json.dump(linux_gaming_topics, f, ensure_ascii=False, indent=2) with open(linux_gaming_json_min, "w", encoding="utf-8") as f: json.dump(linux_gaming_topics, f, ensure_ascii=False, separators=(',',':')) # Упаковка минифицированных JSON в tar.xz архивы # Архив для Steam steam_archive_path = os.path.join(data_dir, f"{CATEGORY_STEAM}_appid.tar.xz") try: with tarfile.open(steam_archive_path, "w:xz", preset=9) as tar: tar.add(output_json_min, arcname=os.path.basename(output_json_min)) print(f"Упаковано минифицированное JSON Steam в архив: {steam_archive_path}") os.remove(output_json_min) except Exception as e: print(f"Ошибка при упаковке архива Steam: {e}") return False # Архив для AreWeAntiCheatYet anticheat_archive_path = os.path.join(data_dir, "anticheat_games.tar.xz") try: with tarfile.open(anticheat_archive_path, "w:xz", preset=9) as tar: tar.add(anticheat_json_min, arcname=os.path.basename(anticheat_json_min)) print(f"Упаковано минифицированное JSON AreWeAntiCheatYet в архив: {anticheat_archive_path}") os.remove(anticheat_json_min) except Exception as e: print(f"Ошибка при упаковке архива AreWeAntiCheatYet: {e}") return False # Архив для linux-gaming.ru if linux_gaming_topics: linux_gaming_archive_path = os.path.join(data_dir, "linux_gaming_topics.tar.xz") try: with tarfile.open(linux_gaming_archive_path, "w:xz", preset=9) as tar: tar.add(linux_gaming_json_min, arcname=os.path.basename(linux_gaming_json_min)) print(f"Упаковано минифицированное JSON linux-gaming.ru в архив: {linux_gaming_archive_path}") os.remove(linux_gaming_json_min) except Exception as e: print(f"Ошибка при упаковке архива linux-gaming.ru: {e}") return False return True async def run(): success = await request_data() if not success: exit(1) if __name__ == "__main__": asyncio.run(run())