leetify-data/src/extract.py

161 lines
3.5 KiB
Python
Raw Normal View History

2024-01-29 10:19:06 -05:00
from .leetify import Leetify
2024-01-28 20:29:19 -05:00
from os import environ as env
2024-01-29 10:19:06 -05:00
from .transform import (
meta_from_profile,
games_from_profile,
player_stats_from_game,
)
import psycopg2 as pg
from typing import Tuple
2024-01-28 20:29:19 -05:00
def connect():
return pg.connect(
dbname=env.get("POSTGRES_DB"),
user=env.get("POSTGRES_USER"),
password=env.get("POSTGRES_PASSWORD"),
host=env.get("POSTGRES_HOST"),
port=env.get("POSTGRES_PORT"),
)
2024-01-29 10:19:06 -05:00
def vals_in_order(data: dict, keys: list):
vals = [data[key] for key in keys]
return vals
def dict_to_col_val(data: dict) -> Tuple[list, list]:
cols = []
vals = []
for k, v in data.items():
cols.append(k)
vals.append(v)
return cols, vals
def dict_to_sql_str(data: dict) -> Tuple[str, str]:
cols, vals = dict_to_col_val(data)
vals = map(str, vals)
cols = ", ".join(cols)
vals = ", ".join(vals)
return cols, vals
def extract_profile_meta(id, api=Leetify(), conn=None):
if not conn:
conn = connect()
2024-01-29 10:44:46 -05:00
cols_api = [
2024-01-29 10:19:06 -05:00
"name",
"steam64Id",
"isCollector",
"isLeetifyStaff",
"isProPlan",
"leetifyUserId",
"faceitNickname",
]
2024-01-29 10:44:46 -05:00
cols_db = [
"name",
"steam64_id",
"is_collector",
"is_leetify_staff",
"is_pro_plan",
"leetify_user_id",
"faceit_nickname",
]
2024-01-29 10:19:06 -05:00
profile = api.get_profile(id)
meta = meta_from_profile(profile)
2024-01-29 10:44:46 -05:00
vals = vals_in_order(meta, cols_api)
2024-01-29 10:19:06 -05:00
with conn.cursor() as curs:
sql = f"""
2024-01-29 10:44:46 -05:00
INSERT INTO data.profile_meta ({', '.join(cols_db)})
VALUES ({', '.join(['%s'] * len(cols_db))});
2024-01-29 10:19:06 -05:00
"""
curs.execute(sql, vals)
conn.commit()
def extract_profile_games(profile, conn=None):
if not conn:
conn = connect()
2024-01-29 10:44:46 -05:00
cols_api = [
2024-01-29 10:19:06 -05:00
"leetifyUserId",
"ctLeetifyRating",
"ctLeetifyRatingRounds",
"dataSource",
"elo",
"gameFinishedAt",
"gameId",
"isCs2",
"mapName",
"matchResult",
"scores",
"skillLevel",
"tLeetifyRating",
"tLeetifyRatingRounds",
"deaths",
"hasBannedPlayer",
"kills",
"partySize",
]
2024-01-29 10:44:46 -05:00
cols_db = [
"leetify_user_id",
"ct_Leetify_rating",
"ct_Leetify_rating_rounds",
"data_source",
"elo",
"game_finished_at",
"game_id",
"is_cs2",
"map_name",
"match_result",
"scores",
"skill_level",
"t_leetify_rating",
"t_leetify_rating_rounds",
"deaths",
"has_banned_player",
"kills",
"party_size",
]
2024-01-29 10:19:06 -05:00
games = games_from_profile(profile)
2024-01-29 10:44:46 -05:00
games = map(lambda game: vals_in_order(game, cols_api), games)
2024-01-29 10:19:06 -05:00
with conn.cursor() as curs:
curs.executemany(
f"""
2024-01-29 10:44:46 -05:00
INSERT into data.profile_game ({', '.join(cols_db)})
VALUES ({', '.join(['%s'] * len(cols_db))});
2024-01-29 10:19:06 -05:00
""",
games,
)
conn.commit()
def extract_player_stats(game, conn=None):
if not conn:
conn = connect()
stats = player_stats_from_game(game)
games = map(dict_to_sql_str, stats)
with conn.cursor() as curs:
for (
cols,
vals,
) in games:
curs.execute(
"""INSERT INTO data.player_stats (%s)
VALUES (%s);""",
(cols, vals),
)
conn.commit()