In [None]:
import zipfile
import os

# Define the path to the uploaded ZIP file
zip_file_path = './Gmail.zip'
extracted_folder_path = './Gmail/'

# Extract the contents of the ZIP file
with zipfile.ZipFile(zip_file_path, 'r') as zip_ref:
    zip_ref.extractall(extracted_folder_path)

# List the contents of the extracted folder to understand the data structure
extracted_files = os.listdir(extracted_folder_path)
extracted_files



['2a8cf96c-0842-4f13-9593-cdfba3b0d054.html',
 '2a8cf96c-0842-4f13-9593-cdfba3b0d054_steam.json',
 '2a8cf96c-0842-4f13-9593-cdfba3b0d054_telemetry_f711bb52-736c-11ef-af95-46e4127b3f61.json']

In [None]:
import json

# Load and inspect the Steam JSON file
steam_json_path = os.path.join(extracted_folder_path, '2a8cf96c-0842-4f13-9593-cdfba3b0d054_steam.json')
with open(steam_json_path, 'r') as steam_file:
    steam_data = json.load(steam_file)

# Load and inspect the Telemetry JSON file
telemetry_json_path = os.path.join(extracted_folder_path, '2a8cf96c-0842-4f13-9593-cdfba3b0d054_telemetry_f711bb52-736c-11ef-af95-46e4127b3f61.json')
with open(telemetry_json_path, 'r') as telemetry_file:
    telemetry_data = json.load(telemetry_file)

# # Preview the data structures
# steam_data_preview = {k: steam_data[k] for k in list(steam_data)[:5]}  # Get a preview of the first 5 keys from Steam data
# telemetry_data_preview = {k: telemetry_data[k] for k in list(telemetry_data)[:5]}  # Preview of first 5 keys from telemetry data

# steam_data_preview, telemetry_data_preview


# Preview the data structures
steam_data_preview = {k: steam_data[k] for k in list(steam_data)[:5]}  # Get a preview of the first 5 keys from Steam data
telemetry_data_preview = telemetry_data[:5] if isinstance(telemetry_data, list) else {k: telemetry_data[k] for k in list(telemetry_data)[:5]}  # Preview of first 5 items from telemetry data

steam_data_preview, telemetry_data_preview

({'data': {'type': 'match',
   'id': '2a8cf96c-0842-4f13-9593-cdfba3b0d054',
   'attributes': {'titleId': 'bluehole-pubg',
    'tags': None,
    'mapName': 'Baltic_Main',
    'matchType': 'airoyale',
    'duration': 1413,
    'gameMode': 'solo',
    'shardId': 'steam',
    'isCustomMatch': False,
    'seasonState': 'progress',
    'createdAt': '2024-09-15T13:51:40Z',
    'stats': None},
   'relationships': {'rosters': {'data': [{'type': 'roster',
       'id': 'e05c80cb-4dbc-4179-9da7-5c033bac47df'},
      {'type': 'roster', 'id': '9cb0cf8a-89fc-4793-a525-871e8713c41d'},
      {'type': 'roster', 'id': '3b424a86-5895-4f44-9365-ef4304d4e2e3'},
      {'type': 'roster', 'id': 'd130d585-995b-455e-8c27-ccf15037e840'},
      {'type': 'roster', 'id': '0d2d09f8-6f27-4e7e-be2b-7e3df8264483'},
      {'type': 'roster', 'id': 'c147452d-f0fe-4245-8621-8d8857a20057'},
      {'type': 'roster', 'id': 'f5e64542-63b6-420a-920f-71d4eddf2913'},
      {'type': 'roster', 'id': 'e57abdc2-05f3-438a-b660-07d1e1b

In [None]:
# Check the structure of the telemetry data (assuming it's a list)
telemetry_data_type = type(telemetry_data)
telemetry_data_sample = telemetry_data[:2] if isinstance(telemetry_data, list) else telemetry_data

# Checking the structure of Steam data in more detail
steam_data_keys = list(steam_data.keys())
steam_data_sample = {key: steam_data[key] for key in steam_data_keys[:5]}

telemetry_data_type, telemetry_data_sample, steam_data_sample

(list,
 [{'MatchId': 'match.bro.airoyale.pc-2018-31.steam.solo.as.2024.09.15.13.2a8cf96c-0842-4f13-9593-cdfba3b0d054',
   'PingQuality': '',
   '_D': '2024-09-15T13:51:41.0087337Z',
   '_T': 'LogMatchDefinition'},
  {'accountId': 'account.598f8d86c13b4b1aad80b8c2ddebf9bf',
   'common': {'isGame': 0},
   '_D': '2024-09-15T13:50:21.057Z',
   '_T': 'LogPlayerLogin'}],
 {'data': {'type': 'match',
   'id': '2a8cf96c-0842-4f13-9593-cdfba3b0d054',
   'attributes': {'titleId': 'bluehole-pubg',
    'tags': None,
    'mapName': 'Baltic_Main',
    'matchType': 'airoyale',
    'duration': 1413,
    'gameMode': 'solo',
    'shardId': 'steam',
    'isCustomMatch': False,
    'seasonState': 'progress',
    'createdAt': '2024-09-15T13:51:40Z',
    'stats': None},
   'relationships': {'rosters': {'data': [{'type': 'roster',
       'id': 'e05c80cb-4dbc-4179-9da7-5c033bac47df'},
      {'type': 'roster', 'id': '9cb0cf8a-89fc-4793-a525-871e8713c41d'},
      {'type': 'roster', 'id': '3b424a86-5895-4f44-9365

In [None]:
import pandas as pd
from sklearn.model_selection import train_test_split
from sklearn.linear_model import LinearRegression
from sklearn.metrics import mean_squared_error, r2_score

# Extract relevant player statistics from the Steam data
players_data = []
for entry in steam_data['included']:
    if entry['type'] == 'participant':
        stats = entry['attributes']['stats']
        player_info = {
            'playerId': stats['playerId'],
            'kills': stats['kills'],
            'assists': stats['assists'],
            'damageDealt': stats['damageDealt'],
            'timeSurvived': stats['timeSurvived'],
            'walkDistance': stats['walkDistance'],
            'weaponsAcquired': stats['weaponsAcquired'],
            'winPlace': stats['winPlace']
        }
        players_data.append(player_info)

# Create DataFrame for analysis
df = pd.DataFrame(players_data)

# Define the independent variables (X) and dependent variable (y)
# We will predict 'timeSurvived' using other variables
X = df[['kills', 'assists', 'damageDealt', 'walkDistance', 'weaponsAcquired']]
y = df['timeSurvived']

# Split data into training and testing sets
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=42)

# Initialize and fit the regression model
model = LinearRegression()
model.fit(X_train, y_train)

# Make predictions
y_pred = model.predict(X_test)

# Evaluate the model
mse = mean_squared_error(y_test, y_pred)
r2 = r2_score(y_test, y_pred)

# Return coefficients and evaluation metrics
coefficients = pd.DataFrame({'Feature': X.columns, 'Coefficient': model.coef_})



A module that was compiled using NumPy 1.x cannot be run in
NumPy 2.1.1 as it may crash. To support both 1.x and 2.x
versions of NumPy, modules must be compiled with NumPy 2.0.
Some module may need to rebuild instead e.g. with 'pybind11>=2.12'.

If you are a user of the module, the easiest solution will be to
downgrade to 'numpy<2' or try to upgrade the affected module.
We expect that some modules will need time to support NumPy 2.

Traceback (most recent call last):  File "/usr/lib/python3.10/runpy.py", line 196, in _run_module_as_main
    return _run_code(code, main_globals, None,
  File "/usr/lib/python3.10/runpy.py", line 86, in _run_code
    exec(code, run_globals)
  File "/home/roina/.local/lib/python3.10/site-packages/ipykernel_launcher.py", line 17, in <module>
    app.launch_new_instance()
  File "/home/roina/.local/lib/python3.10/site-packages/traitlets/config/application.py", line 1043, in launch_instance
    app.start()
  File "/home/roina/.local/lib/python3.10/site-packag

AttributeError: _ARRAY_API not found

ImportError: numpy.core.multiarray failed to import