In [None]:
import os, textwrap

base = '/content/drive/MyDrive/DataTour2025-CreditScoring'
folders = [
    'data/raw',
    'data/processed',
    'notebooks',
    'src',
    'models',
    'submissions',
    'reports/figures',
    'docs'
]

os.makedirs(base, exist_ok=True)
for f in folders:
    os.makedirs(os.path.join(base, f), exist_ok=True)

readme = textwrap.dedent("""
# DataTour 2025 - Credit Scoring (Team: GTF)

**Project:** National phase of DataTour 2025 — Credit default prediction based on historical loan data.

## Context
Access to credit is a key lever of economic development. This project aims to build models to predict loan default (flag = 1) vs correct repayment (flag = 0) using customers' credit histories.
Approaches include tabular ML models (LightGBM, CatBoost, XGBoost) and sequential neural models (LSTM/Transformer) on payment sequences.

## Dataset Notes
- Each row = a credit product for a customer.
- Key columns: `id`, `flag`, `rn`, `pre_*` (loan metadata), `enc_paym_*` (payment sequence), categorical encoders like `enc_loans_credit_type`, flags `pclose_flag` / `fclose_flag`, etc.
- Evaluation metric: ROC AUC.
- Submission format: `.parquet` with columns `id`, `target`.

""").strip()

with open(os.path.join(base, 'README.md'), 'w') as f:
    f.write(readme)

# show result
for root, dirs, files in os.walk(base):
    level = root.replace(base, '').count(os.sep)
    indent = ' ' * 4 * level
    print(f"{indent}{os.path.basename(root)}/")
    subindent = ' ' * 4 * (level + 1)
    for d in dirs:
        print(f"{subindent}{d}/")
    for fn in files:
        print(f"{subindent}{fn}")


In [2]:
%cd /content/drive/MyDrive/DataTour2025-CreditScoring

/content/drive/MyDrive/DataTour2025-CreditScoring


In [3]:
!git init

[33mhint: Using 'master' as the name for the initial branch. This default branch name[m
[33mhint: is subject to change. To configure the initial branch name to use in all[m
[33mhint: [m
[33mhint: 	git config --global init.defaultBranch <name>[m
[33mhint: [m
[33mhint: Names commonly chosen instead of 'master' are 'main', 'trunk' and[m
[33mhint: 'development'. The just-created branch can be renamed via this command:[m
[33mhint: [m
[33mhint: 	git branch -m <name>[m
Initialized empty Git repository in /content/drive/My Drive/DataTour2025-CreditScoring/.git/


In [4]:
!git config --global user.name "Connected-Peter"
!git config --global user.email "osuolaleking20@gmail.com"


In [5]:
!git remote add origin https://github.com/Connected-Peter/Data-Tour-2025-Credit-Scoring.git

In [6]:
!find . -type d -empty -exec touch {}/.gitkeep \;