In [3]:
import numpy as np
import pandas as pd

# Pour des résultats reproductibles
np.random.seed(42)

# Nombre de lignes
n = 300  

# 1. Température (°C) – float
temperature = np.random.normal(loc=15, scale=7, size=n)

# 2. Humidité (%) – float, bornée entre 0 et 100
humidity = np.random.normal(loc=60, scale=15, size=n)
humidity = np.clip(humidity, 0, 100)

# 3. Vitesse du vent (km/h) – float
wind_speed = np.random.normal(loc=25, scale=8, size=n)
wind_speed = np.clip(wind_speed, 0, None)  # pas de vent négatif

# 4. Altitude (m) – ENTIER
altitude = np.random.randint(low=0, high=2000, size=n)

# 5. Pression (hPa) 
pressure = 1015 - 0.8 * temperature + np.random.normal(loc=0, scale=3, size=n)

# 6. Puissance éolienne (kW)
wind_power = 4 * wind_speed + np.random.normal(loc=0, scale=5, size=n)

# Création du DataFrame
df = pd.DataFrame({
    "Temperature_C": temperature,
    "Humidity_pct": humidity,
    "Pressure_hPa": pressure,
    "WindSpeed_kmh": wind_speed,
    "Altitude_m": altitude,
    "WindPower_kW": wind_power
})

# Vérification rapide : nombre de lignes et de colonnes
print("Shape (lignes, colonnes) :", df.shape)

# Statistiques de base (moyenne, écart-type, etc.)
display(df.describe())

# Matrice de corrélation
display(df.corr())

# Sauvegarde du dataset
df.to_csv("artificial_dataset.csv", index=False)
print("Fichier 'artificial_dataset.csv' sauvegardé.")

Shape (lignes, colonnes) : (300, 6)


Unnamed: 0,Temperature_C,Humidity_pct,Pressure_hPa,WindSpeed_kmh,Altitude_m,WindPower_kW
count,300.0,300.0,300.0,300.0,300.0,300.0
mean,14.96116,59.65704,1003.277517,25.657553,997.15,102.60302
std,6.889356,14.361877,6.33818,7.973412,578.691149,32.570814
min,-7.688871,22.925332,978.042191,3.424907,1.0,6.454844
25%,10.217278,49.433922,998.840256,20.428198,510.5,80.221364
50%,15.414536,59.71853,1003.022234,25.341924,988.0,101.04225
75%,19.386604,69.245063,1007.800703,30.691757,1476.5,124.617101
max,41.96912,100.0,1021.09104,46.059057,1999.0,182.953943


Unnamed: 0,Temperature_C,Humidity_pct,Pressure_hPa,WindSpeed_kmh,Altitude_m,WindPower_kW
Temperature_C,1.0,-0.040302,-0.860832,-0.037822,-0.061704,-0.032746
Humidity_pct,-0.040302,1.0,0.020122,-0.031215,0.092028,-0.033817
Pressure_hPa,-0.860832,0.020122,1.0,0.021668,0.023896,0.017692
WindSpeed_kmh,-0.037822,-0.031215,0.021668,1.0,-0.015999,0.989225
Altitude_m,-0.061704,0.092028,0.023896,-0.015999,1.0,-0.010881
WindPower_kW,-0.032746,-0.033817,0.017692,0.989225,-0.010881,1.0


Fichier 'artificial_dataset.csv' sauvegardé.
