# Feedbacks CERES via SW fluxes

(1) Reconstruit les données avec les PCs et EOFs des flux SW. 

(2) Multi Linéaire Régression des PCs sur les feedbacks pour trouver les coefficients Beta. 

(3) Retrouver les PCs des observations CERES. 

(4) Prédire les feedbacks des observations.

# Importe modules

In [1]:
# Computational modules 
%matplotlib inline
import xarray as xr
import glob
import os
import numpy as np
import netCDF4
from netCDF4 import Dataset
import pandas as pd
import re
from array import array
from pylab import *
#import geopandas
from eofs.xarray import Eof
from eofs.multivariate.standard import MultivariateEof

# Plotting modules 
import matplotlib.pyplot as plt
from mpl_toolkits.basemap import Basemap
import pandas.plotting
import matplotlib.ticker as ticker
import seaborn as sns
import cartopy.crs as ccrs
import cartopy.feature as cfeature
from matplotlib.colors import BoundaryNorm

# Scikit-learn
from sklearn import linear_model
from sklearn.linear_model import LassoCV, LassoLarsCV, LassoLarsIC
from sklearn.linear_model import Lasso
from sklearn.metrics import r2_score
from sklearn import preprocessing
from sklearn import tree
from sklearn.ensemble import RandomForestClassifier
from sklearn.metrics import confusion_matrix
from sklearn import metrics
from sklearn.neural_network import MLPRegressor

# Functions definition

In [2]:
import sys
sys.path.append('/data/home/globc/peatier/CNRMppe')
import Fonctions
from Fonctions import get_wavg_budget_df
from Fonctions import wavg 
from Fonctions import plotlines_Xdf
from Fonctions import plotlines_1df
from Fonctions import Deltas_Lambda
from Fonctions import get_3D_budget_xarr
from Fonctions import get_3D_xarr
from Fonctions import get_3D_SW_xarr
from Fonctions import get_3D_LW_xarr

# EOF, pr_mean and PCs

In [7]:
Mean =  pd.read_pickle('/data/home/globc/peatier/CNRMppe/PPE/ENSEMBLE2/files/npy/PPE2_tas_mean.npy').to_xarray().to_array()
Mean = Mean[0,:,:].rename({'variable':'mode'})
Mean

In [8]:
Anom =  pd.read_pickle('/data/home/globc/peatier/CNRMppe/PPE/ENSEMBLE2/files/npy/PPE2_tas_anom.npy').to_xarray().to_array()
Anom = Anom[0,:,:].rename({'variable':'mode'})
Anom

In [9]:
eof1 = pd.read_pickle('/data/home/globc/peatier/CNRMppe/PPE/ENSEMBLE2/files/npy/PPE2_EOFmap1_tas.npy').to_xarray().to_array()
eof2 = pd.read_pickle('/data/home/globc/peatier/CNRMppe/PPE/ENSEMBLE2/files/npy/PPE2_EOFmap2_tas.npy').to_xarray().to_array()
eof3 = pd.read_pickle('/data/home/globc/peatier/CNRMppe/PPE/ENSEMBLE2/files/npy/PPE2_EOFmap3_tas.npy').to_xarray().to_array()
eof4 = pd.read_pickle('/data/home/globc/peatier/CNRMppe/PPE/ENSEMBLE2/files/npy/PPE2_EOFmap4_tas.npy').to_xarray().to_array()
eof5 = pd.read_pickle('/data/home/globc/peatier/CNRMppe/PPE/ENSEMBLE2/files/npy/PPE2_EOFmap5_tas.npy').to_xarray().to_array()

eof1 = eof1[0,:,:].rename({'variable':'mode'})
eof2 = eof2[0,:,:].rename({'variable':'mode'})
eof3 = eof3[0,:,:].rename({'variable':'mode'})
eof4 = eof4[0,:,:].rename({'variable':'mode'})
eof5 = eof5[0,:,:].rename({'variable':'mode'})

eofs = [eof1,eof2,eof3,eof4,eof5]

In [10]:
eofs_combined = xr.combine_nested(eofs, concat_dim='eofs')
#eofs_combined

In [11]:
pc1 = np.load('/data/home/globc/peatier/CNRMppe/PPE/ENSEMBLE2/files/npy/PPE2_EOF1pc_tas.npy')
pc2 = np.load('/data/home/globc/peatier/CNRMppe/PPE/ENSEMBLE2/files/npy/PPE2_EOF2pc_tas.npy')
pc3 = np.load('/data/home/globc/peatier/CNRMppe/PPE/ENSEMBLE2/files/npy/PPE2_EOF3pc_tas.npy')
pc4 = np.load('/data/home/globc/peatier/CNRMppe/PPE/ENSEMBLE2/files/npy/PPE2_EOF4pc_tas.npy')
pc5 = np.load('/data/home/globc/peatier/CNRMppe/PPE/ENSEMBLE2/files/npy/PPE2_EOF5pc_tas.npy')

PC_df = pd.DataFrame(pc1)
PC_df['pc1'] = pc1
PC_df['pc2'] = pc2
PC_df['pc3'] = pc3
PC_df['pc4'] = pc4
PC_df['pc5'] = pc5
PC_df = PC_df.drop(labels = 0, axis=1)
#PC_df

PC_df

Unnamed: 0,pc1,pc2,pc3,pc4,pc5
0,-1.036253,1.783174,0.132006,-0.607847,-1.941047
1,0.505301,-0.620046,-0.661749,0.071263,1.887987
2,1.550187,0.966963,0.211132,0.490079,-1.081055
3,0.533399,1.637583,-0.720199,1.020989,1.132725
4,0.689388,-0.106142,0.247270,-0.857747,-0.863513
...,...,...,...,...,...
97,1.127269,0.137607,-1.883097,1.363466,0.307337
98,-0.848661,-2.183300,-2.136365,0.161926,0.381609
99,-0.199264,-1.611466,-0.654372,1.134501,0.792408
100,1.703953,-0.374048,-1.039726,1.907782,-0.038282


In [12]:
pc1_official = np.load('/data/home/globc/peatier/CNRMppe/PPE/ENSEMBLE2/files/npy/official_EOF1pc_tas.npy')
pc2_official = np.load('/data/home/globc/peatier/CNRMppe/PPE/ENSEMBLE2/files/npy/official_EOF2pc_tas.npy')
pc3_official = np.load('/data/home/globc/peatier/CNRMppe/PPE/ENSEMBLE2/files/npy/official_EOF3pc_tas.npy')
pc4_official = np.load('/data/home/globc/peatier/CNRMppe/PPE/ENSEMBLE2/files/npy/official_EOF4pc_tas.npy')
pc5_official = np.load('/data/home/globc/peatier/CNRMppe/PPE/ENSEMBLE2/files/npy/official_EOF5pc_tas.npy')

pc1_p1 = np.load('/data/home/globc/peatier/CNRMppe/PPE/ENSEMBLE2/files/npy/p1_EOF1pc_tas.npy')
pc2_p1 = np.load('/data/home/globc/peatier/CNRMppe/PPE/ENSEMBLE2/files/npy/p1_EOF2pc_tas.npy')
pc3_p1 = np.load('/data/home/globc/peatier/CNRMppe/PPE/ENSEMBLE2/files/npy/p1_EOF3pc_tas.npy')
pc4_p1 = np.load('/data/home/globc/peatier/CNRMppe/PPE/ENSEMBLE2/files/npy/p1_EOF4pc_tas.npy')
pc5_p1 = np.load('/data/home/globc/peatier/CNRMppe/PPE/ENSEMBLE2/files/npy/p1_EOF5pc_tas.npy')

In [13]:
PCs = [0]*102
for i in range(0,102,1):
    tmp = PC_df.iloc[i].values
    PCs[i] = tmp

PCs

[array([-1.036253  ,  1.7831736 ,  0.13200627, -0.60784733, -1.9410472 ],
       dtype=float32),
 array([ 0.50530076, -0.6200461 , -0.6617492 ,  0.07126312,  1.8879869 ],
       dtype=float32),
 array([ 1.5501868 ,  0.9669626 ,  0.2111317 ,  0.49007887, -1.0810546 ],
       dtype=float32),
 array([ 0.53339934,  1.6375835 , -0.7201993 ,  1.0209891 ,  1.1327245 ],
       dtype=float32),
 array([ 0.68938786, -0.10614232,  0.24727042, -0.8577472 , -0.8635134 ],
       dtype=float32),
 array([ 1.5023398 , -0.74393636,  2.0079553 , -0.21552847, -0.4743517 ],
       dtype=float32),
 array([-0.8357379 ,  1.0471958 ,  0.6302444 ,  0.32924467, -1.0607089 ],
       dtype=float32),
 array([ 0.7184881 ,  0.28508833,  1.2267857 , -0.0412975 , -0.7802244 ],
       dtype=float32),
 array([-1.377905  , -0.9671775 ,  1.3043481 , -0.06797209,  0.57332325],
       dtype=float32),
 array([-0.10597194,  1.5969536 ,  2.1264126 , -1.6648977 ,  0.42086658],
       dtype=float32),
 array([-0.99685633, -0.463237

# Trouver U_obs : Reconstruciton des données

X_ens = U_ens(pc) * v_ens(eof) 

Compute anomaly : X_obs = X_obs - SW_mean_ens 

X_obs = U_obs * v_ens 

U_obs = X_obs * inv(v_ens)

## Get the CMIP6 datatset

In [14]:
def load_monthly_clim(path, filename, variables) :
    
    file = xr.open_mfdataset(path+filename,combine='by_coords')
    df=file[variables].to_dataframe()
    
    # Compute Climatological Annual Cycle :
    df1=df.reset_index(level=['time', 'lat', 'lon'])
    df1['month']=pd.DatetimeIndex(df1['time']).month # time in years
    df_mean=df1.groupby(['month', 'lat', 'lon']).mean()
    
    return df_mean

In [15]:
# Download the amip dataframes and compute the radiative budget  

path = "/data/scratch/globc/peatier/CMIP6/CNRM-CM6-1/CFMIP/amip/"
filename = "*_amip_*.nc"
variables = ['tas']
CNRM_amip = load_monthly_clim(path, filename, variables)

path = "/data/scratch/globc/peatier/CMIP6/MRI-ESM2-0/amip/"
MRI_amip = load_monthly_clim(path, filename, variables)

path = "/data/scratch/globc/peatier/CMIP6/CanESM5/amip/"
filename = "standard_*_amip_*regrid.nc"
CAN_amip = load_monthly_clim(path, filename, variables)
CAN_amip

path = "/data/scratch/globc/peatier/CMIP6/MIROC6/"
filename = "*_amip_*regrid.nc"
MIROC_amip = load_monthly_clim(path, filename, variables)
MIROC_amip

path = "/data/scratch/globc/peatier/CMIP6/HadGEM3-GC31-LL/"
filename = "standard_*_amip_*regrid.nc"
HadGEM3_amip = load_monthly_clim(path, filename, variables)
HadGEM3_amip

path = "/data/scratch/globc/peatier/CMIP6/IPSL-CM6A-LR/"
filename = "*_amip_*regrid.nc"
IPSL_amip = load_monthly_clim(path, filename, variables)
IPSL_amip

path = "/data/scratch/globc/peatier/CMIP6/BCC-CSM2-MR/"
filename = "standard_*_amip_*regrid.nc"
BCC_amip = load_monthly_clim(path, filename, variables)
BCC_amip

Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,tas,height
month,lat,lon,Unnamed: 3_level_1,Unnamed: 4_level_1
1,-88.927735,0.00000,247.238327,2.0
1,-88.927735,1.40625,247.209213,2.0
1,-88.927735,2.81250,247.179489,2.0
1,-88.927735,4.21875,247.150101,2.0
1,-88.927735,5.62500,247.120407,2.0
...,...,...,...,...
12,88.927735,352.96875,246.398361,2.0
12,88.927735,354.37500,246.412842,2.0
12,88.927735,355.78125,246.424255,2.0
12,88.927735,357.18750,246.430847,2.0


In [17]:
df_obs = pd.DataFrame()
df_obs['CNRM'] = CNRM_amip[variables[0]]
df_obs['MRI'] = MRI_amip[variables[0]]
df_obs['CAN'] = CAN_amip[variables[0]]
df_obs['MIROC'] = MIROC_amip[variables[0]]
df_obs['HadGEM3'] = HadGEM3_amip[variables[0]]
df_obs['IPSL'] = IPSL_amip[variables[0]]
df_obs['BCC'] = BCC_amip[variables[0]]
#df_obs = df_obs.drop(['rsut', 'height'], axis = 1)
df_obs

Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,CNRM,MRI,CAN,MIROC,HadGEM3,IPSL,BCC
month,lat,lon,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1
1,-88.927735,0.00000,246.359619,248.840958,250.801117,258.720856,251.111130,245.918213,247.238327
1,-88.927735,1.40625,246.359619,248.798264,250.800552,258.696228,251.096207,245.889923,247.209213
1,-88.927735,2.81250,246.359619,248.756699,250.616211,258.671844,251.082642,245.859909,247.179489
1,-88.927735,4.21875,246.359619,248.714081,250.615662,258.646667,251.067566,245.823822,247.150101
1,-88.927735,5.62500,246.359619,248.680939,250.615112,258.620300,251.054047,245.789490,247.120407
...,...,...,...,...,...,...,...,...,...
12,88.927735,352.96875,247.806992,246.397644,245.186737,242.919815,246.128754,246.175323,246.398361
12,88.927735,354.37500,247.806992,246.398926,245.298721,242.933517,246.147369,246.209091,246.412842
12,88.927735,355.78125,247.806992,246.401794,245.299011,242.946350,246.162262,246.229935,246.424255
12,88.927735,357.18750,247.806992,246.404037,245.401749,242.956711,246.173904,246.240448,246.430847


In [18]:
obs = df_obs.groupby(['lat','lon']).mean().to_xarray()
obs

## Compute Anomaly

In [19]:
X_obs = {}
X_obs['CNRM'] = obs['CNRM'] - Mean
X_obs['MRI'] = obs['MRI'] - Mean
X_obs['CAN'] = obs['CAN'] - Mean
X_obs['MIROC'] = obs['MIROC'] - Mean
X_obs['HadGEM3'] = obs['HadGEM3'] - Mean
X_obs['IPSL'] = obs['IPSL'] - Mean
X_obs['BCC'] = obs['BCC'] - Mean
X_obs

{'CNRM': <xarray.DataArray (lat: 128, lon: 256)>
 array([[-0.71318054, -0.71318054, -0.71318054, ..., -0.71318054,
         -0.71318054, -0.71318054],
        [-1.0500336 , -1.0500336 , -1.0500336 , ..., -1.0500336 ,
         -1.0500336 , -1.0500336 ],
        [-1.1095886 , -1.1095886 , -1.1095886 , ..., -1.0766754 ,
         -1.1095886 , -1.1095886 ],
        ...,
        [ 1.4798889 ,  1.4798889 ,  1.4798889 , ...,  1.3976135 ,
          1.4798889 ,  1.4798889 ],
        [ 1.6473236 ,  1.6473236 ,  1.6473236 , ...,  1.6473236 ,
          1.6473236 ,  1.6473236 ],
        [ 1.5513458 ,  1.5513458 ,  1.5513458 , ...,  1.5513458 ,
          1.5513458 ,  1.5513458 ]], dtype=float32)
 Coordinates:
   * lat      (lat) float64 -88.93 -87.54 -86.14 -84.74 ... 86.14 87.54 88.93
   * lon      (lon) float64 0.0 1.406 2.812 4.219 ... 354.4 355.8 357.2 358.6
     mode     <U7 'tasmean', 'MRI': <xarray.DataArray (lat: 128, lon: 256)>
 array([[ 1.7660522 ,  1.7389221 ,  1.7114105 , ...,  1.8456726 

## Trouver U_obs

In [20]:
eofs_inv = np.linalg.pinv(eofs_combined.transpose())
#eofs_inv = xr.DataArray(eofs_inv, dims=['eofs','lon','lat'])
eofs_inv

array([[[-7.39513605e-04,  1.78612303e-03, -1.00614980e-03, ...,
         -1.84287447e-02, -2.21062806e-02, -2.68071331e-02],
        [-1.10379308e-02,  3.20899524e-02,  3.75619158e-02, ...,
         -1.05169132e-01, -1.14892744e-01, -1.18121870e-01],
        [-8.58247802e-02, -8.15134868e-02, -7.71081820e-02, ...,
         -2.95622274e-02, -2.40896009e-02, -1.25255752e-02],
        [-7.81158209e-02, -8.52241144e-02, -7.10721016e-02, ...,
         -1.38664432e-02,  2.17541610e-03,  1.91265400e-02],
        [ 1.22099072e-02,  3.85677330e-02,  5.45680672e-02, ...,
          9.61847678e-02,  9.81579795e-02,  8.95520151e-02]],

       [[ 5.08372847e-04,  3.52989510e-03,  6.53401774e-04, ...,
         -1.80690251e-02, -2.19996236e-02, -2.69053206e-02],
        [-1.27066709e-02,  2.94238608e-02,  3.47249471e-02, ...,
         -1.05991013e-01, -1.15492404e-01, -1.18544243e-01],
        [-9.13041979e-02, -8.82859975e-02, -8.35473761e-02, ...,
         -3.41397710e-02, -2.78446674e-02, -1.53615

In [21]:
X_CNRM_bis = X_obs['CNRM'].expand_dims(dim={'dummy':range(0,102,1)})
X_MRI_bis = X_obs['MRI'].expand_dims(dim={'dummy':range(0,102,1)})
X_CAN_bis = X_obs['CAN'].expand_dims(dim={'dummy':range(0,102,1)})
X_MIROC_bis = X_obs['MIROC'].expand_dims(dim={'dummy':range(0,102,1)})
X_HadGEM3_bis = X_obs['HadGEM3'].expand_dims(dim={'dummy':range(0,102,1)})
X_IPSL_bis = X_obs['IPSL'].expand_dims(dim={'dummy':range(0,102,1)})
X_BCC_bis = X_obs['BCC'].expand_dims(dim={'dummy':range(0,102,1)})

In [22]:
U_CNRM = np.dot(eofs_inv,X_CNRM_bis.transpose('lon','lat', 'dummy'))
U_MRI = np.dot(eofs_inv,X_MRI_bis.transpose('lon','lat', 'dummy'))
U_CAN = np.dot(eofs_inv,X_CAN_bis.transpose('lon','lat', 'dummy'))
U_MIROC = np.dot(eofs_inv,X_MIROC_bis.transpose('lon','lat', 'dummy'))
U_HadGEM3 = np.dot(eofs_inv,X_HadGEM3_bis.transpose('lon','lat', 'dummy'))
U_IPSL = np.dot(eofs_inv,X_IPSL_bis.transpose('lon','lat', 'dummy'))
U_BCC = np.dot(eofs_inv,X_BCC_bis.transpose('lon','lat', 'dummy'))


In [23]:
U_CNRM = xr.DataArray(U_CNRM, dims=['lon','eofs','lon2', 'dummy'])
U_CNRM_avg = U_CNRM[0,:,0,0].transpose()

U_MRI = xr.DataArray(U_MRI, dims=['lon','eofs','lon2', 'dummy'])
U_MRI_avg = U_MRI[0,:,0,0].transpose()

U_CAN = xr.DataArray(U_CAN, dims=['lon','eofs','lon2', 'dummy'])
U_CAN_avg = U_CAN[0,:,0,0].transpose()

U_MIROC = xr.DataArray(U_MIROC, dims=['lon','eofs','lon2', 'dummy'])
U_MIROC_avg = U_MIROC[0,:,0,0].transpose()

U_HadGEM3 = xr.DataArray(U_HadGEM3, dims=['lon','eofs','lon2', 'dummy'])
U_HadGEM3_avg = U_HadGEM3[0,:,0,0].transpose()

U_IPSL = xr.DataArray(U_IPSL, dims=['lon','eofs','lon2', 'dummy'])
U_IPSL_avg = U_IPSL[0,:,0,0].transpose()

U_BCC = xr.DataArray(U_BCC, dims=['lon','eofs','lon2', 'dummy'])
U_BCC_avg = U_BCC[0,:,0,0].transpose()

In [24]:
#Save the U_obs_avg 
np.save('/data/home/globc/peatier/CNRMppe/PPE/ENSEMBLE2/files/npy/U_CNRM_tas.npy', U_CNRM_avg)
np.save('/data/home/globc/peatier/CNRMppe/PPE/ENSEMBLE2/files/npy/U_MRI_tas.npy', U_MRI_avg)
np.save('/data/home/globc/peatier/CNRMppe/PPE/ENSEMBLE2/files/npy/U_CAN_tas.npy', U_CAN_avg)
np.save('/data/home/globc/peatier/CNRMppe/PPE/ENSEMBLE2/files/npy/U_MIROC_tas.npy', U_MIROC_avg)
np.save('/data/home/globc/peatier/CNRMppe/PPE/ENSEMBLE2/files/npy/U_HadGEM3_tas.npy', U_HadGEM3_avg)
np.save('/data/home/globc/peatier/CNRMppe/PPE/ENSEMBLE2/files/npy/U_IPSL_tas.npy', U_IPSL_avg)
np.save('/data/home/globc/peatier/CNRMppe/PPE/ENSEMBLE2/files/npy/U_BCC_tas.npy', U_BCC_avg)