In [53]:
import numpy as np  # linear algebra
import pandas as pd  # data processing, CSV file I/O (e.g. pd.read_csv)
from sklearn import datasets, linear_model,preprocessing
from datetime import datetime
import gc
%matplotlib inline
from IPython.display import display, HTML
from pprint import pprint
import time
import nltk.corpus
from nltk.stem.snowball import SnowballStemmer
from ml_metrics import rmse,rmsle

In [54]:
#take 1 CSV, then split it to 3..
class FeatureEngineering:

    def __init__(self, ValidationStart, ValidationEnd, trainHdfPath, trainHdfFile, testHdfPath1, testHdfPath2, testHdfFile, 
                 testTypes, trainTypes, trainCsvPath, testCsvPath, maxLag=0):
        self.ValidationStart = ValidationStart
        self.ValidationEnd = ValidationEnd
        self.maxLag = maxLag
        self.trainHdfPath = trainHdfPath
        self.trainHdfFile = trainHdfFile
        self.testHdfPath1 = testHdfPath1
        self.testHdfPath2 = testHdfPath2
        self.testHdfFile = testHdfFile
        self.testTypes = testTypes
        self.trainTypes = trainTypes
        self.trainCsvPath = trainCsvPath
        self.testCsvPath = testCsvPath
        
    @staticmethod
    def __printDataFrameBasics__(data):
        display(data.head(2))
        #print data.dtypes
        gc.collect()
        print(data.info(memory_usage=True))
        
    @staticmethod    
    def changeIndexTypeToLowerMemory(data):
        ##########
        #This is very critical, i accept max number is 2^32. Also, if don't do that, memory gets so much higher..
        ##########
        #data.reset_index(inplace=True)
        #data.drop("index",axis=1, inplace=True)
        #data.index = data.index.astype('uint32')
        gc.collect()
        
    def ReadHdf(self, trainOrTestOrBoth):
        '''Reads and holds Df in object memory'''            
        if trainOrTestOrBoth == 'train' or trainOrTestOrBoth=='both':
            self.train = pd.read_hdf(self.trainHdfPath,self.trainHdfFile)
            FeatureEngineering.changeIndexTypeToLowerMemory(self.train)
            FeatureEngineering.__printDataFrameBasics__(self.train)
            
        if trainOrTestOrBoth == 'test' or trainOrTestOrBoth=='both':
            self.test1 = pd.read_hdf(self.testHdfPath1,self.testHdfFile)
            self.test2 = pd.read_hdf(self.testHdfPath2,self.testHdfFile)
            FeatureEngineering.changeIndexTypeToLowerMemory(self.test1)
            FeatureEngineering.changeIndexTypeToLowerMemory(self.test2)
            FeatureEngineering.__printDataFrameBasics__(self.test1)
            FeatureEngineering.__printDataFrameBasics__(self.test2)
        
    def ReadCsv(self, trainOrTestOrBoth):
        '''Reads and holds Df in memory'''
        if trainOrTestOrBoth == 'train' or trainOrTestOrBoth == 'both':
            self.train = pd.read_csv(self.trainCsvPath, usecols=self.trainTypes.keys(), dtype=self.trainTypes)
            FeatureEngineering.changeIndexTypeToLowerMemory(self.train)
            FeatureEngineering.__printDataFrameBasics__(self.train)
        if trainOrTestOrBoth == 'test' or trainOrTestOrBoth=='both':
            tempTest = pd.read_csv(self.testCsvPath, usecols=self.testTypes.keys(), dtype=self.testTypes)
            self.test1 = tempTest.loc[tempTest.Semana.values == self.ValidationStart]
            self.test2 = tempTest.loc[tempTest.Semana.values == self.ValidationEnd]
            del tempTest
            FeatureEngineering.changeIndexTypeToLowerMemory(self.test1)
            FeatureEngineering.changeIndexTypeToLowerMemory(self.test2)
            FeatureEngineering.__printDataFrameBasics__(self.test1)
            FeatureEngineering.__printDataFrameBasics__(self.test2)
            
    @staticmethod
    def ConvertCsvToHdf(csvPath, HdfPath, HdfName, ColumnTypeDict ):
        tempDf = pd.read_csv(csvPath, usecols=ColumnTypeDict.keys(), dtype=ColumnTypeDict,index=False)
        tempDf.to_hdf(HdfPath, HdfName, format='t')
        del tempDf
        gc.collect()
        print "ConvertCsvToHdf is done.."

    def Preprocess(self, trainOrTestOrBoth, columnFunctionTypeList):
        '''columnFunctionTypeList = [ ['C1',Func1,Type], ['C2',Func2,Type],..    ]'''
        for column, func, localType in columnFunctionTypeList:
            if trainOrTestOrBoth == 'train' or trainOrTestOrBoth =='both':
                self.train.loc[:,column] =  np.apply_along_axis(func,0,FE.train[column].values).astype(localType)
                #np.apply_along_axis(lambda x: x+1,0,FE.train["Semana"]).astype("int32")
            if trainOrTestOrBoth == 'test' or trainOrTestOrBoth == 'both':
                self.test1.loc[:,column] =  np.apply_along_axis(func,0,FE.test1[column].values).astype(localType)
                self.test2.loc[:,column] =  np.apply_along_axis(func,0,FE.test2[column].values).astype(localType)
        gc.collect()
        
    def SaveDataFrameToHdf(self,trainOrTestOrBoth):
        if trainOrTestOrBoth == 'train' or trainOrTestOrBoth=='both':
            self.train.to_hdf(self.trainHdfPath, self.trainHdfFile, format='t', index="False")
        if trainOrTestOrBoth == 'test' or trainOrTestOrBoth=='both':
            self.test1.to_hdf(self.testHdfPath1, self.testHdfFile, format='t', index="False")
            self.test2.to_hdf(self.testHdfPath2, self.testHdfFile, format='t', index="False")
        
    def AddDemandaGeneralMean(self,trainOrTestOrBoth): 
        #self.train.loc[:,"DemandaGeneralMean"] = self.train["Demanda_uni_equil"].loc[
         #   self.train.loc[:,'Semana'] < 10].mean().astype("float32")
            
        meanOfDemanda = self.train["Demanda_uni_equil"].values.mean().astype("float32")
        
        if trainOrTestOrBoth == 'train' or trainOrTestOrBoth=='both':
            self.train.loc[:,"DemandaGeneralMean"] = meanOfDemanda
        if trainOrTestOrBoth == 'test' or trainOrTestOrBoth=='both':
            self.test1.loc[:,"DemandaGeneralMean"] = meanOfDemanda
            self.test2.loc[:,"DemandaGeneralMean"] = meanOfDemanda
        
        #self.train.loc[:,"DemandaGeneralMean"] = self.train["Demanda_uni_equil"].values[
        #(self.train.loc[:,'Semana'].values < self.ValidationStart).values].mean().astype("float32")
        gc.collect()
        
    '''ConfigElements(0,[ ("A",["Semana","Agencia_ID"],["count","count"]),'''
    def AddConfigurableFeaturesToTrain(self, config):
        if config.lag > self.maxLag:
            self.maxLag = config.lag
        
        tempData = self.train[self.train['Semana'].values <= (self.ValidationEnd - config.lag)]
        #display(tempData)
        if(config.lag != 0):
            tempData.loc[:,'Semana'] = tempData['Semana'].values + config.lag
        #display(tempData)
        
        #Means iterative.. eliminate as long as np.nan exists..If there is already one, don't create, use the existing
        if config.targetVariable != "" and  config.targetVariable not in self.train.columns:
            self.train.loc[:,config.targetVariable] = np.nan
            self.test1.loc[:,config.targetVariable] = np.nan
            
            if config.lag != 1:
                self.test2.loc[:,config.targetVariable] = np.nan
        
        for name,groups,aggregate in config.nameAndGroups:
            if name not in self.train.columns:
                print "{} is not in columns..".format(name)            
                
                groupedDataframe = tempData[groups+['Demanda_uni_equil']].copy().groupby(groups).agg(aggregate[0])
                gc.collect()
                #groupedDataframe.columns = groupedDataframe.columns.droplevel(0)
                groupedDataframe.columns = [name]
                
                #This is means of the counts of the semana-columns tuples!..!!!
                #If no lag and mean, mean of the columns without semana!!..
                #If there is lag and count, count of the columns x weeks before
                #If there is lag and mean, mean of the columns x weeks before
                #if(config.lag == 0 and aggregate == "count"):
                if(len(aggregate)>1):
                    groupedDataframe.reset_index(inplace=True)
                    groupedDataframe.drop("Semana",axis=1, inplace=True)
                    groups = groups[1:]
                    groupedDataframe = groupedDataframe.groupby(groups).agg(aggregate[1])
                    groupedDataframe.columns = [name]
                    gc.collect()
                
                display(groupedDataframe.head(2))
                self.train = self.train.merge( groupedDataframe, left_on=groups,
                    right_index=True, how='left', sort=False,copy=False)
                gc.collect()
                self.test1 = self.test1.merge( groupedDataframe, left_on=groups,
                    right_index=True, how='left', sort=False,copy=False)
                gc.collect()
                if config.lag != 1:
                    self.test2 = self.test2.merge( groupedDataframe, left_on=groups,
                        right_index=True, how='left', sort=False,copy=False)
                
                del groupedDataframe
                gc.collect()
            else:
                print "{} is in columns..".format(name)
            
            display(self.train.head(2))
            display(self.test1.head(2))
            display(self.test2.head(2))
            
            #Means iterative..!!!!!
            if config.targetVariable != "":
                self.train.loc[pd.isnull(self.train[config.targetVariable].values), 
                    config.targetVariable] = self.train.loc[pd.isnull(self.train[config.targetVariable].values)
                    , name].values
                self.test1.loc[pd.isnull(self.test1[config.targetVariable].values), 
                    config.targetVariable] = self.test1.loc[pd.isnull(self.test1[config.targetVariable].values),
                    name].values
                if config.lag != 1:
                    self.test2.loc[pd.isnull(self.test2[config.targetVariable].values), 
                        config.targetVariable] = self.test2.loc[pd.isnull(self.test2[config.targetVariable].values)
                        , name].values
                    
                count = self.test1[config.targetVariable].isnull().sum()
                print "Count of missing numbers after {} in validation part 1 in column {} is {}".format(name, 
                    config.targetVariable,str(count))
                if config.lag != 1:
                    count = self.test2.loc[:,config.targetVariable].isnull().sum()
                    print "Count of missing numbers after {} in validation part 2 in column {} is {}".format(name, 
                        config.targetVariable,str(count))
                
                
                #display(self.train)
                #If column is already in Dataframe and we want to fill target variable, this deletes columns!!!
                if(config.deleteColumns):
                    self.train.drop(name, axis=1, inplace=True)
                    self.test1.drop(name, axis=1, inplace=True)
                    if config.lag != 1:
                        self.test2.drop(name, axis=1, inplace=True)
                gc.collect()
                #Only in tesst
                #if count == 0:
                 #   break
        del tempData
        display(self.train.head(2))
        display(self.test1.head(2))
        display(self.test2.head(2))
        gc.collect()
        return 
    
    def DeleteLaggedWeeksFromTrain(self):
        self.train = self.train[self.train['Semana'].values >= (3 + self.maxLag)]
        gc.collect()
        display(self.train.head(2))
        
    def ReadFirstNRowsOfACsv(self, nrows, trainOrTestOrBoth) :
        if trainOrTestOrBoth == 'train' or trainOrTestOrBoth=='both':
            self.train = pd.read_csv(self.trainCsvPath, usecols=self.trainTypes.keys(), dtype=self.trainTypes, nrows = nrows)
            FeatureEngineering.changeIndexTypeToLowerMemory(self.train)
            FeatureEngineering.__printDataFrameBasics__(self.train)
        if trainOrTestOrBoth == 'test' or trainOrTestOrBoth=='both':
            tempTest = pd.read_csv(self.testCsvPath, usecols=self.testTypes.keys(), dtype=self.testTypes, nrows = nrows*2)
            self.test1 = tempTest.loc[tempTest.Semana == self.ValidationStart]
            self.test2 = tempTest.loc[tempTest.Semana == self.ValidationEnd]
            del tempTest
            FeatureEngineering.changeIndexTypeToLowerMemory(self.test1)
            FeatureEngineering.changeIndexTypeToLowerMemory(self.test2)
            FeatureEngineering.__printDataFrameBasics__(self.test1)
            FeatureEngineering.__printDataFrameBasics__(self.test2)
    
    #Use when concatanating train and validation before predict test for example..
    def AppendTestToTrain(self,deleteTest = True):
        self.train = self.train.append(self.test1,ignore_index=True)
        gc.collect()
        if(deleteTest):
            del self.test1
            gc.collect()
        try:
            self.train = self.train.append(self.test2,ignore_index=True)
            gc.collect()
            if(deleteTest):
                del self.test2
                gc.collect()
        except:
            pass
        #BAD PERFORMANCE!!
    #Split train data to train and test1 and test2 (validation)
    #def SplitTrainToTestUsingValidationStart(self):
     #   boolCondition = self.train.Semana == self.ValidationStart
      #  self.test1 = self.train.loc[boolCondition]
       # self.train.drop((self.train.loc[boolCondition].index), axis=0,inplace=True)
        
       # boolCondition = self.train.Semana == self.ValidationEnd
       # self.test2 = self.train.loc[boolCondition]
       # self.train.drop((self.train.loc[boolCondition].index), axis=0,inplace=True)
      #  del boolCondition
      #  gc.collect()
    
    #Reaches 3x memory from train, because of test1, test2 and train itself at the end.. GC fixed in the end..
    def SplitTrainToTestUsingValidationStart(self):
        boolCondition = self.train.Semana.values == self.ValidationStart
        self.test1 = self.train[boolCondition]
        boolCondition = self.train.Semana.values == self.ValidationEnd
        self.test2 = self.train[boolCondition]
        FE.train = FE.train[ FE.train.Semana.values < FE.ValidationStart ]
        del boolCondition
        gc.collect()

In [55]:
class ConfigElements:
    def __init__(self, lag, nameAndGroups, targetVariable="", deleteColumns = False):
        self.lag = lag
        self.nameAndGroups = nameAndGroups
        #If there is target variable, then 5 4 3 2 1, fill the np.nans..Else hold them all in Dataframe..
        self.targetVariable = targetVariable
        self.deleteColumns = deleteColumns

In [56]:
parameterDict =       {"ValidationStart":10, 
 "ValidationEnd":11,
   "maxLag":3,
    "trainHdfPath":'../../input/train_full.h5',
    "trainHdfFile":"train",
    "testHdfPath1":"../../input/test1_full.h5",
    "testHdfPath2":"../../input/test2_full.h5",
    "testHdfFile":"test", 
    "trainTypes" : {'Semana':np.uint8, 'Agencia_ID':np.uint16, 'Canal_ID':np.uint8,'Ruta_SAK':np.uint16, 
        'Cliente_ID':np.uint32, 'Producto_ID':np.uint16,'Venta_uni_hoy':np.uint16, 'Venta_hoy':np.float32,
                    'Dev_uni_proxima': np.uint32, 'Dev_proxima':np.float32,'Demanda_uni_equil':np.uint32}, 
    "testTypes" : {'id':np.uint32,'Semana':np.uint8, 'Agencia_ID':np.uint16, 'Canal_ID':np.uint8,'Ruta_SAK':np.uint16,
        'Cliente_ID':np.uint32, 'Producto_ID':np.uint16},
    "trainCsvPath":'../../input/train.csv'   ,
    "testCsvPath":'../../input/test.csv'}

FE = FeatureEngineering(**parameterDict)
print FE.__dict__

{'trainCsvPath': '../../input/train.csv', 'maxLag': 3, 'testTypes': {'Cliente_ID': <type 'numpy.uint32'>, 'Ruta_SAK': <type 'numpy.uint16'>, 'Canal_ID': <type 'numpy.uint8'>, 'Producto_ID': <type 'numpy.uint16'>, 'Agencia_ID': <type 'numpy.uint16'>, 'Semana': <type 'numpy.uint8'>, 'id': <type 'numpy.uint32'>}, 'testHdfFile': 'test', 'trainTypes': {'Dev_proxima': <type 'numpy.float32'>, 'Venta_uni_hoy': <type 'numpy.uint16'>, 'Cliente_ID': <type 'numpy.uint32'>, 'Demanda_uni_equil': <type 'numpy.uint32'>, 'Ruta_SAK': <type 'numpy.uint16'>, 'Canal_ID': <type 'numpy.uint8'>, 'Venta_hoy': <type 'numpy.float32'>, 'Producto_ID': <type 'numpy.uint16'>, 'Agencia_ID': <type 'numpy.uint16'>, 'Dev_uni_proxima': <type 'numpy.uint32'>, 'Semana': <type 'numpy.uint8'>}, 'testHdfPath1': '../../input/test1_full.h5', 'ValidationEnd': 11, 'testHdfPath2': '../../input/test2_full.h5', 'testCsvPath': '../../input/test.csv', 'ValidationStart': 10, 'trainHdfFile': 'train', 'trainHdfPath': '../../input/train_f

In [57]:
FE.ReadCsv('both')

Unnamed: 0,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Venta_uni_hoy,Venta_hoy,Dev_uni_proxima,Dev_proxima,Demanda_uni_equil
0,3,1110,7,3301,15766,1212,3,25.139999,0,0.0,3
1,3,1110,7,3301,15766,1216,4,33.52,0,0.0,4


<class 'pandas.core.frame.DataFrame'>
RangeIndex: 74180464 entries, 0 to 74180463
Data columns (total 11 columns):
Semana               uint8
Agencia_ID           uint16
Canal_ID             uint8
Ruta_SAK             uint16
Cliente_ID           uint32
Producto_ID          uint16
Venta_uni_hoy        uint16
Venta_hoy            float32
Dev_uni_proxima      uint32
Dev_proxima          float32
Demanda_uni_equil    uint32
dtypes: float32(2), uint16(4), uint32(3), uint8(2)
memory usage: 2.1 GB
None


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID
2,2,10,2045,1,2831,4549769,32940
7,7,10,1612,1,2837,4414012,35305


<class 'pandas.core.frame.DataFrame'>
Int64Index: 3538385 entries, 2 to 6999247
Data columns (total 7 columns):
id             uint32
Semana         uint8
Agencia_ID     uint16
Canal_ID       uint8
Ruta_SAK       uint16
Cliente_ID     uint32
Producto_ID    uint16
dtypes: uint16(3), uint32(2), uint8(2)
memory usage: 81.0 MB
None


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID
0,0,11,4037,1,2209,4639078,35305
1,1,11,2237,1,1226,4705135,1238


<class 'pandas.core.frame.DataFrame'>
Int64Index: 3460866 entries, 0 to 6999250
Data columns (total 7 columns):
id             uint32
Semana         uint8
Agencia_ID     uint16
Canal_ID       uint8
Ruta_SAK       uint16
Cliente_ID     uint32
Producto_ID    uint16
dtypes: uint16(3), uint32(2), uint8(2)
memory usage: 79.2 MB
None


## Merge town and products..

In [58]:
townstate = pd.read_csv("../../input/town_state.csv", encoding='utf-8')
townstate['Town_ID']=townstate['Town'].str[:4]
states = townstate['State']
le = preprocessing.LabelEncoder()
townstate['State_ID']=le.fit_transform(states)
townstate = townstate.drop(['Town', 'State'], axis=1)
townstate = townstate.astype('uint16')
townstate[['State_ID']] =townstate[['State_ID']] .astype('uint8')
FE.train = pd.merge(FE.train, townstate, on='Agencia_ID', how='left', sort=False,copy=False)
gc.collect()
FE.test1 = pd.merge(FE.test1, townstate, on='Agencia_ID', how='left', sort=False,copy=False)
gc.collect()
FE.test2 = pd.merge(FE.test2, townstate, on='Agencia_ID', how='left', sort=False,copy=False)
gc.collect()

98

In [59]:
products = pd.read_csv("../../input/producto_tabla.csv")
products['short_name'] = products.NombreProducto.str.extract('^(\D*)', expand=False)
products['brand'] = products.NombreProducto.str.extract('^.+\s(\D+) \d+$', expand=False)
w = products.NombreProducto.str.extract('(\d+)(Kg|g)', expand=True)
products['weight'] = w[0].astype('float') * w[1].map({'Kg': 1000, 'g': 1})
products['pieces'] = products.NombreProducto.str.extract('(\d+)p ', expand=False).astype('float')

products['short_name_processed'] = (products['short_name'].
                                    map(lambda x: " ".
                                        join([i for i in x.lower().split() 
                                              if i not in nltk.corpus.stopwords.words("spanish")])))
stemmer = SnowballStemmer("spanish")
products['short_name_processed'] = (products['short_name_processed'].
                                    map(lambda x: " ".join([stemmer.stem(i) for i in x.lower().split()])))

le = preprocessing.LabelEncoder()

products['Prod_name_ID']=le.fit_transform(products['short_name_processed'])
products['Brand_ID']=le.fit_transform(products['brand'])

products = products.drop(['short_name', 'brand', 'short_name_processed', 'NombreProducto'], axis=1)
products.fillna(value=0, inplace=True)
products[['pieces','Brand_ID']] = products[['pieces','Brand_ID']].astype('uint8')
products[['Producto_ID','weight', 'Prod_name_ID']] = products[['Producto_ID','weight', 'Prod_name_ID']].astype('uint16')
FE.train = pd.merge(FE.train, products, on='Producto_ID', how='left', sort=False,copy=False)
gc.collect()
FE.test1 = pd.merge(FE.test1, products, on='Producto_ID', how='left', sort=False,copy=False)
gc.collect()
FE.test2 = pd.merge(FE.test2, products, on='Producto_ID', how='left', sort=False,copy=False)
gc.collect()

14

## Check NA values here.

In [60]:
FE.train[FE.train.isnull().any(axis=1)]

Unnamed: 0,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Venta_uni_hoy,Venta_hoy,Dev_uni_proxima,Dev_proxima,Demanda_uni_equil,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID


In [61]:
FE.test1[FE.test1.isnull().any(axis=1)]

Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID


In [62]:
FE.test2[FE.test2.isnull().any(axis=1)]

Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID


## Last State of Train, test1 and test2..

In [63]:
display(FE.train.head(2))
display(FE.test1.head(2))
display(FE.test2.head(2))

Unnamed: 0,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Venta_uni_hoy,Venta_hoy,Dev_uni_proxima,Dev_proxima,Demanda_uni_equil,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID
0,3,1110,7,3301,15766,1212,3,25.139999,0,0.0,3,2008,16,120,2,709,4
1,3,1110,7,3301,15766,1216,4,33.52,0,0.0,4,2008,16,135,2,712,4


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID
0,2,10,2045,1,2831,4549769,32940,2163,14,110,10,678,23
1,7,10,1612,1,2837,4414012,35305,2352,30,75,0,45,23


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID
0,0,11,4037,1,2209,4639078,35305,2499,28,75,0,45,23
1,1,11,2237,1,1226,4705135,1238,2402,4,140,2,630,4


## Convert to Log..

In [64]:
FE.train.loc[:,"Demanda_uni_equil"] = np.log1p (FE.train["Demanda_uni_equil"].values)
FE.train.loc[:,"Demanda_uni_equil_original"] =  np.round( np.expm1(FE.train["Demanda_uni_equil"]))
gc.collect()

94

## Split Train to test1 test2

In [65]:
#FE.SplitTrainToTestUsingValidationStart()

## Add DemandaNotEqualTheDifferenceOfVentaUniAndDev to model products delivered later..

In [66]:
FE.train.loc[:,"DemandaNotEqualTheDifferenceOfVentaUniAndDev"] = FE.train.Demanda_uni_equil_original.values < (
    FE.train.Venta_uni_hoy.values - FE.train.Dev_uni_proxima.values)
gc.collect()

7

## Delete Demanda = 0  and Venta = 0

In [67]:
FE.train = FE.train.loc[~((FE.train.Demanda_uni_equil_original == 0) & (FE.train.Venta_uni_hoy == 0))]
gc.collect()

35

In [68]:
FE.SaveDataFrameToHdf('both')

In [69]:
FE.ReadHdf('both')

Unnamed: 0,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Venta_uni_hoy,Venta_hoy,Dev_uni_proxima,Dev_proxima,Demanda_uni_equil,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Demanda_uni_equil_original,DemandaNotEqualTheDifferenceOfVentaUniAndDev
0,3,1110,7,3301,15766,1212,3,25.139999,0,0.0,1.386294,2008,16,120,2,709,4,3.0,False
1,3,1110,7,3301,15766,1216,4,33.52,0,0.0,1.609438,2008,16,135,2,712,4,4.0,False


<class 'pandas.core.frame.DataFrame'>
Int64Index: 73877905 entries, 0 to 74180463
Data columns (total 19 columns):
Semana                                          uint8
Agencia_ID                                      uint16
Canal_ID                                        uint8
Ruta_SAK                                        uint16
Cliente_ID                                      uint32
Producto_ID                                     uint16
Venta_uni_hoy                                   uint16
Venta_hoy                                       float32
Dev_uni_proxima                                 uint32
Dev_proxima                                     float32
Demanda_uni_equil                               float64
Town_ID                                         uint16
State_ID                                        uint8
weight                                          uint16
pieces                                          uint8
Prod_name_ID                                    uint16
Brand_

Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID
0,2,10,2045,1,2831,4549769,32940,2163,14,110,10,678,23
1,7,10,1612,1,2837,4414012,35305,2352,30,75,0,45,23


<class 'pandas.core.frame.DataFrame'>
Int64Index: 3538385 entries, 0 to 3538384
Data columns (total 13 columns):
id              uint32
Semana          uint8
Agencia_ID      uint16
Canal_ID        uint8
Ruta_SAK        uint16
Cliente_ID      uint32
Producto_ID     uint16
Town_ID         uint16
State_ID        uint8
weight          uint16
pieces          uint8
Prod_name_ID    uint16
Brand_ID        uint8
dtypes: uint16(6), uint32(2), uint8(5)
memory usage: 111.4 MB
None


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID
0,0,11,4037,1,2209,4639078,35305,2499,28,75,0,45,23
1,1,11,2237,1,1226,4705135,1238,2402,4,140,2,630,4


<class 'pandas.core.frame.DataFrame'>
Int64Index: 3460866 entries, 0 to 3460865
Data columns (total 13 columns):
id              uint32
Semana          uint8
Agencia_ID      uint16
Canal_ID        uint8
Ruta_SAK        uint16
Cliente_ID      uint32
Producto_ID     uint16
Town_ID         uint16
State_ID        uint8
weight          uint16
pieces          uint8
Prod_name_ID    uint16
Brand_ID        uint8
dtypes: uint16(6), uint32(2), uint8(5)
memory usage: 108.9 MB
None


## Grouping for Lag0

In [70]:
#FE.train = FE.train.drop(['Lag0'], axis=1)  ## run these again, then comment out.

In [71]:
configLag0Target1DeleteColumnsFalse = ConfigElements(0,[ ("SPClRACh0_mean",[
                                                              "Producto_ID",
                                                              "Cliente_ID",
                                                              "Ruta_SAK",
                                                              "Agencia_ID",
                                                              "Canal_ID"],
                                                          ["mean"]),
                                                        ("SPClRA0_mean",[
                                                              "Producto_ID",
                                                              "Cliente_ID",
                                                              "Ruta_SAK",
                                                              "Agencia_ID"],
                                                          ["mean"]),
                                                        ("SPClRCh0_mean",[
                                                              "Producto_ID",
                                                              "Cliente_ID",
                                                              "Ruta_SAK",
                                                              "Canal_ID"],
                                                          ["mean"]),
                                                        ("SPClACh0_mean",[
                                                              "Producto_ID",
                                                              "Cliente_ID",
                                                              "Agencia_ID",
                                                              "Canal_ID"],
                                                          ["mean"]),
                                                        ("SPClR0_mean",[
                                                              "Producto_ID",
                                                              "Cliente_ID",
                                                              "Ruta_SAK"],
                                                          ["mean"]),
                                                        ("SPClA0_mean",[
                                                              "Producto_ID",
                                                              "Cliente_ID",
                                                              "Agencia_ID"],
                                                          ["mean"]),
                                                       ("SPClCh0_mean",[
                                                              "Producto_ID",
                                                              "Cliente_ID",
                                                              "Canal_ID"],
                                                          ["mean"]),
                                                       ("SPCl0_mean",[
                                                              "Producto_ID",
                                                              "Cliente_ID"],
                                                          ["mean"]),
                                                       ("SPR0_mean",[
                                                              "Producto_ID",
                                                              "Ruta_SAK"],
                                                          ["mean"]),
                                                       ("SPA0_mean",[
                                                              "Producto_ID",
                                                              "Agencia_ID"],
                                                          ["mean"]),
                                                       ("SPCh0_mean",[
                                                              "Producto_ID",
                                                              "Canal_ID"],
                                                          ["mean"]),
                                                       ("SPT0_mean",[
                                                              "Producto_ID",
                                                              "Town_ID"],
                                                          ["mean"]),
                                                       ("SPSt0_mean",[
                                                              "Producto_ID",
                                                              "State_ID"],
                                                          ["mean"]),
                                                       ("SP0_mean",[
                                                              "Producto_ID"],
                                                          ["mean"]),
                                                      ("SPnClRACh0_mean",[  ##PRODNAMES START
                                                              "Prod_name_ID",
                                                              "Cliente_ID",
                                                              "Ruta_SAK",
                                                              "Agencia_ID",
                                                              "Canal_ID"],
                                                          ["mean"]),
                                                        ("SPnClRA0_mean",[
                                                              "Prod_name_ID",
                                                              "Cliente_ID",
                                                              "Ruta_SAK",
                                                              "Agencia_ID"],
                                                          ["mean"]),
                                                        ("SPnClRCh0_mean",[
                                                              "Prod_name_ID",
                                                              "Cliente_ID",
                                                              "Ruta_SAK",
                                                              "Canal_ID"],
                                                          ["mean"]),
                                                        ("SPnClACh0_mean",[
                                                              "Prod_name_ID",
                                                              "Cliente_ID",
                                                              "Agencia_ID",
                                                              "Canal_ID"],
                                                          ["mean"]),
                                                        ("SPnClR0_mean",[
                                                              "Prod_name_ID",
                                                              "Cliente_ID",
                                                              "Ruta_SAK"],
                                                          ["mean"]),
                                                        ("SPnClA0_mean",[
                                                              "Prod_name_ID",
                                                              "Cliente_ID",
                                                              "Agencia_ID"],
                                                          ["mean"]),
                                                       ("SPnClCh0_mean",[
                                                              "Prod_name_ID",
                                                              "Cliente_ID",
                                                              "Canal_ID"],
                                                          ["mean"]),
                                                       ("SPnCl0_mean",[
                                                              "Prod_name_ID",
                                                              "Cliente_ID"],
                                                          ["mean"]),
                                                       ("SPnR0_mean",[
                                                              "Prod_name_ID",
                                                              "Ruta_SAK"],
                                                          ["mean"]),
                                                       ("SPnA0_mean",[
                                                              "Prod_name_ID",
                                                              "Agencia_ID"],
                                                          ["mean"]),
                                                       ("SPnCh0_mean",[
                                                              "Prod_name_ID",
                                                              "Canal_ID"],
                                                          ["mean"]),
                                                       ("SPnT0_mean",[
                                                              "Prod_name_ID",
                                                              "Town_ID"],
                                                          ["mean"]),
                                                       ("SPnSt0_mean",[
                                                              "Prod_name_ID",
                                                              "State_ID"],
                                                          ["mean"]),
                                                       ("SPn0_mean",[
                                                              "Prod_name_ID"],
                                                          ["mean"]),
                                                       ("SBClRACh0_mean",[ ##brand id START
                                                              "Brand_ID",
                                                              "Cliente_ID",
                                                              "Ruta_SAK",
                                                              "Agencia_ID",
                                                              "Canal_ID"],
                                                          ["mean"]),
                                                        ("SBClRA0_mean",[
                                                              "Brand_ID",
                                                              "Cliente_ID",
                                                              "Ruta_SAK",
                                                              "Agencia_ID"],
                                                          ["mean"]),
                                                        ("SBClRCh0_mean",[
                                                              "Brand_ID",
                                                              "Cliente_ID",
                                                              "Ruta_SAK",
                                                              "Canal_ID"],
                                                          ["mean"]),
                                                        ("SBClACh0_mean",[
                                                              "Brand_ID",
                                                              "Cliente_ID",
                                                              "Agencia_ID",
                                                              "Canal_ID"],
                                                          ["mean"]),
                                                        ("SBClR0_mean",[
                                                              "Brand_ID",
                                                              "Cliente_ID",
                                                              "Ruta_SAK"],
                                                          ["mean"]),
                                                        ("SBClA0_mean",[
                                                              "Brand_ID",
                                                              "Cliente_ID",
                                                              "Agencia_ID"],
                                                          ["mean"]),
                                                       ("SBClCh0_mean",[
                                                              "Brand_ID",
                                                              "Cliente_ID",
                                                              "Canal_ID"],
                                                          ["mean"]),
                                                       ("SBCl0_mean",[
                                                              "Brand_ID",
                                                              "Cliente_ID"],
                                                          ["mean"]),
                                                       ("SBR0_mean",[
                                                              "Brand_ID",
                                                              "Ruta_SAK"],
                                                          ["mean"]),
                                                       ("SBA0_mean",[
                                                              "Brand_ID",
                                                              "Agencia_ID"],
                                                          ["mean"]),
                                                       ("SBCh0_mean",[
                                                              "Brand_ID",
                                                              "Canal_ID"],
                                                          ["mean"]),
                                                       ("SBT0_mean",[
                                                              "Brand_ID",
                                                              "Town_ID"],
                                                          ["mean"]),
                                                       ("SBSt0_mean",[
                                                              "Brand_ID",
                                                              "State_ID"],
                                                          ["mean"]),
                                                       ("SB0_mean",[
                                                              "Brand_ID"],
                                                          ["mean"])
                                                       
                                                       
                                                       ], "Lag0", True)
print  configLag0Target1DeleteColumnsFalse.__dict__

{'nameAndGroups': [('SPClRACh0_mean', ['Producto_ID', 'Cliente_ID', 'Ruta_SAK', 'Agencia_ID', 'Canal_ID'], ['mean']), ('SPClRA0_mean', ['Producto_ID', 'Cliente_ID', 'Ruta_SAK', 'Agencia_ID'], ['mean']), ('SPClRCh0_mean', ['Producto_ID', 'Cliente_ID', 'Ruta_SAK', 'Canal_ID'], ['mean']), ('SPClACh0_mean', ['Producto_ID', 'Cliente_ID', 'Agencia_ID', 'Canal_ID'], ['mean']), ('SPClR0_mean', ['Producto_ID', 'Cliente_ID', 'Ruta_SAK'], ['mean']), ('SPClA0_mean', ['Producto_ID', 'Cliente_ID', 'Agencia_ID'], ['mean']), ('SPClCh0_mean', ['Producto_ID', 'Cliente_ID', 'Canal_ID'], ['mean']), ('SPCl0_mean', ['Producto_ID', 'Cliente_ID'], ['mean']), ('SPR0_mean', ['Producto_ID', 'Ruta_SAK'], ['mean']), ('SPA0_mean', ['Producto_ID', 'Agencia_ID'], ['mean']), ('SPCh0_mean', ['Producto_ID', 'Canal_ID'], ['mean']), ('SPT0_mean', ['Producto_ID', 'Town_ID'], ['mean']), ('SPSt0_mean', ['Producto_ID', 'State_ID'], ['mean']), ('SP0_mean', ['Producto_ID'], ['mean']), ('SPnClRACh0_mean', ['Prod_name_ID', 'Clien

In [72]:
FE.AddConfigurableFeaturesToTrain(configLag0Target1DeleteColumnsFalse)

SPClRACh0_mean is not in columns..


Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,Unnamed: 3_level_0,Unnamed: 4_level_0,SPClRACh0_mean
Producto_ID,Cliente_ID,Ruta_SAK,Agencia_ID,Canal_ID,Unnamed: 5_level_1
41,146030,3303,2281,7,4.069195
41,465617,3306,2281,7,0.0


Unnamed: 0,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Venta_uni_hoy,Venta_hoy,Dev_uni_proxima,Dev_proxima,...,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Demanda_uni_equil_original,DemandaNotEqualTheDifferenceOfVentaUniAndDev,Lag0,SPClRACh0_mean
0,3,1110,7,3301,15766,1212,3,25.139999,0,0.0,...,2008,16,120,2,709,4,3.0,False,,1.418015
1,3,1110,7,3301,15766,1216,4,33.52,0,0.0,...,2008,16,135,2,712,4,4.0,False,,1.279644


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,SPClRACh0_mean
0,2,10,2045,1,2831,4549769,32940,2163,14,110,10,678,23,,1.098612
1,7,10,1612,1,2837,4414012,35305,2352,30,75,0,45,23,,


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,SPClRACh0_mean
0,0,11,4037,1,2209,4639078,35305,2499,28,75,0,45,23,,1.609438
1,1,11,2237,1,1226,4705135,1238,2402,4,140,2,630,4,,


Count of missing numbers after SPClRACh0_mean in validation part 1 in column Lag0 is 624259
Count of missing numbers after SPClRACh0_mean in validation part 2 in column Lag0 is 828166
SPClRA0_mean is not in columns..


Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,Unnamed: 3_level_0,SPClRA0_mean
Producto_ID,Cliente_ID,Ruta_SAK,Agencia_ID,Unnamed: 4_level_1
41,146030,3303,2281,4.069195
41,465617,3306,2281,0.0


Unnamed: 0,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Venta_uni_hoy,Venta_hoy,Dev_uni_proxima,Dev_proxima,...,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Demanda_uni_equil_original,DemandaNotEqualTheDifferenceOfVentaUniAndDev,Lag0,SPClRA0_mean
0,3,1110,7,3301,15766,1212,3,25.139999,0,0.0,...,2008,16,120,2,709,4,3.0,False,1.418015,1.418015
1,3,1110,7,3301,15766,1216,4,33.52,0,0.0,...,2008,16,135,2,712,4,4.0,False,1.279644,1.279644


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,SPClRA0_mean
0,2,10,2045,1,2831,4549769,32940,2163,14,110,10,678,23,1.098612,1.098612
1,7,10,1612,1,2837,4414012,35305,2352,30,75,0,45,23,,


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,SPClRA0_mean
0,0,11,4037,1,2209,4639078,35305,2499,28,75,0,45,23,1.609438,1.609438
1,1,11,2237,1,1226,4705135,1238,2402,4,140,2,630,4,,


Count of missing numbers after SPClRA0_mean in validation part 1 in column Lag0 is 624074
Count of missing numbers after SPClRA0_mean in validation part 2 in column Lag0 is 827945
SPClRCh0_mean is not in columns..


Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,Unnamed: 3_level_0,SPClRCh0_mean
Producto_ID,Cliente_ID,Ruta_SAK,Canal_ID,Unnamed: 4_level_1
41,146030,3303,7,4.069195
41,465617,3306,7,0.0


Unnamed: 0,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Venta_uni_hoy,Venta_hoy,Dev_uni_proxima,Dev_proxima,...,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Demanda_uni_equil_original,DemandaNotEqualTheDifferenceOfVentaUniAndDev,Lag0,SPClRCh0_mean
0,3,1110,7,3301,15766,1212,3,25.139999,0,0.0,...,2008,16,120,2,709,4,3.0,False,1.418015,1.418015
1,3,1110,7,3301,15766,1216,4,33.52,0,0.0,...,2008,16,135,2,712,4,4.0,False,1.279644,1.279644


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,SPClRCh0_mean
0,2,10,2045,1,2831,4549769,32940,2163,14,110,10,678,23,1.098612,1.098612
1,7,10,1612,1,2837,4414012,35305,2352,30,75,0,45,23,,


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,SPClRCh0_mean
0,0,11,4037,1,2209,4639078,35305,2499,28,75,0,45,23,1.609438,1.609438
1,1,11,2237,1,1226,4705135,1238,2402,4,140,2,630,4,,


Count of missing numbers after SPClRCh0_mean in validation part 1 in column Lag0 is 623991
Count of missing numbers after SPClRCh0_mean in validation part 2 in column Lag0 is 827777
SPClACh0_mean is not in columns..


Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,Unnamed: 3_level_0,SPClACh0_mean
Producto_ID,Cliente_ID,Agencia_ID,Canal_ID,Unnamed: 4_level_1
41,146030,2281,7,4.069195
41,465617,2281,7,0.0


Unnamed: 0,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Venta_uni_hoy,Venta_hoy,Dev_uni_proxima,Dev_proxima,...,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Demanda_uni_equil_original,DemandaNotEqualTheDifferenceOfVentaUniAndDev,Lag0,SPClACh0_mean
0,3,1110,7,3301,15766,1212,3,25.139999,0,0.0,...,2008,16,120,2,709,4,3.0,False,1.418015,1.418015
1,3,1110,7,3301,15766,1216,4,33.52,0,0.0,...,2008,16,135,2,712,4,4.0,False,1.279644,1.279644


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,SPClACh0_mean
0,2,10,2045,1,2831,4549769,32940,2163,14,110,10,678,23,1.098612,1.098612
1,7,10,1612,1,2837,4414012,35305,2352,30,75,0,45,23,,


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,SPClACh0_mean
0,0,11,4037,1,2209,4639078,35305,2499,28,75,0,45,23,1.609438,1.609438
1,1,11,2237,1,1226,4705135,1238,2402,4,140,2,630,4,,


Count of missing numbers after SPClACh0_mean in validation part 1 in column Lag0 is 593162
Count of missing numbers after SPClACh0_mean in validation part 2 in column Lag0 is 780539
SPClR0_mean is not in columns..


Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,SPClR0_mean
Producto_ID,Cliente_ID,Ruta_SAK,Unnamed: 3_level_1
41,146030,3303,4.069195
41,465617,3306,0.0


Unnamed: 0,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Venta_uni_hoy,Venta_hoy,Dev_uni_proxima,Dev_proxima,...,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Demanda_uni_equil_original,DemandaNotEqualTheDifferenceOfVentaUniAndDev,Lag0,SPClR0_mean
0,3,1110,7,3301,15766,1212,3,25.139999,0,0.0,...,2008,16,120,2,709,4,3.0,False,1.418015,1.418015
1,3,1110,7,3301,15766,1216,4,33.52,0,0.0,...,2008,16,135,2,712,4,4.0,False,1.279644,1.279644


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,SPClR0_mean
0,2,10,2045,1,2831,4549769,32940,2163,14,110,10,678,23,1.098612,1.098612
1,7,10,1612,1,2837,4414012,35305,2352,30,75,0,45,23,,


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,SPClR0_mean
0,0,11,4037,1,2209,4639078,35305,2499,28,75,0,45,23,1.609438,1.609438
1,1,11,2237,1,1226,4705135,1238,2402,4,140,2,630,4,,


Count of missing numbers after SPClR0_mean in validation part 1 in column Lag0 is 593162
Count of missing numbers after SPClR0_mean in validation part 2 in column Lag0 is 780539
SPClA0_mean is not in columns..


Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,SPClA0_mean
Producto_ID,Cliente_ID,Agencia_ID,Unnamed: 3_level_1
41,146030,2281,4.069195
41,465617,2281,0.0


Unnamed: 0,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Venta_uni_hoy,Venta_hoy,Dev_uni_proxima,Dev_proxima,...,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Demanda_uni_equil_original,DemandaNotEqualTheDifferenceOfVentaUniAndDev,Lag0,SPClA0_mean
0,3,1110,7,3301,15766,1212,3,25.139999,0,0.0,...,2008,16,120,2,709,4,3.0,False,1.418015,1.418015
1,3,1110,7,3301,15766,1216,4,33.52,0,0.0,...,2008,16,135,2,712,4,4.0,False,1.279644,1.279644


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,SPClA0_mean
0,2,10,2045,1,2831,4549769,32940,2163,14,110,10,678,23,1.098612,1.098612
1,7,10,1612,1,2837,4414012,35305,2352,30,75,0,45,23,,


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,SPClA0_mean
0,0,11,4037,1,2209,4639078,35305,2499,28,75,0,45,23,1.609438,1.609438
1,1,11,2237,1,1226,4705135,1238,2402,4,140,2,630,4,,


Count of missing numbers after SPClA0_mean in validation part 1 in column Lag0 is 592491
Count of missing numbers after SPClA0_mean in validation part 2 in column Lag0 is 779576
SPClCh0_mean is not in columns..


Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,SPClCh0_mean
Producto_ID,Cliente_ID,Canal_ID,Unnamed: 3_level_1
41,146030,7,4.069195
41,465617,7,0.0


Unnamed: 0,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Venta_uni_hoy,Venta_hoy,Dev_uni_proxima,Dev_proxima,...,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Demanda_uni_equil_original,DemandaNotEqualTheDifferenceOfVentaUniAndDev,Lag0,SPClCh0_mean
0,3,1110,7,3301,15766,1212,3,25.139999,0,0.0,...,2008,16,120,2,709,4,3.0,False,1.418015,1.418015
1,3,1110,7,3301,15766,1216,4,33.52,0,0.0,...,2008,16,135,2,712,4,4.0,False,1.279644,1.279644


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,SPClCh0_mean
0,2,10,2045,1,2831,4549769,32940,2163,14,110,10,678,23,1.098612,1.098612
1,7,10,1612,1,2837,4414012,35305,2352,30,75,0,45,23,,


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,SPClCh0_mean
0,0,11,4037,1,2209,4639078,35305,2499,28,75,0,45,23,1.609438,1.609438
1,1,11,2237,1,1226,4705135,1238,2402,4,140,2,630,4,,


Count of missing numbers after SPClCh0_mean in validation part 1 in column Lag0 is 592235
Count of missing numbers after SPClCh0_mean in validation part 2 in column Lag0 is 779154
SPCl0_mean is not in columns..


Unnamed: 0_level_0,Unnamed: 1_level_0,SPCl0_mean
Producto_ID,Cliente_ID,Unnamed: 2_level_1
41,146030,4.069195
41,465617,0.0


Unnamed: 0,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Venta_uni_hoy,Venta_hoy,Dev_uni_proxima,Dev_proxima,...,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Demanda_uni_equil_original,DemandaNotEqualTheDifferenceOfVentaUniAndDev,Lag0,SPCl0_mean
0,3,1110,7,3301,15766,1212,3,25.139999,0,0.0,...,2008,16,120,2,709,4,3.0,False,1.418015,1.418015
1,3,1110,7,3301,15766,1216,4,33.52,0,0.0,...,2008,16,135,2,712,4,4.0,False,1.279644,1.279644


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,SPCl0_mean
0,2,10,2045,1,2831,4549769,32940,2163,14,110,10,678,23,1.098612,1.098612
1,7,10,1612,1,2837,4414012,35305,2352,30,75,0,45,23,,


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,SPCl0_mean
0,0,11,4037,1,2209,4639078,35305,2499,28,75,0,45,23,1.609438,1.609438
1,1,11,2237,1,1226,4705135,1238,2402,4,140,2,630,4,,


Count of missing numbers after SPCl0_mean in validation part 1 in column Lag0 is 592088
Count of missing numbers after SPCl0_mean in validation part 2 in column Lag0 is 778958
SPR0_mean is not in columns..


Unnamed: 0_level_0,Unnamed: 1_level_0,SPR0_mean
Producto_ID,Ruta_SAK,Unnamed: 2_level_1
41,3201,3.069398
41,3301,4.890607


Unnamed: 0,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Venta_uni_hoy,Venta_hoy,Dev_uni_proxima,Dev_proxima,...,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Demanda_uni_equil_original,DemandaNotEqualTheDifferenceOfVentaUniAndDev,Lag0,SPR0_mean
0,3,1110,7,3301,15766,1212,3,25.139999,0,0.0,...,2008,16,120,2,709,4,3.0,False,1.418015,1.546243
1,3,1110,7,3301,15766,1216,4,33.52,0,0.0,...,2008,16,135,2,712,4,4.0,False,1.279644,1.671644


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,SPR0_mean
0,2,10,2045,1,2831,4549769,32940,2163,14,110,10,678,23,1.098612,1.355031
1,7,10,1612,1,2837,4414012,35305,2352,30,75,0,45,23,,1.892663


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,SPR0_mean
0,0,11,4037,1,2209,4639078,35305,2499,28,75,0,45,23,1.609438,1.630124
1,1,11,2237,1,1226,4705135,1238,2402,4,140,2,630,4,,1.011156


Count of missing numbers after SPR0_mean in validation part 1 in column Lag0 is 61632
Count of missing numbers after SPR0_mean in validation part 2 in column Lag0 is 100241
SPA0_mean is not in columns..


Unnamed: 0_level_0,Unnamed: 1_level_0,SPA0_mean
Producto_ID,Agencia_ID,Unnamed: 2_level_1
41,1958,3.15745
41,2278,4.890607


Unnamed: 0,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Venta_uni_hoy,Venta_hoy,Dev_uni_proxima,Dev_proxima,...,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Demanda_uni_equil_original,DemandaNotEqualTheDifferenceOfVentaUniAndDev,Lag0,SPA0_mean
0,3,1110,7,3301,15766,1212,3,25.139999,0,0.0,...,2008,16,120,2,709,4,3.0,False,1.418015,1.585812
1,3,1110,7,3301,15766,1216,4,33.52,0,0.0,...,2008,16,135,2,712,4,4.0,False,1.279644,1.430041


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,SPA0_mean
0,2,10,2045,1,2831,4549769,32940,2163,14,110,10,678,23,1.098612,1.527452
1,7,10,1612,1,2837,4414012,35305,2352,30,75,0,45,23,1.892663,2.047667


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,SPA0_mean
0,0,11,4037,1,2209,4639078,35305,2499,28,75,0,45,23,1.609438,1.903316
1,1,11,2237,1,1226,4705135,1238,2402,4,140,2,630,4,1.011156,1.020974


Count of missing numbers after SPA0_mean in validation part 1 in column Lag0 is 56956
Count of missing numbers after SPA0_mean in validation part 2 in column Lag0 is 93950
SPCh0_mean is not in columns..


Unnamed: 0_level_0,Unnamed: 1_level_0,SPCh0_mean
Producto_ID,Canal_ID,Unnamed: 2_level_1
41,7,4.739156
53,4,4.118901


Unnamed: 0,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Venta_uni_hoy,Venta_hoy,Dev_uni_proxima,Dev_proxima,...,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Demanda_uni_equil_original,DemandaNotEqualTheDifferenceOfVentaUniAndDev,Lag0,SPCh0_mean
0,3,1110,7,3301,15766,1212,3,25.139999,0,0.0,...,2008,16,120,2,709,4,3.0,False,1.418015,1.515955
1,3,1110,7,3301,15766,1216,4,33.52,0,0.0,...,2008,16,135,2,712,4,4.0,False,1.279644,1.5201


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,SPCh0_mean
0,2,10,2045,1,2831,4549769,32940,2163,14,110,10,678,23,1.098612,1.424204
1,7,10,1612,1,2837,4414012,35305,2352,30,75,0,45,23,1.892663,2.069688


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,SPCh0_mean
0,0,11,4037,1,2209,4639078,35305,2499,28,75,0,45,23,1.609438,2.069688
1,1,11,2237,1,1226,4705135,1238,2402,4,140,2,630,4,1.011156,1.196969


Count of missing numbers after SPCh0_mean in validation part 1 in column Lag0 is 1899
Count of missing numbers after SPCh0_mean in validation part 2 in column Lag0 is 23998
SPT0_mean is not in columns..


Unnamed: 0_level_0,Unnamed: 1_level_0,SPT0_mean
Producto_ID,Town_ID,Unnamed: 2_level_1
41,2288,3.15745
41,2381,5.432942


Unnamed: 0,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Venta_uni_hoy,Venta_hoy,Dev_uni_proxima,Dev_proxima,...,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Demanda_uni_equil_original,DemandaNotEqualTheDifferenceOfVentaUniAndDev,Lag0,SPT0_mean
0,3,1110,7,3301,15766,1212,3,25.139999,0,0.0,...,2008,16,120,2,709,4,3.0,False,1.418015,1.717298
1,3,1110,7,3301,15766,1216,4,33.52,0,0.0,...,2008,16,135,2,712,4,4.0,False,1.279644,1.546708


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,SPT0_mean
0,2,10,2045,1,2831,4549769,32940,2163,14,110,10,678,23,1.098612,1.527452
1,7,10,1612,1,2837,4414012,35305,2352,30,75,0,45,23,1.892663,2.047667


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,SPT0_mean
0,0,11,4037,1,2209,4639078,35305,2499,28,75,0,45,23,1.609438,1.988828
1,1,11,2237,1,1226,4705135,1238,2402,4,140,2,630,4,1.011156,1.068752


Count of missing numbers after SPT0_mean in validation part 1 in column Lag0 is 1891
Count of missing numbers after SPT0_mean in validation part 2 in column Lag0 is 23980
SPSt0_mean is not in columns..


Unnamed: 0_level_0,Unnamed: 1_level_0,SPSt0_mean
Producto_ID,State_ID,Unnamed: 2_level_1
41,22,4.891297
41,25,3.15745


Unnamed: 0,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Venta_uni_hoy,Venta_hoy,Dev_uni_proxima,Dev_proxima,...,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Demanda_uni_equil_original,DemandaNotEqualTheDifferenceOfVentaUniAndDev,Lag0,SPSt0_mean
0,3,1110,7,3301,15766,1212,3,25.139999,0,0.0,...,2008,16,120,2,709,4,3.0,False,1.418015,1.392923
1,3,1110,7,3301,15766,1216,4,33.52,0,0.0,...,2008,16,135,2,712,4,4.0,False,1.279644,1.262543


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,SPSt0_mean
0,2,10,2045,1,2831,4549769,32940,2163,14,110,10,678,23,1.098612,1.418262
1,7,10,1612,1,2837,4414012,35305,2352,30,75,0,45,23,1.892663,2.089995


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,SPSt0_mean
0,0,11,4037,1,2209,4639078,35305,2499,28,75,0,45,23,1.609438,2.036969
1,1,11,2237,1,1226,4705135,1238,2402,4,140,2,630,4,1.011156,1.097953


Count of missing numbers after SPSt0_mean in validation part 1 in column Lag0 is 1868
Count of missing numbers after SPSt0_mean in validation part 2 in column Lag0 is 23954
SP0_mean is not in columns..


Unnamed: 0_level_0,SP0_mean
Producto_ID,Unnamed: 1_level_1
41,4.739156
53,4.118901


Unnamed: 0,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Venta_uni_hoy,Venta_hoy,Dev_uni_proxima,Dev_proxima,...,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Demanda_uni_equil_original,DemandaNotEqualTheDifferenceOfVentaUniAndDev,Lag0,SP0_mean
0,3,1110,7,3301,15766,1212,3,25.139999,0,0.0,...,2008,16,120,2,709,4,3.0,False,1.418015,1.162178
1,3,1110,7,3301,15766,1216,4,33.52,0,0.0,...,2008,16,135,2,712,4,4.0,False,1.279644,1.189524


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,SP0_mean
0,2,10,2045,1,2831,4549769,32940,2163,14,110,10,678,23,1.098612,1.447214
1,7,10,1612,1,2837,4414012,35305,2352,30,75,0,45,23,1.892663,2.083995


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,SP0_mean
0,0,11,4037,1,2209,4639078,35305,2499,28,75,0,45,23,1.609438,2.083995
1,1,11,2237,1,1226,4705135,1238,2402,4,140,2,630,4,1.011156,1.235078


Count of missing numbers after SP0_mean in validation part 1 in column Lag0 is 1809
Count of missing numbers after SP0_mean in validation part 2 in column Lag0 is 23848
SPnClRACh0_mean is not in columns..


Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,Unnamed: 3_level_0,Unnamed: 4_level_0,SPnClRACh0_mean
Prod_name_ID,Cliente_ID,Ruta_SAK,Agencia_ID,Canal_ID,Unnamed: 5_level_1
0,60,7238,2061,2,4.956561
0,65,7250,2061,2,4.071269


Unnamed: 0,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Venta_uni_hoy,Venta_hoy,Dev_uni_proxima,Dev_proxima,...,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Demanda_uni_equil_original,DemandaNotEqualTheDifferenceOfVentaUniAndDev,Lag0,SPnClRACh0_mean
0,3,1110,7,3301,15766,1212,3,25.139999,0,0.0,...,2008,16,120,2,709,4,3.0,False,1.418015,1.418015
1,3,1110,7,3301,15766,1216,4,33.52,0,0.0,...,2008,16,135,2,712,4,4.0,False,1.279644,1.279644


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,SPnClRACh0_mean
0,2,10,2045,1,2831,4549769,32940,2163,14,110,10,678,23,1.098612,1.098612
1,7,10,1612,1,2837,4414012,35305,2352,30,75,0,45,23,1.892663,1.589027


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,SPnClRACh0_mean
0,0,11,4037,1,2209,4639078,35305,2499,28,75,0,45,23,1.609438,1.700599
1,1,11,2237,1,1226,4705135,1238,2402,4,140,2,630,4,1.011156,


Count of missing numbers after SPnClRACh0_mean in validation part 1 in column Lag0 is 1658
Count of missing numbers after SPnClRACh0_mean in validation part 2 in column Lag0 is 23412
SPnClRA0_mean is not in columns..


Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,Unnamed: 3_level_0,SPnClRA0_mean
Prod_name_ID,Cliente_ID,Ruta_SAK,Agencia_ID,Unnamed: 4_level_1
0,60,7238,2061,4.956561
0,65,7250,2061,4.071269


Unnamed: 0,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Venta_uni_hoy,Venta_hoy,Dev_uni_proxima,Dev_proxima,...,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Demanda_uni_equil_original,DemandaNotEqualTheDifferenceOfVentaUniAndDev,Lag0,SPnClRA0_mean
0,3,1110,7,3301,15766,1212,3,25.139999,0,0.0,...,2008,16,120,2,709,4,3.0,False,1.418015,1.418015
1,3,1110,7,3301,15766,1216,4,33.52,0,0.0,...,2008,16,135,2,712,4,4.0,False,1.279644,1.279644


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,SPnClRA0_mean
0,2,10,2045,1,2831,4549769,32940,2163,14,110,10,678,23,1.098612,1.098612
1,7,10,1612,1,2837,4414012,35305,2352,30,75,0,45,23,1.892663,1.589027


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,SPnClRA0_mean
0,0,11,4037,1,2209,4639078,35305,2499,28,75,0,45,23,1.609438,1.700599
1,1,11,2237,1,1226,4705135,1238,2402,4,140,2,630,4,1.011156,


Count of missing numbers after SPnClRA0_mean in validation part 1 in column Lag0 is 1658
Count of missing numbers after SPnClRA0_mean in validation part 2 in column Lag0 is 23412
SPnClRCh0_mean is not in columns..


Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,Unnamed: 3_level_0,SPnClRCh0_mean
Prod_name_ID,Cliente_ID,Ruta_SAK,Canal_ID,Unnamed: 4_level_1
0,60,7238,2,4.956561
0,65,7250,2,4.071269


Unnamed: 0,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Venta_uni_hoy,Venta_hoy,Dev_uni_proxima,Dev_proxima,...,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Demanda_uni_equil_original,DemandaNotEqualTheDifferenceOfVentaUniAndDev,Lag0,SPnClRCh0_mean
0,3,1110,7,3301,15766,1212,3,25.139999,0,0.0,...,2008,16,120,2,709,4,3.0,False,1.418015,1.418015
1,3,1110,7,3301,15766,1216,4,33.52,0,0.0,...,2008,16,135,2,712,4,4.0,False,1.279644,1.279644


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,SPnClRCh0_mean
0,2,10,2045,1,2831,4549769,32940,2163,14,110,10,678,23,1.098612,1.098612
1,7,10,1612,1,2837,4414012,35305,2352,30,75,0,45,23,1.892663,1.589027


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,SPnClRCh0_mean
0,0,11,4037,1,2209,4639078,35305,2499,28,75,0,45,23,1.609438,1.700599
1,1,11,2237,1,1226,4705135,1238,2402,4,140,2,630,4,1.011156,


Count of missing numbers after SPnClRCh0_mean in validation part 1 in column Lag0 is 1657
Count of missing numbers after SPnClRCh0_mean in validation part 2 in column Lag0 is 23412
SPnClACh0_mean is not in columns..


Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,Unnamed: 3_level_0,SPnClACh0_mean
Prod_name_ID,Cliente_ID,Agencia_ID,Canal_ID,Unnamed: 4_level_1
0,60,2061,2,4.956561
0,65,2061,2,4.071269


Unnamed: 0,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Venta_uni_hoy,Venta_hoy,Dev_uni_proxima,Dev_proxima,...,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Demanda_uni_equil_original,DemandaNotEqualTheDifferenceOfVentaUniAndDev,Lag0,SPnClACh0_mean
0,3,1110,7,3301,15766,1212,3,25.139999,0,0.0,...,2008,16,120,2,709,4,3.0,False,1.418015,1.418015
1,3,1110,7,3301,15766,1216,4,33.52,0,0.0,...,2008,16,135,2,712,4,4.0,False,1.279644,1.279644


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,SPnClACh0_mean
0,2,10,2045,1,2831,4549769,32940,2163,14,110,10,678,23,1.098612,1.098612
1,7,10,1612,1,2837,4414012,35305,2352,30,75,0,45,23,1.892663,1.589027


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,SPnClACh0_mean
0,0,11,4037,1,2209,4639078,35305,2499,28,75,0,45,23,1.609438,1.700599
1,1,11,2237,1,1226,4705135,1238,2402,4,140,2,630,4,1.011156,


Count of missing numbers after SPnClACh0_mean in validation part 1 in column Lag0 is 1657
Count of missing numbers after SPnClACh0_mean in validation part 2 in column Lag0 is 23411
SPnClR0_mean is not in columns..


Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,SPnClR0_mean
Prod_name_ID,Cliente_ID,Ruta_SAK,Unnamed: 3_level_1
0,60,7238,4.956561
0,65,7250,4.071269


Unnamed: 0,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Venta_uni_hoy,Venta_hoy,Dev_uni_proxima,Dev_proxima,...,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Demanda_uni_equil_original,DemandaNotEqualTheDifferenceOfVentaUniAndDev,Lag0,SPnClR0_mean
0,3,1110,7,3301,15766,1212,3,25.139999,0,0.0,...,2008,16,120,2,709,4,3.0,False,1.418015,1.418015
1,3,1110,7,3301,15766,1216,4,33.52,0,0.0,...,2008,16,135,2,712,4,4.0,False,1.279644,1.279644


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,SPnClR0_mean
0,2,10,2045,1,2831,4549769,32940,2163,14,110,10,678,23,1.098612,1.098612
1,7,10,1612,1,2837,4414012,35305,2352,30,75,0,45,23,1.892663,1.589027


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,SPnClR0_mean
0,0,11,4037,1,2209,4639078,35305,2499,28,75,0,45,23,1.609438,1.700599
1,1,11,2237,1,1226,4705135,1238,2402,4,140,2,630,4,1.011156,


Count of missing numbers after SPnClR0_mean in validation part 1 in column Lag0 is 1657
Count of missing numbers after SPnClR0_mean in validation part 2 in column Lag0 is 23411
SPnClA0_mean is not in columns..


Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,SPnClA0_mean
Prod_name_ID,Cliente_ID,Agencia_ID,Unnamed: 3_level_1
0,60,2061,4.956561
0,65,2061,4.071269


Unnamed: 0,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Venta_uni_hoy,Venta_hoy,Dev_uni_proxima,Dev_proxima,...,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Demanda_uni_equil_original,DemandaNotEqualTheDifferenceOfVentaUniAndDev,Lag0,SPnClA0_mean
0,3,1110,7,3301,15766,1212,3,25.139999,0,0.0,...,2008,16,120,2,709,4,3.0,False,1.418015,1.418015
1,3,1110,7,3301,15766,1216,4,33.52,0,0.0,...,2008,16,135,2,712,4,4.0,False,1.279644,1.279644


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,SPnClA0_mean
0,2,10,2045,1,2831,4549769,32940,2163,14,110,10,678,23,1.098612,1.098612
1,7,10,1612,1,2837,4414012,35305,2352,30,75,0,45,23,1.892663,1.589027


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,SPnClA0_mean
0,0,11,4037,1,2209,4639078,35305,2499,28,75,0,45,23,1.609438,1.700599
1,1,11,2237,1,1226,4705135,1238,2402,4,140,2,630,4,1.011156,


Count of missing numbers after SPnClA0_mean in validation part 1 in column Lag0 is 1657
Count of missing numbers after SPnClA0_mean in validation part 2 in column Lag0 is 23411
SPnClCh0_mean is not in columns..


Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,SPnClCh0_mean
Prod_name_ID,Cliente_ID,Canal_ID,Unnamed: 3_level_1
0,60,2,4.956561
0,65,2,4.071269


Unnamed: 0,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Venta_uni_hoy,Venta_hoy,Dev_uni_proxima,Dev_proxima,...,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Demanda_uni_equil_original,DemandaNotEqualTheDifferenceOfVentaUniAndDev,Lag0,SPnClCh0_mean
0,3,1110,7,3301,15766,1212,3,25.139999,0,0.0,...,2008,16,120,2,709,4,3.0,False,1.418015,1.418015
1,3,1110,7,3301,15766,1216,4,33.52,0,0.0,...,2008,16,135,2,712,4,4.0,False,1.279644,1.279644


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,SPnClCh0_mean
0,2,10,2045,1,2831,4549769,32940,2163,14,110,10,678,23,1.098612,1.098612
1,7,10,1612,1,2837,4414012,35305,2352,30,75,0,45,23,1.892663,1.589027


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,SPnClCh0_mean
0,0,11,4037,1,2209,4639078,35305,2499,28,75,0,45,23,1.609438,1.700599
1,1,11,2237,1,1226,4705135,1238,2402,4,140,2,630,4,1.011156,


Count of missing numbers after SPnClCh0_mean in validation part 1 in column Lag0 is 1657
Count of missing numbers after SPnClCh0_mean in validation part 2 in column Lag0 is 23411
SPnCl0_mean is not in columns..


Unnamed: 0_level_0,Unnamed: 1_level_0,SPnCl0_mean
Prod_name_ID,Cliente_ID,Unnamed: 2_level_1
0,60,4.956561
0,65,4.071269


Unnamed: 0,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Venta_uni_hoy,Venta_hoy,Dev_uni_proxima,Dev_proxima,...,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Demanda_uni_equil_original,DemandaNotEqualTheDifferenceOfVentaUniAndDev,Lag0,SPnCl0_mean
0,3,1110,7,3301,15766,1212,3,25.139999,0,0.0,...,2008,16,120,2,709,4,3.0,False,1.418015,1.418015
1,3,1110,7,3301,15766,1216,4,33.52,0,0.0,...,2008,16,135,2,712,4,4.0,False,1.279644,1.279644


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,SPnCl0_mean
0,2,10,2045,1,2831,4549769,32940,2163,14,110,10,678,23,1.098612,1.098612
1,7,10,1612,1,2837,4414012,35305,2352,30,75,0,45,23,1.892663,1.589027


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,SPnCl0_mean
0,0,11,4037,1,2209,4639078,35305,2499,28,75,0,45,23,1.609438,1.700599
1,1,11,2237,1,1226,4705135,1238,2402,4,140,2,630,4,1.011156,


Count of missing numbers after SPnCl0_mean in validation part 1 in column Lag0 is 1657
Count of missing numbers after SPnCl0_mean in validation part 2 in column Lag0 is 23411
SPnR0_mean is not in columns..


Unnamed: 0_level_0,Unnamed: 1_level_0,SPnR0_mean
Prod_name_ID,Ruta_SAK,Unnamed: 2_level_1
0,1,4.026461
0,2,3.944476


Unnamed: 0,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Venta_uni_hoy,Venta_hoy,Dev_uni_proxima,Dev_proxima,...,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Demanda_uni_equil_original,DemandaNotEqualTheDifferenceOfVentaUniAndDev,Lag0,SPnR0_mean
0,3,1110,7,3301,15766,1212,3,25.139999,0,0.0,...,2008,16,120,2,709,4,3.0,False,1.418015,1.542243
1,3,1110,7,3301,15766,1216,4,33.52,0,0.0,...,2008,16,135,2,712,4,4.0,False,1.279644,1.696842


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,SPnR0_mean
0,2,10,2045,1,2831,4549769,32940,2163,14,110,10,678,23,1.098612,1.357188
1,7,10,1612,1,2837,4414012,35305,2352,30,75,0,45,23,1.892663,1.88037


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,SPnR0_mean
0,0,11,4037,1,2209,4639078,35305,2499,28,75,0,45,23,1.609438,1.506812
1,1,11,2237,1,1226,4705135,1238,2402,4,140,2,630,4,1.011156,1.004544


Count of missing numbers after SPnR0_mean in validation part 1 in column Lag0 is 1608
Count of missing numbers after SPnR0_mean in validation part 2 in column Lag0 is 21720
SPnA0_mean is not in columns..


Unnamed: 0_level_0,Unnamed: 1_level_0,SPnA0_mean
Prod_name_ID,Agencia_ID,Unnamed: 2_level_1
0,1110,1.851679
0,1114,3.610578


Unnamed: 0,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Venta_uni_hoy,Venta_hoy,Dev_uni_proxima,Dev_proxima,...,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Demanda_uni_equil_original,DemandaNotEqualTheDifferenceOfVentaUniAndDev,Lag0,SPnA0_mean
0,3,1110,7,3301,15766,1212,3,25.139999,0,0.0,...,2008,16,120,2,709,4,3.0,False,1.418015,1.598989
1,3,1110,7,3301,15766,1216,4,33.52,0,0.0,...,2008,16,135,2,712,4,4.0,False,1.279644,1.442348


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,SPnA0_mean
0,2,10,2045,1,2831,4549769,32940,2163,14,110,10,678,23,1.098612,1.527452
1,7,10,1612,1,2837,4414012,35305,2352,30,75,0,45,23,1.892663,2.016902


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,SPnA0_mean
0,0,11,4037,1,2209,4639078,35305,2499,28,75,0,45,23,1.609438,1.879516
1,1,11,2237,1,1226,4705135,1238,2402,4,140,2,630,4,1.011156,1.020974


Count of missing numbers after SPnA0_mean in validation part 1 in column Lag0 is 1608
Count of missing numbers after SPnA0_mean in validation part 2 in column Lag0 is 21719
SPnCh0_mean is not in columns..


Unnamed: 0_level_0,Unnamed: 1_level_0,SPnCh0_mean
Prod_name_ID,Canal_ID,Unnamed: 2_level_1
0,1,2.087308
0,2,3.256293


Unnamed: 0,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Venta_uni_hoy,Venta_hoy,Dev_uni_proxima,Dev_proxima,...,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Demanda_uni_equil_original,DemandaNotEqualTheDifferenceOfVentaUniAndDev,Lag0,SPnCh0_mean
0,3,1110,7,3301,15766,1212,3,25.139999,0,0.0,...,2008,16,120,2,709,4,3.0,False,1.418015,1.497963
1,3,1110,7,3301,15766,1216,4,33.52,0,0.0,...,2008,16,135,2,712,4,4.0,False,1.279644,1.520939


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,SPnCh0_mean
0,2,10,2045,1,2831,4549769,32940,2163,14,110,10,678,23,1.098612,1.432977
1,7,10,1612,1,2837,4414012,35305,2352,30,75,0,45,23,1.892663,2.053326


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,SPnCh0_mean
0,0,11,4037,1,2209,4639078,35305,2499,28,75,0,45,23,1.609438,2.053326
1,1,11,2237,1,1226,4705135,1238,2402,4,140,2,630,4,1.011156,1.189575


Count of missing numbers after SPnCh0_mean in validation part 1 in column Lag0 is 1215
Count of missing numbers after SPnCh0_mean in validation part 2 in column Lag0 is 17825
SPnT0_mean is not in columns..


Unnamed: 0_level_0,Unnamed: 1_level_0,SPnT0_mean
Prod_name_ID,Town_ID,Unnamed: 2_level_1
0,2008,1.851679
0,2011,3.478428


Unnamed: 0,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Venta_uni_hoy,Venta_hoy,Dev_uni_proxima,Dev_proxima,...,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Demanda_uni_equil_original,DemandaNotEqualTheDifferenceOfVentaUniAndDev,Lag0,SPnT0_mean
0,3,1110,7,3301,15766,1212,3,25.139999,0,0.0,...,2008,16,120,2,709,4,3.0,False,1.418015,1.606481
1,3,1110,7,3301,15766,1216,4,33.52,0,0.0,...,2008,16,135,2,712,4,4.0,False,1.279644,1.510445


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,SPnT0_mean
0,2,10,2045,1,2831,4549769,32940,2163,14,110,10,678,23,1.098612,1.527452
1,7,10,1612,1,2837,4414012,35305,2352,30,75,0,45,23,1.892663,2.049042


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,SPnT0_mean
0,0,11,4037,1,2209,4639078,35305,2499,28,75,0,45,23,1.609438,1.977842
1,1,11,2237,1,1226,4705135,1238,2402,4,140,2,630,4,1.011156,1.068752


Count of missing numbers after SPnT0_mean in validation part 1 in column Lag0 is 1215
Count of missing numbers after SPnT0_mean in validation part 2 in column Lag0 is 17825
SPnSt0_mean is not in columns..


Unnamed: 0_level_0,Unnamed: 1_level_0,SPnSt0_mean
Prod_name_ID,State_ID,Unnamed: 2_level_1
0,0,3.356161
0,1,2.564422


Unnamed: 0,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Venta_uni_hoy,Venta_hoy,Dev_uni_proxima,Dev_proxima,...,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Demanda_uni_equil_original,DemandaNotEqualTheDifferenceOfVentaUniAndDev,Lag0,SPnSt0_mean
0,3,1110,7,3301,15766,1212,3,25.139999,0,0.0,...,2008,16,120,2,709,4,3.0,False,1.418015,1.325219
1,3,1110,7,3301,15766,1216,4,33.52,0,0.0,...,2008,16,135,2,712,4,4.0,False,1.279644,1.204164


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,SPnSt0_mean
0,2,10,2045,1,2831,4549769,32940,2163,14,110,10,678,23,1.098612,1.418262
1,7,10,1612,1,2837,4414012,35305,2352,30,75,0,45,23,1.892663,2.127518


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,SPnSt0_mean
0,0,11,4037,1,2209,4639078,35305,2499,28,75,0,45,23,1.609438,2.068745
1,1,11,2237,1,1226,4705135,1238,2402,4,140,2,630,4,1.011156,1.097953


Count of missing numbers after SPnSt0_mean in validation part 1 in column Lag0 is 1215
Count of missing numbers after SPnSt0_mean in validation part 2 in column Lag0 is 17824
SPn0_mean is not in columns..


Unnamed: 0_level_0,SPn0_mean
Prod_name_ID,Unnamed: 1_level_1
0,3.036257
1,3.699834


Unnamed: 0,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Venta_uni_hoy,Venta_hoy,Dev_uni_proxima,Dev_proxima,...,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Demanda_uni_equil_original,DemandaNotEqualTheDifferenceOfVentaUniAndDev,Lag0,SPn0_mean
0,3,1110,7,3301,15766,1212,3,25.139999,0,0.0,...,2008,16,120,2,709,4,3.0,False,1.418015,1.149752
1,3,1110,7,3301,15766,1216,4,33.52,0,0.0,...,2008,16,135,2,712,4,4.0,False,1.279644,1.202437


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,SPn0_mean
0,2,10,2045,1,2831,4549769,32940,2163,14,110,10,678,23,1.098612,1.461948
1,7,10,1612,1,2837,4414012,35305,2352,30,75,0,45,23,1.892663,2.101496


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,SPn0_mean
0,0,11,4037,1,2209,4639078,35305,2499,28,75,0,45,23,1.609438,2.101496
1,1,11,2237,1,1226,4705135,1238,2402,4,140,2,630,4,1.011156,1.232832


Count of missing numbers after SPn0_mean in validation part 1 in column Lag0 is 1215
Count of missing numbers after SPn0_mean in validation part 2 in column Lag0 is 17824
SBClRACh0_mean is not in columns..


Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,Unnamed: 3_level_0,Unnamed: 4_level_0,SBClRACh0_mean
Brand_ID,Cliente_ID,Ruta_SAK,Agencia_ID,Canal_ID,Unnamed: 5_level_1
1,652734,3003,1974,5,0.0
3,1589,3915,2095,11,1.791759


Unnamed: 0,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Venta_uni_hoy,Venta_hoy,Dev_uni_proxima,Dev_proxima,...,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Demanda_uni_equil_original,DemandaNotEqualTheDifferenceOfVentaUniAndDev,Lag0,SBClRACh0_mean
0,3,1110,7,3301,15766,1212,3,25.139999,0,0.0,...,2008,16,120,2,709,4,3.0,False,1.418015,1.568451
1,3,1110,7,3301,15766,1216,4,33.52,0,0.0,...,2008,16,135,2,712,4,4.0,False,1.279644,1.568451


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,SBClRACh0_mean
0,2,10,2045,1,2831,4549769,32940,2163,14,110,10,678,23,1.098612,1.76314
1,7,10,1612,1,2837,4414012,35305,2352,30,75,0,45,23,1.892663,1.447219


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,SBClRACh0_mean
0,0,11,4037,1,2209,4639078,35305,2499,28,75,0,45,23,1.609438,1.179669
1,1,11,2237,1,1226,4705135,1238,2402,4,140,2,630,4,1.011156,1.255255


Count of missing numbers after SBClRACh0_mean in validation part 1 in column Lag0 is 1020
Count of missing numbers after SBClRACh0_mean in validation part 2 in column Lag0 is 1074
SBClRA0_mean is not in columns..


Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,Unnamed: 3_level_0,SBClRA0_mean
Brand_ID,Cliente_ID,Ruta_SAK,Agencia_ID,Unnamed: 4_level_1
1,652734,3003,1974,0.0
3,1589,3915,2095,1.791759


Unnamed: 0,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Venta_uni_hoy,Venta_hoy,Dev_uni_proxima,Dev_proxima,...,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Demanda_uni_equil_original,DemandaNotEqualTheDifferenceOfVentaUniAndDev,Lag0,SBClRA0_mean
0,3,1110,7,3301,15766,1212,3,25.139999,0,0.0,...,2008,16,120,2,709,4,3.0,False,1.418015,1.568451
1,3,1110,7,3301,15766,1216,4,33.52,0,0.0,...,2008,16,135,2,712,4,4.0,False,1.279644,1.568451


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,SBClRA0_mean
0,2,10,2045,1,2831,4549769,32940,2163,14,110,10,678,23,1.098612,1.76314
1,7,10,1612,1,2837,4414012,35305,2352,30,75,0,45,23,1.892663,1.447219


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,SBClRA0_mean
0,0,11,4037,1,2209,4639078,35305,2499,28,75,0,45,23,1.609438,1.179669
1,1,11,2237,1,1226,4705135,1238,2402,4,140,2,630,4,1.011156,1.255255


Count of missing numbers after SBClRA0_mean in validation part 1 in column Lag0 is 1020
Count of missing numbers after SBClRA0_mean in validation part 2 in column Lag0 is 1074
SBClRCh0_mean is not in columns..


Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,Unnamed: 3_level_0,SBClRCh0_mean
Brand_ID,Cliente_ID,Ruta_SAK,Canal_ID,Unnamed: 4_level_1
1,652734,3003,5,0.0
3,1589,3915,11,1.791759


Unnamed: 0,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Venta_uni_hoy,Venta_hoy,Dev_uni_proxima,Dev_proxima,...,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Demanda_uni_equil_original,DemandaNotEqualTheDifferenceOfVentaUniAndDev,Lag0,SBClRCh0_mean
0,3,1110,7,3301,15766,1212,3,25.139999,0,0.0,...,2008,16,120,2,709,4,3.0,False,1.418015,1.568451
1,3,1110,7,3301,15766,1216,4,33.52,0,0.0,...,2008,16,135,2,712,4,4.0,False,1.279644,1.568451


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,SBClRCh0_mean
0,2,10,2045,1,2831,4549769,32940,2163,14,110,10,678,23,1.098612,1.76314
1,7,10,1612,1,2837,4414012,35305,2352,30,75,0,45,23,1.892663,1.447219


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,SBClRCh0_mean
0,0,11,4037,1,2209,4639078,35305,2499,28,75,0,45,23,1.609438,1.179669
1,1,11,2237,1,1226,4705135,1238,2402,4,140,2,630,4,1.011156,1.255255


Count of missing numbers after SBClRCh0_mean in validation part 1 in column Lag0 is 1020
Count of missing numbers after SBClRCh0_mean in validation part 2 in column Lag0 is 1074
SBClACh0_mean is not in columns..


Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,Unnamed: 3_level_0,SBClACh0_mean
Brand_ID,Cliente_ID,Agencia_ID,Canal_ID,Unnamed: 4_level_1
1,652734,1974,5,0.0
3,1589,2095,11,1.791759


Unnamed: 0,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Venta_uni_hoy,Venta_hoy,Dev_uni_proxima,Dev_proxima,...,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Demanda_uni_equil_original,DemandaNotEqualTheDifferenceOfVentaUniAndDev,Lag0,SBClACh0_mean
0,3,1110,7,3301,15766,1212,3,25.139999,0,0.0,...,2008,16,120,2,709,4,3.0,False,1.418015,1.568451
1,3,1110,7,3301,15766,1216,4,33.52,0,0.0,...,2008,16,135,2,712,4,4.0,False,1.279644,1.568451


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,SBClACh0_mean
0,2,10,2045,1,2831,4549769,32940,2163,14,110,10,678,23,1.098612,1.76314
1,7,10,1612,1,2837,4414012,35305,2352,30,75,0,45,23,1.892663,1.447219


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,SBClACh0_mean
0,0,11,4037,1,2209,4639078,35305,2499,28,75,0,45,23,1.609438,1.179669
1,1,11,2237,1,1226,4705135,1238,2402,4,140,2,630,4,1.011156,1.255255


Count of missing numbers after SBClACh0_mean in validation part 1 in column Lag0 is 277
Count of missing numbers after SBClACh0_mean in validation part 2 in column Lag0 is 387
SBClR0_mean is not in columns..


Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,SBClR0_mean
Brand_ID,Cliente_ID,Ruta_SAK,Unnamed: 3_level_1
1,652734,3003,0.0
3,1589,3915,1.791759


Unnamed: 0,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Venta_uni_hoy,Venta_hoy,Dev_uni_proxima,Dev_proxima,...,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Demanda_uni_equil_original,DemandaNotEqualTheDifferenceOfVentaUniAndDev,Lag0,SBClR0_mean
0,3,1110,7,3301,15766,1212,3,25.139999,0,0.0,...,2008,16,120,2,709,4,3.0,False,1.418015,1.568451
1,3,1110,7,3301,15766,1216,4,33.52,0,0.0,...,2008,16,135,2,712,4,4.0,False,1.279644,1.568451


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,SBClR0_mean
0,2,10,2045,1,2831,4549769,32940,2163,14,110,10,678,23,1.098612,1.76314
1,7,10,1612,1,2837,4414012,35305,2352,30,75,0,45,23,1.892663,1.447219


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,SBClR0_mean
0,0,11,4037,1,2209,4639078,35305,2499,28,75,0,45,23,1.609438,1.179669
1,1,11,2237,1,1226,4705135,1238,2402,4,140,2,630,4,1.011156,1.255255


Count of missing numbers after SBClR0_mean in validation part 1 in column Lag0 is 277
Count of missing numbers after SBClR0_mean in validation part 2 in column Lag0 is 387
SBClA0_mean is not in columns..


Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,SBClA0_mean
Brand_ID,Cliente_ID,Agencia_ID,Unnamed: 3_level_1
1,652734,1974,0.0
3,1589,2095,1.791759


Unnamed: 0,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Venta_uni_hoy,Venta_hoy,Dev_uni_proxima,Dev_proxima,...,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Demanda_uni_equil_original,DemandaNotEqualTheDifferenceOfVentaUniAndDev,Lag0,SBClA0_mean
0,3,1110,7,3301,15766,1212,3,25.139999,0,0.0,...,2008,16,120,2,709,4,3.0,False,1.418015,1.568451
1,3,1110,7,3301,15766,1216,4,33.52,0,0.0,...,2008,16,135,2,712,4,4.0,False,1.279644,1.568451


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,SBClA0_mean
0,2,10,2045,1,2831,4549769,32940,2163,14,110,10,678,23,1.098612,1.76314
1,7,10,1612,1,2837,4414012,35305,2352,30,75,0,45,23,1.892663,1.447219


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,SBClA0_mean
0,0,11,4037,1,2209,4639078,35305,2499,28,75,0,45,23,1.609438,1.179669
1,1,11,2237,1,1226,4705135,1238,2402,4,140,2,630,4,1.011156,1.255255


Count of missing numbers after SBClA0_mean in validation part 1 in column Lag0 is 276
Count of missing numbers after SBClA0_mean in validation part 2 in column Lag0 is 385
SBClCh0_mean is not in columns..


Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,SBClCh0_mean
Brand_ID,Cliente_ID,Canal_ID,Unnamed: 3_level_1
1,652734,5,0.0
3,1589,11,1.791759


Unnamed: 0,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Venta_uni_hoy,Venta_hoy,Dev_uni_proxima,Dev_proxima,...,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Demanda_uni_equil_original,DemandaNotEqualTheDifferenceOfVentaUniAndDev,Lag0,SBClCh0_mean
0,3,1110,7,3301,15766,1212,3,25.139999,0,0.0,...,2008,16,120,2,709,4,3.0,False,1.418015,1.568451
1,3,1110,7,3301,15766,1216,4,33.52,0,0.0,...,2008,16,135,2,712,4,4.0,False,1.279644,1.568451


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,SBClCh0_mean
0,2,10,2045,1,2831,4549769,32940,2163,14,110,10,678,23,1.098612,1.76314
1,7,10,1612,1,2837,4414012,35305,2352,30,75,0,45,23,1.892663,1.447219


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,SBClCh0_mean
0,0,11,4037,1,2209,4639078,35305,2499,28,75,0,45,23,1.609438,1.179669
1,1,11,2237,1,1226,4705135,1238,2402,4,140,2,630,4,1.011156,1.255255


Count of missing numbers after SBClCh0_mean in validation part 1 in column Lag0 is 276
Count of missing numbers after SBClCh0_mean in validation part 2 in column Lag0 is 383
SBCl0_mean is not in columns..


Unnamed: 0_level_0,Unnamed: 1_level_0,SBCl0_mean
Brand_ID,Cliente_ID,Unnamed: 2_level_1
1,652734,0.0
3,1589,1.791759


Unnamed: 0,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Venta_uni_hoy,Venta_hoy,Dev_uni_proxima,Dev_proxima,...,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Demanda_uni_equil_original,DemandaNotEqualTheDifferenceOfVentaUniAndDev,Lag0,SBCl0_mean
0,3,1110,7,3301,15766,1212,3,25.139999,0,0.0,...,2008,16,120,2,709,4,3.0,False,1.418015,1.568451
1,3,1110,7,3301,15766,1216,4,33.52,0,0.0,...,2008,16,135,2,712,4,4.0,False,1.279644,1.568451


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,SBCl0_mean
0,2,10,2045,1,2831,4549769,32940,2163,14,110,10,678,23,1.098612,1.76314
1,7,10,1612,1,2837,4414012,35305,2352,30,75,0,45,23,1.892663,1.447219


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,SBCl0_mean
0,0,11,4037,1,2209,4639078,35305,2499,28,75,0,45,23,1.609438,1.179669
1,1,11,2237,1,1226,4705135,1238,2402,4,140,2,630,4,1.011156,1.255255


Count of missing numbers after SBCl0_mean in validation part 1 in column Lag0 is 276
Count of missing numbers after SBCl0_mean in validation part 2 in column Lag0 is 383
SBR0_mean is not in columns..


Unnamed: 0_level_0,Unnamed: 1_level_0,SBR0_mean
Brand_ID,Ruta_SAK,Unnamed: 2_level_1
1,3003,0.0
3,3001,4.719562


Unnamed: 0,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Venta_uni_hoy,Venta_hoy,Dev_uni_proxima,Dev_proxima,...,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Demanda_uni_equil_original,DemandaNotEqualTheDifferenceOfVentaUniAndDev,Lag0,SBR0_mean
0,3,1110,7,3301,15766,1212,3,25.139999,0,0.0,...,2008,16,120,2,709,4,3.0,False,1.418015,2.09989
1,3,1110,7,3301,15766,1216,4,33.52,0,0.0,...,2008,16,135,2,712,4,4.0,False,1.279644,2.09989


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,SBR0_mean
0,2,10,2045,1,2831,4549769,32940,2163,14,110,10,678,23,1.098612,1.525921
1,7,10,1612,1,2837,4414012,35305,2352,30,75,0,45,23,1.892663,1.491275


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,SBR0_mean
0,0,11,4037,1,2209,4639078,35305,2499,28,75,0,45,23,1.609438,1.324077
1,1,11,2237,1,1226,4705135,1238,2402,4,140,2,630,4,1.011156,1.385531


Count of missing numbers after SBR0_mean in validation part 1 in column Lag0 is 5
Count of missing numbers after SBR0_mean in validation part 2 in column Lag0 is 6
SBA0_mean is not in columns..


Unnamed: 0_level_0,Unnamed: 1_level_0,SBA0_mean
Brand_ID,Agencia_ID,Unnamed: 2_level_1
1,1974,0.0
3,1110,1.372339


Unnamed: 0,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Venta_uni_hoy,Venta_hoy,Dev_uni_proxima,Dev_proxima,...,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Demanda_uni_equil_original,DemandaNotEqualTheDifferenceOfVentaUniAndDev,Lag0,SBA0_mean
0,3,1110,7,3301,15766,1212,3,25.139999,0,0.0,...,2008,16,120,2,709,4,3.0,False,1.418015,1.972305
1,3,1110,7,3301,15766,1216,4,33.52,0,0.0,...,2008,16,135,2,712,4,4.0,False,1.279644,1.972305


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,SBA0_mean
0,2,10,2045,1,2831,4549769,32940,2163,14,110,10,678,23,1.098612,1.594678
1,7,10,1612,1,2837,4414012,35305,2352,30,75,0,45,23,1.892663,1.629122


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,SBA0_mean
0,0,11,4037,1,2209,4639078,35305,2499,28,75,0,45,23,1.609438,1.550291
1,1,11,2237,1,1226,4705135,1238,2402,4,140,2,630,4,1.011156,1.374071


Count of missing numbers after SBA0_mean in validation part 1 in column Lag0 is 2
Count of missing numbers after SBA0_mean in validation part 2 in column Lag0 is 3
SBCh0_mean is not in columns..


Unnamed: 0_level_0,Unnamed: 1_level_0,SBCh0_mean
Brand_ID,Canal_ID,Unnamed: 2_level_1
1,5,0.0
3,1,1.544594


Unnamed: 0,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Venta_uni_hoy,Venta_hoy,Dev_uni_proxima,Dev_proxima,...,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Demanda_uni_equil_original,DemandaNotEqualTheDifferenceOfVentaUniAndDev,Lag0,SBCh0_mean
0,3,1110,7,3301,15766,1212,3,25.139999,0,0.0,...,2008,16,120,2,709,4,3.0,False,1.418015,1.969045
1,3,1110,7,3301,15766,1216,4,33.52,0,0.0,...,2008,16,135,2,712,4,4.0,False,1.279644,1.969045


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,SBCh0_mean
0,2,10,2045,1,2831,4549769,32940,2163,14,110,10,678,23,1.098612,1.603549
1,7,10,1612,1,2837,4414012,35305,2352,30,75,0,45,23,1.892663,1.603549


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,SBCh0_mean
0,0,11,4037,1,2209,4639078,35305,2499,28,75,0,45,23,1.609438,1.603549
1,1,11,2237,1,1226,4705135,1238,2402,4,140,2,630,4,1.011156,1.504742


Count of missing numbers after SBCh0_mean in validation part 1 in column Lag0 is 2
Count of missing numbers after SBCh0_mean in validation part 2 in column Lag0 is 3
SBT0_mean is not in columns..


Unnamed: 0_level_0,Unnamed: 1_level_0,SBT0_mean
Brand_ID,Town_ID,Unnamed: 2_level_1
1,2252,0.0
3,2008,1.372339


Unnamed: 0,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Venta_uni_hoy,Venta_hoy,Dev_uni_proxima,Dev_proxima,...,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Demanda_uni_equil_original,DemandaNotEqualTheDifferenceOfVentaUniAndDev,Lag0,SBT0_mean
0,3,1110,7,3301,15766,1212,3,25.139999,0,0.0,...,2008,16,120,2,709,4,3.0,False,1.418015,1.871154
1,3,1110,7,3301,15766,1216,4,33.52,0,0.0,...,2008,16,135,2,712,4,4.0,False,1.279644,1.871154


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,SBT0_mean
0,2,10,2045,1,2831,4549769,32940,2163,14,110,10,678,23,1.098612,1.599133
1,7,10,1612,1,2837,4414012,35305,2352,30,75,0,45,23,1.892663,1.667866


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,SBT0_mean
0,0,11,4037,1,2209,4639078,35305,2499,28,75,0,45,23,1.609438,1.677514
1,1,11,2237,1,1226,4705135,1238,2402,4,140,2,630,4,1.011156,1.448905


Count of missing numbers after SBT0_mean in validation part 1 in column Lag0 is 2
Count of missing numbers after SBT0_mean in validation part 2 in column Lag0 is 3
SBSt0_mean is not in columns..


Unnamed: 0_level_0,Unnamed: 1_level_0,SBSt0_mean
Brand_ID,State_ID,Unnamed: 2_level_1
1,0,0.0
3,0,4.220805


Unnamed: 0,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Venta_uni_hoy,Venta_hoy,Dev_uni_proxima,Dev_proxima,...,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Demanda_uni_equil_original,DemandaNotEqualTheDifferenceOfVentaUniAndDev,Lag0,SBSt0_mean
0,3,1110,7,3301,15766,1212,3,25.139999,0,0.0,...,2008,16,120,2,709,4,3.0,False,1.418015,1.719031
1,3,1110,7,3301,15766,1216,4,33.52,0,0.0,...,2008,16,135,2,712,4,4.0,False,1.279644,1.719031


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,SBSt0_mean
0,2,10,2045,1,2831,4549769,32940,2163,14,110,10,678,23,1.098612,1.555944
1,7,10,1612,1,2837,4414012,35305,2352,30,75,0,45,23,1.892663,1.680662


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,SBSt0_mean
0,0,11,4037,1,2209,4639078,35305,2499,28,75,0,45,23,1.609438,1.692629
1,1,11,2237,1,1226,4705135,1238,2402,4,140,2,630,4,1.011156,1.474373


Count of missing numbers after SBSt0_mean in validation part 1 in column Lag0 is 2
Count of missing numbers after SBSt0_mean in validation part 2 in column Lag0 is 3
SB0_mean is not in columns..


Unnamed: 0_level_0,SB0_mean
Brand_ID,Unnamed: 1_level_1
1,0.0
3,4.474722


Unnamed: 0,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Venta_uni_hoy,Venta_hoy,Dev_uni_proxima,Dev_proxima,...,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Demanda_uni_equil_original,DemandaNotEqualTheDifferenceOfVentaUniAndDev,Lag0,SB0_mean
0,3,1110,7,3301,15766,1212,3,25.139999,0,0.0,...,2008,16,120,2,709,4,3.0,False,1.418015,1.569605
1,3,1110,7,3301,15766,1216,4,33.52,0,0.0,...,2008,16,135,2,712,4,4.0,False,1.279644,1.569605


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,SB0_mean
0,2,10,2045,1,2831,4549769,32940,2163,14,110,10,678,23,1.098612,1.672447
1,7,10,1612,1,2837,4414012,35305,2352,30,75,0,45,23,1.892663,1.672447


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,SB0_mean
0,0,11,4037,1,2209,4639078,35305,2499,28,75,0,45,23,1.609438,1.672447
1,1,11,2237,1,1226,4705135,1238,2402,4,140,2,630,4,1.011156,1.569605


Count of missing numbers after SB0_mean in validation part 1 in column Lag0 is 2
Count of missing numbers after SB0_mean in validation part 2 in column Lag0 is 3


Unnamed: 0,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Venta_uni_hoy,Venta_hoy,Dev_uni_proxima,Dev_proxima,Demanda_uni_equil,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Demanda_uni_equil_original,DemandaNotEqualTheDifferenceOfVentaUniAndDev,Lag0
0,3,1110,7,3301,15766,1212,3,25.139999,0,0.0,1.386294,2008,16,120,2,709,4,3.0,False,1.418015
1,3,1110,7,3301,15766,1216,4,33.52,0,0.0,1.609438,2008,16,135,2,712,4,4.0,False,1.279644


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0
0,2,10,2045,1,2831,4549769,32940,2163,14,110,10,678,23,1.098612
1,7,10,1612,1,2837,4414012,35305,2352,30,75,0,45,23,1.892663


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0
0,0,11,4037,1,2209,4639078,35305,2499,28,75,0,45,23,1.609438
1,1,11,2237,1,1226,4705135,1238,2402,4,140,2,630,4,1.011156


In [73]:
FE.train.fillna(value=0, inplace=True)
FE.test1.fillna(value=0, inplace=True)
FE.test2.fillna(value=0, inplace=True)

In [74]:
FE.SaveDataFrameToHdf('both')

In [75]:
print ('RMSLE Score:', rmse(FE.train.Demanda_uni_equil, FE.train.Lag0))
#print ('RMSLE Score:', rmse(FE.test1.Demanda_uni_equil, FE.test1.Lag0))
#print ('RMSLE Score:', rmse(FE.test2.Demanda_uni_equil, FE.test2.Lag0))

('RMSLE Score:', 0.3188228398904745)


In [76]:
configLag0Target1DeleteColumnsFalse = ConfigElements(1,[ ("SPClRACh0_mean",["Semana",
                                                              "Producto_ID",
                                                              "Cliente_ID",
                                                              "Ruta_SAK",
                                                              "Agencia_ID",
                                                              "Canal_ID"],
                                                          ["mean"]),
                                                        ("SPClRA0_mean",["Semana",
                                                              "Producto_ID",
                                                              "Cliente_ID",
                                                              "Ruta_SAK",
                                                              "Agencia_ID"],
                                                          ["mean"]),
                                                        ("SPClRCh0_mean",["Semana",
                                                              "Producto_ID",
                                                              "Cliente_ID",
                                                              "Ruta_SAK",
                                                              "Canal_ID"],
                                                          ["mean"]),
                                                        ("SPClACh0_mean",["Semana",
                                                              "Producto_ID",
                                                              "Cliente_ID",
                                                              "Agencia_ID",
                                                              "Canal_ID"],
                                                          ["mean"]),
                                                        ("SPClR0_mean",["Semana",
                                                              "Producto_ID",
                                                              "Cliente_ID",
                                                              "Ruta_SAK"],
                                                          ["mean"]),
                                                        ("SPClA0_mean",["Semana",
                                                              "Producto_ID",
                                                              "Cliente_ID",
                                                              "Agencia_ID"],
                                                          ["mean"]),
                                                       ("SPClCh0_mean",["Semana",
                                                              "Producto_ID",
                                                              "Cliente_ID",
                                                              "Canal_ID"],
                                                          ["mean"]),
                                                       ("SPCl0_mean",["Semana",
                                                              "Producto_ID",
                                                              "Cliente_ID"],
                                                          ["mean"]),
                                                       ("SPR0_mean",["Semana",
                                                              "Producto_ID",
                                                              "Ruta_SAK"],
                                                          ["mean"]),
                                                       ("SPA0_mean",["Semana",
                                                              "Producto_ID",
                                                              "Agencia_ID"],
                                                          ["mean"]),
                                                       ("SPCh0_mean",["Semana",
                                                              "Producto_ID",
                                                              "Canal_ID"],
                                                          ["mean"]),
                                                       ("SPT0_mean",["Semana",
                                                              "Producto_ID",
                                                              "Town_ID"],
                                                          ["mean"]),
                                                       ("SPSt0_mean",["Semana",
                                                              "Producto_ID",
                                                              "State_ID"],
                                                          ["mean"]),
                                                       ("SP0_mean",["Semana",
                                                              "Producto_ID"],
                                                          ["mean"]),
                                                      ("SPnClRACh0_mean",["Semana",  ##PRODNAMES START
                                                              "Prod_name_ID",
                                                              "Cliente_ID",
                                                              "Ruta_SAK",
                                                              "Agencia_ID",
                                                              "Canal_ID"],
                                                          ["mean"]),
                                                        ("SPnClRA0_mean",["Semana",
                                                              "Prod_name_ID",
                                                              "Cliente_ID",
                                                              "Ruta_SAK",
                                                              "Agencia_ID"],
                                                          ["mean"]),
                                                        ("SPnClRCh0_mean",["Semana",
                                                              "Prod_name_ID",
                                                              "Cliente_ID",
                                                              "Ruta_SAK",
                                                              "Canal_ID"],
                                                          ["mean"]),
                                                        ("SPnClACh0_mean",["Semana",
                                                              "Prod_name_ID",
                                                              "Cliente_ID",
                                                              "Agencia_ID",
                                                              "Canal_ID"],
                                                          ["mean"]),
                                                        ("SPnClR0_mean",["Semana",
                                                              "Prod_name_ID",
                                                              "Cliente_ID",
                                                              "Ruta_SAK"],
                                                          ["mean"]),
                                                        ("SPnClA0_mean",["Semana",
                                                              "Prod_name_ID",
                                                              "Cliente_ID",
                                                              "Agencia_ID"],
                                                          ["mean"]),
                                                       ("SPnClCh0_mean",["Semana",
                                                              "Prod_name_ID",
                                                              "Cliente_ID",
                                                              "Canal_ID"],
                                                          ["mean"]),
                                                       ("SPnCl0_mean",["Semana",
                                                              "Prod_name_ID",
                                                              "Cliente_ID"],
                                                          ["mean"]),
                                                       ("SPnR0_mean",["Semana",
                                                              "Prod_name_ID",
                                                              "Ruta_SAK"],
                                                          ["mean"]),
                                                       ("SPnA0_mean",["Semana",
                                                              "Prod_name_ID",
                                                              "Agencia_ID"],
                                                          ["mean"]),
                                                       ("SPnCh0_mean",["Semana",
                                                              "Prod_name_ID",
                                                              "Canal_ID"],
                                                          ["mean"]),
                                                       ("SPnT0_mean",["Semana",
                                                              "Prod_name_ID",
                                                              "Town_ID"],
                                                          ["mean"]),
                                                       ("SPnSt0_mean",["Semana",
                                                              "Prod_name_ID",
                                                              "State_ID"],
                                                          ["mean"]),
                                                       ("SPn0_mean",["Semana",
                                                              "Prod_name_ID"],
                                                          ["mean"])

                                                       
                                                       ], "Lag1", True)
print  configLag0Target1DeleteColumnsFalse.__dict__

{'nameAndGroups': [('SPClRACh0_mean', ['Semana', 'Producto_ID', 'Cliente_ID', 'Ruta_SAK', 'Agencia_ID', 'Canal_ID'], ['mean']), ('SPClRA0_mean', ['Semana', 'Producto_ID', 'Cliente_ID', 'Ruta_SAK', 'Agencia_ID'], ['mean']), ('SPClRCh0_mean', ['Semana', 'Producto_ID', 'Cliente_ID', 'Ruta_SAK', 'Canal_ID'], ['mean']), ('SPClACh0_mean', ['Semana', 'Producto_ID', 'Cliente_ID', 'Agencia_ID', 'Canal_ID'], ['mean']), ('SPClR0_mean', ['Semana', 'Producto_ID', 'Cliente_ID', 'Ruta_SAK'], ['mean']), ('SPClA0_mean', ['Semana', 'Producto_ID', 'Cliente_ID', 'Agencia_ID'], ['mean']), ('SPClCh0_mean', ['Semana', 'Producto_ID', 'Cliente_ID', 'Canal_ID'], ['mean']), ('SPCl0_mean', ['Semana', 'Producto_ID', 'Cliente_ID'], ['mean']), ('SPR0_mean', ['Semana', 'Producto_ID', 'Ruta_SAK'], ['mean']), ('SPA0_mean', ['Semana', 'Producto_ID', 'Agencia_ID'], ['mean']), ('SPCh0_mean', ['Semana', 'Producto_ID', 'Canal_ID'], ['mean']), ('SPT0_mean', ['Semana', 'Producto_ID', 'Town_ID'], ['mean']), ('SPSt0_mean', ['Se

In [77]:
FE.AddConfigurableFeaturesToTrain(configLag0Target1DeleteColumnsFalse)

SPClRACh0_mean is not in columns..


Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,Unnamed: 3_level_0,Unnamed: 4_level_0,Unnamed: 5_level_0,SPClRACh0_mean
Semana,Producto_ID,Cliente_ID,Ruta_SAK,Agencia_ID,Canal_ID,Unnamed: 6_level_1
4,41,681747,3306,2281,7,7.632886
4,41,684023,3303,2281,7,3.433987


Unnamed: 0,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Venta_uni_hoy,Venta_hoy,Dev_uni_proxima,Dev_proxima,...,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Demanda_uni_equil_original,DemandaNotEqualTheDifferenceOfVentaUniAndDev,Lag0,Lag1,SPClRACh0_mean
0,3,1110,7,3301,15766,1212,3,25.139999,0,0.0,...,16,120,2,709,4,3.0,False,1.418015,,
1,3,1110,7,3301,15766,1216,4,33.52,0,0.0,...,16,135,2,712,4,4.0,False,1.279644,,


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,Lag1,SPClRACh0_mean
0,2,10,2045,1,2831,4549769,32940,2163,14,110,10,678,23,1.098612,,1.098612
1,7,10,1612,1,2837,4414012,35305,2352,30,75,0,45,23,1.892663,,


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0
0,0,11,4037,1,2209,4639078,35305,2499,28,75,0,45,23,1.609438
1,1,11,2237,1,1226,4705135,1238,2402,4,140,2,630,4,1.011156


Count of missing numbers after SPClRACh0_mean in validation part 1 in column Lag1 is 1205795
SPClRA0_mean is not in columns..


Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,Unnamed: 3_level_0,Unnamed: 4_level_0,SPClRA0_mean
Semana,Producto_ID,Cliente_ID,Ruta_SAK,Agencia_ID,Unnamed: 5_level_1
4,41,681747,3306,2281,7.632886
4,41,684023,3303,2281,3.433987


Unnamed: 0,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Venta_uni_hoy,Venta_hoy,Dev_uni_proxima,Dev_proxima,...,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Demanda_uni_equil_original,DemandaNotEqualTheDifferenceOfVentaUniAndDev,Lag0,Lag1,SPClRA0_mean
0,3,1110,7,3301,15766,1212,3,25.139999,0,0.0,...,16,120,2,709,4,3.0,False,1.418015,,
1,3,1110,7,3301,15766,1216,4,33.52,0,0.0,...,16,135,2,712,4,4.0,False,1.279644,,


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,Lag1,SPClRA0_mean
0,2,10,2045,1,2831,4549769,32940,2163,14,110,10,678,23,1.098612,1.098612,1.098612
1,7,10,1612,1,2837,4414012,35305,2352,30,75,0,45,23,1.892663,,


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0
0,0,11,4037,1,2209,4639078,35305,2499,28,75,0,45,23,1.609438
1,1,11,2237,1,1226,4705135,1238,2402,4,140,2,630,4,1.011156


Count of missing numbers after SPClRA0_mean in validation part 1 in column Lag1 is 1205666
SPClRCh0_mean is not in columns..


Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,Unnamed: 3_level_0,Unnamed: 4_level_0,SPClRCh0_mean
Semana,Producto_ID,Cliente_ID,Ruta_SAK,Canal_ID,Unnamed: 5_level_1
4,41,681747,3306,7,7.632886
4,41,684023,3303,7,3.433987


Unnamed: 0,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Venta_uni_hoy,Venta_hoy,Dev_uni_proxima,Dev_proxima,...,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Demanda_uni_equil_original,DemandaNotEqualTheDifferenceOfVentaUniAndDev,Lag0,Lag1,SPClRCh0_mean
0,3,1110,7,3301,15766,1212,3,25.139999,0,0.0,...,16,120,2,709,4,3.0,False,1.418015,,
1,3,1110,7,3301,15766,1216,4,33.52,0,0.0,...,16,135,2,712,4,4.0,False,1.279644,,


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,Lag1,SPClRCh0_mean
0,2,10,2045,1,2831,4549769,32940,2163,14,110,10,678,23,1.098612,1.098612,1.098612
1,7,10,1612,1,2837,4414012,35305,2352,30,75,0,45,23,1.892663,,


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0
0,0,11,4037,1,2209,4639078,35305,2499,28,75,0,45,23,1.609438
1,1,11,2237,1,1226,4705135,1238,2402,4,140,2,630,4,1.011156


Count of missing numbers after SPClRCh0_mean in validation part 1 in column Lag1 is 1205489
SPClACh0_mean is not in columns..


Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,Unnamed: 3_level_0,Unnamed: 4_level_0,SPClACh0_mean
Semana,Producto_ID,Cliente_ID,Agencia_ID,Canal_ID,Unnamed: 5_level_1
4,41,681747,2281,7,7.632886
4,41,684023,2281,7,3.433987


Unnamed: 0,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Venta_uni_hoy,Venta_hoy,Dev_uni_proxima,Dev_proxima,...,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Demanda_uni_equil_original,DemandaNotEqualTheDifferenceOfVentaUniAndDev,Lag0,Lag1,SPClACh0_mean
0,3,1110,7,3301,15766,1212,3,25.139999,0,0.0,...,16,120,2,709,4,3.0,False,1.418015,,
1,3,1110,7,3301,15766,1216,4,33.52,0,0.0,...,16,135,2,712,4,4.0,False,1.279644,,


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,Lag1,SPClACh0_mean
0,2,10,2045,1,2831,4549769,32940,2163,14,110,10,678,23,1.098612,1.098612,1.098612
1,7,10,1612,1,2837,4414012,35305,2352,30,75,0,45,23,1.892663,,


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0
0,0,11,4037,1,2209,4639078,35305,2499,28,75,0,45,23,1.609438
1,1,11,2237,1,1226,4705135,1238,2402,4,140,2,630,4,1.011156


Count of missing numbers after SPClACh0_mean in validation part 1 in column Lag1 is 1202480
SPClR0_mean is not in columns..


Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,Unnamed: 3_level_0,SPClR0_mean
Semana,Producto_ID,Cliente_ID,Ruta_SAK,Unnamed: 4_level_1
4,41,681747,3306,7.632886
4,41,684023,3303,3.433987


Unnamed: 0,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Venta_uni_hoy,Venta_hoy,Dev_uni_proxima,Dev_proxima,...,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Demanda_uni_equil_original,DemandaNotEqualTheDifferenceOfVentaUniAndDev,Lag0,Lag1,SPClR0_mean
0,3,1110,7,3301,15766,1212,3,25.139999,0,0.0,...,16,120,2,709,4,3.0,False,1.418015,,
1,3,1110,7,3301,15766,1216,4,33.52,0,0.0,...,16,135,2,712,4,4.0,False,1.279644,,


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,Lag1,SPClR0_mean
0,2,10,2045,1,2831,4549769,32940,2163,14,110,10,678,23,1.098612,1.098612,1.098612
1,7,10,1612,1,2837,4414012,35305,2352,30,75,0,45,23,1.892663,,


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0
0,0,11,4037,1,2209,4639078,35305,2499,28,75,0,45,23,1.609438
1,1,11,2237,1,1226,4705135,1238,2402,4,140,2,630,4,1.011156


Count of missing numbers after SPClR0_mean in validation part 1 in column Lag1 is 1202480
SPClA0_mean is not in columns..


Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,Unnamed: 3_level_0,SPClA0_mean
Semana,Producto_ID,Cliente_ID,Agencia_ID,Unnamed: 4_level_1
4,41,681747,2281,7.632886
4,41,684023,2281,3.433987


Unnamed: 0,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Venta_uni_hoy,Venta_hoy,Dev_uni_proxima,Dev_proxima,...,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Demanda_uni_equil_original,DemandaNotEqualTheDifferenceOfVentaUniAndDev,Lag0,Lag1,SPClA0_mean
0,3,1110,7,3301,15766,1212,3,25.139999,0,0.0,...,16,120,2,709,4,3.0,False,1.418015,,
1,3,1110,7,3301,15766,1216,4,33.52,0,0.0,...,16,135,2,712,4,4.0,False,1.279644,,


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,Lag1,SPClA0_mean
0,2,10,2045,1,2831,4549769,32940,2163,14,110,10,678,23,1.098612,1.098612,1.098612
1,7,10,1612,1,2837,4414012,35305,2352,30,75,0,45,23,1.892663,,


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0
0,0,11,4037,1,2209,4639078,35305,2499,28,75,0,45,23,1.609438
1,1,11,2237,1,1226,4705135,1238,2402,4,140,2,630,4,1.011156


Count of missing numbers after SPClA0_mean in validation part 1 in column Lag1 is 1202456
SPClCh0_mean is not in columns..


Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,Unnamed: 3_level_0,SPClCh0_mean
Semana,Producto_ID,Cliente_ID,Canal_ID,Unnamed: 4_level_1
4,41,681747,7,7.632886
4,41,684023,7,3.433987


Unnamed: 0,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Venta_uni_hoy,Venta_hoy,Dev_uni_proxima,Dev_proxima,...,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Demanda_uni_equil_original,DemandaNotEqualTheDifferenceOfVentaUniAndDev,Lag0,Lag1,SPClCh0_mean
0,3,1110,7,3301,15766,1212,3,25.139999,0,0.0,...,16,120,2,709,4,3.0,False,1.418015,,
1,3,1110,7,3301,15766,1216,4,33.52,0,0.0,...,16,135,2,712,4,4.0,False,1.279644,,


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,Lag1,SPClCh0_mean
0,2,10,2045,1,2831,4549769,32940,2163,14,110,10,678,23,1.098612,1.098612,1.098612
1,7,10,1612,1,2837,4414012,35305,2352,30,75,0,45,23,1.892663,,


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0
0,0,11,4037,1,2209,4639078,35305,2499,28,75,0,45,23,1.609438
1,1,11,2237,1,1226,4705135,1238,2402,4,140,2,630,4,1.011156


Count of missing numbers after SPClCh0_mean in validation part 1 in column Lag1 is 1202245
SPCl0_mean is not in columns..


Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,SPCl0_mean
Semana,Producto_ID,Cliente_ID,Unnamed: 3_level_1
4,41,681747,7.632886
4,41,684023,3.433987


Unnamed: 0,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Venta_uni_hoy,Venta_hoy,Dev_uni_proxima,Dev_proxima,...,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Demanda_uni_equil_original,DemandaNotEqualTheDifferenceOfVentaUniAndDev,Lag0,Lag1,SPCl0_mean
0,3,1110,7,3301,15766,1212,3,25.139999,0,0.0,...,16,120,2,709,4,3.0,False,1.418015,,
1,3,1110,7,3301,15766,1216,4,33.52,0,0.0,...,16,135,2,712,4,4.0,False,1.279644,,


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,Lag1,SPCl0_mean
0,2,10,2045,1,2831,4549769,32940,2163,14,110,10,678,23,1.098612,1.098612,1.098612
1,7,10,1612,1,2837,4414012,35305,2352,30,75,0,45,23,1.892663,,


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0
0,0,11,4037,1,2209,4639078,35305,2499,28,75,0,45,23,1.609438
1,1,11,2237,1,1226,4705135,1238,2402,4,140,2,630,4,1.011156


Count of missing numbers after SPCl0_mean in validation part 1 in column Lag1 is 1202156
SPR0_mean is not in columns..


Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,SPR0_mean
Semana,Producto_ID,Ruta_SAK,Unnamed: 3_level_1
4,41,3201,4.037947
4,41,3303,3.433987


Unnamed: 0,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Venta_uni_hoy,Venta_hoy,Dev_uni_proxima,Dev_proxima,...,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Demanda_uni_equil_original,DemandaNotEqualTheDifferenceOfVentaUniAndDev,Lag0,Lag1,SPR0_mean
0,3,1110,7,3301,15766,1212,3,25.139999,0,0.0,...,16,120,2,709,4,3.0,False,1.418015,,
1,3,1110,7,3301,15766,1216,4,33.52,0,0.0,...,16,135,2,712,4,4.0,False,1.279644,,


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,Lag1,SPR0_mean
0,2,10,2045,1,2831,4549769,32940,2163,14,110,10,678,23,1.098612,1.098612,1.25342
1,7,10,1612,1,2837,4414012,35305,2352,30,75,0,45,23,1.892663,,1.853309


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0
0,0,11,4037,1,2209,4639078,35305,2499,28,75,0,45,23,1.609438
1,1,11,2237,1,1226,4705135,1238,2402,4,140,2,630,4,1.011156


Count of missing numbers after SPR0_mean in validation part 1 in column Lag1 is 68377
SPA0_mean is not in columns..


Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,SPA0_mean
Semana,Producto_ID,Agencia_ID,Unnamed: 3_level_1
4,41,2281,5.949871
4,41,23879,4.037947


Unnamed: 0,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Venta_uni_hoy,Venta_hoy,Dev_uni_proxima,Dev_proxima,...,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Demanda_uni_equil_original,DemandaNotEqualTheDifferenceOfVentaUniAndDev,Lag0,Lag1,SPA0_mean
0,3,1110,7,3301,15766,1212,3,25.139999,0,0.0,...,16,120,2,709,4,3.0,False,1.418015,,
1,3,1110,7,3301,15766,1216,4,33.52,0,0.0,...,16,135,2,712,4,4.0,False,1.279644,,


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,Lag1,SPA0_mean
0,2,10,2045,1,2831,4549769,32940,2163,14,110,10,678,23,1.098612,1.098612,1.453848
1,7,10,1612,1,2837,4414012,35305,2352,30,75,0,45,23,1.892663,1.853309,2.08531


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0
0,0,11,4037,1,2209,4639078,35305,2499,28,75,0,45,23,1.609438
1,1,11,2237,1,1226,4705135,1238,2402,4,140,2,630,4,1.011156


Count of missing numbers after SPA0_mean in validation part 1 in column Lag1 is 58235
SPCh0_mean is not in columns..


Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,SPCh0_mean
Semana,Producto_ID,Canal_ID,Unnamed: 3_level_1
4,41,7,5.312563
4,53,4,5.866416


Unnamed: 0,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Venta_uni_hoy,Venta_hoy,Dev_uni_proxima,Dev_proxima,...,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Demanda_uni_equil_original,DemandaNotEqualTheDifferenceOfVentaUniAndDev,Lag0,Lag1,SPCh0_mean
0,3,1110,7,3301,15766,1212,3,25.139999,0,0.0,...,16,120,2,709,4,3.0,False,1.418015,,
1,3,1110,7,3301,15766,1216,4,33.52,0,0.0,...,16,135,2,712,4,4.0,False,1.279644,,


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,Lag1,SPCh0_mean
0,2,10,2045,1,2831,4549769,32940,2163,14,110,10,678,23,1.098612,1.098612,1.414061
1,7,10,1612,1,2837,4414012,35305,2352,30,75,0,45,23,1.892663,1.853309,2.053539


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0
0,0,11,4037,1,2209,4639078,35305,2499,28,75,0,45,23,1.609438
1,1,11,2237,1,1226,4705135,1238,2402,4,140,2,630,4,1.011156


Count of missing numbers after SPCh0_mean in validation part 1 in column Lag1 is 2017
SPT0_mean is not in columns..


Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,SPT0_mean
Semana,Producto_ID,Town_ID,Unnamed: 3_level_1
4,41,2381,5.949871
4,41,2387,4.037947


Unnamed: 0,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Venta_uni_hoy,Venta_hoy,Dev_uni_proxima,Dev_proxima,...,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Demanda_uni_equil_original,DemandaNotEqualTheDifferenceOfVentaUniAndDev,Lag0,Lag1,SPT0_mean
0,3,1110,7,3301,15766,1212,3,25.139999,0,0.0,...,16,120,2,709,4,3.0,False,1.418015,,
1,3,1110,7,3301,15766,1216,4,33.52,0,0.0,...,16,135,2,712,4,4.0,False,1.279644,,


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,Lag1,SPT0_mean
0,2,10,2045,1,2831,4549769,32940,2163,14,110,10,678,23,1.098612,1.098612,1.453848
1,7,10,1612,1,2837,4414012,35305,2352,30,75,0,45,23,1.892663,1.853309,2.08531


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0
0,0,11,4037,1,2209,4639078,35305,2499,28,75,0,45,23,1.609438
1,1,11,2237,1,1226,4705135,1238,2402,4,140,2,630,4,1.011156


Count of missing numbers after SPT0_mean in validation part 1 in column Lag1 is 2002
SPSt0_mean is not in columns..


Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,SPSt0_mean
Semana,Producto_ID,State_ID,Unnamed: 3_level_1
4,41,22,5.312563
4,53,20,6.135444


Unnamed: 0,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Venta_uni_hoy,Venta_hoy,Dev_uni_proxima,Dev_proxima,...,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Demanda_uni_equil_original,DemandaNotEqualTheDifferenceOfVentaUniAndDev,Lag0,Lag1,SPSt0_mean
0,3,1110,7,3301,15766,1212,3,25.139999,0,0.0,...,16,120,2,709,4,3.0,False,1.418015,,
1,3,1110,7,3301,15766,1216,4,33.52,0,0.0,...,16,135,2,712,4,4.0,False,1.279644,,


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,Lag1,SPSt0_mean
0,2,10,2045,1,2831,4549769,32940,2163,14,110,10,678,23,1.098612,1.098612,1.422255
1,7,10,1612,1,2837,4414012,35305,2352,30,75,0,45,23,1.892663,1.853309,2.086532


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0
0,0,11,4037,1,2209,4639078,35305,2499,28,75,0,45,23,1.609438
1,1,11,2237,1,1226,4705135,1238,2402,4,140,2,630,4,1.011156


Count of missing numbers after SPSt0_mean in validation part 1 in column Lag1 is 1951
SP0_mean is not in columns..


Unnamed: 0_level_0,Unnamed: 1_level_0,SP0_mean
Semana,Producto_ID,Unnamed: 2_level_1
4,41,5.312563
4,53,5.866416


Unnamed: 0,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Venta_uni_hoy,Venta_hoy,Dev_uni_proxima,Dev_proxima,...,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Demanda_uni_equil_original,DemandaNotEqualTheDifferenceOfVentaUniAndDev,Lag0,Lag1,SP0_mean
0,3,1110,7,3301,15766,1212,3,25.139999,0,0.0,...,16,120,2,709,4,3.0,False,1.418015,,
1,3,1110,7,3301,15766,1216,4,33.52,0,0.0,...,16,135,2,712,4,4.0,False,1.279644,,


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,Lag1,SP0_mean
0,2,10,2045,1,2831,4549769,32940,2163,14,110,10,678,23,1.098612,1.098612,1.444566
1,7,10,1612,1,2837,4414012,35305,2352,30,75,0,45,23,1.892663,1.853309,2.078753


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0
0,0,11,4037,1,2209,4639078,35305,2499,28,75,0,45,23,1.609438
1,1,11,2237,1,1226,4705135,1238,2402,4,140,2,630,4,1.011156


Count of missing numbers after SP0_mean in validation part 1 in column Lag1 is 1882
SPnClRACh0_mean is not in columns..


Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,Unnamed: 3_level_0,Unnamed: 4_level_0,Unnamed: 5_level_0,SPnClRACh0_mean
Semana,Prod_name_ID,Cliente_ID,Ruta_SAK,Agencia_ID,Canal_ID,Unnamed: 6_level_1
4,0,60,7238,2061,2,5.049856
4,0,65,7250,2061,2,4.369448


Unnamed: 0,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Venta_uni_hoy,Venta_hoy,Dev_uni_proxima,Dev_proxima,...,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Demanda_uni_equil_original,DemandaNotEqualTheDifferenceOfVentaUniAndDev,Lag0,Lag1,SPnClRACh0_mean
0,3,1110,7,3301,15766,1212,3,25.139999,0,0.0,...,16,120,2,709,4,3.0,False,1.418015,,
1,3,1110,7,3301,15766,1216,4,33.52,0,0.0,...,16,135,2,712,4,4.0,False,1.279644,,


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,Lag1,SPnClRACh0_mean
0,2,10,2045,1,2831,4549769,32940,2163,14,110,10,678,23,1.098612,1.098612,1.098612
1,7,10,1612,1,2837,4414012,35305,2352,30,75,0,45,23,1.892663,1.853309,


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0
0,0,11,4037,1,2209,4639078,35305,2499,28,75,0,45,23,1.609438
1,1,11,2237,1,1226,4705135,1238,2402,4,140,2,630,4,1.011156


Count of missing numbers after SPnClRACh0_mean in validation part 1 in column Lag1 is 1809
SPnClRA0_mean is not in columns..


Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,Unnamed: 3_level_0,Unnamed: 4_level_0,SPnClRA0_mean
Semana,Prod_name_ID,Cliente_ID,Ruta_SAK,Agencia_ID,Unnamed: 5_level_1
4,0,60,7238,2061,5.049856
4,0,65,7250,2061,4.369448


Unnamed: 0,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Venta_uni_hoy,Venta_hoy,Dev_uni_proxima,Dev_proxima,...,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Demanda_uni_equil_original,DemandaNotEqualTheDifferenceOfVentaUniAndDev,Lag0,Lag1,SPnClRA0_mean
0,3,1110,7,3301,15766,1212,3,25.139999,0,0.0,...,16,120,2,709,4,3.0,False,1.418015,,
1,3,1110,7,3301,15766,1216,4,33.52,0,0.0,...,16,135,2,712,4,4.0,False,1.279644,,


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,Lag1,SPnClRA0_mean
0,2,10,2045,1,2831,4549769,32940,2163,14,110,10,678,23,1.098612,1.098612,1.098612
1,7,10,1612,1,2837,4414012,35305,2352,30,75,0,45,23,1.892663,1.853309,


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0
0,0,11,4037,1,2209,4639078,35305,2499,28,75,0,45,23,1.609438
1,1,11,2237,1,1226,4705135,1238,2402,4,140,2,630,4,1.011156


Count of missing numbers after SPnClRA0_mean in validation part 1 in column Lag1 is 1809
SPnClRCh0_mean is not in columns..


Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,Unnamed: 3_level_0,Unnamed: 4_level_0,SPnClRCh0_mean
Semana,Prod_name_ID,Cliente_ID,Ruta_SAK,Canal_ID,Unnamed: 5_level_1
4,0,60,7238,2,5.049856
4,0,65,7250,2,4.369448


Unnamed: 0,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Venta_uni_hoy,Venta_hoy,Dev_uni_proxima,Dev_proxima,...,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Demanda_uni_equil_original,DemandaNotEqualTheDifferenceOfVentaUniAndDev,Lag0,Lag1,SPnClRCh0_mean
0,3,1110,7,3301,15766,1212,3,25.139999,0,0.0,...,16,120,2,709,4,3.0,False,1.418015,,
1,3,1110,7,3301,15766,1216,4,33.52,0,0.0,...,16,135,2,712,4,4.0,False,1.279644,,


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,Lag1,SPnClRCh0_mean
0,2,10,2045,1,2831,4549769,32940,2163,14,110,10,678,23,1.098612,1.098612,1.098612
1,7,10,1612,1,2837,4414012,35305,2352,30,75,0,45,23,1.892663,1.853309,


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0
0,0,11,4037,1,2209,4639078,35305,2499,28,75,0,45,23,1.609438
1,1,11,2237,1,1226,4705135,1238,2402,4,140,2,630,4,1.011156


Count of missing numbers after SPnClRCh0_mean in validation part 1 in column Lag1 is 1808
SPnClACh0_mean is not in columns..


Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,Unnamed: 3_level_0,Unnamed: 4_level_0,SPnClACh0_mean
Semana,Prod_name_ID,Cliente_ID,Agencia_ID,Canal_ID,Unnamed: 5_level_1
4,0,60,2061,2,5.049856
4,0,65,2061,2,4.369448


Unnamed: 0,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Venta_uni_hoy,Venta_hoy,Dev_uni_proxima,Dev_proxima,...,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Demanda_uni_equil_original,DemandaNotEqualTheDifferenceOfVentaUniAndDev,Lag0,Lag1,SPnClACh0_mean
0,3,1110,7,3301,15766,1212,3,25.139999,0,0.0,...,16,120,2,709,4,3.0,False,1.418015,,
1,3,1110,7,3301,15766,1216,4,33.52,0,0.0,...,16,135,2,712,4,4.0,False,1.279644,,


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,Lag1,SPnClACh0_mean
0,2,10,2045,1,2831,4549769,32940,2163,14,110,10,678,23,1.098612,1.098612,1.098612
1,7,10,1612,1,2837,4414012,35305,2352,30,75,0,45,23,1.892663,1.853309,


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0
0,0,11,4037,1,2209,4639078,35305,2499,28,75,0,45,23,1.609438
1,1,11,2237,1,1226,4705135,1238,2402,4,140,2,630,4,1.011156


Count of missing numbers after SPnClACh0_mean in validation part 1 in column Lag1 is 1808
SPnClR0_mean is not in columns..


Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,Unnamed: 3_level_0,SPnClR0_mean
Semana,Prod_name_ID,Cliente_ID,Ruta_SAK,Unnamed: 4_level_1
4,0,60,7238,5.049856
4,0,65,7250,4.369448


Unnamed: 0,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Venta_uni_hoy,Venta_hoy,Dev_uni_proxima,Dev_proxima,...,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Demanda_uni_equil_original,DemandaNotEqualTheDifferenceOfVentaUniAndDev,Lag0,Lag1,SPnClR0_mean
0,3,1110,7,3301,15766,1212,3,25.139999,0,0.0,...,16,120,2,709,4,3.0,False,1.418015,,
1,3,1110,7,3301,15766,1216,4,33.52,0,0.0,...,16,135,2,712,4,4.0,False,1.279644,,


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,Lag1,SPnClR0_mean
0,2,10,2045,1,2831,4549769,32940,2163,14,110,10,678,23,1.098612,1.098612,1.098612
1,7,10,1612,1,2837,4414012,35305,2352,30,75,0,45,23,1.892663,1.853309,


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0
0,0,11,4037,1,2209,4639078,35305,2499,28,75,0,45,23,1.609438
1,1,11,2237,1,1226,4705135,1238,2402,4,140,2,630,4,1.011156


Count of missing numbers after SPnClR0_mean in validation part 1 in column Lag1 is 1808
SPnClA0_mean is not in columns..


Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,Unnamed: 3_level_0,SPnClA0_mean
Semana,Prod_name_ID,Cliente_ID,Agencia_ID,Unnamed: 4_level_1
4,0,60,2061,5.049856
4,0,65,2061,4.369448


Unnamed: 0,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Venta_uni_hoy,Venta_hoy,Dev_uni_proxima,Dev_proxima,...,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Demanda_uni_equil_original,DemandaNotEqualTheDifferenceOfVentaUniAndDev,Lag0,Lag1,SPnClA0_mean
0,3,1110,7,3301,15766,1212,3,25.139999,0,0.0,...,16,120,2,709,4,3.0,False,1.418015,,
1,3,1110,7,3301,15766,1216,4,33.52,0,0.0,...,16,135,2,712,4,4.0,False,1.279644,,


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,Lag1,SPnClA0_mean
0,2,10,2045,1,2831,4549769,32940,2163,14,110,10,678,23,1.098612,1.098612,1.098612
1,7,10,1612,1,2837,4414012,35305,2352,30,75,0,45,23,1.892663,1.853309,


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0
0,0,11,4037,1,2209,4639078,35305,2499,28,75,0,45,23,1.609438
1,1,11,2237,1,1226,4705135,1238,2402,4,140,2,630,4,1.011156


Count of missing numbers after SPnClA0_mean in validation part 1 in column Lag1 is 1808
SPnClCh0_mean is not in columns..


Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,Unnamed: 3_level_0,SPnClCh0_mean
Semana,Prod_name_ID,Cliente_ID,Canal_ID,Unnamed: 4_level_1
4,0,60,2,5.049856
4,0,65,2,4.369448


Unnamed: 0,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Venta_uni_hoy,Venta_hoy,Dev_uni_proxima,Dev_proxima,...,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Demanda_uni_equil_original,DemandaNotEqualTheDifferenceOfVentaUniAndDev,Lag0,Lag1,SPnClCh0_mean
0,3,1110,7,3301,15766,1212,3,25.139999,0,0.0,...,16,120,2,709,4,3.0,False,1.418015,,
1,3,1110,7,3301,15766,1216,4,33.52,0,0.0,...,16,135,2,712,4,4.0,False,1.279644,,


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,Lag1,SPnClCh0_mean
0,2,10,2045,1,2831,4549769,32940,2163,14,110,10,678,23,1.098612,1.098612,1.098612
1,7,10,1612,1,2837,4414012,35305,2352,30,75,0,45,23,1.892663,1.853309,


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0
0,0,11,4037,1,2209,4639078,35305,2499,28,75,0,45,23,1.609438
1,1,11,2237,1,1226,4705135,1238,2402,4,140,2,630,4,1.011156


Count of missing numbers after SPnClCh0_mean in validation part 1 in column Lag1 is 1808
SPnCl0_mean is not in columns..


Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,SPnCl0_mean
Semana,Prod_name_ID,Cliente_ID,Unnamed: 3_level_1
4,0,60,5.049856
4,0,65,4.369448


Unnamed: 0,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Venta_uni_hoy,Venta_hoy,Dev_uni_proxima,Dev_proxima,...,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Demanda_uni_equil_original,DemandaNotEqualTheDifferenceOfVentaUniAndDev,Lag0,Lag1,SPnCl0_mean
0,3,1110,7,3301,15766,1212,3,25.139999,0,0.0,...,16,120,2,709,4,3.0,False,1.418015,,
1,3,1110,7,3301,15766,1216,4,33.52,0,0.0,...,16,135,2,712,4,4.0,False,1.279644,,


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,Lag1,SPnCl0_mean
0,2,10,2045,1,2831,4549769,32940,2163,14,110,10,678,23,1.098612,1.098612,1.098612
1,7,10,1612,1,2837,4414012,35305,2352,30,75,0,45,23,1.892663,1.853309,


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0
0,0,11,4037,1,2209,4639078,35305,2499,28,75,0,45,23,1.609438
1,1,11,2237,1,1226,4705135,1238,2402,4,140,2,630,4,1.011156


Count of missing numbers after SPnCl0_mean in validation part 1 in column Lag1 is 1808
SPnR0_mean is not in columns..


Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,SPnR0_mean
Semana,Prod_name_ID,Ruta_SAK,Unnamed: 3_level_1
4,0,1,4.259628
4,0,2,4.14477


Unnamed: 0,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Venta_uni_hoy,Venta_hoy,Dev_uni_proxima,Dev_proxima,...,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Demanda_uni_equil_original,DemandaNotEqualTheDifferenceOfVentaUniAndDev,Lag0,Lag1,SPnR0_mean
0,3,1110,7,3301,15766,1212,3,25.139999,0,0.0,...,16,120,2,709,4,3.0,False,1.418015,,
1,3,1110,7,3301,15766,1216,4,33.52,0,0.0,...,16,135,2,712,4,4.0,False,1.279644,,


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,Lag1,SPnR0_mean
0,2,10,2045,1,2831,4549769,32940,2163,14,110,10,678,23,1.098612,1.098612,1.261764
1,7,10,1612,1,2837,4414012,35305,2352,30,75,0,45,23,1.892663,1.853309,1.850931


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0
0,0,11,4037,1,2209,4639078,35305,2499,28,75,0,45,23,1.609438
1,1,11,2237,1,1226,4705135,1238,2402,4,140,2,630,4,1.011156


Count of missing numbers after SPnR0_mean in validation part 1 in column Lag1 is 1674
SPnA0_mean is not in columns..


Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,SPnA0_mean
Semana,Prod_name_ID,Agencia_ID,Unnamed: 3_level_1
4,0,1110,1.94591
4,0,1114,3.503704


Unnamed: 0,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Venta_uni_hoy,Venta_hoy,Dev_uni_proxima,Dev_proxima,...,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Demanda_uni_equil_original,DemandaNotEqualTheDifferenceOfVentaUniAndDev,Lag0,Lag1,SPnA0_mean
0,3,1110,7,3301,15766,1212,3,25.139999,0,0.0,...,16,120,2,709,4,3.0,False,1.418015,,
1,3,1110,7,3301,15766,1216,4,33.52,0,0.0,...,16,135,2,712,4,4.0,False,1.279644,,


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,Lag1,SPnA0_mean
0,2,10,2045,1,2831,4549769,32940,2163,14,110,10,678,23,1.098612,1.098612,1.453848
1,7,10,1612,1,2837,4414012,35305,2352,30,75,0,45,23,1.892663,1.853309,2.08531


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0
0,0,11,4037,1,2209,4639078,35305,2499,28,75,0,45,23,1.609438
1,1,11,2237,1,1226,4705135,1238,2402,4,140,2,630,4,1.011156


Count of missing numbers after SPnA0_mean in validation part 1 in column Lag1 is 1634
SPnCh0_mean is not in columns..


Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,SPnCh0_mean
Semana,Prod_name_ID,Canal_ID,Unnamed: 3_level_1
4,0,1,2.129508
4,0,2,3.262566


Unnamed: 0,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Venta_uni_hoy,Venta_hoy,Dev_uni_proxima,Dev_proxima,...,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Demanda_uni_equil_original,DemandaNotEqualTheDifferenceOfVentaUniAndDev,Lag0,Lag1,SPnCh0_mean
0,3,1110,7,3301,15766,1212,3,25.139999,0,0.0,...,16,120,2,709,4,3.0,False,1.418015,,
1,3,1110,7,3301,15766,1216,4,33.52,0,0.0,...,16,135,2,712,4,4.0,False,1.279644,,


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,Lag1,SPnCh0_mean
0,2,10,2045,1,2831,4549769,32940,2163,14,110,10,678,23,1.098612,1.098612,1.418644
1,7,10,1612,1,2837,4414012,35305,2352,30,75,0,45,23,1.892663,1.853309,2.05565


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0
0,0,11,4037,1,2209,4639078,35305,2499,28,75,0,45,23,1.609438
1,1,11,2237,1,1226,4705135,1238,2402,4,140,2,630,4,1.011156


Count of missing numbers after SPnCh0_mean in validation part 1 in column Lag1 is 1238
SPnT0_mean is not in columns..


Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,SPnT0_mean
Semana,Prod_name_ID,Town_ID,Unnamed: 3_level_1
4,0,2008,1.94591
4,0,2011,3.684555


Unnamed: 0,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Venta_uni_hoy,Venta_hoy,Dev_uni_proxima,Dev_proxima,...,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Demanda_uni_equil_original,DemandaNotEqualTheDifferenceOfVentaUniAndDev,Lag0,Lag1,SPnT0_mean
0,3,1110,7,3301,15766,1212,3,25.139999,0,0.0,...,16,120,2,709,4,3.0,False,1.418015,,
1,3,1110,7,3301,15766,1216,4,33.52,0,0.0,...,16,135,2,712,4,4.0,False,1.279644,,


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,Lag1,SPnT0_mean
0,2,10,2045,1,2831,4549769,32940,2163,14,110,10,678,23,1.098612,1.098612,1.453848
1,7,10,1612,1,2837,4414012,35305,2352,30,75,0,45,23,1.892663,1.853309,2.12824


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0
0,0,11,4037,1,2209,4639078,35305,2499,28,75,0,45,23,1.609438
1,1,11,2237,1,1226,4705135,1238,2402,4,140,2,630,4,1.011156


Count of missing numbers after SPnT0_mean in validation part 1 in column Lag1 is 1238
SPnSt0_mean is not in columns..


Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,SPnSt0_mean
Semana,Prod_name_ID,State_ID,Unnamed: 3_level_1
4,0,0,3.215217
4,0,1,2.571746


Unnamed: 0,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Venta_uni_hoy,Venta_hoy,Dev_uni_proxima,Dev_proxima,...,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Demanda_uni_equil_original,DemandaNotEqualTheDifferenceOfVentaUniAndDev,Lag0,Lag1,SPnSt0_mean
0,3,1110,7,3301,15766,1212,3,25.139999,0,0.0,...,16,120,2,709,4,3.0,False,1.418015,,
1,3,1110,7,3301,15766,1216,4,33.52,0,0.0,...,16,135,2,712,4,4.0,False,1.279644,,


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,Lag1,SPnSt0_mean
0,2,10,2045,1,2831,4549769,32940,2163,14,110,10,678,23,1.098612,1.098612,1.422255
1,7,10,1612,1,2837,4414012,35305,2352,30,75,0,45,23,1.892663,1.853309,2.1277


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0
0,0,11,4037,1,2209,4639078,35305,2499,28,75,0,45,23,1.609438
1,1,11,2237,1,1226,4705135,1238,2402,4,140,2,630,4,1.011156


Count of missing numbers after SPnSt0_mean in validation part 1 in column Lag1 is 1238
SPn0_mean is not in columns..


Unnamed: 0_level_0,Unnamed: 1_level_0,SPn0_mean
Semana,Prod_name_ID,Unnamed: 2_level_1
4,0,3.034794
4,1,3.686628


Unnamed: 0,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Venta_uni_hoy,Venta_hoy,Dev_uni_proxima,Dev_proxima,...,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Demanda_uni_equil_original,DemandaNotEqualTheDifferenceOfVentaUniAndDev,Lag0,Lag1,SPn0_mean
0,3,1110,7,3301,15766,1212,3,25.139999,0,0.0,...,16,120,2,709,4,3.0,False,1.418015,,
1,3,1110,7,3301,15766,1216,4,33.52,0,0.0,...,16,135,2,712,4,4.0,False,1.279644,,


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,Lag1,SPn0_mean
0,2,10,2045,1,2831,4549769,32940,2163,14,110,10,678,23,1.098612,1.098612,1.456359
1,7,10,1612,1,2837,4414012,35305,2352,30,75,0,45,23,1.892663,1.853309,2.10538


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0
0,0,11,4037,1,2209,4639078,35305,2499,28,75,0,45,23,1.609438
1,1,11,2237,1,1226,4705135,1238,2402,4,140,2,630,4,1.011156


Count of missing numbers after SPn0_mean in validation part 1 in column Lag1 is 1237


Unnamed: 0,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Venta_uni_hoy,Venta_hoy,Dev_uni_proxima,Dev_proxima,...,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Demanda_uni_equil_original,DemandaNotEqualTheDifferenceOfVentaUniAndDev,Lag0,Lag1
0,3,1110,7,3301,15766,1212,3,25.139999,0,0.0,...,2008,16,120,2,709,4,3.0,False,1.418015,
1,3,1110,7,3301,15766,1216,4,33.52,0,0.0,...,2008,16,135,2,712,4,4.0,False,1.279644,


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,Lag1
0,2,10,2045,1,2831,4549769,32940,2163,14,110,10,678,23,1.098612,1.098612
1,7,10,1612,1,2837,4414012,35305,2352,30,75,0,45,23,1.892663,1.853309


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0
0,0,11,4037,1,2209,4639078,35305,2499,28,75,0,45,23,1.609438
1,1,11,2237,1,1226,4705135,1238,2402,4,140,2,630,4,1.011156


In [78]:
FE.train.fillna(value=0, inplace=True)
FE.test1.fillna(value=0, inplace=True)
FE.test2.fillna(value=0, inplace=True)

In [79]:
FE.SaveDataFrameToHdf('both')

In [80]:
configLag0Target1DeleteColumnsFalse = ConfigElements(2,[ ("SPClRACh0_mean",["Semana",
                                                              "Producto_ID",
                                                              "Cliente_ID",
                                                              "Ruta_SAK",
                                                              "Agencia_ID",
                                                              "Canal_ID"],
                                                          ["mean"]),
                                                        ("SPClRA0_mean",["Semana",
                                                              "Producto_ID",
                                                              "Cliente_ID",
                                                              "Ruta_SAK",
                                                              "Agencia_ID"],
                                                          ["mean"]),
                                                        ("SPClRCh0_mean",["Semana",
                                                              "Producto_ID",
                                                              "Cliente_ID",
                                                              "Ruta_SAK",
                                                              "Canal_ID"],
                                                          ["mean"]),
                                                        ("SPClACh0_mean",["Semana",
                                                              "Producto_ID",
                                                              "Cliente_ID",
                                                              "Agencia_ID",
                                                              "Canal_ID"],
                                                          ["mean"]),
                                                        ("SPClR0_mean",["Semana",
                                                              "Producto_ID",
                                                              "Cliente_ID",
                                                              "Ruta_SAK"],
                                                          ["mean"]),
                                                        ("SPClA0_mean",["Semana",
                                                              "Producto_ID",
                                                              "Cliente_ID",
                                                              "Agencia_ID"],
                                                          ["mean"]),
                                                       ("SPClCh0_mean",["Semana",
                                                              "Producto_ID",
                                                              "Cliente_ID",
                                                              "Canal_ID"],
                                                          ["mean"]),
                                                       ("SPCl0_mean",["Semana",
                                                              "Producto_ID",
                                                              "Cliente_ID"],
                                                          ["mean"]),
                                                       ("SPR0_mean",["Semana",
                                                              "Producto_ID",
                                                              "Ruta_SAK"],
                                                          ["mean"]),
                                                       ("SPA0_mean",["Semana",
                                                              "Producto_ID",
                                                              "Agencia_ID"],
                                                          ["mean"]),
                                                       ("SPCh0_mean",["Semana",
                                                              "Producto_ID",
                                                              "Canal_ID"],
                                                          ["mean"]),
                                                       ("SPT0_mean",["Semana",
                                                              "Producto_ID",
                                                              "Town_ID"],
                                                          ["mean"]),
                                                       ("SPSt0_mean",["Semana",
                                                              "Producto_ID",
                                                              "State_ID"],
                                                          ["mean"]),
                                                       ("SP0_mean",["Semana",
                                                              "Producto_ID"],
                                                          ["mean"]),
                                                      ("SPnClRACh0_mean",["Semana",  ##PRODNAMES START
                                                              "Prod_name_ID",
                                                              "Cliente_ID",
                                                              "Ruta_SAK",
                                                              "Agencia_ID",
                                                              "Canal_ID"],
                                                          ["mean"]),
                                                        ("SPnClRA0_mean",["Semana",
                                                              "Prod_name_ID",
                                                              "Cliente_ID",
                                                              "Ruta_SAK",
                                                              "Agencia_ID"],
                                                          ["mean"]),
                                                        ("SPnClRCh0_mean",["Semana",
                                                              "Prod_name_ID",
                                                              "Cliente_ID",
                                                              "Ruta_SAK",
                                                              "Canal_ID"],
                                                          ["mean"]),
                                                        ("SPnClACh0_mean",["Semana",
                                                              "Prod_name_ID",
                                                              "Cliente_ID",
                                                              "Agencia_ID",
                                                              "Canal_ID"],
                                                          ["mean"]),
                                                        ("SPnClR0_mean",["Semana",
                                                              "Prod_name_ID",
                                                              "Cliente_ID",
                                                              "Ruta_SAK"],
                                                          ["mean"]),
                                                        ("SPnClA0_mean",["Semana",
                                                              "Prod_name_ID",
                                                              "Cliente_ID",
                                                              "Agencia_ID"],
                                                          ["mean"]),
                                                       ("SPnClCh0_mean",["Semana",
                                                              "Prod_name_ID",
                                                              "Cliente_ID",
                                                              "Canal_ID"],
                                                          ["mean"]),
                                                       ("SPnCl0_mean",["Semana",
                                                              "Prod_name_ID",
                                                              "Cliente_ID"],
                                                          ["mean"]),
                                                       ("SPnR0_mean",["Semana",
                                                              "Prod_name_ID",
                                                              "Ruta_SAK"],
                                                          ["mean"]),
                                                       ("SPnA0_mean",["Semana",
                                                              "Prod_name_ID",
                                                              "Agencia_ID"],
                                                          ["mean"]),
                                                       ("SPnCh0_mean",["Semana",
                                                              "Prod_name_ID",
                                                              "Canal_ID"],
                                                          ["mean"]),
                                                       ("SPnT0_mean",["Semana",
                                                              "Prod_name_ID",
                                                              "Town_ID"],
                                                          ["mean"]),
                                                       ("SPnSt0_mean",["Semana",
                                                              "Prod_name_ID",
                                                              "State_ID"],
                                                          ["mean"]),
                                                       ("SPn0_mean",["Semana",
                                                              "Prod_name_ID"],
                                                          ["mean"])

                                                       
                                                       ], "Lag2", True)
print  configLag0Target1DeleteColumnsFalse.__dict__

{'nameAndGroups': [('SPClRACh0_mean', ['Semana', 'Producto_ID', 'Cliente_ID', 'Ruta_SAK', 'Agencia_ID', 'Canal_ID'], ['mean']), ('SPClRA0_mean', ['Semana', 'Producto_ID', 'Cliente_ID', 'Ruta_SAK', 'Agencia_ID'], ['mean']), ('SPClRCh0_mean', ['Semana', 'Producto_ID', 'Cliente_ID', 'Ruta_SAK', 'Canal_ID'], ['mean']), ('SPClACh0_mean', ['Semana', 'Producto_ID', 'Cliente_ID', 'Agencia_ID', 'Canal_ID'], ['mean']), ('SPClR0_mean', ['Semana', 'Producto_ID', 'Cliente_ID', 'Ruta_SAK'], ['mean']), ('SPClA0_mean', ['Semana', 'Producto_ID', 'Cliente_ID', 'Agencia_ID'], ['mean']), ('SPClCh0_mean', ['Semana', 'Producto_ID', 'Cliente_ID', 'Canal_ID'], ['mean']), ('SPCl0_mean', ['Semana', 'Producto_ID', 'Cliente_ID'], ['mean']), ('SPR0_mean', ['Semana', 'Producto_ID', 'Ruta_SAK'], ['mean']), ('SPA0_mean', ['Semana', 'Producto_ID', 'Agencia_ID'], ['mean']), ('SPCh0_mean', ['Semana', 'Producto_ID', 'Canal_ID'], ['mean']), ('SPT0_mean', ['Semana', 'Producto_ID', 'Town_ID'], ['mean']), ('SPSt0_mean', ['Se

In [81]:
FE.AddConfigurableFeaturesToTrain(configLag0Target1DeleteColumnsFalse)

SPClRACh0_mean is not in columns..


Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,Unnamed: 3_level_0,Unnamed: 4_level_0,Unnamed: 5_level_0,SPClRACh0_mean
Semana,Producto_ID,Cliente_ID,Ruta_SAK,Agencia_ID,Canal_ID,Unnamed: 6_level_1
5,41,681747,3306,2281,7,7.632886
5,41,684023,3303,2281,7,3.433987


Unnamed: 0,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Venta_uni_hoy,Venta_hoy,Dev_uni_proxima,Dev_proxima,...,weight,pieces,Prod_name_ID,Brand_ID,Demanda_uni_equil_original,DemandaNotEqualTheDifferenceOfVentaUniAndDev,Lag0,Lag1,Lag2,SPClRACh0_mean
0,3,1110,7,3301,15766,1212,3,25.139999,0,0.0,...,120,2,709,4,3.0,False,1.418015,0.0,,
1,3,1110,7,3301,15766,1216,4,33.52,0,0.0,...,135,2,712,4,4.0,False,1.279644,0.0,,


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,Lag1,Lag2,SPClRACh0_mean
0,2,10,2045,1,2831,4549769,32940,2163,14,110,10,678,23,1.098612,1.098612,,1.098612
1,7,10,1612,1,2837,4414012,35305,2352,30,75,0,45,23,1.892663,1.853309,,


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,Lag2,SPClRACh0_mean
0,0,11,4037,1,2209,4639078,35305,2499,28,75,0,45,23,1.609438,,1.609438
1,1,11,2237,1,1226,4705135,1238,2402,4,140,2,630,4,1.011156,,


Count of missing numbers after SPClRACh0_mean in validation part 1 in column Lag2 is 1775002
Count of missing numbers after SPClRACh0_mean in validation part 2 in column Lag2 is 1738183
SPClRA0_mean is not in columns..


Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,Unnamed: 3_level_0,Unnamed: 4_level_0,SPClRA0_mean
Semana,Producto_ID,Cliente_ID,Ruta_SAK,Agencia_ID,Unnamed: 5_level_1
5,41,681747,3306,2281,7.632886
5,41,684023,3303,2281,3.433987


Unnamed: 0,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Venta_uni_hoy,Venta_hoy,Dev_uni_proxima,Dev_proxima,...,weight,pieces,Prod_name_ID,Brand_ID,Demanda_uni_equil_original,DemandaNotEqualTheDifferenceOfVentaUniAndDev,Lag0,Lag1,Lag2,SPClRA0_mean
0,3,1110,7,3301,15766,1212,3,25.139999,0,0.0,...,120,2,709,4,3.0,False,1.418015,0.0,,
1,3,1110,7,3301,15766,1216,4,33.52,0,0.0,...,135,2,712,4,4.0,False,1.279644,0.0,,


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,Lag1,Lag2,SPClRA0_mean
0,2,10,2045,1,2831,4549769,32940,2163,14,110,10,678,23,1.098612,1.098612,1.098612,1.098612
1,7,10,1612,1,2837,4414012,35305,2352,30,75,0,45,23,1.892663,1.853309,,


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,Lag2,SPClRA0_mean
0,0,11,4037,1,2209,4639078,35305,2499,28,75,0,45,23,1.609438,1.609438,1.609438
1,1,11,2237,1,1226,4705135,1238,2402,4,140,2,630,4,1.011156,,


Count of missing numbers after SPClRA0_mean in validation part 1 in column Lag2 is 1774803
Count of missing numbers after SPClRA0_mean in validation part 2 in column Lag2 is 1738016
SPClRCh0_mean is not in columns..


Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,Unnamed: 3_level_0,Unnamed: 4_level_0,SPClRCh0_mean
Semana,Producto_ID,Cliente_ID,Ruta_SAK,Canal_ID,Unnamed: 5_level_1
5,41,681747,3306,7,7.632886
5,41,684023,3303,7,3.433987


Unnamed: 0,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Venta_uni_hoy,Venta_hoy,Dev_uni_proxima,Dev_proxima,...,weight,pieces,Prod_name_ID,Brand_ID,Demanda_uni_equil_original,DemandaNotEqualTheDifferenceOfVentaUniAndDev,Lag0,Lag1,Lag2,SPClRCh0_mean
0,3,1110,7,3301,15766,1212,3,25.139999,0,0.0,...,120,2,709,4,3.0,False,1.418015,0.0,,
1,3,1110,7,3301,15766,1216,4,33.52,0,0.0,...,135,2,712,4,4.0,False,1.279644,0.0,,


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,Lag1,Lag2,SPClRCh0_mean
0,2,10,2045,1,2831,4549769,32940,2163,14,110,10,678,23,1.098612,1.098612,1.098612,1.098612
1,7,10,1612,1,2837,4414012,35305,2352,30,75,0,45,23,1.892663,1.853309,,


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,Lag2,SPClRCh0_mean
0,0,11,4037,1,2209,4639078,35305,2499,28,75,0,45,23,1.609438,1.609438,1.609438
1,1,11,2237,1,1226,4705135,1238,2402,4,140,2,630,4,1.011156,,


Count of missing numbers after SPClRCh0_mean in validation part 1 in column Lag2 is 1774497
Count of missing numbers after SPClRCh0_mean in validation part 2 in column Lag2 is 1737658
SPClACh0_mean is not in columns..


Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,Unnamed: 3_level_0,Unnamed: 4_level_0,SPClACh0_mean
Semana,Producto_ID,Cliente_ID,Agencia_ID,Canal_ID,Unnamed: 5_level_1
5,41,681747,2281,7,7.632886
5,41,684023,2281,7,3.433987


Unnamed: 0,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Venta_uni_hoy,Venta_hoy,Dev_uni_proxima,Dev_proxima,...,weight,pieces,Prod_name_ID,Brand_ID,Demanda_uni_equil_original,DemandaNotEqualTheDifferenceOfVentaUniAndDev,Lag0,Lag1,Lag2,SPClACh0_mean
0,3,1110,7,3301,15766,1212,3,25.139999,0,0.0,...,120,2,709,4,3.0,False,1.418015,0.0,,
1,3,1110,7,3301,15766,1216,4,33.52,0,0.0,...,135,2,712,4,4.0,False,1.279644,0.0,,


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,Lag1,Lag2,SPClACh0_mean
0,2,10,2045,1,2831,4549769,32940,2163,14,110,10,678,23,1.098612,1.098612,1.098612,1.098612
1,7,10,1612,1,2837,4414012,35305,2352,30,75,0,45,23,1.892663,1.853309,,


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,Lag2,SPClACh0_mean
0,0,11,4037,1,2209,4639078,35305,2499,28,75,0,45,23,1.609438,1.609438,1.609438
1,1,11,2237,1,1226,4705135,1238,2402,4,140,2,630,4,1.011156,,


Count of missing numbers after SPClACh0_mean in validation part 1 in column Lag2 is 1767070
Count of missing numbers after SPClACh0_mean in validation part 2 in column Lag2 is 1729376
SPClR0_mean is not in columns..


Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,Unnamed: 3_level_0,SPClR0_mean
Semana,Producto_ID,Cliente_ID,Ruta_SAK,Unnamed: 4_level_1
5,41,681747,3306,7.632886
5,41,684023,3303,3.433987


Unnamed: 0,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Venta_uni_hoy,Venta_hoy,Dev_uni_proxima,Dev_proxima,...,weight,pieces,Prod_name_ID,Brand_ID,Demanda_uni_equil_original,DemandaNotEqualTheDifferenceOfVentaUniAndDev,Lag0,Lag1,Lag2,SPClR0_mean
0,3,1110,7,3301,15766,1212,3,25.139999,0,0.0,...,120,2,709,4,3.0,False,1.418015,0.0,,
1,3,1110,7,3301,15766,1216,4,33.52,0,0.0,...,135,2,712,4,4.0,False,1.279644,0.0,,


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,Lag1,Lag2,SPClR0_mean
0,2,10,2045,1,2831,4549769,32940,2163,14,110,10,678,23,1.098612,1.098612,1.098612,1.098612
1,7,10,1612,1,2837,4414012,35305,2352,30,75,0,45,23,1.892663,1.853309,,


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,Lag2,SPClR0_mean
0,0,11,4037,1,2209,4639078,35305,2499,28,75,0,45,23,1.609438,1.609438,1.609438
1,1,11,2237,1,1226,4705135,1238,2402,4,140,2,630,4,1.011156,,


Count of missing numbers after SPClR0_mean in validation part 1 in column Lag2 is 1767070
Count of missing numbers after SPClR0_mean in validation part 2 in column Lag2 is 1729376
SPClA0_mean is not in columns..


Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,Unnamed: 3_level_0,SPClA0_mean
Semana,Producto_ID,Cliente_ID,Agencia_ID,Unnamed: 4_level_1
5,41,681747,2281,7.632886
5,41,684023,2281,3.433987


Unnamed: 0,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Venta_uni_hoy,Venta_hoy,Dev_uni_proxima,Dev_proxima,...,weight,pieces,Prod_name_ID,Brand_ID,Demanda_uni_equil_original,DemandaNotEqualTheDifferenceOfVentaUniAndDev,Lag0,Lag1,Lag2,SPClA0_mean
0,3,1110,7,3301,15766,1212,3,25.139999,0,0.0,...,120,2,709,4,3.0,False,1.418015,0.0,,
1,3,1110,7,3301,15766,1216,4,33.52,0,0.0,...,135,2,712,4,4.0,False,1.279644,0.0,,


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,Lag1,Lag2,SPClA0_mean
0,2,10,2045,1,2831,4549769,32940,2163,14,110,10,678,23,1.098612,1.098612,1.098612,1.098612
1,7,10,1612,1,2837,4414012,35305,2352,30,75,0,45,23,1.892663,1.853309,,


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,Lag2,SPClA0_mean
0,0,11,4037,1,2209,4639078,35305,2499,28,75,0,45,23,1.609438,1.609438,1.609438
1,1,11,2237,1,1226,4705135,1238,2402,4,140,2,630,4,1.011156,,


Count of missing numbers after SPClA0_mean in validation part 1 in column Lag2 is 1766997
Count of missing numbers after SPClA0_mean in validation part 2 in column Lag2 is 1729295
SPClCh0_mean is not in columns..


Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,Unnamed: 3_level_0,SPClCh0_mean
Semana,Producto_ID,Cliente_ID,Canal_ID,Unnamed: 4_level_1
5,41,681747,7,7.632886
5,41,684023,7,3.433987


Unnamed: 0,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Venta_uni_hoy,Venta_hoy,Dev_uni_proxima,Dev_proxima,...,weight,pieces,Prod_name_ID,Brand_ID,Demanda_uni_equil_original,DemandaNotEqualTheDifferenceOfVentaUniAndDev,Lag0,Lag1,Lag2,SPClCh0_mean
0,3,1110,7,3301,15766,1212,3,25.139999,0,0.0,...,120,2,709,4,3.0,False,1.418015,0.0,,
1,3,1110,7,3301,15766,1216,4,33.52,0,0.0,...,135,2,712,4,4.0,False,1.279644,0.0,,


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,Lag1,Lag2,SPClCh0_mean
0,2,10,2045,1,2831,4549769,32940,2163,14,110,10,678,23,1.098612,1.098612,1.098612,1.098612
1,7,10,1612,1,2837,4414012,35305,2352,30,75,0,45,23,1.892663,1.853309,,


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,Lag2,SPClCh0_mean
0,0,11,4037,1,2209,4639078,35305,2499,28,75,0,45,23,1.609438,1.609438,1.609438
1,1,11,2237,1,1226,4705135,1238,2402,4,140,2,630,4,1.011156,,


Count of missing numbers after SPClCh0_mean in validation part 1 in column Lag2 is 1766672
Count of missing numbers after SPClCh0_mean in validation part 2 in column Lag2 is 1728948
SPCl0_mean is not in columns..


Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,SPCl0_mean
Semana,Producto_ID,Cliente_ID,Unnamed: 3_level_1
5,41,681747,7.632886
5,41,684023,3.433987


Unnamed: 0,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Venta_uni_hoy,Venta_hoy,Dev_uni_proxima,Dev_proxima,...,weight,pieces,Prod_name_ID,Brand_ID,Demanda_uni_equil_original,DemandaNotEqualTheDifferenceOfVentaUniAndDev,Lag0,Lag1,Lag2,SPCl0_mean
0,3,1110,7,3301,15766,1212,3,25.139999,0,0.0,...,120,2,709,4,3.0,False,1.418015,0.0,,
1,3,1110,7,3301,15766,1216,4,33.52,0,0.0,...,135,2,712,4,4.0,False,1.279644,0.0,,


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,Lag1,Lag2,SPCl0_mean
0,2,10,2045,1,2831,4549769,32940,2163,14,110,10,678,23,1.098612,1.098612,1.098612,1.098612
1,7,10,1612,1,2837,4414012,35305,2352,30,75,0,45,23,1.892663,1.853309,,


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,Lag2,SPCl0_mean
0,0,11,4037,1,2209,4639078,35305,2499,28,75,0,45,23,1.609438,1.609438,1.609438
1,1,11,2237,1,1226,4705135,1238,2402,4,140,2,630,4,1.011156,,


Count of missing numbers after SPCl0_mean in validation part 1 in column Lag2 is 1766533
Count of missing numbers after SPCl0_mean in validation part 2 in column Lag2 is 1728791
SPR0_mean is not in columns..


Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,SPR0_mean
Semana,Producto_ID,Ruta_SAK,Unnamed: 3_level_1
5,41,3201,4.037947
5,41,3303,3.433987


Unnamed: 0,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Venta_uni_hoy,Venta_hoy,Dev_uni_proxima,Dev_proxima,...,weight,pieces,Prod_name_ID,Brand_ID,Demanda_uni_equil_original,DemandaNotEqualTheDifferenceOfVentaUniAndDev,Lag0,Lag1,Lag2,SPR0_mean
0,3,1110,7,3301,15766,1212,3,25.139999,0,0.0,...,120,2,709,4,3.0,False,1.418015,0.0,,
1,3,1110,7,3301,15766,1216,4,33.52,0,0.0,...,135,2,712,4,4.0,False,1.279644,0.0,,


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,Lag1,Lag2,SPR0_mean
0,2,10,2045,1,2831,4549769,32940,2163,14,110,10,678,23,1.098612,1.098612,1.098612,1.305682
1,7,10,1612,1,2837,4414012,35305,2352,30,75,0,45,23,1.892663,1.853309,,1.932827


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,Lag2,SPR0_mean
0,0,11,4037,1,2209,4639078,35305,2499,28,75,0,45,23,1.609438,1.609438,1.599221
1,1,11,2237,1,1226,4705135,1238,2402,4,140,2,630,4,1.011156,,0.979642


Count of missing numbers after SPR0_mean in validation part 1 in column Lag2 is 99117
Count of missing numbers after SPR0_mean in validation part 2 in column Lag2 is 112044
SPA0_mean is not in columns..


Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,SPA0_mean
Semana,Producto_ID,Agencia_ID,Unnamed: 3_level_1
5,41,2281,5.949871
5,41,23879,4.037947


Unnamed: 0,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Venta_uni_hoy,Venta_hoy,Dev_uni_proxima,Dev_proxima,...,weight,pieces,Prod_name_ID,Brand_ID,Demanda_uni_equil_original,DemandaNotEqualTheDifferenceOfVentaUniAndDev,Lag0,Lag1,Lag2,SPA0_mean
0,3,1110,7,3301,15766,1212,3,25.139999,0,0.0,...,120,2,709,4,3.0,False,1.418015,0.0,,
1,3,1110,7,3301,15766,1216,4,33.52,0,0.0,...,135,2,712,4,4.0,False,1.279644,0.0,,


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,Lag1,Lag2,SPA0_mean
0,2,10,2045,1,2831,4549769,32940,2163,14,110,10,678,23,1.098612,1.098612,1.098612,1.429421
1,7,10,1612,1,2837,4414012,35305,2352,30,75,0,45,23,1.892663,1.853309,1.932827,2.041774


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,Lag2,SPA0_mean
0,0,11,4037,1,2209,4639078,35305,2499,28,75,0,45,23,1.609438,1.609438,1.910868
1,1,11,2237,1,1226,4705135,1238,2402,4,140,2,630,4,1.011156,0.979642,0.987991


Count of missing numbers after SPA0_mean in validation part 1 in column Lag2 is 82208
Count of missing numbers after SPA0_mean in validation part 2 in column Lag2 is 97121
SPCh0_mean is not in columns..


Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,SPCh0_mean
Semana,Producto_ID,Canal_ID,Unnamed: 3_level_1
5,41,7,5.312563
5,53,4,5.866416


Unnamed: 0,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Venta_uni_hoy,Venta_hoy,Dev_uni_proxima,Dev_proxima,...,weight,pieces,Prod_name_ID,Brand_ID,Demanda_uni_equil_original,DemandaNotEqualTheDifferenceOfVentaUniAndDev,Lag0,Lag1,Lag2,SPCh0_mean
0,3,1110,7,3301,15766,1212,3,25.139999,0,0.0,...,120,2,709,4,3.0,False,1.418015,0.0,,
1,3,1110,7,3301,15766,1216,4,33.52,0,0.0,...,135,2,712,4,4.0,False,1.279644,0.0,,


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,Lag1,Lag2,SPCh0_mean
0,2,10,2045,1,2831,4549769,32940,2163,14,110,10,678,23,1.098612,1.098612,1.098612,1.409464
1,7,10,1612,1,2837,4414012,35305,2352,30,75,0,45,23,1.892663,1.853309,1.932827,2.078055


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,Lag2,SPCh0_mean
0,0,11,4037,1,2209,4639078,35305,2499,28,75,0,45,23,1.609438,1.609438,2.053539
1,1,11,2237,1,1226,4705135,1238,2402,4,140,2,630,4,1.011156,0.979642,1.168275


Count of missing numbers after SPCh0_mean in validation part 1 in column Lag2 is 57508
Count of missing numbers after SPCh0_mean in validation part 2 in column Lag2 is 24171
SPT0_mean is not in columns..


Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,SPT0_mean
Semana,Producto_ID,Town_ID,Unnamed: 3_level_1
5,41,2381,5.949871
5,41,2387,4.037947


Unnamed: 0,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Venta_uni_hoy,Venta_hoy,Dev_uni_proxima,Dev_proxima,...,weight,pieces,Prod_name_ID,Brand_ID,Demanda_uni_equil_original,DemandaNotEqualTheDifferenceOfVentaUniAndDev,Lag0,Lag1,Lag2,SPT0_mean
0,3,1110,7,3301,15766,1212,3,25.139999,0,0.0,...,120,2,709,4,3.0,False,1.418015,0.0,,
1,3,1110,7,3301,15766,1216,4,33.52,0,0.0,...,135,2,712,4,4.0,False,1.279644,0.0,,


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,Lag1,Lag2,SPT0_mean
0,2,10,2045,1,2831,4549769,32940,2163,14,110,10,678,23,1.098612,1.098612,1.098612,1.429421
1,7,10,1612,1,2837,4414012,35305,2352,30,75,0,45,23,1.892663,1.853309,1.932827,2.041774


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,Lag2,SPT0_mean
0,0,11,4037,1,2209,4639078,35305,2499,28,75,0,45,23,1.609438,1.609438,2.010145
1,1,11,2237,1,1226,4705135,1238,2402,4,140,2,630,4,1.011156,0.979642,1.036383


Count of missing numbers after SPT0_mean in validation part 1 in column Lag2 is 57460
Count of missing numbers after SPT0_mean in validation part 2 in column Lag2 is 24143
SPSt0_mean is not in columns..


Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,SPSt0_mean
Semana,Producto_ID,State_ID,Unnamed: 3_level_1
5,41,22,5.312563
5,53,20,6.135444


Unnamed: 0,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Venta_uni_hoy,Venta_hoy,Dev_uni_proxima,Dev_proxima,...,weight,pieces,Prod_name_ID,Brand_ID,Demanda_uni_equil_original,DemandaNotEqualTheDifferenceOfVentaUniAndDev,Lag0,Lag1,Lag2,SPSt0_mean
0,3,1110,7,3301,15766,1212,3,25.139999,0,0.0,...,120,2,709,4,3.0,False,1.418015,0.0,,
1,3,1110,7,3301,15766,1216,4,33.52,0,0.0,...,135,2,712,4,4.0,False,1.279644,0.0,,


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,Lag1,Lag2,SPSt0_mean
0,2,10,2045,1,2831,4549769,32940,2163,14,110,10,678,23,1.098612,1.098612,1.098612,1.392985
1,7,10,1612,1,2837,4414012,35305,2352,30,75,0,45,23,1.892663,1.853309,1.932827,2.090969


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,Lag2,SPSt0_mean
0,0,11,4037,1,2209,4639078,35305,2499,28,75,0,45,23,1.609438,1.609438,2.064013
1,1,11,2237,1,1226,4705135,1238,2402,4,140,2,630,4,1.011156,0.979642,1.067183


Count of missing numbers after SPSt0_mean in validation part 1 in column Lag2 is 57389
Count of missing numbers after SPSt0_mean in validation part 2 in column Lag2 is 24108
SP0_mean is not in columns..


Unnamed: 0_level_0,Unnamed: 1_level_0,SP0_mean
Semana,Producto_ID,Unnamed: 2_level_1
5,41,5.312563
5,53,5.866416


Unnamed: 0,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Venta_uni_hoy,Venta_hoy,Dev_uni_proxima,Dev_proxima,...,weight,pieces,Prod_name_ID,Brand_ID,Demanda_uni_equil_original,DemandaNotEqualTheDifferenceOfVentaUniAndDev,Lag0,Lag1,Lag2,SP0_mean
0,3,1110,7,3301,15766,1212,3,25.139999,0,0.0,...,120,2,709,4,3.0,False,1.418015,0.0,,
1,3,1110,7,3301,15766,1216,4,33.52,0,0.0,...,135,2,712,4,4.0,False,1.279644,0.0,,


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,Lag1,Lag2,SP0_mean
0,2,10,2045,1,2831,4549769,32940,2163,14,110,10,678,23,1.098612,1.098612,1.098612,1.437385
1,7,10,1612,1,2837,4414012,35305,2352,30,75,0,45,23,1.892663,1.853309,1.932827,2.088343


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,Lag2,SP0_mean
0,0,11,4037,1,2209,4639078,35305,2499,28,75,0,45,23,1.609438,1.609438,2.078753
1,1,11,2237,1,1226,4705135,1238,2402,4,140,2,630,4,1.011156,0.979642,1.206758


Count of missing numbers after SP0_mean in validation part 1 in column Lag2 is 57294
Count of missing numbers after SP0_mean in validation part 2 in column Lag2 is 23956
SPnClRACh0_mean is not in columns..


Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,Unnamed: 3_level_0,Unnamed: 4_level_0,Unnamed: 5_level_0,SPnClRACh0_mean
Semana,Prod_name_ID,Cliente_ID,Ruta_SAK,Agencia_ID,Canal_ID,Unnamed: 6_level_1
5,0,60,7238,2061,2,5.049856
5,0,65,7250,2061,2,4.369448


Unnamed: 0,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Venta_uni_hoy,Venta_hoy,Dev_uni_proxima,Dev_proxima,...,weight,pieces,Prod_name_ID,Brand_ID,Demanda_uni_equil_original,DemandaNotEqualTheDifferenceOfVentaUniAndDev,Lag0,Lag1,Lag2,SPnClRACh0_mean
0,3,1110,7,3301,15766,1212,3,25.139999,0,0.0,...,120,2,709,4,3.0,False,1.418015,0.0,,
1,3,1110,7,3301,15766,1216,4,33.52,0,0.0,...,135,2,712,4,4.0,False,1.279644,0.0,,


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,Lag1,Lag2,SPnClRACh0_mean
0,2,10,2045,1,2831,4549769,32940,2163,14,110,10,678,23,1.098612,1.098612,1.098612,1.098612
1,7,10,1612,1,2837,4414012,35305,2352,30,75,0,45,23,1.892663,1.853309,1.932827,


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,Lag2,SPnClRACh0_mean
0,0,11,4037,1,2209,4639078,35305,2499,28,75,0,45,23,1.609438,1.609438,1.609438
1,1,11,2237,1,1226,4705135,1238,2402,4,140,2,630,4,1.011156,0.979642,


Count of missing numbers after SPnClRACh0_mean in validation part 1 in column Lag2 is 52798
Count of missing numbers after SPnClRACh0_mean in validation part 2 in column Lag2 is 23753
SPnClRA0_mean is not in columns..


Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,Unnamed: 3_level_0,Unnamed: 4_level_0,SPnClRA0_mean
Semana,Prod_name_ID,Cliente_ID,Ruta_SAK,Agencia_ID,Unnamed: 5_level_1
5,0,60,7238,2061,5.049856
5,0,65,7250,2061,4.369448


Unnamed: 0,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Venta_uni_hoy,Venta_hoy,Dev_uni_proxima,Dev_proxima,...,weight,pieces,Prod_name_ID,Brand_ID,Demanda_uni_equil_original,DemandaNotEqualTheDifferenceOfVentaUniAndDev,Lag0,Lag1,Lag2,SPnClRA0_mean
0,3,1110,7,3301,15766,1212,3,25.139999,0,0.0,...,120,2,709,4,3.0,False,1.418015,0.0,,
1,3,1110,7,3301,15766,1216,4,33.52,0,0.0,...,135,2,712,4,4.0,False,1.279644,0.0,,


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,Lag1,Lag2,SPnClRA0_mean
0,2,10,2045,1,2831,4549769,32940,2163,14,110,10,678,23,1.098612,1.098612,1.098612,1.098612
1,7,10,1612,1,2837,4414012,35305,2352,30,75,0,45,23,1.892663,1.853309,1.932827,


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,Lag2,SPnClRA0_mean
0,0,11,4037,1,2209,4639078,35305,2499,28,75,0,45,23,1.609438,1.609438,1.609438
1,1,11,2237,1,1226,4705135,1238,2402,4,140,2,630,4,1.011156,0.979642,


Count of missing numbers after SPnClRA0_mean in validation part 1 in column Lag2 is 52798
Count of missing numbers after SPnClRA0_mean in validation part 2 in column Lag2 is 23753
SPnClRCh0_mean is not in columns..


Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,Unnamed: 3_level_0,Unnamed: 4_level_0,SPnClRCh0_mean
Semana,Prod_name_ID,Cliente_ID,Ruta_SAK,Canal_ID,Unnamed: 5_level_1
5,0,60,7238,2,5.049856
5,0,65,7250,2,4.369448


Unnamed: 0,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Venta_uni_hoy,Venta_hoy,Dev_uni_proxima,Dev_proxima,...,weight,pieces,Prod_name_ID,Brand_ID,Demanda_uni_equil_original,DemandaNotEqualTheDifferenceOfVentaUniAndDev,Lag0,Lag1,Lag2,SPnClRCh0_mean
0,3,1110,7,3301,15766,1212,3,25.139999,0,0.0,...,120,2,709,4,3.0,False,1.418015,0.0,,
1,3,1110,7,3301,15766,1216,4,33.52,0,0.0,...,135,2,712,4,4.0,False,1.279644,0.0,,


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,Lag1,Lag2,SPnClRCh0_mean
0,2,10,2045,1,2831,4549769,32940,2163,14,110,10,678,23,1.098612,1.098612,1.098612,1.098612
1,7,10,1612,1,2837,4414012,35305,2352,30,75,0,45,23,1.892663,1.853309,1.932827,


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,Lag2,SPnClRCh0_mean
0,0,11,4037,1,2209,4639078,35305,2499,28,75,0,45,23,1.609438,1.609438,1.609438
1,1,11,2237,1,1226,4705135,1238,2402,4,140,2,630,4,1.011156,0.979642,


Count of missing numbers after SPnClRCh0_mean in validation part 1 in column Lag2 is 52797
Count of missing numbers after SPnClRCh0_mean in validation part 2 in column Lag2 is 23753
SPnClACh0_mean is not in columns..


Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,Unnamed: 3_level_0,Unnamed: 4_level_0,SPnClACh0_mean
Semana,Prod_name_ID,Cliente_ID,Agencia_ID,Canal_ID,Unnamed: 5_level_1
5,0,60,2061,2,5.049856
5,0,65,2061,2,4.369448


Unnamed: 0,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Venta_uni_hoy,Venta_hoy,Dev_uni_proxima,Dev_proxima,...,weight,pieces,Prod_name_ID,Brand_ID,Demanda_uni_equil_original,DemandaNotEqualTheDifferenceOfVentaUniAndDev,Lag0,Lag1,Lag2,SPnClACh0_mean
0,3,1110,7,3301,15766,1212,3,25.139999,0,0.0,...,120,2,709,4,3.0,False,1.418015,0.0,,
1,3,1110,7,3301,15766,1216,4,33.52,0,0.0,...,135,2,712,4,4.0,False,1.279644,0.0,,


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,Lag1,Lag2,SPnClACh0_mean
0,2,10,2045,1,2831,4549769,32940,2163,14,110,10,678,23,1.098612,1.098612,1.098612,1.098612
1,7,10,1612,1,2837,4414012,35305,2352,30,75,0,45,23,1.892663,1.853309,1.932827,


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,Lag2,SPnClACh0_mean
0,0,11,4037,1,2209,4639078,35305,2499,28,75,0,45,23,1.609438,1.609438,1.609438
1,1,11,2237,1,1226,4705135,1238,2402,4,140,2,630,4,1.011156,0.979642,


Count of missing numbers after SPnClACh0_mean in validation part 1 in column Lag2 is 52788
Count of missing numbers after SPnClACh0_mean in validation part 2 in column Lag2 is 23753
SPnClR0_mean is not in columns..


Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,Unnamed: 3_level_0,SPnClR0_mean
Semana,Prod_name_ID,Cliente_ID,Ruta_SAK,Unnamed: 4_level_1
5,0,60,7238,5.049856
5,0,65,7250,4.369448


Unnamed: 0,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Venta_uni_hoy,Venta_hoy,Dev_uni_proxima,Dev_proxima,...,weight,pieces,Prod_name_ID,Brand_ID,Demanda_uni_equil_original,DemandaNotEqualTheDifferenceOfVentaUniAndDev,Lag0,Lag1,Lag2,SPnClR0_mean
0,3,1110,7,3301,15766,1212,3,25.139999,0,0.0,...,120,2,709,4,3.0,False,1.418015,0.0,,
1,3,1110,7,3301,15766,1216,4,33.52,0,0.0,...,135,2,712,4,4.0,False,1.279644,0.0,,


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,Lag1,Lag2,SPnClR0_mean
0,2,10,2045,1,2831,4549769,32940,2163,14,110,10,678,23,1.098612,1.098612,1.098612,1.098612
1,7,10,1612,1,2837,4414012,35305,2352,30,75,0,45,23,1.892663,1.853309,1.932827,


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,Lag2,SPnClR0_mean
0,0,11,4037,1,2209,4639078,35305,2499,28,75,0,45,23,1.609438,1.609438,1.609438
1,1,11,2237,1,1226,4705135,1238,2402,4,140,2,630,4,1.011156,0.979642,


Count of missing numbers after SPnClR0_mean in validation part 1 in column Lag2 is 52788
Count of missing numbers after SPnClR0_mean in validation part 2 in column Lag2 is 23753
SPnClA0_mean is not in columns..


Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,Unnamed: 3_level_0,SPnClA0_mean
Semana,Prod_name_ID,Cliente_ID,Agencia_ID,Unnamed: 4_level_1
5,0,60,2061,5.049856
5,0,65,2061,4.369448


Unnamed: 0,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Venta_uni_hoy,Venta_hoy,Dev_uni_proxima,Dev_proxima,...,weight,pieces,Prod_name_ID,Brand_ID,Demanda_uni_equil_original,DemandaNotEqualTheDifferenceOfVentaUniAndDev,Lag0,Lag1,Lag2,SPnClA0_mean
0,3,1110,7,3301,15766,1212,3,25.139999,0,0.0,...,120,2,709,4,3.0,False,1.418015,0.0,,
1,3,1110,7,3301,15766,1216,4,33.52,0,0.0,...,135,2,712,4,4.0,False,1.279644,0.0,,


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,Lag1,Lag2,SPnClA0_mean
0,2,10,2045,1,2831,4549769,32940,2163,14,110,10,678,23,1.098612,1.098612,1.098612,1.098612
1,7,10,1612,1,2837,4414012,35305,2352,30,75,0,45,23,1.892663,1.853309,1.932827,


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,Lag2,SPnClA0_mean
0,0,11,4037,1,2209,4639078,35305,2499,28,75,0,45,23,1.609438,1.609438,1.609438
1,1,11,2237,1,1226,4705135,1238,2402,4,140,2,630,4,1.011156,0.979642,


Count of missing numbers after SPnClA0_mean in validation part 1 in column Lag2 is 52788
Count of missing numbers after SPnClA0_mean in validation part 2 in column Lag2 is 23753
SPnClCh0_mean is not in columns..


Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,Unnamed: 3_level_0,SPnClCh0_mean
Semana,Prod_name_ID,Cliente_ID,Canal_ID,Unnamed: 4_level_1
5,0,60,2,5.049856
5,0,65,2,4.369448


Unnamed: 0,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Venta_uni_hoy,Venta_hoy,Dev_uni_proxima,Dev_proxima,...,weight,pieces,Prod_name_ID,Brand_ID,Demanda_uni_equil_original,DemandaNotEqualTheDifferenceOfVentaUniAndDev,Lag0,Lag1,Lag2,SPnClCh0_mean
0,3,1110,7,3301,15766,1212,3,25.139999,0,0.0,...,120,2,709,4,3.0,False,1.418015,0.0,,
1,3,1110,7,3301,15766,1216,4,33.52,0,0.0,...,135,2,712,4,4.0,False,1.279644,0.0,,


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,Lag1,Lag2,SPnClCh0_mean
0,2,10,2045,1,2831,4549769,32940,2163,14,110,10,678,23,1.098612,1.098612,1.098612,1.098612
1,7,10,1612,1,2837,4414012,35305,2352,30,75,0,45,23,1.892663,1.853309,1.932827,


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,Lag2,SPnClCh0_mean
0,0,11,4037,1,2209,4639078,35305,2499,28,75,0,45,23,1.609438,1.609438,1.609438
1,1,11,2237,1,1226,4705135,1238,2402,4,140,2,630,4,1.011156,0.979642,


Count of missing numbers after SPnClCh0_mean in validation part 1 in column Lag2 is 52786
Count of missing numbers after SPnClCh0_mean in validation part 2 in column Lag2 is 23753
SPnCl0_mean is not in columns..


Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,SPnCl0_mean
Semana,Prod_name_ID,Cliente_ID,Unnamed: 3_level_1
5,0,60,5.049856
5,0,65,4.369448


Unnamed: 0,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Venta_uni_hoy,Venta_hoy,Dev_uni_proxima,Dev_proxima,...,weight,pieces,Prod_name_ID,Brand_ID,Demanda_uni_equil_original,DemandaNotEqualTheDifferenceOfVentaUniAndDev,Lag0,Lag1,Lag2,SPnCl0_mean
0,3,1110,7,3301,15766,1212,3,25.139999,0,0.0,...,120,2,709,4,3.0,False,1.418015,0.0,,
1,3,1110,7,3301,15766,1216,4,33.52,0,0.0,...,135,2,712,4,4.0,False,1.279644,0.0,,


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,Lag1,Lag2,SPnCl0_mean
0,2,10,2045,1,2831,4549769,32940,2163,14,110,10,678,23,1.098612,1.098612,1.098612,1.098612
1,7,10,1612,1,2837,4414012,35305,2352,30,75,0,45,23,1.892663,1.853309,1.932827,


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,Lag2,SPnCl0_mean
0,0,11,4037,1,2209,4639078,35305,2499,28,75,0,45,23,1.609438,1.609438,1.609438
1,1,11,2237,1,1226,4705135,1238,2402,4,140,2,630,4,1.011156,0.979642,


Count of missing numbers after SPnCl0_mean in validation part 1 in column Lag2 is 52786
Count of missing numbers after SPnCl0_mean in validation part 2 in column Lag2 is 23753
SPnR0_mean is not in columns..


Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,SPnR0_mean
Semana,Prod_name_ID,Ruta_SAK,Unnamed: 3_level_1
5,0,1,4.259628
5,0,2,4.14477


Unnamed: 0,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Venta_uni_hoy,Venta_hoy,Dev_uni_proxima,Dev_proxima,...,weight,pieces,Prod_name_ID,Brand_ID,Demanda_uni_equil_original,DemandaNotEqualTheDifferenceOfVentaUniAndDev,Lag0,Lag1,Lag2,SPnR0_mean
0,3,1110,7,3301,15766,1212,3,25.139999,0,0.0,...,120,2,709,4,3.0,False,1.418015,0.0,,
1,3,1110,7,3301,15766,1216,4,33.52,0,0.0,...,135,2,712,4,4.0,False,1.279644,0.0,,


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,Lag1,Lag2,SPnR0_mean
0,2,10,2045,1,2831,4549769,32940,2163,14,110,10,678,23,1.098612,1.098612,1.098612,1.30888
1,7,10,1612,1,2837,4414012,35305,2352,30,75,0,45,23,1.892663,1.853309,1.932827,1.934301


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,Lag2,SPnR0_mean
0,0,11,4037,1,2209,4639078,35305,2499,28,75,0,45,23,1.609438,1.609438,1.599221
1,1,11,2237,1,1226,4705135,1238,2402,4,140,2,630,4,1.011156,0.979642,0.976249


Count of missing numbers after SPnR0_mean in validation part 1 in column Lag2 is 47749
Count of missing numbers after SPnR0_mean in validation part 2 in column Lag2 is 21976
SPnA0_mean is not in columns..


Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,SPnA0_mean
Semana,Prod_name_ID,Agencia_ID,Unnamed: 3_level_1
5,0,1110,1.94591
5,0,1114,3.503704


Unnamed: 0,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Venta_uni_hoy,Venta_hoy,Dev_uni_proxima,Dev_proxima,...,weight,pieces,Prod_name_ID,Brand_ID,Demanda_uni_equil_original,DemandaNotEqualTheDifferenceOfVentaUniAndDev,Lag0,Lag1,Lag2,SPnA0_mean
0,3,1110,7,3301,15766,1212,3,25.139999,0,0.0,...,120,2,709,4,3.0,False,1.418015,0.0,,
1,3,1110,7,3301,15766,1216,4,33.52,0,0.0,...,135,2,712,4,4.0,False,1.279644,0.0,,


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,Lag1,Lag2,SPnA0_mean
0,2,10,2045,1,2831,4549769,32940,2163,14,110,10,678,23,1.098612,1.098612,1.098612,1.429421
1,7,10,1612,1,2837,4414012,35305,2352,30,75,0,45,23,1.892663,1.853309,1.932827,2.041774


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,Lag2,SPnA0_mean
0,0,11,4037,1,2209,4639078,35305,2499,28,75,0,45,23,1.609438,1.609438,1.910489
1,1,11,2237,1,1226,4705135,1238,2402,4,140,2,630,4,1.011156,0.979642,0.987991


Count of missing numbers after SPnA0_mean in validation part 1 in column Lag2 is 47677
Count of missing numbers after SPnA0_mean in validation part 2 in column Lag2 is 21919
SPnCh0_mean is not in columns..


Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,SPnCh0_mean
Semana,Prod_name_ID,Canal_ID,Unnamed: 3_level_1
5,0,1,2.129508
5,0,2,3.262566


Unnamed: 0,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Venta_uni_hoy,Venta_hoy,Dev_uni_proxima,Dev_proxima,...,weight,pieces,Prod_name_ID,Brand_ID,Demanda_uni_equil_original,DemandaNotEqualTheDifferenceOfVentaUniAndDev,Lag0,Lag1,Lag2,SPnCh0_mean
0,3,1110,7,3301,15766,1212,3,25.139999,0,0.0,...,120,2,709,4,3.0,False,1.418015,0.0,,
1,3,1110,7,3301,15766,1216,4,33.52,0,0.0,...,135,2,712,4,4.0,False,1.279644,0.0,,


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,Lag1,Lag2,SPnCh0_mean
0,2,10,2045,1,2831,4549769,32940,2163,14,110,10,678,23,1.098612,1.098612,1.098612,1.416974
1,7,10,1612,1,2837,4414012,35305,2352,30,75,0,45,23,1.892663,1.853309,1.932827,2.074462


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,Lag2,SPnCh0_mean
0,0,11,4037,1,2209,4639078,35305,2499,28,75,0,45,23,1.609438,1.609438,2.05565
1,1,11,2237,1,1226,4705135,1238,2402,4,140,2,630,4,1.011156,0.979642,1.158545


Count of missing numbers after SPnCh0_mean in validation part 1 in column Lag2 is 47483
Count of missing numbers after SPnCh0_mean in validation part 2 in column Lag2 is 17853
SPnT0_mean is not in columns..


Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,SPnT0_mean
Semana,Prod_name_ID,Town_ID,Unnamed: 3_level_1
5,0,2008,1.94591
5,0,2011,3.684555


Unnamed: 0,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Venta_uni_hoy,Venta_hoy,Dev_uni_proxima,Dev_proxima,...,weight,pieces,Prod_name_ID,Brand_ID,Demanda_uni_equil_original,DemandaNotEqualTheDifferenceOfVentaUniAndDev,Lag0,Lag1,Lag2,SPnT0_mean
0,3,1110,7,3301,15766,1212,3,25.139999,0,0.0,...,120,2,709,4,3.0,False,1.418015,0.0,,
1,3,1110,7,3301,15766,1216,4,33.52,0,0.0,...,135,2,712,4,4.0,False,1.279644,0.0,,


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,Lag1,Lag2,SPnT0_mean
0,2,10,2045,1,2831,4549769,32940,2163,14,110,10,678,23,1.098612,1.098612,1.098612,1.429421
1,7,10,1612,1,2837,4414012,35305,2352,30,75,0,45,23,1.892663,1.853309,1.932827,2.071958


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,Lag2,SPnT0_mean
0,0,11,4037,1,2209,4639078,35305,2499,28,75,0,45,23,1.609438,1.609438,2.019287
1,1,11,2237,1,1226,4705135,1238,2402,4,140,2,630,4,1.011156,0.979642,1.036383


Count of missing numbers after SPnT0_mean in validation part 1 in column Lag2 is 47482
Count of missing numbers after SPnT0_mean in validation part 2 in column Lag2 is 17853
SPnSt0_mean is not in columns..


Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,SPnSt0_mean
Semana,Prod_name_ID,State_ID,Unnamed: 3_level_1
5,0,0,3.215217
5,0,1,2.571746


Unnamed: 0,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Venta_uni_hoy,Venta_hoy,Dev_uni_proxima,Dev_proxima,...,weight,pieces,Prod_name_ID,Brand_ID,Demanda_uni_equil_original,DemandaNotEqualTheDifferenceOfVentaUniAndDev,Lag0,Lag1,Lag2,SPnSt0_mean
0,3,1110,7,3301,15766,1212,3,25.139999,0,0.0,...,120,2,709,4,3.0,False,1.418015,0.0,,
1,3,1110,7,3301,15766,1216,4,33.52,0,0.0,...,135,2,712,4,4.0,False,1.279644,0.0,,


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,Lag1,Lag2,SPnSt0_mean
0,2,10,2045,1,2831,4549769,32940,2163,14,110,10,678,23,1.098612,1.098612,1.098612,1.392985
1,7,10,1612,1,2837,4414012,35305,2352,30,75,0,45,23,1.892663,1.853309,1.932827,2.121022


Unnamed: 0,id,Semana,Agencia_ID,Canal_ID,Ruta_SAK,Cliente_ID,Producto_ID,Town_ID,State_ID,weight,pieces,Prod_name_ID,Brand_ID,Lag0,Lag2,SPnSt0_mean
0,0,11,4037,1,2209,4639078,35305,2499,28,75,0,45,23,1.609438,1.609438,2.074652
1,1,11,2237,1,1226,4705135,1238,2402,4,140,2,630,4,1.011156,0.979642,1.067183


Count of missing numbers after SPnSt0_mean in validation part 1 in column Lag2 is 47481
Count of missing numbers after SPnSt0_mean in validation part 2 in column Lag2 is 17852
SPn0_mean is not in columns..


Unnamed: 0_level_0,Unnamed: 1_level_0,SPn0_mean
Semana,Prod_name_ID,Unnamed: 2_level_1
5,0,3.034794
5,1,3.686628


MemoryError: 

In [None]:
FE.train.fillna(value=0, inplace=True)
FE.test1.fillna(value=0, inplace=True)
FE.test2.fillna(value=0, inplace=True)

In [None]:
FE.SaveDataFrameToHdf('both')

In [None]:
configLag0Target1DeleteColumnsFalse = ConfigElements(3,[ ("SPClRACh0_mean",["Semana",
                                                              "Producto_ID",
                                                              "Cliente_ID",
                                                              "Ruta_SAK",
                                                              "Agencia_ID",
                                                              "Canal_ID"],
                                                          ["mean"]),
                                                        ("SPClRA0_mean",["Semana",
                                                              "Producto_ID",
                                                              "Cliente_ID",
                                                              "Ruta_SAK",
                                                              "Agencia_ID"],
                                                          ["mean"]),
                                                        ("SPClRCh0_mean",["Semana",
                                                              "Producto_ID",
                                                              "Cliente_ID",
                                                              "Ruta_SAK",
                                                              "Canal_ID"],
                                                          ["mean"]),
                                                        ("SPClACh0_mean",["Semana",
                                                              "Producto_ID",
                                                              "Cliente_ID",
                                                              "Agencia_ID",
                                                              "Canal_ID"],
                                                          ["mean"]),
                                                        ("SPClR0_mean",["Semana",
                                                              "Producto_ID",
                                                              "Cliente_ID",
                                                              "Ruta_SAK"],
                                                          ["mean"]),
                                                        ("SPClA0_mean",["Semana",
                                                              "Producto_ID",
                                                              "Cliente_ID",
                                                              "Agencia_ID"],
                                                          ["mean"]),
                                                       ("SPClCh0_mean",["Semana",
                                                              "Producto_ID",
                                                              "Cliente_ID",
                                                              "Canal_ID"],
                                                          ["mean"]),
                                                       ("SPCl0_mean",["Semana",
                                                              "Producto_ID",
                                                              "Cliente_ID"],
                                                          ["mean"]),
                                                       ("SPR0_mean",["Semana",
                                                              "Producto_ID",
                                                              "Ruta_SAK"],
                                                          ["mean"]),
                                                       ("SPA0_mean",["Semana",
                                                              "Producto_ID",
                                                              "Agencia_ID"],
                                                          ["mean"]),
                                                       ("SPCh0_mean",["Semana",
                                                              "Producto_ID",
                                                              "Canal_ID"],
                                                          ["mean"]),
                                                       ("SPT0_mean",["Semana",
                                                              "Producto_ID",
                                                              "Town_ID"],
                                                          ["mean"]),
                                                       ("SPSt0_mean",["Semana",
                                                              "Producto_ID",
                                                              "State_ID"],
                                                          ["mean"]),
                                                       ("SP0_mean",["Semana",
                                                              "Producto_ID"],
                                                          ["mean"]),
                                                      ("SPnClRACh0_mean",["Semana",  ##PRODNAMES START
                                                              "Prod_name_ID",
                                                              "Cliente_ID",
                                                              "Ruta_SAK",
                                                              "Agencia_ID",
                                                              "Canal_ID"],
                                                          ["mean"]),
                                                        ("SPnClRA0_mean",["Semana",
                                                              "Prod_name_ID",
                                                              "Cliente_ID",
                                                              "Ruta_SAK",
                                                              "Agencia_ID"],
                                                          ["mean"]),
                                                        ("SPnClRCh0_mean",["Semana",
                                                              "Prod_name_ID",
                                                              "Cliente_ID",
                                                              "Ruta_SAK",
                                                              "Canal_ID"],
                                                          ["mean"]),
                                                        ("SPnClACh0_mean",["Semana",
                                                              "Prod_name_ID",
                                                              "Cliente_ID",
                                                              "Agencia_ID",
                                                              "Canal_ID"],
                                                          ["mean"]),
                                                        ("SPnClR0_mean",["Semana",
                                                              "Prod_name_ID",
                                                              "Cliente_ID",
                                                              "Ruta_SAK"],
                                                          ["mean"]),
                                                        ("SPnClA0_mean",["Semana",
                                                              "Prod_name_ID",
                                                              "Cliente_ID",
                                                              "Agencia_ID"],
                                                          ["mean"]),
                                                       ("SPnClCh0_mean",["Semana",
                                                              "Prod_name_ID",
                                                              "Cliente_ID",
                                                              "Canal_ID"],
                                                          ["mean"]),
                                                       ("SPnCl0_mean",["Semana",
                                                              "Prod_name_ID",
                                                              "Cliente_ID"],
                                                          ["mean"]),
                                                       ("SPnR0_mean",["Semana",
                                                              "Prod_name_ID",
                                                              "Ruta_SAK"],
                                                          ["mean"]),
                                                       ("SPnA0_mean",["Semana",
                                                              "Prod_name_ID",
                                                              "Agencia_ID"],
                                                          ["mean"]),
                                                       ("SPnCh0_mean",["Semana",
                                                              "Prod_name_ID",
                                                              "Canal_ID"],
                                                          ["mean"]),
                                                       ("SPnT0_mean",["Semana",
                                                              "Prod_name_ID",
                                                              "Town_ID"],
                                                          ["mean"]),
                                                       ("SPnSt0_mean",["Semana",
                                                              "Prod_name_ID",
                                                              "State_ID"],
                                                          ["mean"]),
                                                       ("SPn0_mean",["Semana",
                                                              "Prod_name_ID"],
                                                          ["mean"])

                                                       
                                                       ], "Lag3", True)
print  configLag0Target1DeleteColumnsFalse.__dict__

In [None]:
FE.AddConfigurableFeaturesToTrain(configLag0Target1DeleteColumnsFalse)

In [None]:
FE.train.fillna(value=0, inplace=True)
FE.test1.fillna(value=0, inplace=True)
FE.test2.fillna(value=0, inplace=True)

In [None]:
FE.SaveDataFrameToHdf('both')

In [None]:
print ('RMSLE Score:', rmse(FE.train.Demanda_uni_equil, FE.train.Lag0))
#print ('RMSLE Score:', rmse(FE.test1.Demanda_uni_equil, FE.test1.Lag0))
#print ('RMSLE Score:', rmse(FE.test2.Demanda_uni_equil, FE.test2.Lag0))


print ('RMSLE Score:', rmse(FE.train.Demanda_uni_equil, FE.train.Lag1))
#print ('RMSLE Score:', rmse(FE.test1.Demanda_uni_equil, FE.test1.Lag1))
#print ('RMSLE Score:', rmse(FE.test2.Demanda_uni_equil, FE.test2.Lag1))


print ('RMSLE Score:', rmse(FE.train.Demanda_uni_equil, FE.train.Lag2))
#print ('RMSLE Score:', rmse(FE.test1.Demanda_uni_equil, FE.test1.Lag2))
#print ('RMSLE Score:', rmse(FE.test2.Demanda_uni_equil, FE.test2.Lag2))


print ('RMSLE Score:', rmse(FE.train.Demanda_uni_equil, FE.train.Lag3))
#print ('RMSLE Score:', rmse(FE.test1.Demanda_uni_equil, FE.test1.Lag3))
#print ('RMSLE Score:', rmse(FE.test2.Demanda_uni_equil, FE.test2.Lag3))

In [None]:
FE.train.loc[:,"weightppieces"] = (FE.train["weight"].values/FE.train["pieces"].values)
FE.test1.loc[:,"weightppieces"] = (FE.test1["weight"].values/FE.test1["pieces"].values)
FE.test2.loc[:,"weightppieces"] = (FE.test2["weight"].values/FE.test2["pieces"].values)
FE.train.fillna(value=0, inplace=True)
FE.test1.fillna(value=0, inplace=True)
FE.test2.fillna(value=0, inplace=True)
gc.collect()
FE.SaveDataFrameToHdf('both')
client_sum_venta_hoy = FE.train.groupby('Cliente_ID',as_index=False)['Venta_hoy'].sum()
client_sum_venta_uni_hoy = FE.train.groupby('Cliente_ID',as_index=False)['Venta_uni_hoy'].sum()
client_sum = pd.merge(client_sum_venta_hoy, client_sum_venta_uni_hoy, on='Cliente_ID', how='left', sort=False,copy=False)
client_sum.loc[:,"client_sum_venta_div_venta_uni"] = (client_sum["Venta_hoy"].values/client_sum["Venta_uni_hoy"].values)
client_sum.columns = ['Cliente_ID', 'Client_Sum_Venta_hoy', 'Client_Sum_Venta_uni_hoy', 'Client_Sum_venta_div_venta_uni']
client_sum[['Cliente_ID']]=client_sum[['Cliente_ID']].astype('uint32')
client_sum[['Client_Sum_Venta_hoy']]=client_sum[['Client_Sum_Venta_hoy']].astype('float32')
client_sum[['Client_Sum_Venta_uni_hoy']]=client_sum[['Client_Sum_Venta_uni_hoy']].astype('float32')
client_sum[['Client_Sum_venta_div_venta_uni']]=client_sum[['Client_Sum_venta_div_venta_uni']].astype('float32')
FE.train = pd.merge(FE.train, client_sum, on='Cliente_ID', how='left', sort=False, copy=False)
gc.collect()
prod_name_sum_venta_hoy = FE.train.groupby('Prod_name_ID',as_index=False)['Venta_hoy'].sum()
prod_name_sum_venta_uni_hoy = FE.train.groupby('Prod_name_ID',as_index=False)['Venta_uni_hoy'].sum()
prod_name_sum = pd.merge(prod_name_sum_venta_hoy, prod_name_sum_venta_uni_hoy, on='Prod_name_ID', how='left', sort=False,copy=False)
prod_name_sum.loc[:,"prod_name_sum_venta_div_venta_uni"] = (prod_name_sum["Venta_hoy"].values/prod_name_sum["Venta_uni_hoy"].values)
prod_name_sum.columns = ['Prod_name_ID', 'prod_name_sum_Venta_hoy', 'prod_name_sum_Venta_uni_hoy', 'prod_name_sum_venta_div_venta_uni']
prod_name_sum[['Prod_name_ID']]=prod_name_sum[['Prod_name_ID']].astype('uint16')
prod_name_sum[['prod_name_sum_Venta_hoy']]=prod_name_sum[['prod_name_sum_Venta_hoy']].astype('float32')
prod_name_sum[['prod_name_sum_Venta_uni_hoy']]=prod_name_sum[['prod_name_sum_Venta_uni_hoy']].astype('float32')
prod_name_sum[['prod_name_sum_venta_div_venta_uni']]=prod_name_sum[['prod_name_sum_venta_div_venta_uni']].astype('float32')
FE.train = pd.merge(FE.train, prod_name_sum, on='Prod_name_ID', how='left', sort=False, copy=False)
gc.collect()
Producto_sum_venta_hoy = FE.train.groupby('Producto_ID',as_index=False)['Venta_hoy'].sum()
Producto_sum_venta_uni_hoy = FE.train.groupby('Producto_ID',as_index=False)['Venta_uni_hoy'].sum()
Producto_sum = pd.merge(Producto_sum_venta_hoy, Producto_sum_venta_uni_hoy, on='Producto_ID', how='left', sort=False,copy=False)
Producto_sum.loc[:,"Producto_sum_venta_div_venta_uni"] = (Producto_sum["Venta_hoy"].values/Producto_sum["Venta_uni_hoy"].values)
Producto_sum.columns = ['Producto_ID', 'Producto_sum_Venta_hoy', 'Producto_sum_Venta_uni_hoy', 'Producto_sum_venta_div_venta_uni']
Producto_sum[['Producto_ID']]=Producto_sum[['Producto_ID']].astype('uint16')
Producto_sum[['Producto_sum_Venta_hoy']]=Producto_sum[['Producto_sum_Venta_hoy']].astype('float32')
Producto_sum[['Producto_sum_Venta_uni_hoy']]=Producto_sum[['Producto_sum_Venta_uni_hoy']].astype('float32')
Producto_sum[['Producto_sum_venta_div_venta_uni']]=Producto_sum[['Producto_sum_venta_div_venta_uni']].astype('float32')
FE.train = pd.merge(FE.train, Producto_sum, on='Producto_ID', how='left', sort=False, copy=False)
gc.collect()
FE.test1 = pd.merge(FE.test1, client_sum, on='Cliente_ID', how='left', sort=False, copy=False)
FE.test2 = pd.merge(FE.test2, client_sum, on='Cliente_ID', how='left', sort=False, copy=False)
FE.test1 = pd.merge(FE.test1, prod_name_sum, on='Prod_name_ID', how='left', sort=False, copy=False)
FE.test2 = pd.merge(FE.test2, prod_name_sum, on='Prod_name_ID', how='left', sort=False, copy=False)
FE.test1 = pd.merge(FE.test1, Producto_sum, on='Producto_ID', how='left', sort=False, copy=False)
FE.test2 = pd.merge(FE.test2, Producto_sum, on='Producto_ID', how='left', sort=False, copy=False)
FE.train.fillna(value=0, inplace=True)
FE.test1.fillna(value=0, inplace=True)
FE.test2.fillna(value=0, inplace=True)
gc.collect()
FE.SaveDataFrameToHdf('both')

In [None]:
Feature1 = FE.train[["Producto_ID","Demanda_uni_equil","Venta_uni_hoy"]].copy()
gc.collect()
display(Feature1.head(2))
print "Venta_Uni_Hoy = 0: " ,((Feature1.Venta_uni_hoy == 0).sum())
print "Shape of New Dataframe..: ", str((Feature1.shape[0]))
gc.collect()
Feature1 = Feature1[Feature1.Venta_uni_hoy != 0]
print "Shape of New Dataframe after deleting Venta_Uni_Hoy = 0..: ",(Feature1.shape[0])
gc.collect()
Feature1.loc[:,"Demanda_uni_equil"] = np.round( np.expm1(Feature1["Demanda_uni_equil"].values) )
display(Feature1[Feature1.Demanda_uni_equil.values != Feature1.Venta_uni_hoy.values].head(10))
Feature1 = Feature1.groupby("Producto_ID").sum()
gc.collect()
Feature1.loc[:,"Producto_ID_sum_demanda_divide_sum_venta_uni"] = Feature1.Demanda_uni_equil.values / Feature1.Venta_uni_hoy.values
Feature1 = pd.DataFrame(Feature1["Producto_ID_sum_demanda_divide_sum_venta_uni"])
gc.collect()
print Feature1.mean()
display(Feature1.head(10))
FE.train = FE.train.merge( Feature1, left_on="Producto_ID",
                    right_index=True, how='left', sort=False,copy=False)
FE.test1 = FE.test1.merge( Feature1, left_on="Producto_ID",
                    right_index=True, how='left', sort=False,copy=False)
FE.test2 = FE.test2.merge( Feature1, left_on="Producto_ID",
                    right_index=True, how='left', sort=False,copy=False)
display(FE.train.head(2))
display(FE.test1.head(2))
display(FE.test2.head(2))

In [None]:
Feature1 = FE.train[["Prod_name_ID","Demanda_uni_equil","Venta_uni_hoy"]].copy()
gc.collect()
display(Feature1.head(2))
print "Venta_Uni_Hoy = 0: " ,((Feature1.Venta_uni_hoy == 0).sum())
print "Shape of New Dataframe..: ", str((Feature1.shape[0]))
gc.collect()
Feature1 = Feature1[Feature1.Venta_uni_hoy != 0]
print "Shape of New Dataframe after deleting Venta_Uni_Hoy = 0..: ",(Feature1.shape[0])
gc.collect()
Feature1.loc[:,"Demanda_uni_equil"] = np.round( np.expm1(Feature1["Demanda_uni_equil"].values) )
display(Feature1[Feature1.Demanda_uni_equil.values != Feature1.Venta_uni_hoy.values].head(10))
Feature1 = Feature1.groupby("Prod_name_ID").sum()
gc.collect()
Feature1.loc[:,"Prod_name_ID_sum_demanda_divide_sum_venta_uni"] = Feature1.Demanda_uni_equil.values / Feature1.Venta_uni_hoy.values
Feature1 = pd.DataFrame(Feature1["Prod_name_ID_sum_demanda_divide_sum_venta_uni"])
gc.collect()
print Feature1.mean()
display(Feature1.head(10))
FE.train = FE.train.merge( Feature1, left_on="Prod_name_ID",
                    right_index=True, how='left', sort=False,copy=False)
FE.test1 = FE.test1.merge( Feature1, left_on="Prod_name_ID",
                    right_index=True, how='left', sort=False,copy=False)
FE.test2 = FE.test2.merge( Feature1, left_on="Prod_name_ID",
                    right_index=True, how='left', sort=False,copy=False)
display(FE.train.head(2))
display(FE.test1.head(2))
display(FE.test2.head(2))

In [None]:
Feature1 = FE.train[["Cliente_ID","Demanda_uni_equil","Venta_uni_hoy"]].copy()
gc.collect()
display(Feature1.head(2))
print "Venta_Uni_Hoy = 0: " ,((Feature1.Venta_uni_hoy == 0).sum())
print "Shape of New Dataframe..: ", str((Feature1.shape[0]))
gc.collect()
Feature1 = Feature1[Feature1.Venta_uni_hoy != 0]
print "Shape of New Dataframe after deleting Venta_Uni_Hoy = 0..: ",(Feature1.shape[0])
gc.collect()
Feature1.loc[:,"Demanda_uni_equil"] = np.round( np.expm1(Feature1["Demanda_uni_equil"].values) )
display(Feature1[Feature1.Demanda_uni_equil.values != Feature1.Venta_uni_hoy.values].head(10))
Feature1 = Feature1.groupby("Cliente_ID").sum()
gc.collect()
Feature1.loc[:,"Cliente_ID_sum_demanda_divide_sum_venta_uni"] = Feature1.Demanda_uni_equil.values / Feature1.Venta_uni_hoy.values
Feature1 = pd.DataFrame(Feature1["Cliente_ID_sum_demanda_divide_sum_venta_uni"])
gc.collect()
print Feature1.mean()
display(Feature1.head(10))
FE.train = FE.train.merge( Feature1, left_on="Cliente_ID",
                    right_index=True, how='left', sort=False,copy=False)
FE.test1 = FE.test1.merge( Feature1, left_on="Cliente_ID",
                    right_index=True, how='left', sort=False,copy=False)
FE.test2 = FE.test2.merge( Feature1, left_on="Cliente_ID",
                    right_index=True, how='left', sort=False,copy=False)
display(FE.train.head(2))
display(FE.test1.head(2))
display(FE.test2.head(2))

In [None]:
FE.train.fillna(value=0, inplace=True)
FE.test1.fillna(value=0, inplace=True)
FE.test2.fillna(value=0, inplace=True)
gc.collect()
FE.SaveDataFrameToHdf('both')

In [None]:
clientPerTown = FE.train[["Town_ID","Cliente_ID","Lag0"]].copy()

clientPerTown = clientPerTown.groupby(["Town_ID","Cliente_ID"])

clientPerTown = clientPerTown.count()
gc.collect()

clientPerTown.reset_index(inplace=True)

clientPerTown = clientPerTown.groupby("Town_ID").count()

clientPerTown = pd.DataFrame( { "ClientPerTown" : clientPerTown.Cliente_ID} )

gc.collect()

FE.train = FE.train.merge( clientPerTown, left_on="Town_ID",
                    right_index=True, how='left', sort=False,copy=False)
FE.test1 = FE.test1.merge( clientPerTown, left_on="Town_ID",
                    right_index=True, how='left', sort=False,copy=False)
FE.test2 = FE.test2.merge( clientPerTown, left_on="Town_ID",
                    right_index=True, how='left', sort=False,copy=False)
display(FE.train.head(2))
display(FE.test1.head(2))
display(FE.test2.head(2))

FE.train.fillna(value=0, inplace=True)
FE.test1.fillna(value=0, inplace=True)
FE.test2.fillna(value=0, inplace=True)
gc.collect()


client_return_sum = FE.train.groupby('Cliente_ID',as_index=False)['DemandaNotEqualTheDifferenceOfVentaUniAndDev'].sum()
client_return_count = FE.train.groupby('Cliente_ID',as_index=False)['DemandaNotEqualTheDifferenceOfVentaUniAndDev'].count()
client_return = pd.merge(client_return_sum, client_return_count, on='Cliente_ID', how='left', sort=False,copy=False)

client_return.loc[:,"Client_return_rate"] = (client_return["DemandaNotEqualTheDifferenceOfVentaUniAndDev_x"].values/client_return["DemandaNotEqualTheDifferenceOfVentaUniAndDev_y"].values)
client_return.columns = ['Cliente_ID', 'client_return_sum', 'client_return_count', 'Client_return_rate']

FE.train = pd.merge(FE.train, client_return, on='Cliente_ID', how='left', sort=False, copy=False)
FE.test1 = pd.merge(FE.test1, client_return, on='Cliente_ID', how='left', sort=False, copy=False)
FE.test2 = pd.merge(FE.test2, client_return, on='Cliente_ID', how='left', sort=False, copy=False)

FE.train.fillna(value=0, inplace=True)
FE.test1.fillna(value=0, inplace=True)
FE.test2.fillna(value=0, inplace=True)
gc.collect()


producto_return_sum = FE.train.groupby('Producto_ID',as_index=False)['DemandaNotEqualTheDifferenceOfVentaUniAndDev'].sum()
producto_return_count = FE.train.groupby('Producto_ID',as_index=False)['DemandaNotEqualTheDifferenceOfVentaUniAndDev'].count()
producto_return = pd.merge(producto_return_sum, producto_return_count, on='Producto_ID', how='left', sort=False,copy=False)

producto_return.loc[:,"producto_return_rate"] = (producto_return["DemandaNotEqualTheDifferenceOfVentaUniAndDev_x"].values/producto_return["DemandaNotEqualTheDifferenceOfVentaUniAndDev_y"].values)
producto_return.columns = ['Producto_ID', 'producto_return_sum', 'producto_return_count', 'producto_return_rate']

FE.train = pd.merge(FE.train, producto_return, on='Producto_ID', how='left', sort=False, copy=False)
FE.test1 = pd.merge(FE.test1, producto_return, on='Producto_ID', how='left', sort=False, copy=False)
FE.test2 = pd.merge(FE.test2, producto_return, on='Producto_ID', how='left', sort=False, copy=False)

FE.train.fillna(value=0, inplace=True)
FE.test1.fillna(value=0, inplace=True)
FE.test2.fillna(value=0, inplace=True)
gc.collect()

prod_name_return_sum = FE.train.groupby('Prod_name_ID',as_index=False)['DemandaNotEqualTheDifferenceOfVentaUniAndDev'].sum()
prod_name_return_count = FE.train.groupby('Prod_name_ID',as_index=False)['DemandaNotEqualTheDifferenceOfVentaUniAndDev'].count()
producto_return = pd.merge(prod_name_return_sum, prod_name_return_count, on='Prod_name_ID', how='left', sort=False,copy=False)

producto_return.loc[:,"prod_name_return_rate"] = (producto_return["DemandaNotEqualTheDifferenceOfVentaUniAndDev_x"].values/producto_return["DemandaNotEqualTheDifferenceOfVentaUniAndDev_y"].values)
producto_return.columns = ['Prod_name_ID', 'prod_name_return_sum', 'prod_name_return_count', 'prod_name_return_rate']

FE.train = pd.merge(FE.train, producto_return, on='Prod_name_ID', how='left', sort=False, copy=False)
FE.test1 = pd.merge(FE.test1, producto_return, on='Prod_name_ID', how='left', sort=False, copy=False)
FE.test2 = pd.merge(FE.test2, producto_return, on='Prod_name_ID', how='left', sort=False, copy=False)

FE.train.fillna(value=0, inplace=True)
FE.test1.fillna(value=0, inplace=True)
FE.test2.fillna(value=0, inplace=True)
gc.collect()
FE.SaveDataFrameToHdf('both')
gc.collect()