# Problem Statement

The data scientists at BigMart have collected 2013 sales data for 1559 products across 10 stores in different cities. Also, certain attributes of each product and store have been defined. The aim is to build a predictive model and find out the sales of each product at a particular store.

Using this model, BigMart will try to understand the properties of products and stores which play a key role in increasing sales.

 
Please note that the data may have missing values as some stores might not report all the data due to technical glitches. Hence, it will be required to treat them accordingly.

### importing libraries

In [1]:
import numpy as np
import pandas as pd
import matplotlib.pyplot as plt
import seaborn as sns

In [2]:
df_train = pd.read_csv('Train.csv')
df_test = pd.read_csv('Test.csv')

In [3]:
df_train.head()

Unnamed: 0,Item_Identifier,Item_Weight,Item_Fat_Content,Item_Visibility,Item_Type,Item_MRP,Outlet_Identifier,Outlet_Establishment_Year,Outlet_Size,Outlet_Location_Type,Outlet_Type,Item_Outlet_Sales
0,FDA15,9.3,Low Fat,0.016047,Dairy,249.8092,OUT049,1999,Medium,Tier 1,Supermarket Type1,3735.138
1,DRC01,5.92,Regular,0.019278,Soft Drinks,48.2692,OUT018,2009,Medium,Tier 3,Supermarket Type2,443.4228
2,FDN15,17.5,Low Fat,0.01676,Meat,141.618,OUT049,1999,Medium,Tier 1,Supermarket Type1,2097.27
3,FDX07,19.2,Regular,0.0,Fruits and Vegetables,182.095,OUT010,1998,,Tier 3,Grocery Store,732.38
4,NCD19,8.93,Low Fat,0.0,Household,53.8614,OUT013,1987,High,Tier 3,Supermarket Type1,994.7052


In [4]:
df_test.head()

Unnamed: 0,Item_Identifier,Item_Weight,Item_Fat_Content,Item_Visibility,Item_Type,Item_MRP,Outlet_Identifier,Outlet_Establishment_Year,Outlet_Size,Outlet_Location_Type,Outlet_Type
0,FDW58,20.75,Low Fat,0.007565,Snack Foods,107.8622,OUT049,1999,Medium,Tier 1,Supermarket Type1
1,FDW14,8.3,reg,0.038428,Dairy,87.3198,OUT017,2007,,Tier 2,Supermarket Type1
2,NCN55,14.6,Low Fat,0.099575,Others,241.7538,OUT010,1998,,Tier 3,Grocery Store
3,FDQ58,7.315,Low Fat,0.015388,Snack Foods,155.034,OUT017,2007,,Tier 2,Supermarket Type1
4,FDY38,,Regular,0.118599,Dairy,234.23,OUT027,1985,Medium,Tier 3,Supermarket Type3


In [5]:
df_train.shape

(8523, 12)

In [6]:
df_test.shape

(5681, 11)

In [7]:
df_train2 = df_train.drop('Item_Outlet_Sales',axis=1)

In [8]:
combined = df_train2.append(df_test)

In [9]:
combined.head()

Unnamed: 0,Item_Identifier,Item_Weight,Item_Fat_Content,Item_Visibility,Item_Type,Item_MRP,Outlet_Identifier,Outlet_Establishment_Year,Outlet_Size,Outlet_Location_Type,Outlet_Type
0,FDA15,9.3,Low Fat,0.016047,Dairy,249.8092,OUT049,1999,Medium,Tier 1,Supermarket Type1
1,DRC01,5.92,Regular,0.019278,Soft Drinks,48.2692,OUT018,2009,Medium,Tier 3,Supermarket Type2
2,FDN15,17.5,Low Fat,0.01676,Meat,141.618,OUT049,1999,Medium,Tier 1,Supermarket Type1
3,FDX07,19.2,Regular,0.0,Fruits and Vegetables,182.095,OUT010,1998,,Tier 3,Grocery Store
4,NCD19,8.93,Low Fat,0.0,Household,53.8614,OUT013,1987,High,Tier 3,Supermarket Type1


In [10]:
combined.tail()

Unnamed: 0,Item_Identifier,Item_Weight,Item_Fat_Content,Item_Visibility,Item_Type,Item_MRP,Outlet_Identifier,Outlet_Establishment_Year,Outlet_Size,Outlet_Location_Type,Outlet_Type
5676,FDB58,10.5,Regular,0.013496,Snack Foods,141.3154,OUT046,1997,Small,Tier 1,Supermarket Type1
5677,FDD47,7.6,Regular,0.142991,Starchy Foods,169.1448,OUT018,2009,Medium,Tier 3,Supermarket Type2
5678,NCO17,10.0,Low Fat,0.073529,Health and Hygiene,118.744,OUT045,2002,,Tier 2,Supermarket Type1
5679,FDJ26,15.3,Regular,0.0,Canned,214.6218,OUT017,2007,,Tier 2,Supermarket Type1
5680,FDU37,9.5,Regular,0.10472,Canned,79.796,OUT045,2002,,Tier 2,Supermarket Type1


In [11]:
combined.reset_index(inplace=True)

In [12]:
combined.drop('index',inplace=True, axis=1)

In [13]:
combined.tail()

Unnamed: 0,Item_Identifier,Item_Weight,Item_Fat_Content,Item_Visibility,Item_Type,Item_MRP,Outlet_Identifier,Outlet_Establishment_Year,Outlet_Size,Outlet_Location_Type,Outlet_Type
14199,FDB58,10.5,Regular,0.013496,Snack Foods,141.3154,OUT046,1997,Small,Tier 1,Supermarket Type1
14200,FDD47,7.6,Regular,0.142991,Starchy Foods,169.1448,OUT018,2009,Medium,Tier 3,Supermarket Type2
14201,NCO17,10.0,Low Fat,0.073529,Health and Hygiene,118.744,OUT045,2002,,Tier 2,Supermarket Type1
14202,FDJ26,15.3,Regular,0.0,Canned,214.6218,OUT017,2007,,Tier 2,Supermarket Type1
14203,FDU37,9.5,Regular,0.10472,Canned,79.796,OUT045,2002,,Tier 2,Supermarket Type1


In [14]:
combined.columns

Index(['Item_Identifier', 'Item_Weight', 'Item_Fat_Content', 'Item_Visibility',
       'Item_Type', 'Item_MRP', 'Outlet_Identifier',
       'Outlet_Establishment_Year', 'Outlet_Size', 'Outlet_Location_Type',
       'Outlet_Type'],
      dtype='object')

In [15]:
combined['Item_Fat_Content'].value_counts()

Low Fat    8485
Regular    4824
LF          522
reg         195
low fat     178
Name: Item_Fat_Content, dtype: int64

In [16]:
fat_content = {'Low Fat':0, 'LF':0, 'low fat':0, 'Regular':1, 'reg':1}
combined['Item_Fat_Content'] = combined['Item_Fat_Content'].map(fat_content)

In [17]:
combined.head()

Unnamed: 0,Item_Identifier,Item_Weight,Item_Fat_Content,Item_Visibility,Item_Type,Item_MRP,Outlet_Identifier,Outlet_Establishment_Year,Outlet_Size,Outlet_Location_Type,Outlet_Type
0,FDA15,9.3,0,0.016047,Dairy,249.8092,OUT049,1999,Medium,Tier 1,Supermarket Type1
1,DRC01,5.92,1,0.019278,Soft Drinks,48.2692,OUT018,2009,Medium,Tier 3,Supermarket Type2
2,FDN15,17.5,0,0.01676,Meat,141.618,OUT049,1999,Medium,Tier 1,Supermarket Type1
3,FDX07,19.2,1,0.0,Fruits and Vegetables,182.095,OUT010,1998,,Tier 3,Grocery Store
4,NCD19,8.93,0,0.0,Household,53.8614,OUT013,1987,High,Tier 3,Supermarket Type1


In [18]:
combined.isnull().sum()

Item_Identifier                 0
Item_Weight                  2439
Item_Fat_Content                0
Item_Visibility                 0
Item_Type                       0
Item_MRP                        0
Outlet_Identifier               0
Outlet_Establishment_Year       0
Outlet_Size                  4016
Outlet_Location_Type            0
Outlet_Type                     0
dtype: int64

In [19]:
combined.tail()

Unnamed: 0,Item_Identifier,Item_Weight,Item_Fat_Content,Item_Visibility,Item_Type,Item_MRP,Outlet_Identifier,Outlet_Establishment_Year,Outlet_Size,Outlet_Location_Type,Outlet_Type
14199,FDB58,10.5,1,0.013496,Snack Foods,141.3154,OUT046,1997,Small,Tier 1,Supermarket Type1
14200,FDD47,7.6,1,0.142991,Starchy Foods,169.1448,OUT018,2009,Medium,Tier 3,Supermarket Type2
14201,NCO17,10.0,0,0.073529,Health and Hygiene,118.744,OUT045,2002,,Tier 2,Supermarket Type1
14202,FDJ26,15.3,1,0.0,Canned,214.6218,OUT017,2007,,Tier 2,Supermarket Type1
14203,FDU37,9.5,1,0.10472,Canned,79.796,OUT045,2002,,Tier 2,Supermarket Type1


In [20]:
combined.loc[combined['Item_Identifier'] == 'NCO17']

Unnamed: 0,Item_Identifier,Item_Weight,Item_Fat_Content,Item_Visibility,Item_Type,Item_MRP,Outlet_Identifier,Outlet_Establishment_Year,Outlet_Size,Outlet_Location_Type,Outlet_Type
182,NCO17,,0,0.128478,Health and Hygiene,117.944,OUT019,1985,Small,Tier 1,Grocery Store
361,NCO17,10.0,0,0.07338,Health and Hygiene,118.244,OUT046,1997,Small,Tier 1,Supermarket Type1
892,NCO17,,0,0.073024,Health and Hygiene,121.844,OUT027,1985,Medium,Tier 3,Supermarket Type3
968,NCO17,10.0,0,0.0,Health and Hygiene,120.644,OUT035,2004,Small,Tier 2,Supermarket Type1
2076,NCO17,10.0,0,0.073795,Health and Hygiene,121.444,OUT017,2007,,Tier 2,Supermarket Type1
6916,NCO17,10.0,0,0.073494,Health and Hygiene,118.344,OUT049,1999,Medium,Tier 1,Supermarket Type1
7193,NCO17,10.0,0,0.073679,Health and Hygiene,120.944,OUT018,2009,Medium,Tier 3,Supermarket Type2
11573,NCO17,10.0,0,0.0,Health and Hygiene,118.744,OUT013,1987,High,Tier 3,Supermarket Type1
14201,NCO17,10.0,0,0.073529,Health and Hygiene,118.744,OUT045,2002,,Tier 2,Supermarket Type1


In [21]:
import math
dic = {}

for i in combined['Item_Identifier']:
    a = (combined['Item_Identifier'] == i)
    b = combined[a == True]
    c = b['Item_Weight'].unique()
    for j in c:
        if math.isnan(j):
            continue
        else:
            dic[i] = j


# dic = {}
# for i in alldata['Item_Identifier']:
#     a = (alldata['Item_Identifier']==i)
#     b = alldata[a==True]
#     c = b['Item_Weight'].unique()
#     dic[i] = c



In [22]:
for i in dic:
    combined['Item_Weight'].loc[combined['Item_Identifier'] == i] = dic[i]

A value is trying to be set on a copy of a slice from a DataFrame

See the caveats in the documentation: http://pandas.pydata.org/pandas-docs/stable/indexing.html#indexing-view-versus-copy
  self._setitem_with_indexer(indexer, value)


In [25]:
combined.isnull().sum()

Item_Identifier                 0
Item_Weight                     0
Item_Fat_Content                0
Item_Visibility                 0
Item_Type                       0
Item_MRP                        0
Outlet_Identifier               0
Outlet_Establishment_Year       0
Outlet_Size                  4016
Outlet_Location_Type            0
Outlet_Type                     0
dtype: int64

In [45]:
pd.crosstab(combined['Outlet_Size'], combined['Outlet_Type'], dropna=False, margins=True)

Outlet_Type,Grocery Store,Supermarket Type1,Supermarket Type2,Supermarket Type3,All
Outlet_Size,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1
High,0,1553,0,0,1553
Medium,0,1550,1546,1559,4655
Small,1805,3100,0,0,4905
All,1805,9294,1546,1559,14204


In [None]:
pd.crosstab(combined['Outlet_Size'], combined['Outlet_Type'], dropna=False, margins=True)

In [44]:
combined['Outlet_Size'].isnull().sum()

3091

In [53]:
combined['Outlet_Size'].value_counts()

Small     4905
Medium    4655
High      1553
Name: Outlet_Size, dtype: int64

In [36]:
combined['Outlet_Type'].value_counts()

Supermarket Type1    9294
Grocery Store        1805
Supermarket Type3    1559
Supermarket Type2    1546
Name: Outlet_Type, dtype: int64

In [51]:
combined.groupby('Outlet_Type').Outlet_Size.value_counts()

Outlet_Type        Outlet_Size
Grocery Store      Small          1805
Supermarket Type1  Small          3100
                   High           1553
                   Medium         1550
Supermarket Type2  Medium         1546
Supermarket Type3  Medium         1559
Name: Outlet_Size, dtype: int64

In [52]:
combined.groupby('Outlet_Size').Outlet_Type.value_counts()

Outlet_Size  Outlet_Type      
High         Supermarket Type1    1553
Medium       Supermarket Type3    1559
             Supermarket Type1    1550
             Supermarket Type2    1546
Small        Supermarket Type1    3100
             Grocery Store        1805
Name: Outlet_Type, dtype: int64

In [56]:
combined['Outlet_Size'].fillna('Medium', inplace=True)

In [57]:
pd.crosstab(combined['Outlet_Size'], combined['Outlet_Type'], dropna=False, margins=True)

Outlet_Type,Grocery Store,Supermarket Type1,Supermarket Type2,Supermarket Type3,All
Outlet_Size,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1
High,0,1553,0,0,1553
Medium,0,4641,1546,1559,7746
Small,1805,3100,0,0,4905
All,1805,9294,1546,1559,14204


In [58]:
pd.crosstab(combined['Outlet_Size'], combined['Outlet_Location_Type'], dropna=False, margins=True)

Outlet_Location_Type,Tier 1,Tier 2,Tier 3,All
Outlet_Size,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1
High,0,0,1553,1553
Medium,1550,3091,3105,7746
Small,2430,1550,925,4905
All,3980,4641,5583,14204


In [59]:
pd.crosstab(combined['Outlet_Type'], combined['Outlet_Location_Type'], dropna=False, margins=True)

Outlet_Location_Type,Tier 1,Tier 2,Tier 3,All
Outlet_Type,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1
Grocery Store,880,0,925,1805
Supermarket Type1,3100,4641,1553,9294
Supermarket Type2,0,0,1546,1546
Supermarket Type3,0,0,1559,1559
All,3980,4641,5583,14204


In [60]:
combined.isnull().sum()

Item_Identifier              0
Item_Weight                  0
Item_Fat_Content             0
Item_Visibility              0
Item_Type                    0
Item_MRP                     0
Outlet_Identifier            0
Outlet_Establishment_Year    0
Outlet_Size                  0
Outlet_Location_Type         0
Outlet_Type                  0
dtype: int64

In [61]:
combined.loc[combined['Outlet_Type']=='Grocery Store', 'Outlet_Size'] = 'Small'

In [62]:
combined.isnull().sum()

Item_Identifier              0
Item_Weight                  0
Item_Fat_Content             0
Item_Visibility              0
Item_Type                    0
Item_MRP                     0
Outlet_Identifier            0
Outlet_Establishment_Year    0
Outlet_Size                  0
Outlet_Location_Type         0
Outlet_Type                  0
dtype: int64

In [63]:
combined

Unnamed: 0,Item_Identifier,Item_Weight,Item_Fat_Content,Item_Visibility,Item_Type,Item_MRP,Outlet_Identifier,Outlet_Establishment_Year,Outlet_Size,Outlet_Location_Type,Outlet_Type
0,FDA15,9.300,0,0.016047,Dairy,249.8092,OUT049,1999,Medium,Tier 1,Supermarket Type1
1,DRC01,5.920,1,0.019278,Soft Drinks,48.2692,OUT018,2009,Medium,Tier 3,Supermarket Type2
2,FDN15,17.500,0,0.016760,Meat,141.6180,OUT049,1999,Medium,Tier 1,Supermarket Type1
3,FDX07,19.200,1,0.000000,Fruits and Vegetables,182.0950,OUT010,1998,Small,Tier 3,Grocery Store
4,NCD19,8.930,0,0.000000,Household,53.8614,OUT013,1987,High,Tier 3,Supermarket Type1
5,FDP36,10.395,1,0.000000,Baking Goods,51.4008,OUT018,2009,Medium,Tier 3,Supermarket Type2
6,FDO10,13.650,1,0.012741,Snack Foods,57.6588,OUT013,1987,High,Tier 3,Supermarket Type1
7,FDP10,19.000,0,0.127470,Snack Foods,107.7622,OUT027,1985,Medium,Tier 3,Supermarket Type3
8,FDH17,16.200,1,0.016687,Frozen Foods,96.9726,OUT045,2002,Medium,Tier 2,Supermarket Type1
9,FDU28,19.200,1,0.094450,Frozen Foods,187.8214,OUT017,2007,Medium,Tier 2,Supermarket Type1


In [64]:
import datetime

combined['Outlet_Establishment_Year'] = datetime.datetime.now().year - combined['Outlet_Establishment_Year']

In [65]:
combined

Unnamed: 0,Item_Identifier,Item_Weight,Item_Fat_Content,Item_Visibility,Item_Type,Item_MRP,Outlet_Identifier,Outlet_Establishment_Year,Outlet_Size,Outlet_Location_Type,Outlet_Type
0,FDA15,9.300,0,0.016047,Dairy,249.8092,OUT049,20,Medium,Tier 1,Supermarket Type1
1,DRC01,5.920,1,0.019278,Soft Drinks,48.2692,OUT018,10,Medium,Tier 3,Supermarket Type2
2,FDN15,17.500,0,0.016760,Meat,141.6180,OUT049,20,Medium,Tier 1,Supermarket Type1
3,FDX07,19.200,1,0.000000,Fruits and Vegetables,182.0950,OUT010,21,Small,Tier 3,Grocery Store
4,NCD19,8.930,0,0.000000,Household,53.8614,OUT013,32,High,Tier 3,Supermarket Type1
5,FDP36,10.395,1,0.000000,Baking Goods,51.4008,OUT018,10,Medium,Tier 3,Supermarket Type2
6,FDO10,13.650,1,0.012741,Snack Foods,57.6588,OUT013,32,High,Tier 3,Supermarket Type1
7,FDP10,19.000,0,0.127470,Snack Foods,107.7622,OUT027,34,Medium,Tier 3,Supermarket Type3
8,FDH17,16.200,1,0.016687,Frozen Foods,96.9726,OUT045,17,Medium,Tier 2,Supermarket Type1
9,FDU28,19.200,1,0.094450,Frozen Foods,187.8214,OUT017,12,Medium,Tier 2,Supermarket Type1


In [66]:
combined['Item_MRP'] -= combined['Item_MRP'].min()

In [67]:
combined['Item_MRP'] /= combined['Item_MRP'].max()

In [68]:
combined

Unnamed: 0,Item_Identifier,Item_Weight,Item_Fat_Content,Item_Visibility,Item_Type,Item_MRP,Outlet_Identifier,Outlet_Establishment_Year,Outlet_Size,Outlet_Location_Type,Outlet_Type
0,FDA15,9.300,0,0.016047,Dairy,0.927507,OUT049,20,Medium,Tier 1,Supermarket Type1
1,DRC01,5.920,1,0.019278,Soft Drinks,0.072068,OUT018,10,Medium,Tier 3,Supermarket Type2
2,FDN15,17.500,0,0.016760,Meat,0.468288,OUT049,20,Medium,Tier 1,Supermarket Type1
3,FDX07,19.200,1,0.000000,Fruits and Vegetables,0.640093,OUT010,21,Small,Tier 3,Grocery Store
4,NCD19,8.930,0,0.000000,Household,0.095805,OUT013,32,High,Tier 3,Supermarket Type1
5,FDP36,10.395,1,0.000000,Baking Goods,0.085361,OUT018,10,Medium,Tier 3,Supermarket Type2
6,FDO10,13.650,1,0.012741,Snack Foods,0.111923,OUT013,32,High,Tier 3,Supermarket Type1
7,FDP10,19.000,0,0.127470,Snack Foods,0.324587,OUT027,34,Medium,Tier 3,Supermarket Type3
8,FDH17,16.200,1,0.016687,Frozen Foods,0.278791,OUT045,17,Medium,Tier 2,Supermarket Type1
9,FDU28,19.200,1,0.094450,Frozen Foods,0.664399,OUT017,12,Medium,Tier 2,Supermarket Type1


In [69]:
combined['Item_Weight'] -= combined['Item_Weight'].min()
combined['Item_Weight'] /= combined['Item_Weight'].max()

In [98]:
combined.shape

(14204, 11)

In [99]:
df_train.shape

(8523, 12)

In [100]:
df_test.shape

(5681, 11)

In [103]:
combined2 = combined

In [104]:
combined2.shape

(14204, 11)

In [105]:
combined2.columns

Index(['Item_Identifier', 'Item_Weight', 'Item_Fat_Content', 'Item_Visibility',
       'Item_Type', 'Item_MRP', 'Outlet_Identifier',
       'Outlet_Establishment_Year', 'Outlet_Size', 'Outlet_Location_Type',
       'Outlet_Type'],
      dtype='object')

In [107]:
combined2.drop('Item_Identifier', inplace=True, axis=1)

In [108]:
combined2.shape

(14204, 10)

In [109]:
idx = combined.columns

In [115]:
idx = combined[['Item_Weight', 'Item_Fat_Content', 'Item_Visibility', 'Item_Type',
       'Item_MRP', 'Outlet_Identifier', 'Outlet_Establishment_Year',
       'Outlet_Size', 'Outlet_Location_Type', 'Outlet_Type']]

In [116]:
idx

Unnamed: 0,Item_Weight,Item_Fat_Content,Item_Visibility,Item_Type,Item_MRP,Outlet_Identifier,Outlet_Establishment_Year,Outlet_Size,Outlet_Location_Type,Outlet_Type
0,0.282525,0,0.016047,Dairy,0.927507,OUT049,20,Medium,Tier 1,Supermarket Type1
1,0.081274,1,0.019278,Soft Drinks,0.072068,OUT018,10,Medium,Tier 3,Supermarket Type2
2,0.770765,0,0.016760,Meat,0.468288,OUT049,20,Medium,Tier 1,Supermarket Type1
3,0.871986,1,0.000000,Fruits and Vegetables,0.640093,OUT010,21,Small,Tier 3,Grocery Store
4,0.260494,0,0.000000,Household,0.095805,OUT013,32,High,Tier 3,Supermarket Type1
5,0.347723,1,0.000000,Baking Goods,0.085361,OUT018,10,Medium,Tier 3,Supermarket Type2
6,0.541530,1,0.012741,Snack Foods,0.111923,OUT013,32,High,Tier 3,Supermarket Type1
7,0.860077,0,0.127470,Snack Foods,0.324587,OUT027,34,Medium,Tier 3,Supermarket Type3
8,0.693361,1,0.016687,Frozen Foods,0.278791,OUT045,17,Medium,Tier 2,Supermarket Type1
9,0.871986,1,0.094450,Frozen Foods,0.664399,OUT017,12,Medium,Tier 2,Supermarket Type1


In [117]:
combined2 = pd.get_dummies(idx)

In [118]:
combined2.shape

(14204, 41)

In [120]:
train = combined2[:8523]
test = combined2[8523:]
target = df_train['Item_Outlet_Sales']

In [121]:
from sklearn.linear_model import LinearRegression
model = LinearRegression()

model.fit(train,target)

LinearRegression(copy_X=True, fit_intercept=True, n_jobs=None, normalize=False)

In [122]:
print(model.intercept_)

-223.15761682391394


In [123]:
y_pred = model.predict(test)

In [125]:
y_pred.shape

(5681,)

In [126]:
df = pd.DataFrame(y_pred)

In [127]:
df

Unnamed: 0,0
0,1840.369113
1,1528.576040
2,1882.082328
3,2578.201918
4,5136.377185
5,1951.976282
6,596.409071
7,2783.708630
8,1489.150029
9,3088.631617


In [131]:
test_cases=pd.read_csv('Test.csv')
df['Item_Identifier'] = test_cases['Item_Identifier']
df['Outlet_Identifier'] = test_cases['Outlet_Identifier']
df['Item_Outlet_Sales'] = df[0]

In [133]:
df[['Item_Identifier', 'Outlet_Identifier', 'Item_Outlet_Sales']].to_csv('Result.csv',index=False)