In [13]:
import numpy as np
import pandas as pd
from yaml import safe_load
import os
from tqdm import tqdm

In [14]:
# Set the path to the data directory
data_path = os.path.join('..', 'data')

# Collect filenames from the data directory
filenames = [os.path.join(data_path, file) for file in os.listdir(data_path)]

In [15]:
filenames[0:5]

['..\\data\\1075986.yaml',
 '..\\data\\1075987.yaml',
 '..\\data\\1075988.yaml',
 '..\\data\\1075989.yaml',
 '..\\data\\1075990.yaml']

In [17]:
# Initialize an empty list to store DataFrames
data_frames = []
counter = 1

# Process each file
for file in tqdm(filenames):
    try:
        with open(file, 'r') as f:
            df = pd.json_normalize(safe_load(f))
            df['match_id'] = counter
            data_frames.append(df)
            counter += 1
    except FileNotFoundError:
        print(f"File not found: {file}. Skipping...")
        continue
    except Exception as e:
        print(f"Error processing {file}: {e}")
        continue

# Concatenate all DataFrames into a single DataFrame
final_df = pd.concat(data_frames, ignore_index=True)

final_df

  0%|          | 0/148 [00:00<?, ?it/s]

100%|██████████| 148/148 [04:20<00:00,  1.76s/it]


Error processing ..\data\desktop.ini: expected '<document start>', but found '<scalar>'
  in "..\data\desktop.ini", line 2, column 1
Error processing ..\data\README.txt: 


Unnamed: 0,innings,meta.data_version,meta.created,meta.revision,info.competition,info.dates,info.gender,info.match_type,info.neutral_venue,info.outcome.by.wickets,...,info.teams,info.toss.decision,info.toss.winner,info.umpires,info.venue,match_id,info.outcome.by.runs,info.outcome.result,info.city,info.outcome.eliminator
0,"[{'1st innings': {'team': 'Peshawar Zalmi', 'd...",0.9,2017-05-04,1,Pakistan Super League,[2017-02-09],male,T20,1.0,7.0,...,"[Islamabad United, Peshawar Zalmi]",field,Islamabad United,"[Ahsan Raza, Shozab Raza]",Dubai International Cricket Stadium,1,,,,
1,"[{'1st innings': {'team': 'Quetta Gladiators',...",0.9,2017-05-06,2,Pakistan Super League,[2017-02-10],male,T20,1.0,,...,"[Lahore Qalandars, Quetta Gladiators]",field,Lahore Qalandars,"[Rashid Riaz, Shozab Raza]",Dubai International Cricket Stadium,2,8.0,,,
2,"[{'1st innings': {'team': 'Karachi Kings', 'de...",0.9,2017-05-05,1,Pakistan Super League,[2017-02-10],male,T20,1.0,7.0,...,"[Karachi Kings, Peshawar Zalmi]",field,Peshawar Zalmi,"[Ahmed Shahab, Ahsan Raza]",Dubai International Cricket Stadium,3,,,,
3,"[{'1st innings': {'team': 'Islamabad United', ...",0.9,2017-05-06,1,Pakistan Super League,[2017-02-11],male,T20,1.0,6.0,...,"[Islamabad United, Lahore Qalandars]",field,Lahore Qalandars,"[Asif Yaqoob, Shozab Raza]",Dubai International Cricket Stadium,4,,,,
4,"[{'1st innings': {'team': 'Karachi Kings', 'de...",0.9,2017-05-05,2,Pakistan Super League,[2017-02-11],male,T20,1.0,7.0,...,"[Karachi Kings, Quetta Gladiators]",field,Quetta Gladiators,"[Aleem Dar, Rashid Riaz]",Dubai International Cricket Stadium,5,,,,
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
141,"[{'1st innings': {'team': 'Lahore Qalandars', ...",0.9,2020-08-17,1,Pakistan Super League,[2016-02-17],male,T20,,5.0,...,"[Lahore Qalandars, Islamabad United]",field,Islamabad United,"[JS Wilson, Aleem Dar]",Dubai International Cricket Stadium,142,,,,
142,"[{'1st innings': {'team': 'Quetta Gladiators',...",0.9,2020-08-17,1,Pakistan Super League,[2016-02-19],male,T20,,,...,"[Quetta Gladiators, Peshawar Zalmi]",field,Peshawar Zalmi,"[Shozab Raza, Aleem Dar]",Dubai International Cricket Stadium,143,1.0,,,
143,"[{'1st innings': {'team': 'Karachi Kings', 'de...",0.9,2020-08-17,1,Pakistan Super League,[2016-02-20],male,T20,,9.0,...,"[Karachi Kings, Islamabad United]",field,Islamabad United,"[Aleem Dar, Ahsan Raza]",Dubai International Cricket Stadium,144,,,,
144,"[{'1st innings': {'team': 'Islamabad United', ...",0.9,2020-08-17,1,Pakistan Super League,[2016-02-21],male,T20,,,...,"[Islamabad United, Peshawar Zalmi]",field,Peshawar Zalmi,"[JS Wilson, Aleem Dar]",Dubai International Cricket Stadium,145,50.0,,,


In [18]:
backup = final_df.copy()

In [19]:
final_df

Unnamed: 0,innings,meta.data_version,meta.created,meta.revision,info.competition,info.dates,info.gender,info.match_type,info.neutral_venue,info.outcome.by.wickets,...,info.teams,info.toss.decision,info.toss.winner,info.umpires,info.venue,match_id,info.outcome.by.runs,info.outcome.result,info.city,info.outcome.eliminator
0,"[{'1st innings': {'team': 'Peshawar Zalmi', 'd...",0.9,2017-05-04,1,Pakistan Super League,[2017-02-09],male,T20,1.0,7.0,...,"[Islamabad United, Peshawar Zalmi]",field,Islamabad United,"[Ahsan Raza, Shozab Raza]",Dubai International Cricket Stadium,1,,,,
1,"[{'1st innings': {'team': 'Quetta Gladiators',...",0.9,2017-05-06,2,Pakistan Super League,[2017-02-10],male,T20,1.0,,...,"[Lahore Qalandars, Quetta Gladiators]",field,Lahore Qalandars,"[Rashid Riaz, Shozab Raza]",Dubai International Cricket Stadium,2,8.0,,,
2,"[{'1st innings': {'team': 'Karachi Kings', 'de...",0.9,2017-05-05,1,Pakistan Super League,[2017-02-10],male,T20,1.0,7.0,...,"[Karachi Kings, Peshawar Zalmi]",field,Peshawar Zalmi,"[Ahmed Shahab, Ahsan Raza]",Dubai International Cricket Stadium,3,,,,
3,"[{'1st innings': {'team': 'Islamabad United', ...",0.9,2017-05-06,1,Pakistan Super League,[2017-02-11],male,T20,1.0,6.0,...,"[Islamabad United, Lahore Qalandars]",field,Lahore Qalandars,"[Asif Yaqoob, Shozab Raza]",Dubai International Cricket Stadium,4,,,,
4,"[{'1st innings': {'team': 'Karachi Kings', 'de...",0.9,2017-05-05,2,Pakistan Super League,[2017-02-11],male,T20,1.0,7.0,...,"[Karachi Kings, Quetta Gladiators]",field,Quetta Gladiators,"[Aleem Dar, Rashid Riaz]",Dubai International Cricket Stadium,5,,,,
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
141,"[{'1st innings': {'team': 'Lahore Qalandars', ...",0.9,2020-08-17,1,Pakistan Super League,[2016-02-17],male,T20,,5.0,...,"[Lahore Qalandars, Islamabad United]",field,Islamabad United,"[JS Wilson, Aleem Dar]",Dubai International Cricket Stadium,142,,,,
142,"[{'1st innings': {'team': 'Quetta Gladiators',...",0.9,2020-08-17,1,Pakistan Super League,[2016-02-19],male,T20,,,...,"[Quetta Gladiators, Peshawar Zalmi]",field,Peshawar Zalmi,"[Shozab Raza, Aleem Dar]",Dubai International Cricket Stadium,143,1.0,,,
143,"[{'1st innings': {'team': 'Karachi Kings', 'de...",0.9,2020-08-17,1,Pakistan Super League,[2016-02-20],male,T20,,9.0,...,"[Karachi Kings, Islamabad United]",field,Islamabad United,"[Aleem Dar, Ahsan Raza]",Dubai International Cricket Stadium,144,,,,
144,"[{'1st innings': {'team': 'Islamabad United', ...",0.9,2020-08-17,1,Pakistan Super League,[2016-02-21],male,T20,,,...,"[Islamabad United, Peshawar Zalmi]",field,Peshawar Zalmi,"[JS Wilson, Aleem Dar]",Dubai International Cricket Stadium,145,50.0,,,


In [20]:
final_df.columns

Index(['innings', 'meta.data_version', 'meta.created', 'meta.revision',
       'info.competition', 'info.dates', 'info.gender', 'info.match_type',
       'info.neutral_venue', 'info.outcome.by.wickets', 'info.outcome.method',
       'info.outcome.winner', 'info.overs', 'info.player_of_match',
       'info.teams', 'info.toss.decision', 'info.toss.winner', 'info.umpires',
       'info.venue', 'match_id', 'info.outcome.by.runs', 'info.outcome.result',
       'info.city', 'info.outcome.eliminator'],
      dtype='object')

In [21]:
final_df['info.city']

0      NaN
1      NaN
2      NaN
3      NaN
4      NaN
      ... 
141    NaN
142    NaN
143    NaN
144    NaN
145    NaN
Name: info.city, Length: 146, dtype: object

In [22]:
final_df.columns

Index(['innings', 'meta.data_version', 'meta.created', 'meta.revision',
       'info.competition', 'info.dates', 'info.gender', 'info.match_type',
       'info.neutral_venue', 'info.outcome.by.wickets', 'info.outcome.method',
       'info.outcome.winner', 'info.overs', 'info.player_of_match',
       'info.teams', 'info.toss.decision', 'info.toss.winner', 'info.umpires',
       'info.venue', 'match_id', 'info.outcome.by.runs', 'info.outcome.result',
       'info.city', 'info.outcome.eliminator'],
      dtype='object')

In [23]:
final_df.drop(columns=[
    'meta.data_version',
    'info.dates',
    'info.gender',
    'info.match_type',
    'meta.created',
    'meta.revision',
    'info.outcome.eliminator',
    'info.outcome.result',
    'info.outcome.method',
    'info.neutral_venue',
    'info.outcome.by.runs',
    'info.outcome.by.wickets'
],inplace=True)

In [24]:
final_df

Unnamed: 0,innings,info.competition,info.outcome.winner,info.overs,info.player_of_match,info.teams,info.toss.decision,info.toss.winner,info.umpires,info.venue,match_id,info.city
0,"[{'1st innings': {'team': 'Peshawar Zalmi', 'd...",Pakistan Super League,Islamabad United,20,[BJ Haddin],"[Islamabad United, Peshawar Zalmi]",field,Islamabad United,"[Ahsan Raza, Shozab Raza]",Dubai International Cricket Stadium,1,
1,"[{'1st innings': {'team': 'Quetta Gladiators',...",Pakistan Super League,Quetta Gladiators,20,[Hassan Khan],"[Lahore Qalandars, Quetta Gladiators]",field,Lahore Qalandars,"[Rashid Riaz, Shozab Raza]",Dubai International Cricket Stadium,2,
2,"[{'1st innings': {'team': 'Karachi Kings', 'de...",Pakistan Super League,Peshawar Zalmi,20,[EJG Morgan],"[Karachi Kings, Peshawar Zalmi]",field,Peshawar Zalmi,"[Ahmed Shahab, Ahsan Raza]",Dubai International Cricket Stadium,3,
3,"[{'1st innings': {'team': 'Islamabad United', ...",Pakistan Super League,Lahore Qalandars,20,[JJ Roy],"[Islamabad United, Lahore Qalandars]",field,Lahore Qalandars,"[Asif Yaqoob, Shozab Raza]",Dubai International Cricket Stadium,4,
4,"[{'1st innings': {'team': 'Karachi Kings', 'de...",Pakistan Super League,Quetta Gladiators,20,[RR Rossouw],"[Karachi Kings, Quetta Gladiators]",field,Quetta Gladiators,"[Aleem Dar, Rashid Riaz]",Dubai International Cricket Stadium,5,
...,...,...,...,...,...,...,...,...,...,...,...,...
141,"[{'1st innings': {'team': 'Lahore Qalandars', ...",Pakistan Super League,Islamabad United,20,[Mohammad Irfan],"[Lahore Qalandars, Islamabad United]",field,Islamabad United,"[JS Wilson, Aleem Dar]",Dubai International Cricket Stadium,142,
142,"[{'1st innings': {'team': 'Quetta Gladiators',...",Pakistan Super League,Quetta Gladiators,20,[Mohammad Nawaz (3)],"[Quetta Gladiators, Peshawar Zalmi]",field,Peshawar Zalmi,"[Shozab Raza, Aleem Dar]",Dubai International Cricket Stadium,143,
143,"[{'1st innings': {'team': 'Karachi Kings', 'de...",Pakistan Super League,Islamabad United,20,[Mohammad Sami],"[Karachi Kings, Islamabad United]",field,Islamabad United,"[Aleem Dar, Ahsan Raza]",Dubai International Cricket Stadium,144,
144,"[{'1st innings': {'team': 'Islamabad United', ...",Pakistan Super League,Islamabad United,20,[Sharjeel Khan],"[Islamabad United, Peshawar Zalmi]",field,Peshawar Zalmi,"[JS Wilson, Aleem Dar]",Dubai International Cricket Stadium,145,


In [25]:
final_df.columns

Index(['innings', 'info.competition', 'info.outcome.winner', 'info.overs',
       'info.player_of_match', 'info.teams', 'info.toss.decision',
       'info.toss.winner', 'info.umpires', 'info.venue', 'match_id',
       'info.city'],
      dtype='object')

In [26]:
final_df['info.overs'].value_counts()

info.overs
20    146
Name: count, dtype: int64

In [28]:
import pickle
model_path = os.path.join('..', 'model')
pickle.dump(final_df,open(model_path+'\psl_dataset_1.pkl','wb'))

  pickle.dump(final_df,open(model_path+'\psl_dataset_1.pkl','wb'))


In [30]:
matches = pickle.load(open(model_path+'\psl_dataset_1.pkl','rb'))
#ball by ball data
matches.iloc[0]['innings'][0]['1st innings']['deliveries']

  matches = pickle.load(open(model_path+'\psl_dataset_1.pkl','rb'))


[{0.1: {'batsman': 'Mohammad Hafeez',
   'bowler': 'Mohammad Irfan',
   'non_striker': 'DJ Malan',
   'runs': {'batsman': 0, 'extras': 0, 'total': 0},
   'wicket': {'fielders': ['Sharjeel Khan'],
    'kind': 'caught',
    'player_out': 'Mohammad Hafeez'}}},
 {0.2: {'batsman': 'Kamran Akmal',
   'bowler': 'Mohammad Irfan',
   'non_striker': 'DJ Malan',
   'runs': {'batsman': 1, 'extras': 0, 'total': 1}}},
 {0.3: {'batsman': 'DJ Malan',
   'bowler': 'Mohammad Irfan',
   'non_striker': 'Kamran Akmal',
   'runs': {'batsman': 0, 'extras': 0, 'total': 0}}},
 {0.4: {'batsman': 'DJ Malan',
   'bowler': 'Mohammad Irfan',
   'non_striker': 'Kamran Akmal',
   'runs': {'batsman': 0, 'extras': 0, 'total': 0}}},
 {0.5: {'batsman': 'DJ Malan',
   'bowler': 'Mohammad Irfan',
   'non_striker': 'Kamran Akmal',
   'runs': {'batsman': 0, 'extras': 0, 'total': 0}}},
 {0.6: {'batsman': 'DJ Malan',
   'bowler': 'Mohammad Irfan',
   'non_striker': 'Kamran Akmal',
   'runs': {'batsman': 0, 'extras': 0, 'total'

In [33]:
count = 1
delivery_df = pd.DataFrame()
for index, row in matches.iterrows():
    if count in [75,108,150,180,268,360,443,458,584,748,982,1052,1111,1226,1345]:
        count+=1
        continue
    count+=1
    ball_of_match = []
    batsman = []
    bowler = []
    runs = []
    player_of_dismissed = []
    teams = []
    batting_team = []
    match_id = []
    city = []
    venue = []
    for ball in row['innings'][0]['1st innings']['deliveries']:
        for key in ball.keys():
            match_id.append(count)
            batting_team.append(row['innings'][0]['1st innings']['team'])
            teams.append(row['info.teams'])
            ball_of_match.append(key)
            batsman.append(ball[key]['batsman'])
            bowler.append(ball[key]['bowler'])
            runs.append(ball[key]['runs']['total'])
            city.append(row['info.city'])
            venue.append(row['info.venue'])
            try:
                player_of_dismissed.append(ball[key]['wicket']['player_out'])
            except:
                player_of_dismissed.append('0')
    loop_df = pd.DataFrame({
            'match_id':match_id,
            'teams':teams,
            'batting_team':batting_team,
            'ball':ball_of_match,
            'batsman':batsman,
            'bowler':bowler,
            'runs':runs,
            'player_dismissed':player_of_dismissed,
            'city':city,
            'venue':venue
        })
    delivery_df = pd.concat([delivery_df, loop_df], ignore_index=True)

In [34]:
delivery_df

Unnamed: 0,match_id,teams,batting_team,ball,batsman,bowler,runs,player_dismissed,city,venue
0,2,"[Islamabad United, Peshawar Zalmi]",Peshawar Zalmi,0.1,Mohammad Hafeez,Mohammad Irfan,0,Mohammad Hafeez,,Dubai International Cricket Stadium
1,2,"[Islamabad United, Peshawar Zalmi]",Peshawar Zalmi,0.2,Kamran Akmal,Mohammad Irfan,1,0,,Dubai International Cricket Stadium
2,2,"[Islamabad United, Peshawar Zalmi]",Peshawar Zalmi,0.3,DJ Malan,Mohammad Irfan,0,0,,Dubai International Cricket Stadium
3,2,"[Islamabad United, Peshawar Zalmi]",Peshawar Zalmi,0.4,DJ Malan,Mohammad Irfan,0,0,,Dubai International Cricket Stadium
4,2,"[Islamabad United, Peshawar Zalmi]",Peshawar Zalmi,0.5,DJ Malan,Mohammad Irfan,0,0,,Dubai International Cricket Stadium
...,...,...,...,...,...,...,...,...,...,...
17322,147,"[Quetta Gladiators, Islamabad United]",Quetta Gladiators,19.2,Anwar Ali,AD Russell,6,0,,Dubai International Cricket Stadium
17323,147,"[Quetta Gladiators, Islamabad United]",Quetta Gladiators,19.3,Anwar Ali,AD Russell,2,0,,Dubai International Cricket Stadium
17324,147,"[Quetta Gladiators, Islamabad United]",Quetta Gladiators,19.4,Anwar Ali,AD Russell,0,Anwar Ali,,Dubai International Cricket Stadium
17325,147,"[Quetta Gladiators, Islamabad United]",Quetta Gladiators,19.5,GD Elliott,AD Russell,0,0,,Dubai International Cricket Stadium


In [35]:
def bowl(row):
    for team in row['teams']:
        if team != row['batting_team']:
            return team

In [36]:
delivery_df['bowling_team'] = delivery_df.apply(bowl,axis=1)

In [37]:
delivery_df

Unnamed: 0,match_id,teams,batting_team,ball,batsman,bowler,runs,player_dismissed,city,venue,bowling_team
0,2,"[Islamabad United, Peshawar Zalmi]",Peshawar Zalmi,0.1,Mohammad Hafeez,Mohammad Irfan,0,Mohammad Hafeez,,Dubai International Cricket Stadium,Islamabad United
1,2,"[Islamabad United, Peshawar Zalmi]",Peshawar Zalmi,0.2,Kamran Akmal,Mohammad Irfan,1,0,,Dubai International Cricket Stadium,Islamabad United
2,2,"[Islamabad United, Peshawar Zalmi]",Peshawar Zalmi,0.3,DJ Malan,Mohammad Irfan,0,0,,Dubai International Cricket Stadium,Islamabad United
3,2,"[Islamabad United, Peshawar Zalmi]",Peshawar Zalmi,0.4,DJ Malan,Mohammad Irfan,0,0,,Dubai International Cricket Stadium,Islamabad United
4,2,"[Islamabad United, Peshawar Zalmi]",Peshawar Zalmi,0.5,DJ Malan,Mohammad Irfan,0,0,,Dubai International Cricket Stadium,Islamabad United
...,...,...,...,...,...,...,...,...,...,...,...
17322,147,"[Quetta Gladiators, Islamabad United]",Quetta Gladiators,19.2,Anwar Ali,AD Russell,6,0,,Dubai International Cricket Stadium,Islamabad United
17323,147,"[Quetta Gladiators, Islamabad United]",Quetta Gladiators,19.3,Anwar Ali,AD Russell,2,0,,Dubai International Cricket Stadium,Islamabad United
17324,147,"[Quetta Gladiators, Islamabad United]",Quetta Gladiators,19.4,Anwar Ali,AD Russell,0,Anwar Ali,,Dubai International Cricket Stadium,Islamabad United
17325,147,"[Quetta Gladiators, Islamabad United]",Quetta Gladiators,19.5,GD Elliott,AD Russell,0,0,,Dubai International Cricket Stadium,Islamabad United


In [38]:
delivery_df.drop(columns=['teams'],inplace=True)

In [39]:
delivery_df['batting_team'].unique()

array(['Peshawar Zalmi', 'Quetta Gladiators', 'Karachi Kings',
       'Islamabad United', 'Lahore Qalandars', 'Multan Sultans'],
      dtype=object)

In [40]:
delivery_df

Unnamed: 0,match_id,batting_team,ball,batsman,bowler,runs,player_dismissed,city,venue,bowling_team
0,2,Peshawar Zalmi,0.1,Mohammad Hafeez,Mohammad Irfan,0,Mohammad Hafeez,,Dubai International Cricket Stadium,Islamabad United
1,2,Peshawar Zalmi,0.2,Kamran Akmal,Mohammad Irfan,1,0,,Dubai International Cricket Stadium,Islamabad United
2,2,Peshawar Zalmi,0.3,DJ Malan,Mohammad Irfan,0,0,,Dubai International Cricket Stadium,Islamabad United
3,2,Peshawar Zalmi,0.4,DJ Malan,Mohammad Irfan,0,0,,Dubai International Cricket Stadium,Islamabad United
4,2,Peshawar Zalmi,0.5,DJ Malan,Mohammad Irfan,0,0,,Dubai International Cricket Stadium,Islamabad United
...,...,...,...,...,...,...,...,...,...,...
17322,147,Quetta Gladiators,19.2,Anwar Ali,AD Russell,6,0,,Dubai International Cricket Stadium,Islamabad United
17323,147,Quetta Gladiators,19.3,Anwar Ali,AD Russell,2,0,,Dubai International Cricket Stadium,Islamabad United
17324,147,Quetta Gladiators,19.4,Anwar Ali,AD Russell,0,Anwar Ali,,Dubai International Cricket Stadium,Islamabad United
17325,147,Quetta Gladiators,19.5,GD Elliott,AD Russell,0,0,,Dubai International Cricket Stadium,Islamabad United


In [41]:
#new dataframe 
output = delivery_df[['match_id','batting_team','bowling_team','ball','runs','player_dismissed','city','venue']]

In [42]:
output

Unnamed: 0,match_id,batting_team,bowling_team,ball,runs,player_dismissed,city,venue
0,2,Peshawar Zalmi,Islamabad United,0.1,0,Mohammad Hafeez,,Dubai International Cricket Stadium
1,2,Peshawar Zalmi,Islamabad United,0.2,1,0,,Dubai International Cricket Stadium
2,2,Peshawar Zalmi,Islamabad United,0.3,0,0,,Dubai International Cricket Stadium
3,2,Peshawar Zalmi,Islamabad United,0.4,0,0,,Dubai International Cricket Stadium
4,2,Peshawar Zalmi,Islamabad United,0.5,0,0,,Dubai International Cricket Stadium
...,...,...,...,...,...,...,...,...
17322,147,Quetta Gladiators,Islamabad United,19.2,6,0,,Dubai International Cricket Stadium
17323,147,Quetta Gladiators,Islamabad United,19.3,2,0,,Dubai International Cricket Stadium
17324,147,Quetta Gladiators,Islamabad United,19.4,0,Anwar Ali,,Dubai International Cricket Stadium
17325,147,Quetta Gladiators,Islamabad United,19.5,0,0,,Dubai International Cricket Stadium


In [43]:
model_path = os.path.join('..', 'model')
pickle.dump(output,open(model_path+'\psl_dataset_2.pkl','wb'))

  pickle.dump(output,open(model_path+'\psl_dataset_2.pkl','wb'))
