Text File Processing

In [4]:
with open('accounts.txt',mode='w') as accounts:
    accounts.write('100 Jones 24.98\n')
    accounts.write('200 Doe 354.67\n')
    accounts.write('300 White 0.00\n')
    accounts.write('400 Stone -42.16\n')
    accounts.write('500 Rich 224.62\n')
    #you can also write to a file with print, as in: 
    #print('100 Jones 24.98', file=accounts)

In [5]:
with open('accounts.txt', mode='r') as accounts:
    print(f'{"Account":<10}{"Name":<10}{"Balance":>10}')
    for record in accounts:
        account, name, balance = record.split()
        print(f'{account:<10}{name:<10}{balance:>10}')

Account   Name         Balance
100       Jones          24.98
200       Doe           354.67
300       White           0.00
400       Stone         -42.16
500       Rich          224.62


Updating Text FIles

In [6]:
#updating text file
accounts = open('accounts.txt', 'r')
temp_file = open('temp_file.txt', 'w')

with accounts, temp_file:
    for record in accounts:
        account, name, balance = record.split()
        if account != '300':
            temp_file.write(record)
        else:
            new_record = ' '.join([account, 'Williams', balance])
            temp_file.write(new_record + '\n')


In [7]:
with open('temp_file.txt', mode='r') as accounts:
    print(f'{"Account":<10}{"Name":<10}{"Balance":>10}')
    for record in accounts:
        account, name, balance = record.split()
        print(f'{account:<10}{name:<10}{balance:>10}')

Account   Name         Balance
100       Jones          24.98
200       Doe           354.67
300       Williams        0.00
400       Stone         -42.16
500       Rich          224.62


In [8]:
import os
os.remove('accounts.txt')

In [9]:
os.rename('temp_file.txt', 'accounts.txt')

Serialization with JSON

In [14]:
import json

accounts_dict = {'accounts': [
    {'account': 100, 'name': 'Jones', 'balance': 24.98},
    {'account': 200, 'name': 'Doe', 'balance': 354.67}]}

with open('accounts.json', 'w') as accounts:
    json.dump(accounts_dict, accounts)

In [15]:
with open('accounts.json', 'r') as accounts:
    accounts_json = json.load(accounts)

In [16]:
accounts_json

{'accounts': [{'account': 100, 'name': 'Jones', 'balance': 24.98},
  {'account': 200, 'name': 'Doe', 'balance': 354.67}]}

In [17]:
accounts_json['accounts']

[{'account': 100, 'name': 'Jones', 'balance': 24.98},
 {'account': 200, 'name': 'Doe', 'balance': 354.67}]

In [18]:
accounts_json['accounts'][0]

{'account': 100, 'name': 'Jones', 'balance': 24.98}

In [19]:
accounts_json['accounts'][1]

{'account': 200, 'name': 'Doe', 'balance': 354.67}

In [20]:
with open('accounts.json', 'r') as accounts:
    print(json.dumps(json.load(accounts), indent=4))
    

{
    "accounts": [
        {
            "account": 100,
            "name": "Jones",
            "balance": 24.98
        },
        {
            "account": 200,
            "name": "Doe",
            "balance": 354.67
        }
    ]
}


9.8 Handling Exceptions

In [21]:
10/0

ZeroDivisionError: division by zero

In [22]:
value = int(input('Enter an intenger: '))

ValueError: invalid literal for int() with base 10: 'hello'

In [26]:
#dividebyzero.py
"""Simple exception handling example."""

while True: 
    # attempt to convert and divide values
    try:
        number1 = int(input('Enter numerator: '))
        number2 = int(input('Enter denominator: '))
        result = number1 / number2
    except ValueError: # tried to convert non-numeric value to int
        print('You must enter two integers\n')
    except ZeroDivisionError: # denominator was 0
        print('Attempted to divide by zero\n')
    else: 
        print(f'{number1:.3f} / {number2:.3f} = {result:.3f}')
        break #terminate the loop


Attempted to divide by zero

You must enter two integers

100.000 / 7.000 = 14.286


finally Clause

In [27]:
try: 
    print('try suite with no exceptions raised')
except:
    print('this will not execute')
else:
    print('else executes because no exceptions in the try suite')
finally:
    print('finally always executes')

try suite with no exceptions raised
else executes because no exceptions in the try suite
finally always executes


In [28]:
try:
    print('try suite that raises an exception')
    int('hello')
    print('this will not execute')
except ValueError:
    print('a ValueError occured')
else:
    print('else will not execute because an exception occured')
finally:
    print('finally always executes')
    

try suite that raises an exception
a ValueError occured
finally always executes


In [29]:
open('gradez.txt')

FileNotFoundError: [Errno 2] No such file or directory: 'gradez.txt'

In [31]:
try:
    with open('gradez.txt', 'r') as accounts:
        print(f'{"ID":<3}{"Name":<7}{"Grade"}')
        for record in accounts:
            student_id, name, grade = record.split()
            print(f'{student_id:<3}{name:<7}{grade}')
except FileNotFoundError:
    print('The file name you specified does not exist')

The file name you specified does not exist


Stack Unwinding and Tracebacks

In [32]:
def function1():
    function2()

def function2():
    raise Exception('An exception occured')

In [33]:
function1()

Exception: An exception occured

Working with CSV Files

In [34]:
import csv

with open('accounts.csv', mode='w', newline='') as accounts:
    writer = csv.writer(accounts)
    writer.writerow([100, 'Jones', 24.98])
    writer.writerow([200, 'Doe', 345.67])
    writer.writerow([300, 'White', 0.00])
    writer.writerow([400, 'Stone', -42.16])
    writer.writerow([500, 'Rich', 224.62])

reading a CSV file

In [35]:
with open('accounts.csv', 'r', newline='') as accounts:
    print(f'{"Account":<10}{"Name":<10}{balance:>10}')
    reader = csv.reader(accounts)
    for record in reader: 
        account, name, balance = record
        print(f'{account:<10}{name:<10}{balance:>10}')

Account   Name          224.62
100       Jones          24.98
200       Doe           345.67
300       White            0.0
400       Stone         -42.16
500       Rich          224.62


In [36]:
import pandas as pd
df = pd.read_csv('accounts.csv', names=['account', 'name', 'balance'])

df

Unnamed: 0,account,name,balance
0,100,Jones,24.98
1,200,Doe,345.67
2,300,White,0.0
3,400,Stone,-42.16
4,500,Rich,224.62


In [37]:
df.to_csv('accounts_from_dataframe.csv', index=False)

In [38]:
titanic = pd.read_csv('http://vincentarelbundock.github.io/' +
    'Rdatasets/csv/carData/TitanicSurvival.csv')

In [40]:
titanic

Unnamed: 0.1,Unnamed: 0,survived,sex,age,passengerClass
0,"Allen, Miss. Elisabeth Walton",yes,female,29.0000,1st
1,"Allison, Master. Hudson Trevor",yes,male,0.9167,1st
2,"Allison, Miss. Helen Loraine",no,female,2.0000,1st
3,"Allison, Mr. Hudson Joshua Crei",no,male,30.0000,1st
4,"Allison, Mrs. Hudson J C (Bessi",no,female,25.0000,1st
...,...,...,...,...,...
1304,"Zabour, Miss. Hileni",no,female,14.5000,3rd
1305,"Zabour, Miss. Thamine",no,female,,3rd
1306,"Zakarian, Mr. Mapriededer",no,male,26.5000,3rd
1307,"Zakarian, Mr. Ortin",no,male,27.0000,3rd


In [50]:
pd.set_option('display.precision', 2) #format for floating-point values
titanic.head()

Unnamed: 0,name,survived,sex,age,class
0,"Allen, Miss. Elisabeth Walton",yes,female,29.0,1st
1,"Allison, Master. Hudson Trevor",yes,male,0.92,1st
2,"Allison, Miss. Helen Loraine",no,female,2.0,1st
3,"Allison, Mr. Hudson Joshua Crei",no,male,30.0,1st
4,"Allison, Mrs. Hudson J C (Bessi",no,female,25.0,1st


In [43]:
titanic.tail()

Unnamed: 0.1,Unnamed: 0,survived,sex,age,passengerClass
1304,"Zabour, Miss. Hileni",no,female,14.5,3rd
1305,"Zabour, Miss. Thamine",no,female,,3rd
1306,"Zakarian, Mr. Mapriededer",no,male,26.5,3rd
1307,"Zakarian, Mr. Ortin",no,male,27.0,3rd
1308,"Zimmerman, Mr. Leo",no,male,29.0,3rd


In [44]:
titanic.columns = ['name', 'survived', 'sex', 'age', 'class']
titanic.head()

Unnamed: 0,name,survived,sex,age,class
0,"Allen, Miss. Elisabeth Walton",yes,female,29.0,1st
1,"Allison, Master. Hudson Trevor",yes,male,0.9167,1st
2,"Allison, Miss. Helen Loraine",no,female,2.0,1st
3,"Allison, Mr. Hudson Joshua Crei",no,male,30.0,1st
4,"Allison, Mrs. Hudson J C (Bessi",no,female,25.0,1st


In [45]:
titanic.describe()

Unnamed: 0,age
count,1046.0
mean,29.881135
std,14.4135
min,0.1667
25%,21.0
50%,28.0
75%,39.0
max,80.0


In [46]:
(titanic.survived == 'yes').describe()

count      1309
unique        2
top       False
freq        809
Name: survived, dtype: object

In [1]:
import matplotlib
#%matplotlib

In [2]:
histogram = titanic.hist()

NameError: name 'titanic' is not defined