# Reading and Writing Data in Text Format
## read_csv

In [1]:
!cat examples/ex1.csv

a,b,c,d,message
1,2,3,4,hello
5,6,7,8,world
9,10,11,12,foo

In [2]:
import pandas as pd

In [3]:
df = pd.read_csv('examples/ex1.csv')

In [4]:
df

Unnamed: 0,a,b,c,d,message
0,1,2,3,4,hello
1,5,6,7,8,world
2,9,10,11,12,foo


In [5]:
!cat examples/ex2.csv

1,2,3,4,hello
5,6,7,8,world
9,10,11,12,foo

In [6]:
pd.read_csv('examples/ex2.csv')

Unnamed: 0,1,2,3,4,hello
0,5,6,7,8,world
1,9,10,11,12,foo


In [7]:
df2 = pd.read_csv('examples/ex2.csv', header= None)

In [8]:
df2

Unnamed: 0,0,1,2,3,4
0,1,2,3,4,hello
1,5,6,7,8,world
2,9,10,11,12,foo


In [9]:
pd.read_csv('examples/ex2.csv', names= ['a', 'b', 'c', 'd', 'msg'])

Unnamed: 0,a,b,c,d,msg
0,1,2,3,4,hello
1,5,6,7,8,world
2,9,10,11,12,foo


In [10]:
pd.read_csv('examples/ex2.csv', names= ['a', 'b', 'c', 'd', 'msg'], index_col= 'msg')

Unnamed: 0_level_0,a,b,c,d
msg,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1
hello,1,2,3,4
world,5,6,7,8
foo,9,10,11,12


In [11]:
!cat examples/csv_mindex.csv

key1,key2,value1,value2
one,a,1,2
one,b,3,4
one,c,5,6
one,d,7,8
two,a,9,10
two,b,11,12
two,c,13,14
two,d,15,16


In [12]:
pd.read_csv('examples/csv_mindex.csv', index_col= ['key1', 'key2'])

Unnamed: 0_level_0,Unnamed: 1_level_0,value1,value2
key1,key2,Unnamed: 2_level_1,Unnamed: 3_level_1
one,a,1,2
one,b,3,4
one,c,5,6
one,d,7,8
two,a,9,10
two,b,11,12
two,c,13,14
two,d,15,16


In [13]:
!cat examples/ex3.txt

            A         B         C
aaa -0.264438 -1.026059 -0.619500
bbb  0.927272  0.302904 -0.032399
ccc -0.264273 -0.386314 -0.217601
ddd -0.871858 -0.348382  1.100491


In [14]:
result = pd.read_csv('examples/ex3.txt', delimiter= '\s+')

In [15]:
result

Unnamed: 0,A,B,C
aaa,-0.264438,-1.026059,-0.6195
bbb,0.927272,0.302904,-0.032399
ccc,-0.264273,-0.386314,-0.217601
ddd,-0.871858,-0.348382,1.100491


In [16]:
!cat examples/ex4.csv

# hey!
a,b,c,d,message
# just wanted to make things more difficult for you
# who reads CSV files with computers, anyway?
1,2,3,4,hello
5,6,7,8,world
9,10,11,12,foo


In [17]:
pd.read_csv('examples/ex4.csv', skiprows= [0, 2, 3])

Unnamed: 0,a,b,c,d,message
0,1,2,3,4,hello
1,5,6,7,8,world
2,9,10,11,12,foo


In [18]:
!cat examples/ex5.csv

something,a,b,c,d,message
one,1,2,3,4,NA
two,5,6,,8,world
three,9,10,11,12,foo

In [19]:
df = pd.read_csv('examples/ex5.csv')

In [20]:
df

Unnamed: 0,something,a,b,c,d,message
0,one,1,2,3.0,4,
1,two,5,6,,8,world
2,three,9,10,11.0,12,foo


In [21]:
df.isna()

Unnamed: 0,something,a,b,c,d,message
0,False,False,False,False,False,True
1,False,False,False,True,False,False
2,False,False,False,False,False,False


In [22]:
result2 = pd.read_csv('examples/ex5.csv', keep_default_na= False)

In [23]:
result2

Unnamed: 0,something,a,b,c,d,message
0,one,1,2,3.0,4,
1,two,5,6,,8,world
2,three,9,10,11.0,12,foo


In [24]:
result3 = pd.read_csv('examples/ex5.csv', keep_default_na= False, na_values= ['NA'])

In [25]:
result3

Unnamed: 0,something,a,b,c,d,message
0,one,1,2,3.0,4,
1,two,5,6,,8,world
2,three,9,10,11.0,12,foo


In [26]:
result3.isna()

Unnamed: 0,something,a,b,c,d,message
0,False,False,False,False,False,True
1,False,False,False,False,False,False
2,False,False,False,False,False,False


In [27]:
sentinals = {
    'something': ['two'],
    'message': ['foo', 'NA']
}

pd.read_csv('examples/ex5.csv', na_values= sentinals, keep_default_na= False)

Unnamed: 0,something,a,b,c,d,message
0,one,1,2,3.0,4,
1,,5,6,,8,world
2,three,9,10,11.0,12,


## Reading Text Files in Pieces

In [28]:
pd.options.display.max_rows = 10

In [29]:
result = pd.read_csv('examples/ex6.csv')

In [30]:
result

Unnamed: 0,one,two,three,four,key
0,0.467976,-0.038649,-0.295344,-1.824726,L
1,-0.358893,1.404453,0.704965,-0.200638,B
2,-0.501840,0.659254,-0.421691,-0.057688,G
3,0.204886,1.074134,1.388361,-0.982404,R
4,0.354628,-0.133116,0.283763,-0.837063,Q
...,...,...,...,...,...
9995,2.311896,-0.417070,-1.409599,-0.515821,L
9996,-0.479893,-0.650419,0.745152,-0.646038,E
9997,0.523331,0.787112,0.486066,1.093156,K
9998,-0.362559,0.598894,-1.843201,0.887292,G


In [31]:
pd.read_csv('examples/ex6.csv', nrows= 5)

Unnamed: 0,one,two,three,four,key
0,0.467976,-0.038649,-0.295344,-1.824726,L
1,-0.358893,1.404453,0.704965,-0.200638,B
2,-0.50184,0.659254,-0.421691,-0.057688,G
3,0.204886,1.074134,1.388361,-0.982404,R
4,0.354628,-0.133116,0.283763,-0.837063,Q


In [32]:
chunker = pd.read_csv('examples/ex6.csv', chunksize= 1000)

In [33]:
chunker

<pandas.io.parsers.readers.TextFileReader at 0x7d29e73f15d0>

In [34]:
tot = pd.Series([], dtype= 'int64')

In [35]:
for piece in chunker:
  tot = tot.add(piece.key.value_counts(), fill_value= 0)

In [36]:
tot.head()

key
0    151.0
1    146.0
2    152.0
3    162.0
4    171.0
dtype: float64

In [37]:
tot = tot.sort_values(ascending= False)

In [38]:
tot.head(10)

key
E    368.0
X    364.0
L    346.0
O    343.0
Q    340.0
M    338.0
J    337.0
F    335.0
K    334.0
H    330.0
dtype: float64

## Writing Data to Text Format

In [39]:
data = pd.read_csv('examples/ex5.csv')

In [40]:
data.to_csv('examples/out.csv')

In [41]:
import sys

In [42]:
data.to_csv(sys.stdout, sep= '|')

|something|a|b|c|d|message
0|one|1|2|3.0|4|
1|two|5|6||8|world
2|three|9|10|11.0|12|foo


In [43]:
data.to_csv(sys.stdout, na_rep= 'NULL')

,something,a,b,c,d,message
0,one,1,2,3.0,4,NULL
1,two,5,6,NULL,8,world
2,three,9,10,11.0,12,foo


In [44]:
data.to_csv(sys.stdout, index= False, header= False)

one,1,2,3.0,4,
two,5,6,,8,world
three,9,10,11.0,12,foo


In [45]:
data.to_csv(sys.stdout, columns= ['a', 'c', 'b'])

,a,c,b
0,1,3.0,2
1,5,,6
2,9,11.0,10


## Working with Other Delimited Formats

In [46]:
!cat examples/ex7.csv

"a","b","c"
"1","2","3"
"1","2","3"


In [47]:
import csv

In [48]:
with open('examples/ex7.csv') as f:
  reader: list[list[str]] = list(csv.reader(f))

In [49]:
for line in reader:
  print(line)

['a', 'b', 'c']
['1', '2', '3']
['1', '2', '3']


In [50]:
class my_dialect(csv.Dialect):
    delimiter: str = ';'
    lineterminator: str = '\n'
    quotechar: str = '"'
    quoting = csv.QUOTE_MINIMAL

In [51]:
with open('examples/my_data.csv', 'w') as f:
    writer = csv.writer(f, dialect= my_dialect)
    writer.writerow(('one', 'two', 'three'))
    writer.writerow(('1', '2', '3'))
    writer.writerow(('4', '5', '6'))

## JSON Data

In [52]:
import json

In [53]:
obj = """
{"name": "Wes",
"cities_lived": ["Akron", "Nashville", "New York", "San Francisco"],
"pet": null,
"siblings": [{"name": "Scott", "age": 34, "hobbies": ["guitars", "soccer"]},
{"name": "Katie", "age": 42, "hobbies": ["diving", "art"]}]
}
"""
result = json.loads(obj)

result

{'name': 'Wes',
 'cities_lived': ['Akron', 'Nashville', 'New York', 'San Francisco'],
 'pet': None,
 'siblings': [{'name': 'Scott', 'age': 34, 'hobbies': ['guitars', 'soccer']},
  {'name': 'Katie', 'age': 42, 'hobbies': ['diving', 'art']}]}

In [54]:
as_json = json.dumps(result)

In [55]:
as_json

'{"name": "Wes", "cities_lived": ["Akron", "Nashville", "New York", "San Francisco"], "pet": null, "siblings": [{"name": "Scott", "age": 34, "hobbies": ["guitars", "soccer"]}, {"name": "Katie", "age": 42, "hobbies": ["diving", "art"]}]}'

In [56]:
!cat examples/example.json

[{"a": 1, "b": 2, "c": 3},
 {"a": 4, "b": 5, "c": 6},
 {"a": 7, "b": 8, "c": 9}]


In [57]:
data = pd.read_json('examples/example.json')

In [58]:
data

Unnamed: 0,a,b,c
0,1,2,3
1,4,5,6
2,7,8,9


In [59]:
data.to_json(sys.stdout)

{"a":{"0":1,"1":4,"2":7},"b":{"0":2,"1":5,"2":8},"c":{"0":3,"1":6,"2":9}}

In [60]:
data.to_json(sys.stdout, orient= 'records')

[{"a":1,"b":2,"c":3},{"a":4,"b":5,"c":6},{"a":7,"b":8,"c":9}]

## XML and HTML: Web Scraping

In [61]:
tables = pd.read_html('examples/fdic_failed_bank_list.html')

In [62]:
tables

[                             Bank Name             City  ST   CERT  \
 0                          Allied Bank         Mulberry  AR     91   
 1         The Woodbury Banking Company         Woodbury  GA  11297   
 2               First CornerStone Bank  King of Prussia  PA  35312   
 3                   Trust Company Bank          Memphis  TN   9956   
 4           North Milwaukee State Bank        Milwaukee  WI  20364   
 ..                                 ...              ...  ..    ...   
 542                 Superior Bank, FSB         Hinsdale  IL  32646   
 543                Malta National Bank            Malta  OH   6629   
 544    First Alliance Bank & Trust Co.       Manchester  NH  34264   
 545  National State Bank of Metropolis       Metropolis  IL   3815   
 546                   Bank of Honolulu         Honolulu  HI  21029   
 
                    Acquiring Institution        Closing Date  \
 0                           Today's Bank  September 23, 2016   
 1              

In [63]:
failures = tables[0]

In [64]:
failures

Unnamed: 0,Bank Name,City,ST,CERT,Acquiring Institution,Closing Date,Updated Date
0,Allied Bank,Mulberry,AR,91,Today's Bank,"September 23, 2016","November 17, 2016"
1,The Woodbury Banking Company,Woodbury,GA,11297,United Bank,"August 19, 2016","November 17, 2016"
2,First CornerStone Bank,King of Prussia,PA,35312,First-Citizens Bank & Trust Company,"May 6, 2016","September 6, 2016"
3,Trust Company Bank,Memphis,TN,9956,The Bank of Fayette County,"April 29, 2016","September 6, 2016"
4,North Milwaukee State Bank,Milwaukee,WI,20364,First-Citizens Bank & Trust Company,"March 11, 2016","June 16, 2016"
...,...,...,...,...,...,...,...
542,"Superior Bank, FSB",Hinsdale,IL,32646,"Superior Federal, FSB","July 27, 2001","August 19, 2014"
543,Malta National Bank,Malta,OH,6629,North Valley Bank,"May 3, 2001","November 18, 2002"
544,First Alliance Bank & Trust Co.,Manchester,NH,34264,Southern New Hampshire Bank & Trust,"February 2, 2001","February 18, 2003"
545,National State Bank of Metropolis,Metropolis,IL,3815,Banterra Bank of Marion,"December 14, 2000","March 17, 2005"


In [65]:
close_timestamps = pd.to_datetime(failures['Closing Date'])

In [66]:
close_timestamps

0     2016-09-23
1     2016-08-19
2     2016-05-06
3     2016-04-29
4     2016-03-11
         ...    
542   2001-07-27
543   2001-05-03
544   2001-02-02
545   2000-12-14
546   2000-10-13
Name: Closing Date, Length: 547, dtype: datetime64[ns]

In [67]:
close_timestamps.dt.year.value_counts()

Closing Date
2010    157
2009    140
2011     92
2012     51
2008     25
       ... 
2004      4
2001      4
2007      3
2003      3
2000      2
Name: count, Length: 15, dtype: int64

### Parsing XML with lxml.objectify

In [68]:
from lxml import objectify

In [69]:
path = r'datasets/mta_perf/Performance_MNR.xml'

In [71]:
with open(path) as f:
    parsed = objectify.parse(f)

In [72]:
root = parsed.getroot()

In [73]:
root

<Element PERFORMANCE at 0x7d29e739ffc0>

In [74]:
pd.read_xml(path)

Unnamed: 0,INDICATOR_SEQ,PARENT_SEQ,AGENCY_NAME,INDICATOR_NAME,DESCRIPTION,PERIOD_YEAR,PERIOD_MONTH,CATEGORY,FREQUENCY,DESIRED_CHANGE,INDICATOR_UNIT,DECIMAL_PLACES,YTD_TARGET,YTD_ACTUAL,MONTHLY_TARGET,MONTHLY_ACTUAL
0,28445,,Metro-North Railroad,On-Time Performance (West of Hudson),Percent of commuter trains that arrive at thei...,2008,1,Service Indicators,M,U,%,1,95.00,96.90,95.00,96.90
1,28445,,Metro-North Railroad,On-Time Performance (West of Hudson),Percent of commuter trains that arrive at thei...,2008,2,Service Indicators,M,U,%,1,95.00,96.00,95.00,95.00
2,28445,,Metro-North Railroad,On-Time Performance (West of Hudson),Percent of commuter trains that arrive at thei...,2008,3,Service Indicators,M,U,%,1,95.00,96.30,95.00,96.90
3,28445,,Metro-North Railroad,On-Time Performance (West of Hudson),Percent of commuter trains that arrive at thei...,2008,4,Service Indicators,M,U,%,1,95.00,96.80,95.00,98.30
4,28445,,Metro-North Railroad,On-Time Performance (West of Hudson),Percent of commuter trains that arrive at thei...,2008,5,Service Indicators,M,U,%,1,95.00,96.60,95.00,95.80
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
643,373889,,Metro-North Railroad,Escalator Availability,Percent of the time that escalators are operat...,2011,8,Service Indicators,M,U,%,1,97.00,,97.00,
644,373889,,Metro-North Railroad,Escalator Availability,Percent of the time that escalators are operat...,2011,9,Service Indicators,M,U,%,1,97.00,,97.00,
645,373889,,Metro-North Railroad,Escalator Availability,Percent of the time that escalators are operat...,2011,10,Service Indicators,M,U,%,1,97.00,,97.00,
646,373889,,Metro-North Railroad,Escalator Availability,Percent of the time that escalators are operat...,2011,11,Service Indicators,M,U,%,1,97.00,,97.00,


#Binary Data Formats



## pickle

In [75]:
df = pd.read_csv('examples/ex1.csv')

In [76]:
df.to_pickle('examples/pickled_data.csv')

In [77]:
pd.read_pickle('examples/pickled_data.csv')

Unnamed: 0,a,b,c,d,message
0,1,2,3,4,hello
1,5,6,7,8,world
2,9,10,11,12,foo


## Excel files

In [78]:
df = pd.read_excel('examples/ex1.xlsx', sheet_name= 'Sheet1', index_col= 0)

In [79]:
df

Unnamed: 0,a,b,c,d,message
0,1,2,3,4,hello
1,5,6,7,8,world
2,9,10,11,12,foo


In [80]:
df.to_excel('examples/ex2.xlsx')

## HDF5 Format

In [82]:
import numpy as np

In [83]:
frame = pd.DataFrame(
    {'a': np.random.standard_normal(100)}
)

In [84]:
frame

Unnamed: 0,a
0,2.268400
1,0.933570
2,2.003999
3,-0.004996
4,0.383031
...,...
95,1.815914
96,0.341166
97,1.073515
98,1.127122


In [85]:
store = pd.HDFStore('examples/mydata.h5')

In [86]:
store

<class 'pandas.io.pytables.HDFStore'>
File path: examples/mydata.h5

In [87]:
store.obj1 = frame

In [88]:
store.obj1

Unnamed: 0,a
0,2.268400
1,0.933570
2,2.003999
3,-0.004996
4,0.383031
...,...
95,1.815914
96,0.341166
97,1.073515
98,1.127122


In [89]:
store.obj1_col = frame.a

In [90]:
store.obj1_col

0     2.268400
1     0.933570
2     2.003999
3    -0.004996
4     0.383031
        ...   
95    1.815914
96    0.341166
97    1.073515
98    1.127122
99   -0.111030
Name: a, Length: 100, dtype: float64

In [91]:
store.put('obj2', frame, format= 'table')

In [92]:
store.select('obj2', where= 'index <= 5')

Unnamed: 0,a
0,2.2684
1,0.93357
2,2.003999
3,-0.004996
4,0.383031
5,-0.490103


In [94]:
store.close()

In [95]:
frame.to_hdf('examples/mydata.h5', 'obj3', format= 'table')

In [96]:
pd.read_hdf('examples/mydata.h5', 'obj3', where= 'index > 5 and index < 10')

Unnamed: 0,a
6,0.054496
7,1.654843
8,0.070731
9,-0.660633


# Interacting with Web APIs

In [97]:
import requests

In [98]:
url = r'https://api.github.com/repos/pandas-dev/pandas/issues'

In [99]:
resp = requests.get(url)

In [100]:
resp.raise_for_status()

In [101]:
resp

<Response [200]>

In [102]:
data = resp.json()

In [103]:
data

[{'url': 'https://api.github.com/repos/pandas-dev/pandas/issues/58663',
  'repository_url': 'https://api.github.com/repos/pandas-dev/pandas',
  'labels_url': 'https://api.github.com/repos/pandas-dev/pandas/issues/58663/labels{/name}',
  'comments_url': 'https://api.github.com/repos/pandas-dev/pandas/issues/58663/comments',
  'events_url': 'https://api.github.com/repos/pandas-dev/pandas/issues/58663/events',
  'html_url': 'https://github.com/pandas-dev/pandas/issues/58663',
  'id': 2288613904,
  'node_id': 'I_kwDOAA0YD86IaXoQ',
  'number': 58663,
  'title': 'REF/API: make construct_array_type a non-classmethod',
  'user': {'login': 'jbrockmendel',
   'id': 8078968,
   'node_id': 'MDQ6VXNlcjgwNzg5Njg=',
   'avatar_url': 'https://avatars.githubusercontent.com/u/8078968?v=4',
   'gravatar_id': '',
   'url': 'https://api.github.com/users/jbrockmendel',
   'html_url': 'https://github.com/jbrockmendel',
   'followers_url': 'https://api.github.com/users/jbrockmendel/followers',
   'following_u

In [104]:
data[0]['url']

'https://api.github.com/repos/pandas-dev/pandas/issues/58663'

In [106]:
df = pd.DataFrame(data)

In [107]:
df

Unnamed: 0,url,repository_url,labels_url,comments_url,events_url,html_url,id,node_id,number,title,...,closed_at,author_association,active_lock_reason,body,reactions,timeline_url,performed_via_github_app,state_reason,draft,pull_request
0,https://api.github.com/repos/pandas-dev/pandas...,https://api.github.com/repos/pandas-dev/pandas,https://api.github.com/repos/pandas-dev/pandas...,https://api.github.com/repos/pandas-dev/pandas...,https://api.github.com/repos/pandas-dev/pandas...,https://github.com/pandas-dev/pandas/issues/58663,2288613904,I_kwDOAA0YD86IaXoQ,58663,REF/API: make construct_array_type a non-class...,...,,MEMBER,,### Pandas version checks\n\n- [X] I have chec...,{'url': 'https://api.github.com/repos/pandas-d...,https://api.github.com/repos/pandas-dev/pandas...,,,,
1,https://api.github.com/repos/pandas-dev/pandas...,https://api.github.com/repos/pandas-dev/pandas,https://api.github.com/repos/pandas-dev/pandas...,https://api.github.com/repos/pandas-dev/pandas...,https://api.github.com/repos/pandas-dev/pandas...,https://github.com/pandas-dev/pandas/pull/58662,2288529336,PR_kwDOAA0YD85vCQI5,58662,DOC: Clarify allowed values for on_bad_lines i...,...,,CONTRIBUTOR,,Move the callable options out of the version a...,{'url': 'https://api.github.com/repos/pandas-d...,https://api.github.com/repos/pandas-dev/pandas...,,,False,{'url': 'https://api.github.com/repos/pandas-d...
2,https://api.github.com/repos/pandas-dev/pandas...,https://api.github.com/repos/pandas-dev/pandas,https://api.github.com/repos/pandas-dev/pandas...,https://api.github.com/repos/pandas-dev/pandas...,https://api.github.com/repos/pandas-dev/pandas...,https://github.com/pandas-dev/pandas/pull/58661,2288291196,PR_kwDOAA0YD85vBcgB,58661,DOC: Add examples for pd.read_csv,...,,CONTRIBUTOR,,- [x] closes #58462 \r\n- [ ] [Tests added and...,{'url': 'https://api.github.com/repos/pandas-d...,https://api.github.com/repos/pandas-dev/pandas...,,,False,{'url': 'https://api.github.com/repos/pandas-d...
3,https://api.github.com/repos/pandas-dev/pandas...,https://api.github.com/repos/pandas-dev/pandas,https://api.github.com/repos/pandas-dev/pandas...,https://api.github.com/repos/pandas-dev/pandas...,https://api.github.com/repos/pandas-dev/pandas...,https://github.com/pandas-dev/pandas/pull/58655,2288099934,PR_kwDOAA0YD85vAz1g,58655,CLN: Stopped dtype inference in sanitize_array...,...,,MEMBER,,xref https://github.com/pandas-dev/pandas/pull...,{'url': 'https://api.github.com/repos/pandas-d...,https://api.github.com/repos/pandas-dev/pandas...,,,False,{'url': 'https://api.github.com/repos/pandas-d...
4,https://api.github.com/repos/pandas-dev/pandas...,https://api.github.com/repos/pandas-dev/pandas,https://api.github.com/repos/pandas-dev/pandas...,https://api.github.com/repos/pandas-dev/pandas...,https://api.github.com/repos/pandas-dev/pandas...,https://github.com/pandas-dev/pandas/issues/58654,2287830900,I_kwDOAA0YD86IXYd0,58654,Mac (with M2 chip) install of pandas with Poetry,...,,NONE,,### Installation check\n\n- [X] I have read th...,{'url': 'https://api.github.com/repos/pandas-d...,https://api.github.com/repos/pandas-dev/pandas...,,,,
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
25,https://api.github.com/repos/pandas-dev/pandas...,https://api.github.com/repos/pandas-dev/pandas,https://api.github.com/repos/pandas-dev/pandas...,https://api.github.com/repos/pandas-dev/pandas...,https://api.github.com/repos/pandas-dev/pandas...,https://github.com/pandas-dev/pandas/issues/58603,2281902026,I_kwDOAA0YD86IAw_K,58603,BUG: Regression of Index.join() when return_in...,...,,NONE,,### Pandas version checks\n\n- [X] I have chec...,{'url': 'https://api.github.com/repos/pandas-d...,https://api.github.com/repos/pandas-dev/pandas...,,,,
26,https://api.github.com/repos/pandas-dev/pandas...,https://api.github.com/repos/pandas-dev/pandas,https://api.github.com/repos/pandas-dev/pandas...,https://api.github.com/repos/pandas-dev/pandas...,https://api.github.com/repos/pandas-dev/pandas...,https://github.com/pandas-dev/pandas/issues/58602,2281872312,I_kwDOAA0YD86IApu4,58602,BUG: Adding or multiplying a pandas nullable d...,...,,NONE,,### Pandas version checks\n\n- [X] I have chec...,{'url': 'https://api.github.com/repos/pandas-d...,https://api.github.com/repos/pandas-dev/pandas...,,,,
27,https://api.github.com/repos/pandas-dev/pandas...,https://api.github.com/repos/pandas-dev/pandas,https://api.github.com/repos/pandas-dev/pandas...,https://api.github.com/repos/pandas-dev/pandas...,https://api.github.com/repos/pandas-dev/pandas...,https://github.com/pandas-dev/pandas/pull/58601,2281795280,PR_kwDOAA0YD85ur4kQ,58601,BUG: Assignment of pyarrow arrays yield unexpe...,...,,CONTRIBUTOR,,- [x] closes #56994 \r\n- [x] [Tests added and...,{'url': 'https://api.github.com/repos/pandas-d...,https://api.github.com/repos/pandas-dev/pandas...,,,False,{'url': 'https://api.github.com/repos/pandas-d...
28,https://api.github.com/repos/pandas-dev/pandas...,https://api.github.com/repos/pandas-dev/pandas,https://api.github.com/repos/pandas-dev/pandas...,https://api.github.com/repos/pandas-dev/pandas...,https://api.github.com/repos/pandas-dev/pandas...,https://github.com/pandas-dev/pandas/pull/58600,2281758396,PR_kwDOAA0YD85urwQb,58600,ENH: Totality validation for merge operation,...,,NONE,,- [x] closes #58547\r\n- [x] [Tests added and ...,{'url': 'https://api.github.com/repos/pandas-d...,https://api.github.com/repos/pandas-dev/pandas...,,,False,{'url': 'https://api.github.com/repos/pandas-d...


# Interacting with Databases

In [135]:
import sqlite3

In [136]:
query = """
    CREATE TABLE student(
        roll_no INTEGER,
        name TEXT
    );
"""

In [144]:
connector = sqlite3.connect('data.sqlite')

In [145]:
connector.execute(query)
connector.commit()

In [146]:
connector.executemany(
    """
    INSERT INTO student(roll_no, name)
    VALUES(?, ?);
    """,
    [
        (1, 'Harshit'),
        (2, 'Kushal'),
        (3, 'Ruchi')
    ]
)
connector.commit()

In [147]:
connector.execute(
    """
    SELECT *
    FROM student;
    """
).fetchall()

[(1, 'Harshit'), (2, 'Kushal'), (3, 'Ruchi')]

In [148]:
pd.read_sql('SELECT * FROM student', connector)

Unnamed: 0,roll_no,name
0,1,Harshit
1,2,Kushal
2,3,Ruchi
