In [1]:
from tabledataextractor import Table

Input
=========

* from file, as .csv or .html
* from url (if there are more tables at the provided url, use the "table_number=" argument)
* from python list object


In [2]:
table_path = './tables/table_example.csv'
table = Table(table_path)

In [3]:
# use print to see the table
print(table)

                           Rutile      Rutile  Rutile  Anatase     Anatase  Anatase  
                           a = b (Ã…)  c (Ã…)  u       a = b (Ã…)  c (Ã…)   u        
Computational  This study  4.64        2.99    0.305   3.83        9.62     0.208    
Computational  GGA [25]    4.67        2.97    0.305   3.80        9.67     0.207    
Computational  GGA [26]    4.63        2.98    0.305   -           -        -        
Computational  HF [27]     -           -       -       3.76        9.85     0.202    
Experimental   Expt. [23]  4.594       2.958   0.305   3.785       9.514    0.207    




In [4]:
# or, alternatively, to see:
# 1. the input table
# 2. the cleaned table
# 3. the section labelling
# 4. the resulting category table
table

Table(./tables/table_example.csv, table_number=1, transposed=False)

                           Rutile      Rutile  Rutile  Anatase     Anatase  Anatase  
                           a = b (Ã…)  c (Ã…)  u       a = b (Ã…)  c (Ã…)   u        
Computational  This study  4.64        2.99    0.305   3.83        9.62     0.208    
Computational  GGA [25]    4.67        2.97    0.305   3.80        9.67     0.207    
Computational  GGA [26]    4.63        2.98    0.305   -           -        -        
Computational  HF [27]     -           -       -       3.76        9.85     0.202    
Experimental   Expt. [23]  4.594       2.958   0.305   3.785       9.514    0.207    

                           Rutile      Rutile     Rutile     Anatase     Anatase    Anatase    
                           a = b (Ã…)  c (Ã…)     u          a = b (Ã…)  c (Ã…)     u          
Computational  This study  4.64        2.99       0.305      3.83        9.62       0.208      
Computational  GGA [25]    4.67        2

In [5]:
# The category table, as a list of lists, can be returned with
table.category_table

[['4.64', ['This study'], ['Rutile', 'a = b (Ã…)']],
 ['2.99', ['This study'], ['Rutile', 'c (Ã…)']],
 ['0.305', ['This study'], ['Rutile', 'u']],
 ['3.83', ['This study'], ['Anatase', 'a = b (Ã…)']],
 ['9.62', ['This study'], ['Anatase', 'c (Ã…)']],
 ['0.208', ['This study'], ['Anatase', 'u']],
 ['4.67', ['GGA [25]'], ['Rutile', 'a = b (Ã…)']],
 ['2.97', ['GGA [25]'], ['Rutile', 'c (Ã…)']],
 ['0.305', ['GGA [25]'], ['Rutile', 'u']],
 ['3.80', ['GGA [25]'], ['Anatase', 'a = b (Ã…)']],
 ['9.67', ['GGA [25]'], ['Anatase', 'c (Ã…)']],
 ['0.207', ['GGA [25]'], ['Anatase', 'u']],
 ['4.63', ['GGA [26]'], ['Rutile', 'a = b (Ã…)']],
 ['2.98', ['GGA [26]'], ['Rutile', 'c (Ã…)']],
 ['0.305', ['GGA [26]'], ['Rutile', 'u']],
 ['-', ['GGA [26]'], ['Anatase', 'a = b (Ã…)']],
 ['-', ['GGA [26]'], ['Anatase', 'c (Ã…)']],
 ['-', ['GGA [26]'], ['Anatase', 'u']],
 ['-', ['HF [27]'], ['Rutile', 'a = b (Ã…)']],
 ['-', ['HF [27]'], ['Rutile', 'c (Ã…)']],
 ['-', ['HF [27]'], ['Rutile', 'u']],
 ['3.76', ['HF 

In [6]:
# other elements that can be retrieved
print (table.title_row)
print (table.row_header)
print (table.col_header)
print (table.data)

0
[['This study']
 ['GGA [25]']
 ['GGA [26]']
 ['HF [27]']
 ['Expt. [23]']]
[['Rutile' 'Rutile' 'Rutile' 'Anatase' 'Anatase' 'Anatase']
 ['a = b (Ã…)' 'c (Ã…)' 'u' 'a = b (Ã…)' 'c (Ã…)' 'u']]
[['4.64' '2.99' '0.305' '3.83' '9.62' '0.208']
 ['4.67' '2.97' '0.305' '3.80' '9.67' '0.207']
 ['4.63' '2.98' '0.305' '-' '-' '-']
 ['-' '-' '-' '3.76' '9.85' '0.202']
 ['4.594' '2.958' '0.305' '3.785' '9.514' '0.207']]


In [7]:
# The table can be transposed if needed
table.transpose()
table

Table(./tables/table_example.csv, table_number=1, transposed=True)

                     Computational  Computational  Computational  Computational  Experimental  
                     This study     GGA [25]       GGA [26]       HF [27]        Expt. [23]    
Rutile   a = b (Ã…)  4.64           4.67           4.63           -              4.594         
Rutile   c (Ã…)      2.99           2.97           2.98           -              2.958         
Rutile   u           0.305          0.305          0.305          -              0.305         
Anatase  a = b (Ã…)  3.83           3.80           -              3.76           3.785         
Anatase  c (Ã…)      9.62           9.67           -              9.85           9.514         
Anatase  u           0.208          0.207          -              0.202          0.207         

                        Computational  Computational  Computational  Computational  Experimental  
                        This study     GGA [25]       GGA [26]  

Output
========

* as csv file
* as Pandas DataFrame

In [8]:
from tabledataextractor.output.to_csv import write_to_csv

In [9]:
# this will now store the transposed table
write_to_csv(table.raw_table, './saved_table.csv')