# To what extent did the relative frequency materials change from modernism to postmodernism? To better answer this question, we compare the two csv files that we had created (results before 1980 and the results of on and after 1980). 

In [1]:
import pandas as pd

f1 = pd.read_csv('C:/Users/alexa/OneDrive/Documenten/Collecting Data & Tools and Methods/Subquestion1before1980.csv')
f2 = pd.read_csv('C:/Users/alexa/OneDrive/Documenten/Collecting Data & Tools and Methods/Subquestion1onafter1980.csv')

# Note: an important criteria for this comparison was that we could only select words that were present in both the first subset as well as the second subset. Although there was significant overlap between the two subsets (both subsets for example had 'print' as their most frequent material), it is possible that some materials that were used after 1980 but not before 1980, and possibly vice versa, are excluded from this comparison. 

In [2]:
df1 = (f2[f2.word.isin(f1.word)])
df1 = df1.sort_values(["percentage"], ascending=[0])
df2 = (f1[f1.word.isin(f2.word)])

In [3]:
df1

Unnamed: 0.1,Unnamed: 0,word,wordcount,percentage
0,3,print,7936,0.053569
1,10,paper,6083,0.041061
2,509,one,5159,0.034824
3,39,color,4863,0.032826
4,59,lithograph,4669,0.031516
...,...,...,...,...
2659,3211,parquet,1,0.000007
2657,3542,notations,1,0.000007
2654,3219,modified,1,0.000007
2642,3180,mercerized,1,0.000007


In [4]:
df2.head(25)

Unnamed: 0.1,Unnamed: 0,word,wordcount,percentage
0,42,print,26521,0.074192
1,12,silver,23150,0.064762
2,50,lithograph,19429,0.054352
3,11,gelatin,17189,0.048086
4,4,paper,13559,0.037931
5,41,printed,11898,0.033284
6,933,one,11355,0.031765
7,68,etching,9643,0.026976
8,871,book,8189,0.022909
9,8,pencil,8167,0.022847


# Below we show a list of all materials used on and after 1980, but not before 1980. Although the majority of these materials were not used much (the vast majority of the materials in this list were counted less than 10 times), there are some significant exceptions. The most significant are 'archival', 'multichannel', 'dyetransfer' and 'modelling' artworks. Some other interesting exceptions, which came with the advent of time, are 'computergenerated', 'silicone' and 'digitally' artworks, showing the increasing digitial nature of artworks. 

In [7]:
list1 = list(df2.word)
list2 = list(f2.word)
left_out_1 = []

for item in list2:
    if item not in list1:
        left_out_1.append(item)

for item in left_out_1:
    print(f2.loc[f2["word"] == item])
    

    Unnamed: 0       word  wordcount  percentage
16         501  additions       1945    0.013129
     Unnamed: 0      word  wordcount  percentage
133        2430  archival        135    0.000911
     Unnamed: 0        word  wordcount  percentage
138         715  sixtythree        128    0.000864
     Unnamed: 0          word  wordcount  percentage
145        2404  multichannel        119    0.000803
     Unnamed: 0     word  wordcount  percentage
174         498  project         94    0.000635
     Unnamed: 0   word  wordcount  percentage
188        3057  upper         85    0.000574
     Unnamed: 0      word  wordcount  percentage
207        1929  printout         77     0.00052
     Unnamed: 0 word  wordcount  percentage
257        1580  mdf         53    0.000358
     Unnamed: 0   word  wordcount  percentage
265        1893  notes         50    0.000338
     Unnamed: 0    word  wordcount  percentage
267        1832  cprint         49    0.000331
     Unnamed: 0        word  wordcou

969        1582  methacrylate          5    0.000034
     Unnamed: 0  word  wordcount  percentage
976        1598  coal          5    0.000034
     Unnamed: 0        word  wordcount  percentage
978        2254  processing          5    0.000034
     Unnamed: 0    word  wordcount  percentage
987        2193  spread          5    0.000034
     Unnamed: 0         word  wordcount  percentage
990        2300  illustrator          5    0.000034
     Unnamed: 0              word  wordcount  percentage
995        3505  collages\r\n\r\n          5    0.000034
      Unnamed: 0  word  wordcount  percentage
1001        2313  esri          5    0.000034
      Unnamed: 0    word  wordcount  percentage
1006        2314  arcgis          5    0.000034
      Unnamed: 0              word  wordcount  percentage
1007        3508  text\r\n\r\n\r\n          5    0.000034
      Unnamed: 0          word  wordcount  percentage
1008        3067  creamcolored          5    0.000034
      Unnamed: 0     word  word

1356         441  carbonate          3     0.00002
      Unnamed: 0      word  wordcount  percentage
1359         764  bookmark          3     0.00002
      Unnamed: 0        word  wordcount  percentage
1360        2759  fabricated          3     0.00002
      Unnamed: 0      word  wordcount  percentage
1363        1250  backpack          3     0.00002
      Unnamed: 0        word  wordcount  percentage
1366        2728  powerpoint          3     0.00002
      Unnamed: 0       word  wordcount  percentage
1368        3048  \r\nwhite          3     0.00002
      Unnamed: 0  word  wordcount  percentage
1369        1261  kite          3     0.00002
      Unnamed: 0                 word  wordcount  percentage
1370        1262  commerciallyprinted          3     0.00002
      Unnamed: 0      word  wordcount  percentage
1371        2563  deflated          3     0.00002
      Unnamed: 0     word  wordcount  percentage
1373        2252  boundin          3     0.00002
      Unnamed: 0   word  wo

1585        3002  bookseller          2    0.000014
      Unnamed: 0     word  wordcount  percentage
1586        2177  effects          2    0.000014
      Unnamed: 0     word  wordcount  percentage
1587        3094  vehicle          2    0.000014
      Unnamed: 0   word  wordcount  percentage
1591        2323  apple          2    0.000014
      Unnamed: 0        word  wordcount  percentage
1592        3019  photograms          2    0.000014
      Unnamed: 0   word  wordcount  percentage
1594        3022  heart          2    0.000014
      Unnamed: 0        word  wordcount  percentage
1596        2294  conductive          2    0.000014
      Unnamed: 0       word  wordcount  percentage
1598        2203  editioned          2    0.000014
      Unnamed: 0     word  wordcount  percentage
1600        3029  artista          2    0.000014
      Unnamed: 0           word  wordcount  percentage
1601        2291  photovoltaics          2    0.000014
      Unnamed: 0       word  wordcount  percen

1812        1227  vase          2    0.000014
      Unnamed: 0        word  wordcount  percentage
1814        1265  integrated          2    0.000014
      Unnamed: 0      word  wordcount  percentage
1815        3656  receipts          2    0.000014
      Unnamed: 0  word  wordcount  percentage
1816        1225  play          2    0.000014
      Unnamed: 0   word  wordcount  percentage
1818        3654  twill          2    0.000014
      Unnamed: 0  word  wordcount  percentage
1820        1221  cial          2    0.000014
      Unnamed: 0 word  wordcount  percentage
1821        1220  spe          2    0.000014
      Unnamed: 0 word  wordcount  percentage
1823        1217   ie          2    0.000014
      Unnamed: 0         word  wordcount  percentage
1824        3644  workstation          2    0.000014
      Unnamed: 0     word  wordcount  percentage
1825        1348  lectern          2    0.000014
      Unnamed: 0     word  wordcount  percentage
1826        3700  pudding          2   

2056        2737  adapters          1    0.000007
      Unnamed: 0  word  wordcount  percentage
2057        2738  crow          1    0.000007
      Unnamed: 0     word  wordcount  percentage
2058        3874  florida          1    0.000007
      Unnamed: 0    word  wordcount  percentage
2059        3873  loofah          1    0.000007
      Unnamed: 0  word  wordcount  percentage
2063        2750  gown          1    0.000007
      Unnamed: 0    word  wordcount  percentage
2064        3686  helmet          1    0.000007
      Unnamed: 0          word  wordcount  percentage
2066        2996  antiquestyle          1    0.000007
      Unnamed: 0                word  wordcount  percentage
2068        2994  brochuresupplement          1    0.000007
      Unnamed: 0   word  wordcount  percentage
2069        2993  sales          1    0.000007
      Unnamed: 0        word  wordcount  percentage
2070        3688  complexion          1    0.000007
      Unnamed: 0    word  wordcount  percentage
20

2270        3740  washers          1    0.000007
      Unnamed: 0     word  wordcount  percentage
2271         196  ashwood          1    0.000007
      Unnamed: 0   word  wordcount  percentage
2272        2788  ernst          1    0.000007
      Unnamed: 0   word  wordcount  percentage
2273        2913  valve          1    0.000007
      Unnamed: 0      word  wordcount  percentage
2274        2912  solenoid          1    0.000007
      Unnamed: 0     word  wordcount  percentage
2275        3754  coolant          1    0.000007
      Unnamed: 0           word  wordcount  percentage
2276        3073  bibliographic          1    0.000007
      Unnamed: 0     word  wordcount  percentage
2277        3037  jukebox          1    0.000007
      Unnamed: 0    word  wordcount  percentage
2278        3497  safety          1    0.000007
      Unnamed: 0     word  wordcount  percentage
2279        3309  website          1    0.000007
      Unnamed: 0   word  wordcount  percentage
2280        3308  

2438        3435  grayscale          1    0.000007
      Unnamed: 0  word  wordcount  percentage
2439        3440  fair          1    0.000007
      Unnamed: 0     word  wordcount  percentage
2440        3412  thrower          1    0.000007
      Unnamed: 0           word  wordcount  percentage
2441        3441  plasticbacked          1    0.000007
      Unnamed: 0    word  wordcount  percentage
2442        3410  lumber          1    0.000007
      Unnamed: 0    word  wordcount  percentage
2443        3409  cclamp          1    0.000007
      Unnamed: 0        word  wordcount  percentage
2444        3442  emulsionup          1    0.000007
      Unnamed: 0          word  wordcount  percentage
2445        3443  rightreading          1    0.000007
      Unnamed: 0     word  wordcount  percentage
2446        3445  topcoat          1    0.000007
      Unnamed: 0        word  wordcount  percentage
2447        3464  grumichama          1    0.000007
      Unnamed: 0    word  wordcount  percen

2614        3639  boning          1    0.000007
      Unnamed: 0         word  wordcount  percentage
2615        3640  piezography          1    0.000007
      Unnamed: 0     word  wordcount  percentage
2616        3641  paper\\          1    0.000007
      Unnamed: 0     word  wordcount  percentage
2617        3062  missile          1    0.000007
      Unnamed: 0    word  wordcount  percentage
2618        3643  rowing          1    0.000007
      Unnamed: 0      word  wordcount  percentage
2620        3123  students          1    0.000007
      Unnamed: 0  word  wordcount  percentage
2621        3594  0gsm          1    0.000007
      Unnamed: 0               word  wordcount  percentage
2622        3566  constructiongrade          1    0.000007
      Unnamed: 0     word  wordcount  percentage
2623        3556  dresses          1    0.000007
      Unnamed: 0      word  wordcount  percentage
2624        3193  imbedded          1    0.000007
      Unnamed: 0       word  wordcount  percen

      Unnamed: 0 word  wordcount  percentage
2810        1423  dia          1    0.000007
      Unnamed: 0      word  wordcount  percentage
2811         392  acryllic          1    0.000007
      Unnamed: 0        word  wordcount  percentage
2812        1425  foundation          1    0.000007
      Unnamed: 0           word  wordcount  percentage
2813         391  handlaminated          1    0.000007
      Unnamed: 0    word  wordcount  percentage
2814        1427  gleber          1    0.000007
      Unnamed: 0      word  wordcount  percentage
2815        1429  directed          1    0.000007
      Unnamed: 0        word  wordcount  percentage
2818        1431  pellington          1    0.000007
      Unnamed: 0      word  wordcount  percentage
2819        1433  cleaners          1    0.000007
      Unnamed: 0   word  wordcount  percentage
2821        1437  kayak          1    0.000007
      Unnamed: 0       word  wordcount  percentage
2822        1438  staircase          1    0.000007


3002         330  counterweight          1    0.000007
      Unnamed: 0     word  wordcount  percentage
3004        1745  alaskan          1    0.000007
      Unnamed: 0     word  wordcount  percentage
3005        1744  western          1    0.000007
      Unnamed: 0 word  wordcount  percentage
3006         332  cfc          1    0.000007
      Unnamed: 0       word  wordcount  percentage
3007        1741  purrubber          1    0.000007
      Unnamed: 0    word  wordcount  percentage
3008        1740  foamed          1    0.000007
      Unnamed: 0                    word  wordcount  percentage
3010         333  chlorofluorocarbonfree          1    0.000007
      Unnamed: 0        word  wordcount  percentage
3011        1732  disposable          1    0.000007
      Unnamed: 0      word  wordcount  percentage
3012        1730  migraine          1    0.000007
      Unnamed: 0        word  wordcount  percentage
3015        1724  hahnemühle          1    0.000007
      Unnamed: 0   word  

3221        1315  entrails          1    0.000007
      Unnamed: 0              word  wordcount  percentage
3224        1319  carvedandstained          1    0.000007
      Unnamed: 0       word  wordcount  percentage
3226        1322  clothcord          1    0.000007
      Unnamed: 0 word  wordcount  percentage
3227         417  rtm          1    0.000007
      Unnamed: 0       word  wordcount  percentage
3228         419  copolymer          1    0.000007
      Unnamed: 0             word  wordcount  percentage
3231        1328  silverdyebleach          1    0.000007
      Unnamed: 0    word  wordcount  percentage
3235        1244  recipe          1    0.000007
      Unnamed: 0          word  wordcount  percentage
3237        1150  aluminumleaf          1    0.000007
      Unnamed: 0        word  wordcount  percentage
3239        1136  sheets\r\n          1    0.000007
      Unnamed: 0                  word  wordcount  percentage
3241         532  photogravure\r\n\r\n          1    0.0

      Unnamed: 0     word  wordcount  percentage
3448        2520  puppets          1    0.000007
      Unnamed: 0         word  wordcount  percentage
3449        2523  electrotype          1    0.000007
      Unnamed: 0 word  wordcount  percentage
3450        2304  gnu          1    0.000007
      Unnamed: 0  word  wordcount  percentage
3453        2666  pool          1    0.000007
      Unnamed: 0  word  wordcount  percentage
3454        2667  rain          1    0.000007
      Unnamed: 0   word  wordcount  percentage
3455        2668  brook          1    0.000007
      Unnamed: 0  word  wordcount  percentage
3456        2669  lake          1    0.000007
      Unnamed: 0    word  wordcount  percentage
3459        2663  coesnt          1    0.000007
      Unnamed: 0       word  wordcount  percentage
3460        2673  templates          1    0.000007
      Unnamed: 0   word  wordcount  percentage
3461        2674  quote          1    0.000007
      Unnamed: 0     word  wordcount  percen

3629        2074  siliconcoated          1    0.000007
      Unnamed: 0      word  wordcount  percentage
3630        2063  otoblast          1    0.000007
      Unnamed: 0     word  wordcount  percentage
3631        2054  sparkle          1    0.000007
      Unnamed: 0       word  wordcount  percentage
3633        2057  bookshelf          1    0.000007
      Unnamed: 0    word  wordcount  percentage
3634        2058  corian          1    0.000007
      Unnamed: 0          word  wordcount  percentage
3635        2059  polymerbased          1    0.000007
      Unnamed: 0      word  wordcount  percentage
3637        2066  furlined          1    0.000007
      Unnamed: 0   word  wordcount  percentage
3638        2051  robin          1    0.000007
      Unnamed: 0    word  wordcount  percentage
3640        2068  melted          1    0.000007
      Unnamed: 0           word  wordcount  percentage
3641        2069  cinemeccanica          1    0.000007
      Unnamed: 0      word  wordcount  pe

3745        2210  rotationmolded          1    0.000007
      Unnamed: 0 word  wordcount  percentage
3746        2226  hmi          1    0.000007
      Unnamed: 0     word  wordcount  percentage
3747        2230  imovies          1    0.000007
      Unnamed: 0     word  wordcount  percentage
3748        2232  macmini          1    0.000007
      Unnamed: 0        word  wordcount  percentage
3749        2235  cushioning          1    0.000007
      Unnamed: 0    word  wordcount  percentage
3751         281  rubrum          1    0.000007
      Unnamed: 0  word  wordcount  percentage
3752        2212  jeff          1    0.000007
      Unnamed: 0        word  wordcount  percentage
3753        2209  tshirt\r\n          1    0.000007
      Unnamed: 0      word  wordcount  percentage
3755         287  bulkdyed          1    0.000007
      Unnamed: 0  word  wordcount  percentage
3756        2185  imac          1    0.000007
      Unnamed: 0      word  wordcount  percentage
3757        2186  qu

# Below we show a list of all materials used before 1980, but not on or after 1980. Some interesting types of materials that were not used after 1980 are heliogravure, hectrographed, celluloid and paperfaced artworks. 

In [27]:
list3 = list(df1.word)
list4 = list(f1.word)
left_out_2 = []

for item in list4:
    if item not in list3:
        left_out_2.append(item)

for item in left_out_2:
    print(f1.loc[f1['word'] == item])

     Unnamed: 0     word  wordcount  percentage
206        1092  caption        131    0.000366
     Unnamed: 0       word  wordcount  percentage
207        1520  fiftyfive        131    0.000366
     Unnamed: 0      word  wordcount  percentage
209        1116  sixtytwo        126    0.000352
     Unnamed: 0          word  wordcount  percentage
241        2195  heliogravure         96    0.000269
     Unnamed: 0        word  wordcount  percentage
243        1767  ninetyfour         95    0.000266
     Unnamed: 0          word  wordcount  percentage
246        1037  hectographed         93     0.00026
     Unnamed: 0         word  wordcount  percentage
248        1703  seventyfour         92    0.000257
     Unnamed: 0        word  wordcount  percentage
255        1539  eightyfive         87    0.000243
     Unnamed: 0         word  wordcount  percentage
259        1626  eightythree         84    0.000235
     Unnamed: 0       word  wordcount  percentage
260        3225  eightytwo      

791        1408  postertext         10    0.000028
     Unnamed: 0     word  wordcount  percentage
794        2110  staples         10    0.000028
     Unnamed: 0       word  wordcount  percentage
796        1236  rodchenko         10    0.000028
     Unnamed: 0           word  wordcount  percentage
801        1607  justification         10    0.000028
     Unnamed: 0       word  wordcount  percentage
807         409  naugahyde         10    0.000028
     Unnamed: 0  word  wordcount  percentage
808         117  paul         10    0.000028
     Unnamed: 0           word  wordcount  percentage
810        1090  incorporating         10    0.000028
     Unnamed: 0          word  wordcount  percentage
818        1071  carboncopied          9    0.000025
     Unnamed: 0        word  wordcount  percentage
822        2087  autochrome          9    0.000025
     Unnamed: 0      word  wordcount  percentage
826        2127  petersen          9    0.000025
     Unnamed: 0        word  wordcount  p

1088        3506  opening          5    0.000014
      Unnamed: 0     word  wordcount  percentage
1090        3511  striker          5    0.000014
      Unnamed: 0     word  wordcount  percentage
1094        1544  flyleaf          5    0.000014
      Unnamed: 0    word  wordcount  percentage
1096        1885  tusche          5    0.000014
      Unnamed: 0    word  wordcount  percentage
1100        1858  layers          5    0.000014
      Unnamed: 0         word  wordcount  percentage
1102        3248  overlapping          5    0.000014
      Unnamed: 0       word  wordcount  percentage
1105        1807  distemper          5    0.000014
      Unnamed: 0          word  wordcount  percentage
1106        1634  accompanying          5    0.000014
      Unnamed: 0   word  wordcount  percentage
1107         107  diazo          5    0.000014
      Unnamed: 0    word  wordcount  percentage
1109        1654  george          5    0.000014
      Unnamed: 0  word  wordcount  percentage
1111       

1383         734  tinned          3    0.000008
      Unnamed: 0  word  wordcount  percentage
1385         785  bolt          3    0.000008
      Unnamed: 0    word  wordcount  percentage
1386        1776  papier          3    0.000008
      Unnamed: 0   word  wordcount  percentage
1388        1777  mâché          3    0.000008
      Unnamed: 0              word  wordcount  percentage
1389        1834  punchedandpasted          3    0.000008
      Unnamed: 0   word  wordcount  percentage
1393        1778  globe          3    0.000008
      Unnamed: 0        word  wordcount  percentage
1398        2841  dictionary          3    0.000008
      Unnamed: 0     word  wordcount  percentage
1400         766  ferrite          3    0.000008
      Unnamed: 0    word  wordcount  percentage
1404         394  damask          3    0.000008
      Unnamed: 0    word  wordcount  percentage
1407         388  wicker          3    0.000008
      Unnamed: 0        word  wordcount  percentage
1408        23

1541        3497  springmounted          3    0.000008
      Unnamed: 0     word  wordcount  percentage
1543        2579  pennies          3    0.000008
      Unnamed: 0       word  wordcount  percentage
1545        1935  footprint          3    0.000008
      Unnamed: 0   word  wordcount  percentage
1546        4068  \r\nx          3    0.000008
      Unnamed: 0   word  wordcount  percentage
1551        1898  chart          3    0.000008
      Unnamed: 0      word  wordcount  percentage
1553        2872  scissors          3    0.000008
      Unnamed: 0   word  wordcount  percentage
1554         682  sisal          3    0.000008
      Unnamed: 0     word  wordcount  percentage
1555        2283  typeset          3    0.000008
      Unnamed: 0       word  wordcount  percentage
1556        2285  squashing          3    0.000008
      Unnamed: 0     word  wordcount  percentage
1559        3517  tickets          3    0.000008
      Unnamed: 0      word  wordcount  percentage
1560        190

      Unnamed: 0        word  wordcount  percentage
1737        4004  photobusta          2    0.000006
      Unnamed: 0   word  wordcount  percentage
1739        1998  penci          2    0.000006
      Unnamed: 0       word  wordcount  percentage
1740        2997  verso\r\n          2    0.000006
      Unnamed: 0   word  wordcount  percentage
1745          58  gampi          2    0.000006
      Unnamed: 0        word  wordcount  percentage
1748         584  copper\r\n          2    0.000006
      Unnamed: 0   word  wordcount  percentage
1750        2077  allan          2    0.000006
      Unnamed: 0 word  wordcount  percentage
1752        2079    –          2    0.000006
      Unnamed: 0    word  wordcount  percentage
1754        3463  adding          2    0.000006
      Unnamed: 0     word  wordcount  percentage
1756        4117  macramé          2    0.000006
      Unnamed: 0          word  wordcount  percentage
1758        4036  appliqué\r\n          2    0.000006
      Unnamed: 0

1937        1240  breia          2    0.000006
      Unnamed: 0      word  wordcount  percentage
1938         444  austrian          2    0.000006
      Unnamed: 0 word  wordcount  percentage
1939        3376  mit          2    0.000006
      Unnamed: 0    word  wordcount  percentage
1940        2501  kaolin          2    0.000006
      Unnamed: 0       word  wordcount  percentage
1941        1237  tretiakov          2    0.000006
      Unnamed: 0   word  wordcount  percentage
1942        3865  zitar          2    0.000006
      Unnamed: 0       word  wordcount  percentage
1943        2498  framework          2    0.000006
      Unnamed: 0       word  wordcount  percentage
1944        1235  aleksandr          2    0.000006
      Unnamed: 0  word  wordcount  percentage
1945        4070  slor          2    0.000006
      Unnamed: 0       word  wordcount  percentage
1946         439  resistant          2    0.000006
      Unnamed: 0       word  wordcount  percentage
1947        2272  snak

2151        3125  sardine          2    0.000006
      Unnamed: 0      word  wordcount  percentage
2152        1890  ragboard          2    0.000006
      Unnamed: 0  word  wordcount  percentage
2153        1429  dick          2    0.000006
      Unnamed: 0 word  wordcount  percentage
2154        1427    r          2    0.000006
      Unnamed: 0      word  wordcount  percentage
2155        1894  printers          2    0.000006
      Unnamed: 0        word  wordcount  percentage
2156        2798  flashlight          2    0.000006
      Unnamed: 0  word  wordcount  percentage
2157        2869  lock          2    0.000006
      Unnamed: 0  word  wordcount  percentage
2158        1422  dead          2    0.000006
      Unnamed: 0       word  wordcount  percentage
2159         685  mechanism          2    0.000006
      Unnamed: 0     word  wordcount  percentage
2162        3079  alpacca          2    0.000006
      Unnamed: 0   word  wordcount  percentage
2164        1437  still          2

2311        3120  schären          1    0.000003
      Unnamed: 0  word  wordcount  percentage
2312        3305  neck          1    0.000003
      Unnamed: 0    word  wordcount  percentage
2313        3167  tuxedo          1    0.000003
      Unnamed: 0    word  wordcount  percentage
2314        3197  origin          1    0.000003
      Unnamed: 0  word  wordcount  percentage
2315        3180  club          1    0.000003
      Unnamed: 0            word  wordcount  percentage
2317        3183  galvanizediron          1    0.000003
      Unnamed: 0        word  wordcount  percentage
2318        3291  demokratie          1    0.000003
      Unnamed: 0        word  wordcount  percentage
2319        3272  happenings          1    0.000003
      Unnamed: 0     word  wordcount  percentage
2320        3258  gallows          1    0.000003
      Unnamed: 0     word  wordcount  percentage
2322        3293  laundry          1    0.000003
      Unnamed: 0             word  wordcount  percentage
23

2468        3880  area          1    0.000003
      Unnamed: 0         word  wordcount  percentage
2469        3878  nickelplate          1    0.000003
      Unnamed: 0           word  wordcount  percentage
2470        3875  photocopy\r\n          1    0.000003
      Unnamed: 0        word  wordcount  percentage
2471        3874  modacrylic          1    0.000003
      Unnamed: 0        word  wordcount  percentage
2472        3873  felttippen          1    0.000003
      Unnamed: 0              word  wordcount  percentage
2473        3872  vinylimpregnated          1    0.000003
      Unnamed: 0        word  wordcount  percentage
2474        3871  hectograph          1    0.000003
      Unnamed: 0    word  wordcount  percentage
2476        3920  school          1    0.000003
      Unnamed: 0       word  wordcount  percentage
2477        3921  hallwalls          1    0.000003
      Unnamed: 0     word  wordcount  percentage
2478        3922  buffalo          1    0.000003
      Unnamed:

2663        3994  taffeta          1    0.000003
      Unnamed: 0      word  wordcount  percentage
2664        3991  artist\s          1    0.000003
      Unnamed: 0         word  wordcount  percentage
2665        3990  pages\r\nmm          1    0.000003
      Unnamed: 0         word  wordcount  percentage
2667        4011  gravure\r\n          1    0.000003
      Unnamed: 0       word  wordcount  percentage
2668        3987  handscrew          1    0.000003
      Unnamed: 0       word  wordcount  percentage
2669        3986  resinflex          1    0.000003
      Unnamed: 0       word  wordcount  percentage
2670        3984  tiles\r\n          1    0.000003
      Unnamed: 0                  word  wordcount  percentage
2672        3980  electroencephalogram          1    0.000003
      Unnamed: 0            word  wordcount  percentage
2673        3979  electroglazing          1    0.000003
      Unnamed: 0             word  wordcount  percentage
2675        3976  fourteenchannel       

2777        3462  tokyo          1    0.000003
      Unnamed: 0    word  wordcount  percentage
2779        3460  naiqua          1    0.000003
      Unnamed: 0  word  wordcount  percentage
2780        3459  solo          1    0.000003
      Unnamed: 0     word  wordcount  percentage
2781        3458  higgins          1    0.000003
      Unnamed: 0            word  wordcount  percentage
2783        3452  plasticwrapped          1    0.000003
      Unnamed: 0    word  wordcount  percentage
2784        3451  ignite          1    0.000003
      Unnamed: 0  word  wordcount  percentage
2785        3390  ecke          1    0.000003
      Unnamed: 0         word  wordcount  percentage
2786        3389  tamponierte          1    0.000003
      Unnamed: 0       word  wordcount  percentage
2787        3388  zinkkiste          1    0.000003
      Unnamed: 0     word  wordcount  percentage
2788        3329  scheibe          1    0.000003
      Unnamed: 0    word  wordcount  percentage
2789        3

2906        3705  friedman          1    0.000003
      Unnamed: 0    word  wordcount  percentage
2907        3682  winder          1    0.000003
      Unnamed: 0      word  wordcount  percentage
2908        3703  postives          1    0.000003
      Unnamed: 0       word  wordcount  percentage
2912        3697  yardstick          1    0.000003
      Unnamed: 0   word  wordcount  percentage
2915        3691  waves          1    0.000003
      Unnamed: 0 word  wordcount  percentage
2916        3690   fm          1    0.000003
      Unnamed: 0    word  wordcount  percentage
2917        3688  format          1    0.000003
      Unnamed: 0   word  wordcount  percentage
2918        3686  frogs          1    0.000003
      Unnamed: 0      word  wordcount  percentage
2919        3685  indended          1    0.000003
      Unnamed: 0    word  wordcount  percentage
2921        3683  condom          1    0.000003
      Unnamed: 0    word  wordcount  percentage
2922        3625  wallet          

3032        1450  kahn          1    0.000003
      Unnamed: 0    word  wordcount  percentage
3033        1451  little          1    0.000003
      Unnamed: 0   word  wordcount  percentage
3034        1453  shops          1    0.000003
      Unnamed: 0 word  wordcount  percentage
3036        1457  owl          1    0.000003
      Unnamed: 0        word  wordcount  percentage
3037        1444  collectors          1    0.000003
      Unnamed: 0   word  wordcount  percentage
3039        1460  venus          1    0.000003
      Unnamed: 0  word  wordcount  percentage
3041        1462  weed          1    0.000003
      Unnamed: 0   word  wordcount  percentage
3042        1463  tiger          1    0.000003
      Unnamed: 0  word  wordcount  percentage
3043        1464  lamb          1    0.000003
      Unnamed: 0       word  wordcount  percentage
3044        1445  fantastic          1    0.000003
      Unnamed: 0      word  wordcount  percentage
3045        1443  abundant          1    0.000

3159        1629  bon          1    0.000003
      Unnamed: 0    word  wordcount  percentage
3160        1631  tirage          1    0.000003
      Unnamed: 0     word  wordcount  percentage
3161        1632  prinetd          1    0.000003
      Unnamed: 0    word  wordcount  percentage
3163        1653  cabana          1    0.000003
      Unnamed: 0      word  wordcount  percentage
3165        1638  matisses          1    0.000003
      Unnamed: 0        word  wordcount  percentage
3166        1639  annotating          1    0.000003
      Unnamed: 0     word  wordcount  percentage
3167        1641  euroset          1    0.000003
      Unnamed: 0    word  wordcount  percentage
3169        1652  bather          1    0.000003
      Unnamed: 0      word  wordcount  percentage
3170        1684  laureate          1    0.000003
      Unnamed: 0        word  wordcount  percentage
3172        1616  lacourière          1    0.000003
      Unnamed: 0  word  wordcount  percentage
3173        1726 

3262        1543  delaunay          1    0.000003
      Unnamed: 0     word  wordcount  percentage
3263        1556  gouahce          1    0.000003
      Unnamed: 0     word  wordcount  percentage
3264        1547  reverse          1    0.000003
      Unnamed: 0   word  wordcount  percentage
3265        1548  bookw          1    0.000003
      Unnamed: 0 word  wordcount  percentage
3266        1549  ith          1    0.000003
      Unnamed: 0      word  wordcount  percentage
3267        1550  nintysix          1    0.000003
      Unnamed: 0       word  wordcount  percentage
3268        1551  roulettte          1    0.000003
      Unnamed: 0        word  wordcount  percentage
3269        1553  collotypte          1    0.000003
      Unnamed: 0   word  wordcount  percentage
3270        1557  blakc          1    0.000003
      Unnamed: 0  word  wordcount  percentage
3271        1573  tony          1    0.000003
      Unnamed: 0    word  wordcount  percentage
3272        1564  intext      

3407         275  casement          1    0.000003
      Unnamed: 0             word  wordcount  percentage
3408         239  impactresistant          1    0.000003
      Unnamed: 0         word  wordcount  percentage
3409         242  synthesized          1    0.000003
      Unnamed: 0                   word  wordcount  percentage
3411         255  syrenebutadienerubber          1    0.000003
      Unnamed: 0      word  wordcount  percentage
3412         262  hardened          1    0.000003
      Unnamed: 0   word  wordcount  percentage
3413         274  sheer          1    0.000003
      Unnamed: 0      word  wordcount  percentage
3414         277  bleached          1    0.000003
      Unnamed: 0      word  wordcount  percentage
3415         339  european          1    0.000003
      Unnamed: 0              word  wordcount  percentage
3416         290  chromemolybdenum          1    0.000003
      Unnamed: 0       word  wordcount  percentage
3418         305  linen\r\n          1    0

3515         677  fireplace          1    0.000003
      Unnamed: 0               word  wordcount  percentage
3516         666  polypropylene\r\n          1    0.000003
      Unnamed: 0     word  wordcount  percentage
3517         668  hotdrop          1    0.000003
      Unnamed: 0          word  wordcount  percentage
3520         673  differential          1    0.000003
      Unnamed: 0       word  wordcount  percentage
3522         678  surrounds          1    0.000003
      Unnamed: 0           word  wordcount  percentage
3524         679  blackoxidized          1    0.000003
      Unnamed: 0    word  wordcount  percentage
3525         684  taslan          1    0.000003
      Unnamed: 0       word  wordcount  percentage
3527         688  reflector          1    0.000003
      Unnamed: 0     word  wordcount  percentage
3528         693  watered          1    0.000003
      Unnamed: 0      word  wordcount  percentage
3529         696  asbestos          1    0.000003
      Unnamed: 0 

3695        2603  methyl          1    0.000003
      Unnamed: 0   word  wordcount  percentage
3696        2594  crude          1    0.000003
      Unnamed: 0 word  wordcount  percentage
3697        2597  hex          1    0.000003
      Unnamed: 0       word  wordcount  percentage
3698        2598  separated          1    0.000003
      Unnamed: 0     word  wordcount  percentage
3700        2601  metalic          1    0.000003
      Unnamed: 0       word  wordcount  percentage
3701        2602  notarized          1    0.000003
      Unnamed: 0    word  wordcount  percentage
3702        2604  flawed          1    0.000003
      Unnamed: 0   word  wordcount  percentage
3703        2614  geode          1    0.000003
      Unnamed: 0            word  wordcount  percentage
3704        2605  advertisements          1    0.000003
      Unnamed: 0      word  wordcount  percentage
3707        2611  skeletal          1    0.000003
      Unnamed: 0      word  wordcount  percentage
3709        26

3879        1960  boesch          1    0.000003
      Unnamed: 0                    word  wordcount  percentage
3880        1961  cutandpastedandstapled          1    0.000003
      Unnamed: 0  word  wordcount  percentage
3881        1962  rows          1    0.000003
      Unnamed: 0 word  wordcount  percentage
3882        1967   bc          1    0.000003
      Unnamed: 0          word  wordcount  percentage
3883        1984  andballpoint          1    0.000003
      Unnamed: 0         word  wordcount  percentage
3884        1969  paperrelief          1    0.000003
      Unnamed: 0     word  wordcount  percentage
3889        1979  goauche          1    0.000003
      Unnamed: 0        word  wordcount  percentage
3890        2053  threecolor          1    0.000003
      Unnamed: 0          word  wordcount  percentage
3891        2066  doublecoated          1    0.000003
      Unnamed: 0     word  wordcount  percentage
3892        1952  college          1    0.000003
      Unnamed: 0    

3996        1907  paperspencil          1    0.000003
      Unnamed: 0       word  wordcount  percentage
3997        1908  crayonink          1    0.000003
      Unnamed: 0           word  wordcount  percentage
3998        2152  redevelopment          1    0.000003
      Unnamed: 0       word  wordcount  percentage
3999        2155  bleaching          1    0.000003
      Unnamed: 0       word  wordcount  percentage
4000        2487  intensity          1    0.000003
      Unnamed: 0        word  wordcount  percentage
4004        2401  brownblack          1    0.000003
      Unnamed: 0  word  wordcount  percentage
4006        2405  comp          1    0.000003
      Unnamed: 0       word  wordcount  percentage
4008        2408  exhibiton          1    0.000003
      Unnamed: 0     word  wordcount  percentage
4009        2396  grayish          1    0.000003
      Unnamed: 0       word  wordcount  percentage
4010        2409  brochures          1    0.000003
      Unnamed: 0       word  wor

# Since most artworks however are present in both the first subset as well as the second, we will continue with the comparison  (comparing only those countries which were present in either subset).

In [28]:
output2 = list(df1.wordcount)
output3 = list(df1.percentage)

output4 = list(df2.word)
output5 = list(df2.wordcount)
output6 = list(df2.percentage)

dictionary1 = {'wordcount_onafter' : output2, 'percentage_onafter' : output3}

dictionary2 = {'word' : output4, 'wordcount_before' : output5, 'percentage_before' : output6}

df1 = pd.DataFrame(dictionary1)

df2 = pd.DataFrame(dictionary2)



In [29]:
df1

Unnamed: 0,wordcount_onafter,percentage_onafter
0,7936,0.053569
1,6083,0.041061
2,5159,0.034824
3,4863,0.032826
4,4669,0.031516
...,...,...
1812,1,0.000007
1813,1,0.000007
1814,1,0.000007
1815,1,0.000007


In [30]:
df2

Unnamed: 0,word,wordcount_before,percentage_before
0,print,26521,0.074192
1,silver,23150,0.064762
2,lithograph,19429,0.054352
3,gelatin,17189,0.048086
4,paper,13559,0.037931
...,...,...,...
1812,bristle,1,0.000003
1813,sulphur,1,0.000003
1814,engraving\r\n,1,0.000003
1815,butter,1,0.000003


In [31]:
join_df = df2.join(df1)
join_df

Unnamed: 0,word,wordcount_before,percentage_before,wordcount_onafter,percentage_onafter
0,print,26521,0.074192,7936,0.053569
1,silver,23150,0.064762,6083,0.041061
2,lithograph,19429,0.054352,5159,0.034824
3,gelatin,17189,0.048086,4863,0.032826
4,paper,13559,0.037931,4669,0.031516
...,...,...,...,...,...
1812,bristle,1,0.000003,1,0.000007
1813,sulphur,1,0.000003,1,0.000007
1814,engraving\r\n,1,0.000003,1,0.000007
1815,butter,1,0.000003,1,0.000007


# We also add columns 'wordcount_difference', which calculates the difference in wordcounts from before 1970 to on and after 1970, and 'percentage_difference', which calculates the percentage increase or decrease in wordcounts as a percentage of the total from before 1970 to on and after 1970.

In [32]:
join_df['wordcount_difference'] = (join_df['wordcount_onafter'] - join_df['wordcount_before'])

In [33]:
join_df['percentage_difference'] = (join_df['percentage_onafter'] - join_df['percentage_before']) / join_df['percentage_before'] * 100
join_df

Unnamed: 0,word,wordcount_before,percentage_before,wordcount_onafter,percentage_onafter,wordcount_difference,percentage_difference
0,print,26521,0.074192,7936,0.053569,-18585,-27.796493
1,silver,23150,0.064762,6083,0.041061,-17067,-36.596483
2,lithograph,19429,0.054352,5159,0.034824,-14270,-35.928985
3,gelatin,17189,0.048086,4863,0.032826,-12326,-31.734671
4,paper,13559,0.037931,4669,0.031516,-8890,-16.911151
...,...,...,...,...,...,...,...
1812,bristle,1,0.000003,1,0.000007,0,141.294002
1813,sulphur,1,0.000003,1,0.000007,0,141.294002
1814,engraving\r\n,1,0.000003,1,0.000007,0,141.294002
1815,butter,1,0.000003,1,0.000007,0,141.294002


In [34]:
join_df.to_csv('C:/Users/alexa/OneDrive/Documenten/Collecting Data & Tools and Methods/Subquestion1Comparison.csv')