In [1]:
import pandas as pd
from qiime2 import Artifact

In [2]:
"""
Load table and seq from 'Sci_Rep_2017b' (V4 region)
The salivary microbiome as an indicator of carcinogenesis in patients 
with oropharyngeal squamous cell carcinoma: A pilot study
"""
table_1 = Artifact.load('Sci_Rep_2017b_table.qza')
seqs_1 = Artifact.load('Sci_Rep_2017b_sequences.qza')


"""
Load table and seq from 'PLOS_ONE_2014' (V4 region)
Bacterial alteration in salivary microbiota  and their association in oral cancer
"""
table_2 = Artifact.load('PLOS_ONE_2014_table.qza')
seqs_2 = Artifact.load('PLOS_ONE_2014_sequences.qza')

In [3]:
# convert to pandas' dataframe and series datastructure
df_table_1 = table_1.view(pd.DataFrame)
ser_seqs_1 = seqs_1.view(pd.Series)

df_table_2 = table_2.view(pd.DataFrame)
ser_seqs_2 = seqs_2.view(pd.Series)

In [4]:
# show feature IDs in table 1
df_table_1.columns

Index(['50b0b4cd015999c8222bb021637c8873', '959aeca1a65ce24599aaed29828c33f0',
       '8b84a4ddaedff09de10789670dd8d7ec', '4ac711b46d68011221bfd3afb538a3dc',
       '9f185911874fb5d5b2623b647359f33b', '1ec321d2e2cf3e3a7046ff8def9fdd13',
       '124930655bc445fb3e9523ddaccaf346', 'e8f3058091170164f253d1d57c5f8912',
       '94adac1e5690b5aef26d6014e471f458', 'e4abc7e798dc0de4035299647bedcf1d',
       ...
       '9fa6c62fdf049b5bd9ef0260ed901853', '0e41240b413688989228c6c422ce24e4',
       '795c703d4c16ffeb7508632702c7e01d', '367f90c7332d353f11390a6631091bf7',
       '015e719f3186bfa6b0f44ba0b4cb6209', '564811ed6ce9e86b1a85f41ae6722ce6',
       'b20bb3d72317e7eb86d2286e63e32ba7', 'aa953b4619982e0cc3896ee2146a4cf6',
       'df043a5969cb17682b13a01ee607a5d3', '4707acb19acbcf34a2abdf084bf6d7c4'],
      dtype='object', length=1083)

In [5]:
# show feature IDs in table 2
df_table_2.columns

Index(['394eda29c886632f514dd94b58381186', '06f825b512d903b9230e1a55d87359ee',
       '32f8fd11d2bee278d609a1d4ab767554', '85c44c83eddc5d3028261a1000b7d0e1',
       '4f5efd25dacb5d639316e7291ff6ff8b', '7d135dfbf857c62673695ef24332b100',
       'ca9c66d47347c03d0343d6fe03ed8636', '923f521b9cf313f1f95c9367e09bbc1c',
       '59f7d8a7f37d6eeec95eb556f33da267', '8674dcf0cfe35939037fa9a5b986866f',
       ...
       '524383798a3b0e7df712be516de32f97', 'd1d4d4a6df36955e6e67d7b32e2fdafe',
       '2804f1abbdde069f3cb78e4669755acc', 'ffde5da5465f6689030a7121d9a38365',
       'b70b98d40ffee4e2b96679f4b8274733', '633e0e06711db8a3ca4bc947e754996c',
       '7440de30b2068eeeb916d98e1e2cde72', '5534a6ae0c0a17d72c63fbfa2ddda79b',
       '898517cda47bf7626cad8ce37fc85d08', '1dca104d96e09a385302f0e0ec8b8553'],
      dtype='object', length=1706)

In [6]:
# return common feature(s)
set(df_table_1.columns) & set(df_table_2.columns)

set()

In [7]:
# elements in ser_seqs are actually skbio.DNA object and are unhashable
# therefore, we first convert them to string
ls_seqs_1 = [str(ser_seqs_1[index]) for index, _ in enumerate(ser_seqs_1)]
ls_seqs_2 = [str(ser_seqs_2[index]) for index, _ in enumerate(ser_seqs_2)]

In [8]:
# return common sequence(s)
set(ls_seqs_1) & set(ls_seqs_2)

set()