# Compare Taxa list with Ecological Categories

In [1]:
import pandas as pd
import numpy as np
import datetime
import matplotlib.pyplot as plt
import glob

#For illustrator import:
plt.rcParams['pdf.fonttype'] = 42
plt.rcParams['ps.fonttype'] = 42

### Import Taxa list

In [2]:
df = pd.read_csv('../data/Deduplicated_Taxa_list.csv')
df.set_index(['Kingdom', 'Phylum', 'Class', 'Order', 'Family', 'Genus', 'Species'], inplace=True)
taxa_list = df.copy()
taxa_list

Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,Unnamed: 3_level_0,Unnamed: 4_level_0,Unnamed: 5_level_0,Unnamed: 6_level_0,Total_reads,Total_samples
Kingdom,Phylum,Class,Order,Family,Genus,Species,Unnamed: 7_level_1,Unnamed: 8_level_1
Eukaryota,Chordata,Actinopteri,Alepocephaliformes,Platytroctidae,Holtbyrnia,s_,7361,9
Eukaryota,Chordata,Actinopteri,Alepocephaliformes,Platytroctidae,Sagamichthys,Sagamichthys abei,15304,11
Eukaryota,Chordata,Actinopteri,Anabantiformes,Channidae,g_,s_,72,1
Eukaryota,Chordata,Actinopteri,Argentiniformes,Argentinidae,g_,s_,26340,21
Eukaryota,Chordata,Actinopteri,Argentiniformes,Bathylagidae,Bathylagus,Bathylagus pacificus,170,10
Eukaryota,Chordata,...,...,...,...,...,...,...
Eukaryota,Chordata,Mammalia,Cetacea,Ziphiidae,Ziphius,Ziphius cavirostris,25621,14
Eukaryota,Chordata,Mammalia,Cetacea,Ziphiidae,g_,s_,88,3
Eukaryota,Chordata,Mammalia,Cetacea,unassigned,g_,s_,71,4
Eukaryota,Chordata,Mammalia,unassigned,unassigned,g_,s_,6,1


### Import taxa categories

In [3]:
# Import species ecological categories that have been manually determined

file = "../data/metadata/CN19S_Taxa_Categories.csv"
# species designations tibble:
df = pd.read_csv(file)
df.set_index(['Kingdom', 'Phylum', 'Class', 'Order', 'Family', 'Genus', 'Species'], inplace=True)
sp_desig = df.copy()
sp_desig

Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,Unnamed: 3_level_0,Unnamed: 4_level_0,Unnamed: 5_level_0,Unnamed: 6_level_0,Common_name,Ecological_Category
Kingdom,Phylum,Class,Order,Family,Genus,Species,Unnamed: 7_level_1,Unnamed: 8_level_1
Eukaryota,Chordata,Actinopteri,Perciformes,Zoarcidae,Melanostigma,Melanostigma atlanticum,Atlantic soft pout,Atlantic species
Eukaryota,Chordata,Actinopteri,unknown,Moronidae,Morone,Morone saxatilis,Striped bass,Atlantic species
Eukaryota,Chordata,Actinopteri,Beryciformes,Melamphaidae,Scopelogadus,s_,ridgeheads,bathypelagic
Eukaryota,Chordata,Actinopteri,Gadiformes,Macrouridae,Coryphaenoides,unassigned,rattails,bathypelagic
Eukaryota,Chordata,Actinopteri,Gadiformes,Macrouridae,Malacocephalus,unassigned,rattails,bathypelagic
Eukaryota,Chordata,Actinopteri,...,...,...,...,...,...
Eukaryota,Chordata,Actinopteri,Pleuronectiformes,Paralichthyidae,Citharichthys,Citharichthys sordidus,Pacific sanddab,nearshore bottom
Eukaryota,Chordata,Actinopteri,Pleuronectiformes,Paralichthyidae,Citharichthys,Citharichthys stigmaeus,Speckeled sanddab,nearshore bottom
Eukaryota,Chordata,Actinopteri,Pleuronectiformes,Paralichthyidae,Paralichthys,s_,large-tooth flounders,nearshore bottom
Eukaryota,Chordata,Actinopteri,unknown,Sciaenidae,Genyonemus,Genyonemus lineatus,White croaker,nearshore bottom


### Merge

In [4]:
df = pd.concat([sp_desig, taxa_list], axis=1)
df.to_csv('/Users/kpitz/Documents/test.csv')
df

Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,Unnamed: 3_level_0,Unnamed: 4_level_0,Unnamed: 5_level_0,Unnamed: 6_level_0,Common_name,Ecological_Category,Total_reads,Total_samples
Kingdom,Phylum,Class,Order,Family,Genus,Species,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1
Eukaryota,Chordata,Actinopteri,Perciformes,Zoarcidae,Melanostigma,Melanostigma atlanticum,Atlantic soft pout,Atlantic species,57.0,4.0
Eukaryota,Chordata,Actinopteri,unknown,Moronidae,Morone,Morone saxatilis,Striped bass,Atlantic species,946.0,4.0
Eukaryota,Chordata,Actinopteri,Beryciformes,Melamphaidae,Scopelogadus,s_,ridgeheads,bathypelagic,14903.0,24.0
Eukaryota,Chordata,Actinopteri,Gadiformes,Macrouridae,Coryphaenoides,unassigned,rattails,bathypelagic,,
Eukaryota,Chordata,Actinopteri,Gadiformes,Macrouridae,Malacocephalus,unassigned,rattails,bathypelagic,89.0,4.0
Eukaryota,Chordata,Actinopteri,...,...,...,...,...,...,...,...
Eukaryota,Chordata,Actinopteri,Pleuronectiformes,Paralichthyidae,Citharichthys,Citharichthys sordidus,Pacific sanddab,nearshore bottom,43499.0,78.0
Eukaryota,Chordata,Actinopteri,Pleuronectiformes,Paralichthyidae,Citharichthys,Citharichthys stigmaeus,Speckeled sanddab,nearshore bottom,2706.0,19.0
Eukaryota,Chordata,Actinopteri,Pleuronectiformes,Paralichthyidae,Paralichthys,s_,large-tooth flounders,nearshore bottom,1.0,1.0
Eukaryota,Chordata,Actinopteri,unknown,Sciaenidae,Genyonemus,Genyonemus lineatus,White croaker,nearshore bottom,12257.0,23.0
