### Prep survival data for ecosystem model
 -- Purpose: Prep survival data for model
 -- By: G Oldford <br>
 -- Date: 2019-2021 <br>
#### Data in:
   **1) Zimmerman et al 2015 / 2020 survival data**
         - StocksList.csv (extracted from master xlsx; edited to add model functional group codes)
         - Coho_survival.csv (extracted from master xlsx)
   **2) DFO Coho Survival data from CWT (via Josh Korman, Carl Walters)**
         - TBD

Local paths: 
   - C:\Users\Greig\Sync\6. SSMSP Model\Model Greig\Data\1. Salmon\Survival Exploitation Rate\CohoSurvival_Zimmermanetal2015
   - C:\Users\Greig\Sync\6. SSMSP Model\Model Greig\Data\1. Salmon\Survival Exploitation Rate\CohoChin_Survival_CW

In [None]:
# to install r packages
#install.packages("magick", repos='http://cran.us.r-project.org')

In [1]:
library(dplyr)
library(tidyverse)
library(plotly)

"package 'dplyr' was built under R version 3.6.3"
Attaching package: 'dplyr'

The following objects are masked from 'package:stats':

    filter, lag

The following objects are masked from 'package:base':

    intersect, setdiff, setequal, union

"package 'tidyverse' was built under R version 3.6.3"-- [1mAttaching packages[22m --------------------------------------- tidyverse 1.3.0 --
[32mv[39m [34mggplot2[39m 3.2.1     [32mv[39m [34mpurrr  [39m 0.3.4
[32mv[39m [34mtibble [39m 2.1.3     [32mv[39m [34mstringr[39m 1.4.0
[32mv[39m [34mtidyr  [39m 1.1.2     [32mv[39m [34mforcats[39m 0.4.0
[32mv[39m [34mreadr  [39m 1.3.1     
"package 'purrr' was built under R version 3.6.3"-- [1mConflicts[22m ------------------------------------------ tidyverse_conflicts() --
[31mx[39m [34mdplyr[39m::[32mfilter()[39m masks [34mstats[39m::filter()
[31mx[39m [34mdplyr[39m::[32mlag()[39m    masks [34mstats[39m::lag()
"package 'plotly' was built under R version 3

In [17]:
surv <- read.csv("Coho Survival CWT Mar2020 Matrix.csv")
stocks <- read.csv("StocksList.csv")


In [18]:
surv

OEY,X1972,X1973,X1974,X1975,X1976,X1977,X1978,X1979,X1980,...,X2008,X2009,X2010,X2011,X2012,X2013,X2014,X2015,X2016,X2017
<fct>,<dbl>,<dbl>,<dbl>,<dbl>,<dbl>,<dbl>,<dbl>,<dbl>,<dbl>,...,<dbl>,<dbl>,<dbl>,<dbl>,<dbl>,<dbl>,<dbl>,<dbl>,<dbl>,<int>
BKH,,,,,,,,,,...,,,,,,,,,,
BKW,,,,,,,,,,...,0.099450178,0.024920014,0.033107035,0.065679043,0.05278991,0.041888008,0.007332251,,,
BBW,,,,,,0.102229673,0.14915825,0.23142298,0.143808256,...,0.083653729,0.0129735,0.046567347,0.061523723,0.067822977,0.057912435,0.03855002,0.06676949,,
BGQ,,0.142739026,0.486798367,0.31305546,0.209482612,0.163858018,0.24854052,0.25983277,0.146477695,...,0.006920807,0.008523185,0.012243356,0.017390361,0.009439469,0.00301125,0.001991544,0.00584055,0.003493696,
BCW,,,,,,,,,,...,0.082709768,0.060738295,0.050350164,0.041013327,0.019271758,0.060781412,0.014146971,0.028355459,,
BLW,,,,,,,0.19037926,0.19903702,,...,0.027742061,0.015257842,0.013703382,,,,,,,
CHH,,,,,,,,,,...,,,,,,,,,,
COH,,,,,,,,,,...,,0.006083097,0.005375466,,,,,,,
DEW,,,,,,0.063513744,,0.16710451,0.174809025,...,0.104549725,,,0.018233978,,,0.001934704,,,
DUH,0.02704194,,0.042897398,,,0.044983543,0.07754426,0.08483098,0.102370541,...,0.021320584,0.002207388,0.018553063,,,,,,,


In [19]:
stocks

ï..Stock,StockKey,Location,OUTGROUP,lat,old_long,lon,ORIGIN,WILD
<fct>,<fct>,<fct>,<int>,<dbl>,<dbl>,<dbl>,<fct>,<int>
Baker River (Skagit),BKW,PS,0,48.5394,121.7435,-121.7435,W,1
Baker River (Skagit),BKH,PS,0,48.5394,121.7435,-121.7435,H,0
Bernie Gobin Hatchery (Snohomish),,PS,0,48.093,122.2838,-122.2838,H,0
Big Beef Cr (Hood Canal),BBW,PS,0,47.6518,122.7834,-122.7834,W,1
Big Qualicum,BGQ,SOG,0,49.38195,124.6439,-124.6439,H,0
Bingham Cr (EF Satsop),BCW,CR,1,47.1538,123.4035,-123.4035,W,1
Bingham Fall (EF Satsop),SAH,CR,1,47.1462,123.4004,-123.4004,H,0
Bingham Late Fall (EF Satsop),,CR,1,47.1462,123.4004,-123.4004,H,0
Black,BLW,SOG,0,49.852,125.1,-125.1,W,1
Carnation,,WCVI,1,48.908,125.0,-125.0,W,1


In [20]:
stocks <- stocks %>% rename(StockName = "ï..Stock") 
t <- surv %>% as_tibble(surv)

In [25]:

t2 <- t %>% pivot_longer(cols=starts_with("X"), names_to = "year", values_to = "survival") %>% 
#t2 <- t %>% pivot_longer(cols=-starts_with("OEY"), names_to = "year", values_to = "survival") %>% 
rename(Stock = "OEY") %>%
left_join(stocks, by = c("Stock" = "StockKey")) %>%
mutate(year = substring(year, 2, 5)) %>%
mutate(year = as.numeric(year))

"Column `Stock`/`StockKey` joining factors with different levels, coercing to character vector"

In [26]:
t2

Stock,year,survival,StockName,Location,OUTGROUP,lat,old_long,lon,ORIGIN,WILD
<chr>,<dbl>,<dbl>,<fct>,<fct>,<int>,<dbl>,<dbl>,<dbl>,<fct>,<int>
BKH,1972,,Baker River (Skagit),PS,0,48.5394,121.7435,-121.7435,H,0
BKH,1973,,Baker River (Skagit),PS,0,48.5394,121.7435,-121.7435,H,0
BKH,1974,,Baker River (Skagit),PS,0,48.5394,121.7435,-121.7435,H,0
BKH,1975,,Baker River (Skagit),PS,0,48.5394,121.7435,-121.7435,H,0
BKH,1976,,Baker River (Skagit),PS,0,48.5394,121.7435,-121.7435,H,0
BKH,1977,,Baker River (Skagit),PS,0,48.5394,121.7435,-121.7435,H,0
BKH,1978,,Baker River (Skagit),PS,0,48.5394,121.7435,-121.7435,H,0
BKH,1979,,Baker River (Skagit),PS,0,48.5394,121.7435,-121.7435,H,0
BKH,1980,,Baker River (Skagit),PS,0,48.5394,121.7435,-121.7435,H,0
BKH,1981,,Baker River (Skagit),PS,0,48.5394,121.7435,-121.7435,H,0


In [27]:
 write.csv(t2,'survival_joined_stocks.csv')