From b40b086af4b6049aa0302925c1241e56235bf147 Mon Sep 17 00:00:00 2001 From: Sarah Gaichas Date: Wed, 29 May 2024 10:46:59 -0400 Subject: [PATCH] update scripts for bias corrected full covariate run --- ..._allsurvsANNUAL_lencovSST_ALLinoffsplits.R | 271 --------------- ...te_bfp_allsurvs_lencovSST_ALLinoffsplits.R | 328 ------------------ .../VASTunivariate_macrobenthos_allsurvs.R | 127 ++++--- .../VASTunivariate_megabenthos_allsurvs.R | 130 ++++--- 4 files changed, 125 insertions(+), 731 deletions(-) delete mode 100644 VASTscripts/VASTunivariate_bfp_allsurvsANNUAL_lencovSST_ALLinoffsplits.R delete mode 100644 VASTscripts/VASTunivariate_bfp_allsurvs_lencovSST_ALLinoffsplits.R diff --git a/VASTscripts/VASTunivariate_bfp_allsurvsANNUAL_lencovSST_ALLinoffsplits.R b/VASTscripts/VASTunivariate_bfp_allsurvsANNUAL_lencovSST_ALLinoffsplits.R deleted file mode 100644 index e226133..0000000 --- a/VASTscripts/VASTunivariate_bfp_allsurvsANNUAL_lencovSST_ALLinoffsplits.R +++ /dev/null @@ -1,271 +0,0 @@ -# VAST attempt 2 univariate model as a script -# modified from https://github.com/James-Thorson-NOAA/VAST/wiki/Index-standardization - -# Load packages -library(here) -library(dplyr) -library(VAST) - -#Read in data, separate spring and fall, and rename columns for VAST: - -# this dataset created in SSTmethods.Rmd - -bluepyagg_stn <- readRDS(here::here("fhdat/bluepyagg_stn_all_OISST.rds")) - -# make SST column that uses surftemp unless missing or 0 -# there are 3 surftemp 0 values in the dataset, all with oisst > 15 -bluepyagg_stn <- bluepyagg_stn %>% - dplyr::mutate(sstfill = ifelse((is.na(surftemp)|surftemp==0), oisst, surftemp)) - -#bluepyagg_stn <- bluepyagg_pred_stn - -# filter to assessment years at Tony's suggestion - -# code Vessel as AL=0, HB=1, NEAMAP=2 - -bluepyagg_stn_all <- bluepyagg_stn %>% - #ungroup() %>% - filter(#season_ng == "FALL", # Annual model for MRIP index - year > 1984) %>% - mutate(AreaSwept_km2 = 1, #Elizabeth's code - #declon = -declon already done before neamap merge - Vessel = as.numeric(as.factor(vessel))-1 - ) %>% - dplyr::select(Catch_g = meanbluepywt, #use bluepywt for individuals input in example - Year = year, - Vessel, - AreaSwept_km2, - Lat = declat, - Lon = declon, - meanpisclen, - npiscsp, - #bottemp, #this leaves out many stations for NEFSC - #surftemp, #this leaves out many stations for NEFSC - oisst, - sstfill - ) %>% - na.omit() %>% - as.data.frame() - - -# Make settings (turning off bias.correct to save time for example) -# NEFSC strata limits https://github.com/James-Thorson-NOAA/VAST/issues/302 - -# use only MAB, GB, GOM, SS EPUs -# leave out south of Cape Hatteras at Elizabeth's suggestion -# could also leave out SS? -# CHECK if these EPUs match what we use in SOE - -bfinshore <- c(3020, 3050, 3080, 3110, 3140, 3170, 3200, 3230, - 3260, 3290, 3320, 3350, 3380, 3410, 3440, 3450, 3460) - -bfoffshore <- c(1010, 1730, 1690, 1650, 1050, 1060, 1090, 1100, 1250, 1200, 1190, 1610) - -MAB <- c(1010:1080, 1100:1120, 1600:1750, 3010:3450, 3470, 3500, 3510) -GB <- c(1090, 1130:1210, 1230, 1250, 3460, 3480, 3490, 3520:3550) -GOM <- c(1220, 1240, 1260:1290, 1360:1400, 3560:3830) -SS <- c(1300:1352, 3840:3990) - -MABGBinshore <- c(3010:3450, 3460, 3470, 3480, 3490, 3500, 3510, 3520:3550) - -MABGBoffshore <- c(1010:1080, 1090, 1100:1120,1130:1210, 1230, 1250, 1600:1750) - -coast3nmbuffst <- readRDS(here::here("spatialdat/coast3nmbuffst.rds")) - -MAB2 <- coast3nmbuffst %>% - dplyr::filter(stratum_number %in% MAB) %>% - dplyr::select(stratum_number2) %>% - dplyr::distinct() - -# MAB state waters -MAB2state <- MAB2 %>% - dplyr::filter(stratum_number2 %% 10 == 1) - -# MAB federal waters -MAB2fed <- MAB2 %>% - dplyr::filter(stratum_number2 %% 10 == 2) - -# Georges Bank EPU -GB2 <- coast3nmbuffst %>% - dplyr::filter(stratum_number %in% GB) %>% - dplyr::select(stratum_number2) %>% - dplyr::distinct() - -# GB state waters -GB2state <- GB2 %>% - dplyr::filter(stratum_number2 %% 10 == 1) - -#GB federal waters -GB2fed <- GB2 %>% - dplyr::filter(stratum_number2 %% 10 == 2) - -# whole bluefish domain MABG -MABGB2 <- dplyr::bind_rows(MAB2, GB2) - -# MABGB state waters -MABGBstate <- dplyr::bind_rows(MAB2state, GB2state) - -# MABGB federal waters -MABGBfed <- dplyr::bind_rows(MAB2fed, GB2fed) - -# gulf of maine EPU (for SOE) -GOM2 <- coast3nmbuffst %>% - dplyr::filter(stratum_number %in% GOM) %>% - dplyr::select(stratum_number2) %>% - dplyr::distinct() - -# scotian shelf EPU (for SOE) -SS2 <- coast3nmbuffst %>% - dplyr::filter(stratum_number %in% SS) %>% - dplyr::select(stratum_number2) %>% - dplyr::distinct() - -# previous bluefish strata -bfinshore2 <- coast3nmbuffst %>% - dplyr::filter(stratum_number %in% bfinshore) %>% - dplyr::select(stratum_number2) %>% - dplyr::distinct() - -# additional new bluefish strata 2022 -bfoffshore2 <- coast3nmbuffst %>% - dplyr::filter(stratum_number %in% bfoffshore) %>% - dplyr::select(stratum_number2) %>% - dplyr::distinct() - -# all bluefish strata -bfall2 <- dplyr::bind_rows(bfinshore2, bfoffshore2) - -# albatross inshore strata -albinshore2 <- coast3nmbuffst %>% - dplyr::filter(stratum_number %in% setdiff(MABGBinshore, bfinshore)) %>% - dplyr::select(stratum_number2) %>% - dplyr::distinct() - -# Albold for WHAM input -albbfinshore <- dplyr::bind_rows(albinshore2, bfinshore2) - -# Albnew for WHAM input -albbfall <- dplyr::bind_rows(albinshore2, bfall2) - -# offshore of all bluefish survey strata -MABGBothoffshore2 <- coast3nmbuffst %>% - dplyr::filter(stratum_number %in% setdiff(MABGBoffshore, bfoffshore)) %>% - dplyr::select(stratum_number2) %>% - dplyr::distinct() - -# needed to cover the whole northwest atlantic grid -allother2 <- coast3nmbuffst %>% - dplyr::filter(!stratum_number %in% c(MAB, GB, GOM, SS)) %>% - dplyr::select(stratum_number2) %>% - dplyr::distinct() - -# all epus -allEPU2 <- coast3nmbuffst %>% - dplyr::filter(stratum_number %in% c(MAB, GB, GOM, SS)) %>% - dplyr::select(stratum_number2) %>% - dplyr::distinct() - -# configs -FieldConfig <- c( - "Omega1" = 0, # number of spatial variation factors (0, 1, AR1) - "Epsilon1" = 0, # number of spatio-temporal factors - "Omega2" = 0, - "Epsilon2" = 0 -) - -# Model selection options, FieldConfig default (all IID) -# Season_knots + suffix below -# _base No vessel overdispersion or length/number covariates (ensure same dataset) -# _len Predator mean length covariate -# _no Number of predator species covariate -# _lenno Predator mean length and number of predator species covariates -# _eta10 Overdispersion (vessel effect) in first linear predictor (prey encounter) -# _eta11 Overdispersion (vessel effect) in both linear predictors (prey wt) - -RhoConfig <- c( - "Beta1" = 0, # temporal structure on years (intercepts) - "Beta2" = 0, - "Epsilon1" = 0, # temporal structure on spatio-temporal variation - "Epsilon2" = 0 -) -# 0 off (fixed effects) -# 1 independent -# 2 random walk -# 3 constant among years (fixed effect) -# 4 AR1 - -OverdispersionConfig <- c("eta1"=0, "eta2"=0) -# eta1 = vessel effects on prey encounter rate -# eta2 = vessel effects on prey weight - -strata.limits <- as.list(c("AllEPU" = allEPU2, - "MABGB" = MABGB2, - "MABGBstate" = MABGBstate, - "MABGBfed" = MABGBfed, - "MAB" = MAB2, - "GB" = GB2, - "GOM" = GOM2, - "bfall" = bfall2, - "bfin" = bfinshore2, - "bfoff" = bfoffshore2, - "MABGBalbinshore" = albinshore2, - "MABGBothoffshore" = MABGBothoffshore2, - "albbfin" = albbfinshore, - "albbfall" = albbfall, - "allother" = allother2)) - -settings = make_settings( n_x = 500, - Region = "northwest_atlantic", - Version = "VAST_v14_0_1", #needed to prevent error from newer dev version number - #strata.limits = list('All_areas' = 1:1e5), full area - strata.limits = strata.limits, - purpose = "index2", - bias.correct = TRUE, - #use_anisotropy = FALSE, - #fine_scale = FALSE, - #FieldConfig = FieldConfig, - #RhoConfig = RhoConfig, - OverdispersionConfig = OverdispersionConfig - ) - - -New_Extrapolation_List <- readRDS(here::here("spatialdat/CustomExtrapolationList.rds")) - -# select dataset and set directory for output - -######################################################### -# Run model annual - -season <- c("annual_500_lennosst_ALLsplit_biascorrect") - -working_dir <- here::here(sprintf("pyindex/allagg_%s/", season)) - -if(!dir.exists(working_dir)) { - dir.create(working_dir) -} - -# subset for faster testing -#bluepyagg_stn_all <- bluepyagg_stn_all %>% filter(Year<1990) - -fit <- fit_model( - settings = settings, - extrapolation_list = New_Extrapolation_List, - Lat_i = bluepyagg_stn_all$Lat, - Lon_i = bluepyagg_stn_all$Lon, - t_i = bluepyagg_stn_all$Year, - b_i = as_units(bluepyagg_stn_all[,'Catch_g'], 'g'), - a_i = rep(1, nrow(bluepyagg_stn_all)), - v_i = bluepyagg_stn_all$Vessel, - Q_ik = as.matrix(bluepyagg_stn_all[,c("npiscsp", - "meanpisclen", - "sstfill" - )]), - #Use_REML = TRUE, - working_dir = paste0(working_dir, "/")) - -saveRDS(fit, file = paste0(working_dir, "/fit.rds")) - -# Plot results -plot( fit, - working_dir = paste0(working_dir, "/")) - diff --git a/VASTscripts/VASTunivariate_bfp_allsurvs_lencovSST_ALLinoffsplits.R b/VASTscripts/VASTunivariate_bfp_allsurvs_lencovSST_ALLinoffsplits.R deleted file mode 100644 index 291341a..0000000 --- a/VASTscripts/VASTunivariate_bfp_allsurvs_lencovSST_ALLinoffsplits.R +++ /dev/null @@ -1,328 +0,0 @@ -# VAST attempt 2 univariate model as a script -# modified from https://github.com/James-Thorson-NOAA/VAST/wiki/Index-standardization - -# Load packages -library(here) -library(dplyr) -library(VAST) - -#Read in data, separate spring and fall, and rename columns for VAST: - -# this dataset created in SSTmethods.Rmd - -bluepyagg_stn <- readRDS(here::here("fhdat/bluepyagg_stn_all_OISST.rds")) - -# make SST column that uses surftemp unless missing or 0 -# there are 3 surftemp 0 values in the dataset, all with oisst > 15 -bluepyagg_stn <- bluepyagg_stn %>% - dplyr::mutate(sstfill = ifelse((is.na(surftemp)|surftemp==0), oisst, surftemp)) - -#bluepyagg_stn <- bluepyagg_pred_stn - -# filter to assessment years at Tony's suggestion - -# code Vessel as AL=0, HB=1, NEAMAP=2 - -bluepyagg_stn_fall <- bluepyagg_stn %>% - #ungroup() %>% - filter(season_ng == "FALL", - year > 1984) %>% - mutate(AreaSwept_km2 = 1, #Elizabeth's code - #declon = -declon already done before neamap merge - Vessel = as.numeric(as.factor(vessel))-1 - ) %>% - dplyr::select(Catch_g = meanbluepywt, #use bluepywt for individuals input in example - Year = year, - Vessel, - AreaSwept_km2, - Lat = declat, - Lon = declon, - meanpisclen, - npiscsp, - #bottemp, #this leaves out many stations for NEFSC - #surftemp, #this leaves out many stations for NEFSC - oisst, - sstfill - ) %>% - na.omit() %>% - as.data.frame() - -bluepyagg_stn_spring <- bluepyagg_stn %>% - filter(season_ng == "SPRING", - year > 1984) %>% - mutate(AreaSwept_km2 =1, #Elizabeth's code - #declon = -declon already done before neamap merge - Vessel = as.numeric(as.factor(vessel))-1 - ) %>% - dplyr::select(Catch_g = meanbluepywt, - Year = year, - Vessel, - AreaSwept_km2, - Lat = declat, - Lon = declon, - meanpisclen, - npiscsp, - #bottemp, #this leaves out many stations for NEFSC - #surftemp, #this leaves out many stations for NEFSC - oisst, - sstfill - ) %>% - na.omit() %>% - as.data.frame() - - -# Make settings (turning off bias.correct to save time for example) -# NEFSC strata limits https://github.com/James-Thorson-NOAA/VAST/issues/302 - -# use only MAB, GB, GOM, SS EPUs -# leave out south of Cape Hatteras at Elizabeth's suggestion -# could also leave out SS? -# CHECK if these EPUs match what we use in SOE - -bfinshore <- c(3020, 3050, 3080, 3110, 3140, 3170, 3200, 3230, - 3260, 3290, 3320, 3350, 3380, 3410, 3440, 3450, 3460) - -bfoffshore <- c(1010, 1730, 1690, 1650, 1050, 1060, 1090, 1100, 1250, 1200, 1190, 1610) - -MAB <- c(1010:1080, 1100:1120, 1600:1750, 3010:3450, 3470, 3500, 3510) -GB <- c(1090, 1130:1210, 1230, 1250, 3460, 3480, 3490, 3520:3550) -GOM <- c(1220, 1240, 1260:1290, 1360:1400, 3560:3830) -SS <- c(1300:1352, 3840:3990) - -MABGBinshore <- c(3010:3450, 3460, 3470, 3480, 3490, 3500, 3510, 3520:3550) - -MABGBoffshore <- c(1010:1080, 1090, 1100:1120,1130:1210, 1230, 1250, 1600:1750) - -coast3nmbuffst <- readRDS(here::here("spatialdat/coast3nmbuffst.rds")) - -MAB2 <- coast3nmbuffst %>% - dplyr::filter(stratum_number %in% MAB) %>% - dplyr::select(stratum_number2) %>% - dplyr::distinct() - -# MAB state waters -MAB2state <- MAB2 %>% - dplyr::filter(stratum_number2 %% 10 == 1) - -# MAB federal waters -MAB2fed <- MAB2 %>% - dplyr::filter(stratum_number2 %% 10 == 2) - -# Georges Bank EPU -GB2 <- coast3nmbuffst %>% - dplyr::filter(stratum_number %in% GB) %>% - dplyr::select(stratum_number2) %>% - dplyr::distinct() - -# GB state waters -GB2state <- GB2 %>% - dplyr::filter(stratum_number2 %% 10 == 1) - -#GB federal waters -GB2fed <- GB2 %>% - dplyr::filter(stratum_number2 %% 10 == 2) - -# whole bluefish domain MABG -MABGB2 <- dplyr::bind_rows(MAB2, GB2) - -# MABGB state waters -MABGBstate <- dplyr::bind_rows(MAB2state, GB2state) - -# MABGB federal waters -MABGBfed <- dplyr::bind_rows(MAB2fed, GB2fed) - -# gulf of maine EPU (for SOE) -GOM2 <- coast3nmbuffst %>% - dplyr::filter(stratum_number %in% GOM) %>% - dplyr::select(stratum_number2) %>% - dplyr::distinct() - -# scotian shelf EPU (for SOE) -SS2 <- coast3nmbuffst %>% - dplyr::filter(stratum_number %in% SS) %>% - dplyr::select(stratum_number2) %>% - dplyr::distinct() - -# previous bluefish strata -bfinshore2 <- coast3nmbuffst %>% - dplyr::filter(stratum_number %in% bfinshore) %>% - dplyr::select(stratum_number2) %>% - dplyr::distinct() - -# additional new bluefish strata 2022 -bfoffshore2 <- coast3nmbuffst %>% - dplyr::filter(stratum_number %in% bfoffshore) %>% - dplyr::select(stratum_number2) %>% - dplyr::distinct() - -# all bluefish strata -bfall2 <- dplyr::bind_rows(bfinshore2, bfoffshore2) - -# albatross inshore strata -albinshore2 <- coast3nmbuffst %>% - dplyr::filter(stratum_number %in% setdiff(MABGBinshore, bfinshore)) %>% - dplyr::select(stratum_number2) %>% - dplyr::distinct() - -# Albold for WHAM input -albbfinshore <- dplyr::bind_rows(albinshore2, bfinshore2) - -# Albnew for WHAM input -albbfall <- dplyr::bind_rows(albinshore2, bfall2) - -# offshore of all bluefish survey strata -MABGBothoffshore2 <- coast3nmbuffst %>% - dplyr::filter(stratum_number %in% setdiff(MABGBoffshore, bfoffshore)) %>% - dplyr::select(stratum_number2) %>% - dplyr::distinct() - -# needed to cover the whole northwest atlantic grid -allother2 <- coast3nmbuffst %>% - dplyr::filter(!stratum_number %in% c(MAB, GB, GOM, SS)) %>% - dplyr::select(stratum_number2) %>% - dplyr::distinct() - -# all epus -allEPU2 <- coast3nmbuffst %>% - dplyr::filter(stratum_number %in% c(MAB, GB, GOM, SS)) %>% - dplyr::select(stratum_number2) %>% - dplyr::distinct() - -# configs -FieldConfig <- c( - "Omega1" = 0, # number of spatial variation factors (0, 1, AR1) - "Epsilon1" = 0, # number of spatio-temporal factors - "Omega2" = 0, - "Epsilon2" = 0 -) - -# Model selection options, FieldConfig default (all IID) -# Season_knots + suffix below -# _base No vessel overdispersion or length/number covariates (ensure same dataset) -# _len Predator mean length covariate -# _no Number of predator species covariate -# _lenno Predator mean length and number of predator species covariates -# _eta10 Overdispersion (vessel effect) in first linear predictor (prey encounter) -# _eta11 Overdispersion (vessel effect) in both linear predictors (prey wt) - -RhoConfig <- c( - "Beta1" = 0, # temporal structure on years (intercepts) - "Beta2" = 0, - "Epsilon1" = 0, # temporal structure on spatio-temporal variation - "Epsilon2" = 0 -) -# 0 off (fixed effects) -# 1 independent -# 2 random walk -# 3 constant among years (fixed effect) -# 4 AR1 - -OverdispersionConfig <- c("eta1"=0, "eta2"=0) -# eta1 = vessel effects on prey encounter rate -# eta2 = vessel effects on prey weight - -strata.limits <- as.list(c("AllEPU" = allEPU2, - "MABGB" = MABGB2, - "MABGBstate" = MABGBstate, - "MABGBfed" = MABGBfed, - "MAB" = MAB2, - "GB" = GB2, - "GOM" = GOM2, - "bfall" = bfall2, - "bfin" = bfinshore2, - "bfoff" = bfoffshore2, - "MABGBalbinshore" = albinshore2, - "MABGBothoffshore" = MABGBothoffshore2, - "albbfin" = albbfinshore, - "albbfall" = albbfall, - "allother" = allother2)) - -settings = make_settings( n_x = 500, - Region = "northwest_atlantic", - Version = "VAST_v14_0_1", #needed to prevent error from newer dev version number - #strata.limits = list('All_areas' = 1:1e5), full area - strata.limits = strata.limits, - purpose = "index2", - bias.correct = TRUE, - #use_anisotropy = FALSE, - #fine_scale = FALSE, - #FieldConfig = FieldConfig, - #RhoConfig = RhoConfig, - OverdispersionConfig = OverdispersionConfig - ) - - -New_Extrapolation_List <- readRDS(here::here("spatialdat/CustomExtrapolationList.rds")) - -# select dataset and set directory for output - -######################################################### -# Run model fall - -season <- c("fall_500_lennosst_ALLsplit_biascorrect") - -working_dir <- here::here(sprintf("pyindex/allagg_%s/", season)) - -if(!dir.exists(working_dir)) { - dir.create(working_dir) -} - -# subset for faster testing -#bluepyagg_stn_fall <- bluepyagg_stn_fall %>% filter(Year<1990) - -fit <- fit_model( - settings = settings, - extrapolation_list = New_Extrapolation_List, - Lat_i = bluepyagg_stn_fall$Lat, - Lon_i = bluepyagg_stn_fall$Lon, - t_i = bluepyagg_stn_fall$Year, - b_i = as_units(bluepyagg_stn_fall[,'Catch_g'], 'g'), - a_i = rep(1, nrow(bluepyagg_stn_fall)), - v_i = bluepyagg_stn_fall$Vessel, - Q_ik = as.matrix(bluepyagg_stn_fall[,c("npiscsp", - "meanpisclen", - "sstfill" - )]), - #Use_REML = TRUE, - working_dir = paste0(working_dir, "/")) - -saveRDS(fit, file = paste0(working_dir, "/fit.rds")) - -# Plot results -plot( fit, - working_dir = paste0(working_dir, "/")) - -###################################################### -# Run model spring - -season <- c("spring_500_lennosst_ALLsplit_biascorrect") - -working_dir <- here::here(sprintf("pyindex/allagg_%s/", season)) - -if(!dir.exists(working_dir)) { - dir.create(working_dir) -} - -# subset for faster testing -#bluepyagg_stn_spring <- bluepyagg_stn_spring %>% filter(Year<1990) - -fit <- fit_model( settings = settings, - extrapolation_list = New_Extrapolation_List, - Lat_i = bluepyagg_stn_spring[,'Lat'], - Lon_i = bluepyagg_stn_spring[,'Lon'], - t_i = bluepyagg_stn_spring[,'Year'], - b_i = as_units(bluepyagg_stn_spring[,'Catch_g'], 'g'), - a_i = rep(1, nrow(bluepyagg_stn_spring)), - v_i = bluepyagg_stn_spring$Vessel, - Q_ik = as.matrix(bluepyagg_stn_spring[,c("npiscsp", - "meanpisclen", - "sstfill" - )]), - # Use_REML = TRUE, - working_dir = paste0(working_dir, "/")) - -saveRDS(fit, file = paste0(working_dir, "/fit.rds")) - -# Plot results -plot( fit, - working_dir = paste0(working_dir, "/")) diff --git a/VASTscripts/VASTunivariate_macrobenthos_allsurvs.R b/VASTscripts/VASTunivariate_macrobenthos_allsurvs.R index 396095e..21824f6 100644 --- a/VASTscripts/VASTunivariate_macrobenthos_allsurvs.R +++ b/VASTscripts/VASTunivariate_macrobenthos_allsurvs.R @@ -8,61 +8,63 @@ library(VAST) #Read in data, separate spring and fall, and rename columns for VAST: -# this dataset created in fhdata/VASTbenthos_ProcessInputDat.R +# this dataset created in SSTmethods.Rmd -macrobenagg_stn <- readRDS(here::here("fhdata/macrobenagg_stn_all.rds")) +macrobenagg_stn <- readRDS(here::here("fhdata/macrobenagg_stn_all_modBT.rds")) # make SST column that uses surftemp unless missing or 0 # there are 3 surftemp 0 values in the dataset, all with oisst > 15 -#macrobenagg_stn <- macrobenagg_stn %>% -# dplyr::mutate(sstfill = ifelse((is.na(surftemp)|surftemp==0), oisst, surftemp)) + +macrobenagg_stn <- macrobenagg_stn %>% + dplyr::mutate(btfill = ifelse((is.na(bottemp)|bottemp==0), mod_bt, bottemp)) # code Vessel as AL=0, HB=1, NEAMAP=2 macrobenagg_stn_fall <- macrobenagg_stn %>% #ungroup() %>% - filter(season_ng == "FALL", + filter(season_ng == "FALL", # Annual model for MRIP index year > 1979) %>% mutate(AreaSwept_km2 = 1, #Elizabeth's code #declon = -declon already done before neamap merge Vessel = as.numeric(as.factor(vessel))-1 - ) %>% - dplyr::select(Catch_g = meanmacrobenpywt, #use bluepywt for individuals input in example - Year = year, - Vessel, - AreaSwept_km2, - Lat = declat, - Lon = declon, - meanbenthivorelen, - nbenthivoresp #, - #bottemp, #this leaves out many stations for NEFSC - #surftemp, #this leaves out many stations for NEFSC - #oisst, - #sstfill - ) %>% + ) %>% + dplyr::select(Catch_g = meanmacrobenpywt, #use megabenwt for individuals input in example + Year = year, + Vessel, + AreaSwept_km2, + Lat = declat, + Lon = declon, + meanbenthivorelen, + nbenthivoresp, + #bottemp, #this leaves out many stations for NEFSC + #surftemp, #this leaves out many stations for NEFSC + mod_bt,#leaves out 2023 NEAMAP, ok for now + btfill + ) %>% na.omit() %>% as.data.frame() macrobenagg_stn_spring <- macrobenagg_stn %>% - filter(season_ng == "SPRING", + #ungroup() %>% + filter(season_ng == "SPRING", # Annual model for MRIP index year > 1979) %>% - mutate(AreaSwept_km2 =1, #Elizabeth's code + mutate(AreaSwept_km2 = 1, #Elizabeth's code #declon = -declon already done before neamap merge Vessel = as.numeric(as.factor(vessel))-1 - ) %>% - dplyr::select(Catch_g = meanmacrobenpywt, - Year = year, - Vessel, - AreaSwept_km2, - Lat = declat, - Lon = declon, - meanbenthivorelen, - nbenthivoresp #, - #bottemp, #this leaves out many stations for NEFSC - #surftemp, #this leaves out many stations for NEFSC - #oisst, - #sstfill - ) %>% + ) %>% + dplyr::select(Catch_g = meanmacrobenpywt, #use megabenwt for individuals input in example + Year = year, + Vessel, + AreaSwept_km2, + Lat = declat, + Lon = declon, + meanbenthivorelen, + nbenthivoresp, + #bottemp, #this leaves out many stations for NEFSC + #surftemp, #this leaves out many stations for NEFSC + mod_bt,#leaves out 2023 NEAMAP, ok for now + btfill + ) %>% na.omit() %>% as.data.frame() @@ -116,21 +118,18 @@ allEPU2 <- FishStatsUtils::northwest_atlantic_grid %>% dplyr::distinct() # configs -FieldConfig <- c( - "Omega1" = 0, # number of spatial variation factors (0, 1, AR1) - "Epsilon1" = 0, # number of spatio-temporal factors - "Omega2" = 0, - "Epsilon2" = 0 -) +# older type, below current, should be functionally the same +# FieldConfig <- c( +# "Omega1" = 0, # number of spatial variation factors (0, 1, AR1) +# "Epsilon1" = 0, # number of spatio-temporal factors +# "Omega2" = 0, +# "Epsilon2" = 0 +# ) + +# all random effects are on +FieldConfig <- matrix( "IID", ncol=2, nrow=3, + dimnames=list(c("Omega","Epsilon","Beta"),c("Component_1","Component_2"))) -# Model selection options, FieldConfig default (all IID) -# Season_knots + suffix below -# _base No vessel overdispersion or length/number covariates (ensure same dataset) -# _len Predator mean length covariate -# _no Number of predator species covariate -# _lenno Predator mean length and number of predator species covariates -# _eta10 Overdispersion (vessel effect) in first linear predictor (prey encounter) -# _eta11 Overdispersion (vessel effect) in both linear predictors (prey wt) RhoConfig <- c( "Beta1" = 0, # temporal structure on years (intercepts) @@ -172,11 +171,11 @@ settings = make_settings( n_x = 500, #strata.limits = list('All_areas' = 1:1e5), full area strata.limits = strata.limits, purpose = "index2", - bias.correct = FALSE, - #use_anisotropy = FALSE, - #fine_scale = FALSE, - #FieldConfig = FieldConfig, - #RhoConfig = RhoConfig, + bias.correct = TRUE, + use_anisotropy = TRUE, + fine_scale = TRUE, + FieldConfig = FieldConfig, + RhoConfig = RhoConfig, OverdispersionConfig = OverdispersionConfig ) @@ -188,7 +187,7 @@ settings = make_settings( n_x = 500, ######################################################### # Run model fall -season <- c("fall_500_test") +season <- c("fall_500_cov") working_dir <- here::here(sprintf("pyindex/macrobenthos_%s/", season)) @@ -205,10 +204,9 @@ fit <- fit_model( b_i = as_units(macrobenagg_stn_fall[,'Catch_g'], 'g'), a_i = rep(1, nrow(macrobenagg_stn_fall)), v_i = macrobenagg_stn_fall$Vessel, - #Q_ik = as.matrix(bluepyagg_stn_fall[,c("npiscsp", - # "meanpisclen", - # "sstfill" - # )]), + Q_ik = as.matrix(macrobenagg_stn_fall[,c("meanbenthivorelen", + "nbenthivoresp", + "btfill")]), #Use_REML = TRUE, working_dir = paste0(working_dir, "/")) @@ -221,7 +219,7 @@ plot( fit, ###################################################### # Run model spring -season <- c("spring_500_test") +season <- c("spring_500_cov") working_dir <- here::here(sprintf("pyindex/macrobenthos_%s/", season)) @@ -237,11 +235,10 @@ fit <- fit_model( settings = settings, b_i = as_units(macrobenagg_stn_spring[,'Catch_g'], 'g'), a_i = rep(1, nrow(macrobenagg_stn_spring)), v_i = macrobenagg_stn_spring$Vessel, - #Q_ik = as.matrix(bluepyagg_stn_spring[,c("npiscsp", - # "meanpisclen", - # "sstfill" - # )]), - # Use_REML = TRUE, + Q_ik = as.matrix(macrobenagg_stn_fall[,c("meanbenthivorelen", + "nbenthivoresp", + "btfill")]), + # Use_REML = TRUE, working_dir = paste0(working_dir, "/")) saveRDS(fit, file = paste0(working_dir, "/fit.rds")) diff --git a/VASTscripts/VASTunivariate_megabenthos_allsurvs.R b/VASTscripts/VASTunivariate_megabenthos_allsurvs.R index 9654ebf..6ec889e 100644 --- a/VASTscripts/VASTunivariate_megabenthos_allsurvs.R +++ b/VASTscripts/VASTunivariate_megabenthos_allsurvs.R @@ -8,72 +8,73 @@ library(VAST) #Read in data, separate spring and fall, and rename columns for VAST: -# this dataset created in fhdata/VASTbenthos_ProcessInputDat.R +# this dataset created in SSTmethods.Rmd -megabenagg_stn <- readRDS(here::here("fhdata/megabenagg_stn_all.rds")) +megabenagg_stn <- readRDS(here::here("fhdata/megabenagg_stn_all_modBT.rds")) # make SST column that uses surftemp unless missing or 0 # there are 3 surftemp 0 values in the dataset, all with oisst > 15 -#megabenagg_stn <- megabenagg_stn %>% -# dplyr::mutate(sstfill = ifelse((is.na(surftemp)|surftemp==0), oisst, surftemp)) +megabenagg_stn <- megabenagg_stn %>% + dplyr::mutate(btfill = ifelse((is.na(bottemp)|bottemp==0), mod_bt, bottemp)) # code Vessel as AL=0, HB=1, NEAMAP=2 megabenagg_stn_fall <- megabenagg_stn %>% #ungroup() %>% - filter(season_ng == "FALL", + filter(season_ng == "FALL", # Annual model for MRIP index year > 1979) %>% mutate(AreaSwept_km2 = 1, #Elizabeth's code #declon = -declon already done before neamap merge Vessel = as.numeric(as.factor(vessel))-1 - ) %>% - dplyr::select(Catch_g = meanmegabenpywt, #use bluepywt for individuals input in example - Year = year, - Vessel, - AreaSwept_km2, - Lat = declat, - Lon = declon, - meanbenthivorelen, - nbenthivoresp #, - #bottemp, #this leaves out many stations for NEFSC - #surftemp, #this leaves out many stations for NEFSC - #oisst, - #sstfill - ) %>% + ) %>% + dplyr::select(Catch_g = meanmegabenpywt, #use megabenwt for individuals input in example + Year = year, + Vessel, + AreaSwept_km2, + Lat = declat, + Lon = declon, + meanbenthivorelen, + nbenthivoresp, + #bottemp, #this leaves out many stations for NEFSC + #surftemp, #this leaves out many stations for NEFSC + mod_bt,#leaves out 2023 NEAMAP, ok for now + btfill + ) %>% na.omit() %>% as.data.frame() megabenagg_stn_spring <- megabenagg_stn %>% - filter(season_ng == "SPRING", + #ungroup() %>% + filter(season_ng == "SPRING", # Annual model for MRIP index year > 1979) %>% - mutate(AreaSwept_km2 =1, #Elizabeth's code + mutate(AreaSwept_km2 = 1, #Elizabeth's code #declon = -declon already done before neamap merge Vessel = as.numeric(as.factor(vessel))-1 - ) %>% - dplyr::select(Catch_g = meanmegabenpywt, - Year = year, - Vessel, - AreaSwept_km2, - Lat = declat, - Lon = declon, - meanbenthivorelen, - nbenthivoresp #, - #bottemp, #this leaves out many stations for NEFSC - #surftemp, #this leaves out many stations for NEFSC - #oisst, - #sstfill - ) %>% + ) %>% + dplyr::select(Catch_g = meanmegabenpywt, #use megabenwt for individuals input in example + Year = year, + Vessel, + AreaSwept_km2, + Lat = declat, + Lon = declon, + meanbenthivorelen, + nbenthivoresp, + #bottemp, #this leaves out many stations for NEFSC + #surftemp, #this leaves out many stations for NEFSC + mod_bt,#leaves out 2023 NEAMAP, ok for now + btfill + ) %>% na.omit() %>% as.data.frame() -# Make settings (turning off bias.correct to save time for example) +# Make settings # NEFSC strata limits https://github.com/James-Thorson-NOAA/VAST/issues/302 # use only MAB, GB, GOM, SS EPUs -# leave out south of Cape Hatteras at Elizabeth's suggestion +# leave out south of Cape Hatteras # could also leave out SS? -# CHECK if these EPUs match what we use in SOE + MAB <- c(1010:1080, 1100:1120, 1600:1750, 3010:3450, 3470, 3500, 3510) GB <- c(1090, 1130:1210, 1230, 1250, 3460, 3480, 3490, 3520:3550) @@ -116,21 +117,18 @@ allEPU2 <- FishStatsUtils::northwest_atlantic_grid %>% dplyr::distinct() # configs -FieldConfig <- c( - "Omega1" = 0, # number of spatial variation factors (0, 1, AR1) - "Epsilon1" = 0, # number of spatio-temporal factors - "Omega2" = 0, - "Epsilon2" = 0 -) +# older type, below current, should be functionally the same +# FieldConfig <- c( +# "Omega1" = 0, # number of spatial variation factors (0, 1, AR1) +# "Epsilon1" = 0, # number of spatio-temporal factors +# "Omega2" = 0, +# "Epsilon2" = 0 +# ) + +# all random effects are on +FieldConfig <- matrix( "IID", ncol=2, nrow=3, + dimnames=list(c("Omega","Epsilon","Beta"),c("Component_1","Component_2"))) -# Model selection options, FieldConfig default (all IID) -# Season_knots + suffix below -# _base No vessel overdispersion or length/number covariates (ensure same dataset) -# _len Predator mean length covariate -# _no Number of predator species covariate -# _lenno Predator mean length and number of predator species covariates -# _eta10 Overdispersion (vessel effect) in first linear predictor (prey encounter) -# _eta11 Overdispersion (vessel effect) in both linear predictors (prey wt) RhoConfig <- c( "Beta1" = 0, # temporal structure on years (intercepts) @@ -172,11 +170,11 @@ settings = make_settings( n_x = 500, #strata.limits = list('All_areas' = 1:1e5), full area strata.limits = strata.limits, purpose = "index2", - bias.correct = FALSE, - #use_anisotropy = FALSE, - fine_scale = FALSE, - #FieldConfig = FieldConfig, - #RhoConfig = RhoConfig, + bias.correct = TRUE, + use_anisotropy = TRUE, + fine_scale = TRUE, + FieldConfig = FieldConfig, + RhoConfig = RhoConfig, OverdispersionConfig = OverdispersionConfig ) @@ -188,7 +186,7 @@ settings = make_settings( n_x = 500, ######################################################### # Run model fall -season <- c("fall_500_test") +season <- c("fall_500_cov") working_dir <- here::here(sprintf("pyindex/megabenthos_%s/", season)) @@ -205,10 +203,9 @@ fit <- fit_model( b_i = as_units(megabenagg_stn_fall[,'Catch_g'], 'g'), a_i = rep(1, nrow(megabenagg_stn_fall)), v_i = megabenagg_stn_fall$Vessel, - #Q_ik = as.matrix(bluepyagg_stn_fall[,c("npiscsp", - # "meanpisclen", - # "sstfill" - # )]), + Q_ik = as.matrix(megabenagg_stn_fall[,c("meanbenthivorelen", + "nbenthivoresp", + "btfill")]), #Use_REML = TRUE, working_dir = paste0(working_dir, "/")) @@ -221,7 +218,7 @@ plot( fit, ###################################################### # Run model spring -season <- c("spring_500_test") +season <- c("spring_500_cov") working_dir <- here::here(sprintf("pyindex/megabenthos_%s/", season)) @@ -237,10 +234,9 @@ fit <- fit_model( settings = settings, b_i = as_units(megabenagg_stn_spring[,'Catch_g'], 'g'), a_i = rep(1, nrow(megabenagg_stn_spring)), v_i = megabenagg_stn_spring$Vessel, - #Q_ik = as.matrix(bluepyagg_stn_spring[,c("npiscsp", - # "meanpisclen", - # "sstfill" - # )]), + Q_ik = as.matrix(megabenagg_stn_spring[,c("meanbenthivorelen", + "nbenthivoresp", + "btfill")]), # Use_REML = TRUE, working_dir = paste0(working_dir, "/"))