Skip to content

Commit

Permalink
code to read in sas7bdat files and save as Rds
Browse files Browse the repository at this point in the history
  • Loading branch information
mle2718 committed Oct 22, 2024
1 parent 1deef9c commit c57c43c
Showing 1 changed file with 126 additions and 0 deletions.
126 changes: 126 additions & 0 deletions R_code/data_extraction_processing/extraction/pull_in_MRIP.R
Original file line number Diff line number Diff line change
@@ -0,0 +1,126 @@

# This is code to pull in the sas7bdat and save them as Rds.
# This code takes a while to run, which is why it's been split apart from the data processing.

##MRIP data is stored in
#"smb://net/mrfss/products/mrip_estim/Public_data_cal2018"
#Windows, just mount \\net.nefsc.noaa.gov\mrfss to A:\

#A:/products/mrip_estim/Public_data_cal2018


library("here")
library("haven")
library("data.table")
here::i_am("R_code/data_extraction_processing/extraction/pull_in_MRIP.R")

# running local
local_mrip_folder<-file.path("A:","products","mrip_estim","Public_data_cal2018")
network_mrip_folder<-file.path("mrfss","products","mrip_estim","Public_data_cal2018")


raw_mrip_folder<-local_mrip_folder


len_dataset<-list()

year<-as.character(2021:2024)
year<-as.data.frame(year)
waves<-as.character(1:6)
waves<-as.data.frame(waves)

yearly<-merge(year,waves, all=TRUE)
readins<-paste0(yearly$year, yearly$waves)

readins<-as.list(readins)

################################################################################
# Size
################################################################################

#Small function to read in size dataset

readin_size <- function(waves) {
size_file_in<-file.path(raw_mrip_folder,paste0("size_",waves,".sas7bdat"))

if(file.exists(size_file_in)==TRUE){
len<-haven::read_sas(size_file_in)
saveRDS(len,file=file.path("data_folder", "raw", paste0("size_",waves,".Rds")))
return(len)
}
}


size_dataset<-lapply(readins,readin_size)
size_dataset2<-rbindlist(size_dataset, fill=TRUE)

################################################################################
# TRIPS
################################################################################
readin_trips <- function(waves) {
trips_file_in<-file.path(raw_mrip_folder,paste0("trip_",waves,".sas7bdat"))

if(file.exists(trips_file_in)==TRUE){
trips<-haven::read_sas(trips_file_in)
saveRDS(trips,file=file.path("data_folder", "raw", paste0("trip_",waves,".Rds")))
return(trips)
}
}


trips_dataset<-lapply(readins,readin_trips)

trips_dataset2<-rbindlist(trips_dataset, fill=TRUE)




################################################################################
# catch
################################################################################
readin_catch <- function(waves) {
catch_file_in<-file.path(raw_mrip_folder,paste0("catch_",waves,".sas7bdat"))

if(file.exists(catch_file_in)==TRUE){
catch<-haven::read_sas(catch_file_in)
saveRDS(catch,file=file.path("data_folder", "raw", paste0("catch_",waves,".Rds")))
return(catch)
}
}


catch_dataset<-lapply(readins,readin_catch)

catch_dataset2<-rbindlist(catch_dataset, fill=TRUE)






################################################################################
# SizeB2
################################################################################

#Small function to read in size dataset

readin_sizeb2 <- function(waves) {
size_file_in<-file.path(raw_mrip_folder,paste0("size_b2_",waves,".sas7bdat"))

if(file.exists(size_file_in)==TRUE){
lenb2<-haven::read_sas(size_file_in)
saveRDS(lenb2,file=file.path("data_folder", "raw", paste0("size_b2_",waves,".Rds")))
return(lenb2)
}
}


sizeb2_dataset<-lapply(readins,readin_sizeb2)
sizeb2_dataset2<-rbindlist(sizeb2_dataset, fill=TRUE)







0 comments on commit c57c43c

Please sign in to comment.