select only unique coverage points
# Load necessary libraries
library(dplyr)
Attaching package: 'dplyr'
The following objects are masked from 'package:stats':
filter, lag
The following objects are masked from 'package:base':
intersect, setdiff, setequal, union
select only unique coverage points
library(glue)
library(here)here() starts at /home/tylar/repos/rvc_habitat_cover
select only unique coverage points
pattern <- paste0({params$inputFilePrefix}, "\\d{4}\\.csv")
# List all files matching the pattern
files <- list.files(
path = here("data/01_raw"), pattern = pattern, full.names = TRUE
)
# Initialize an empty list to store data
data_list <- list()
# Loop over the files
for (file in files) {
# Read the CSV file
data <- read.csv(file)
print(glue("reading {file}..."))
# Select the desired columns
selected_data <- data %>%
select(LAT_DEGREES, LON_DEGREES, YEAR, MONTH, DAY, HABITAT_CD) %>%
mutate(date = sprintf("%04d-%02d-%02d", YEAR, MONTH, DAY)) %>%
mutate(`system:time_start` = as.numeric(as.POSIXct(
date, format="%Y-%m-%d", tz="UTC"
)) * 1000) %>%
select( -MONTH, -DAY) %>%
rename(latitude = LAT_DEGREES, longitude = LON_DEGREES)
# Keep only the rows with unique values across the selected columns
unique_data <- selected_data %>%
distinct()
# Append the data to the list
data_list[[length(data_list) + 1]] <- unique_data
}reading /home/tylar/repos/rvc_habitat_cover/data/01_raw/FLA_KEYS_1999.csv...
reading /home/tylar/repos/rvc_habitat_cover/data/01_raw/FLA_KEYS_2000.csv...
reading /home/tylar/repos/rvc_habitat_cover/data/01_raw/FLA_KEYS_2001.csv...
reading /home/tylar/repos/rvc_habitat_cover/data/01_raw/FLA_KEYS_2002.csv...
reading /home/tylar/repos/rvc_habitat_cover/data/01_raw/FLA_KEYS_2003.csv...
reading /home/tylar/repos/rvc_habitat_cover/data/01_raw/FLA_KEYS_2004.csv...
reading /home/tylar/repos/rvc_habitat_cover/data/01_raw/FLA_KEYS_2005.csv...
reading /home/tylar/repos/rvc_habitat_cover/data/01_raw/FLA_KEYS_2006.csv...
reading /home/tylar/repos/rvc_habitat_cover/data/01_raw/FLA_KEYS_2007.csv...
reading /home/tylar/repos/rvc_habitat_cover/data/01_raw/FLA_KEYS_2008.csv...
reading /home/tylar/repos/rvc_habitat_cover/data/01_raw/FLA_KEYS_2009.csv...
reading /home/tylar/repos/rvc_habitat_cover/data/01_raw/FLA_KEYS_2010.csv...
reading /home/tylar/repos/rvc_habitat_cover/data/01_raw/FLA_KEYS_2011.csv...
reading /home/tylar/repos/rvc_habitat_cover/data/01_raw/FLA_KEYS_2012.csv...
reading /home/tylar/repos/rvc_habitat_cover/data/01_raw/FLA_KEYS_2014.csv...
reading /home/tylar/repos/rvc_habitat_cover/data/01_raw/FLA_KEYS_2016.csv...
reading /home/tylar/repos/rvc_habitat_cover/data/01_raw/FLA_KEYS_2018.csv...
reading /home/tylar/repos/rvc_habitat_cover/data/01_raw/FLA_KEYS_2022.csv...
select only unique coverage points
# Combine all data into a single dataframe
combined_data <- do.call(rbind, data_list)

