#Import California Streams.xls through 'Import Dataset' #to view the first few lines of data to make sure that the dataset imported correctly head(StreamQuality_all) #add libraries library(dplyr) library(tidyr) library(ggplot2) library(scales) #Nitrogen trend per EPA REGION? stream_qualityN <- StreamQuality_all %>% group_by(EPAREGION) %>% summarise(avgNTL = mean(NTL)) stream_qualityN stream_qualityN_median <- StreamQuality_all %>% group_by(EPAREGION) %>% summarise(medNTL = median(NTL)) stream_qualityN_median p = ggplot(data = StreamQuality_all, aes(x = EPAREGION, y = NTL)) + geom_boxplot()+ theme(axis.text.x = element_text(angle = 90, hjust = 1)) + labs( x="EPA Region", y="Nitrogen Total Load (ug/L)") p ggplot_build(p) ggplot(data = StreamQuality_all, aes(x = EPAREGION, y = NTL)) + geom_boxplot()+ scale_y_log10() + theme(axis.text.x = element_text(angle = 90, hjust = 1)) + labs( x="EPA Region", y="Nitrogen Total Load (ug/L)") #trend per county? Phosphorus stream_qualityP <- StreamQuality_all %>% group_by(EPAREGION) %>% summarise(avgPTL = mean(PTL)) stream_qualityP stream_qualityPmedian <- StreamQuality_all %>% group_by(EPAREGION) %>% summarise(avgPTL = median(PTL)) stream_qualityPmedian pp = ggplot(data = StreamQuality_all, aes(x = EPAREGION, y = PTL)) + geom_boxplot()+ theme(axis.text.x = element_text(angle = 90, hjust = 1)) + labs( x="EPA Region", y="Phosphorous Total Load (ug/L)") pp ggplot_build(pp) #relationship between N and P? StreamQuality_all$logNTL = log10(StreamQuality_all$NTL) StreamQuality_all$logPTL = log10(StreamQuality_all$PTL) ggplot(data = StreamQuality_all, aes(x = logNTL, y = MMI_WSABEST)) + geom_jitter() + geom_smooth(method = "lm", se = FALSE) + theme(axis.text.x = element_text(angle = 90, hjust = 1)) + labs( x="NTL (log)", y="MMI") cor(StreamQuality_all$logNTL, StreamQuality_all$MMI_WSABEST) #[1] -0.4190654 ggplot(data = StreamQuality_all, aes(x = logPTL, y = MMI_WSABEST)) + geom_jitter() + theme(axis.text.x = element_text(angle = 90, hjust = 1)) + geom_smooth(method = "lm", se = FALSE) + labs( x="PTL (log)", y="MMI") cor(StreamQuality_all$logPTL, StreamQuality_all$MMI_WSABEST) #[1] -0.4207201