# Lab settings - please ingnore
options(repr.plot.width=7, repr.plot.height=4, repr.plot.res=250 ) # Make plots a resonable size


install.packages("tidyverse")


library(tidyverse)


# Read data
photosynthesis <- read_csv("Silver Tree Study photosynthetis.csv")

conductivity <- read_csv("Silver tree study conductance.csv")


head(photosynthesis)


str(photosynthesis)

tibble [1,722 x 12] (S3: spec_tbl_df/tbl_df/tbl/data.frame)
 $ Sample type           : chr [1:1722] "1DroughtIndigenous Pathogen 1" "1DroughtIndigenous Pathogen 1" "1DroughtIndigenous Pathogen 1" "1DroughtIndigenous Pathogen 1" ...
 $ Days after inoculation: num [1:1722] 9 9 9 9 9 9 9 9 9 9 ...
 $ Date                  : chr [1:1722] "6/8/2018" "6/8/2018" "6/8/2018" "6/8/2018" ...
 $ Licor                 : num [1:1722] 6400 6400 6400 6400 6400 6400 6400 6400 6400 6400 ...
 $ Trial                 : num [1:1722] 1 1 1 1 1 1 1 1 1 1 ...
 $ Treatment             : chr [1:1722] "Drought" "Drought" "Drought" "Drought" ...
 $ Species               : chr [1:1722] "Indigenous Pathogen" "Indigenous Pathogen" "Indigenous Pathogen" "Indigenous Pathogen" ...
 $ Plant Number          : num [1:1722] 1 1 1 1 1 1 1 1 1 1 ...
 $ Isolate Number        : num [1:1722] 1 1 1 1 1 1 1 1 1 1 ...
 $ Unique Sample Number  : num [1:1722] 3 3 3 3 3 3 3 3 3 3 ...
 $ Obs                   : num [1:1722] 1 2 3 4 5 6 7 8 9 10 ...
 $ Photosynthesis        : num [1:1722] 1.146 0.822 0.838 1.289 1.334 ...
 - attr(*, "spec")=
  .. cols(
  ..   `Sample type` = col_character(),
  ..   `Days after inoculation` = col_double(),
  ..   Date = col_character(),
  ..   Licor = col_double(),
  ..   Trial = col_double(),
  ..   Treatment = col_character(),
  ..   Species = col_character(),
  ..   `Plant Number` = col_double(),
  ..   `Isolate Number` = col_double(),
  ..   `Unique Sample Number` = col_double(),
  ..   Obs = col_double(),
  ..   Photosynthesis = col_double()
  .. )


# Photosynthesis plot 
ggplot(data = photosynthesis,
    aes(x = factor(Species), y = Photosynthesis, fill = factor(Species))) +
    geom_boxplot() +
    scale_y_continuous(limits = c(-10,50)) + #sets axis limits for y-axis. We note that this will remove values > 50. A warning message will let us know how many observations were excluded (10 observations)
    theme_classic() +
    guides(fill = FALSE) #removes legend for fill

Warning message:
"Removed 10 rows containing non-finite values (stat_boxplot)."


# Conductance plot
ggplot(data = conductivity,
    aes(x = factor(Species), y = Conductance, fill = factor(Species))) +
    geom_boxplot() +
    theme_classic() +
    guides(fill = FALSE) #removes legend for fill


# left_join example
combined_data <- left_join(photosynthesis,conductivity, 
                           by =c("Sample type",
                                 "Days after inoculation", 
                                 "Date", 
                                 "Licor", 
                                 "Trial",
                                 "Treatment",
                                 "Species",
                                 "Plant Number",
                                 "Isolate Number", 
                                 "Unique Sample Number",
                                 "Obs"))


head(combined_data)


str(combined_data)

tibble [1,722 x 14] (S3: spec_tbl_df/tbl_df/tbl/data.frame)
 $ Sample type           : chr [1:1722] "1DroughtIndigenous Pathogen 1" "1DroughtIndigenous Pathogen 1" "1DroughtIndigenous Pathogen 1" "1DroughtIndigenous Pathogen 1" ...
 $ Days after inoculation: num [1:1722] 9 9 9 9 9 9 9 9 9 9 ...
 $ Date                  : chr [1:1722] "6/8/2018" "6/8/2018" "6/8/2018" "6/8/2018" ...
 $ Licor                 : num [1:1722] 6400 6400 6400 6400 6400 6400 6400 6400 6400 6400 ...
 $ Trial                 : num [1:1722] 1 1 1 1 1 1 1 1 1 1 ...
 $ Treatment             : chr [1:1722] "Drought" "Drought" "Drought" "Drought" ...
 $ Species               : chr [1:1722] "Indigenous Pathogen" "Indigenous Pathogen" "Indigenous Pathogen" "Indigenous Pathogen" ...
 $ Plant Number          : num [1:1722] 1 1 1 1 1 1 1 1 1 1 ...
 $ Isolate Number        : num [1:1722] 1 1 1 1 1 1 1 1 1 1 ...
 $ Unique Sample Number  : num [1:1722] 3 3 3 3 3 3 3 3 3 3 ...
 $ Obs                   : num [1:1722] 1 2 3 4 5 6 7 8 9 10 ...
 $ Photosynthesis        : num [1:1722] 1.146 0.822 0.838 1.289 1.334 ...
 $ Conductance           : num [1:1722] 0.000408 0.000455 0.000673 0.000471 0.000676 ...
 $ Ci                    : num [1:1722] -4050 -2467 -1575 -3939 -2727 ...
 - attr(*, "spec")=
  .. cols(
  ..   `Sample type` = col_character(),
  ..   `Days after inoculation` = col_double(),
  ..   Date = col_character(),
  ..   Licor = col_double(),
  ..   Trial = col_double(),
  ..   Treatment = col_character(),
  ..   Species = col_character(),
  ..   `Plant Number` = col_double(),
  ..   `Isolate Number` = col_double(),
  ..   `Unique Sample Number` = col_double(),
  ..   Obs = col_double(),
  ..   Photosynthesis = col_double()
  .. )


# inner_join example
combined_inner <- inner_join(photosynthesis, conductivity, 
                             by =c("Sample type",
                                   "Days after inoculation",
                                   "Date", 
                                   "Trial",
                                   "Treatment",
                                   "Species",
                                   "Plant Number",
                                   "Isolate Number", 
                                   "Unique Sample Number",
                                   "Obs"))


head(combined_inner)


# full_join example
combined_full <- full_join(photosynthesis, conductivity)


# anti_join example
combined_anti <- anti_join(photosynthesis, conductivity)


# merge example
combined_data <- merge(photosynthesis, conductivity, all.x = TRUE, all.y = TRUE)


head(combined_data)


str(combined_data)

'data.frame':	1722 obs. of  14 variables:
 $ Sample type           : chr  "1DroughtBoth Pathogens9" "1DroughtBoth Pathogens9" "1DroughtBoth Pathogens9" "1DroughtBoth Pathogens9" ...
 $ Days after inoculation: num  9 9 9 9 9 9 9 9 9 9 ...
 $ Date                  : chr  "6/8/2018" "6/8/2018" "6/8/2018" "6/8/2018" ...
 $ Licor                 : num  6800 6800 6800 6800 6800 6800 6800 6800 6800 6800 ...
 $ Trial                 : num  1 1 1 1 1 1 1 1 1 1 ...
 $ Treatment             : chr  "Drought" "Drought" "Drought" "Drought" ...
 $ Species               : chr  "Both Pathogens" "Both Pathogens" "Both Pathogens" "Both Pathogens" ...
 $ Plant Number          : num  9 9 9 9 9 9 9 9 9 9 ...
 $ Isolate Number        : num  NA NA NA NA NA NA NA NA NA NA ...
 $ Unique Sample Number  : num  148 148 148 148 148 148 148 148 148 148 ...
 $ Obs                   : num  1 10 2 3 4 5 6 7 8 9 ...
 $ Photosynthesis        : num  0.0567 0.076 0.0606 0.0486 0.0747 ...
 $ Conductance           : num  0.001441 0.001589 0.001521 0.001897 0.000933 ...
 $ Ci                    : num  332 318 331 354 268 ...


# select example
sml_data <- select(combined_data, `Sample type`, Photosynthesis, Conductance)


head(sml_data)


str(sml_data)

'data.frame':	1722 obs. of  3 variables:
 $ Sample type   : chr  "1DroughtBoth Pathogens9" "1DroughtBoth Pathogens9" "1DroughtBoth Pathogens9" "1DroughtBoth Pathogens9" ...
 $ Photosynthesis: num  0.0567 0.076 0.0606 0.0486 0.0747 ...
 $ Conductance   : num  0.001441 0.001589 0.001521 0.001897 0.000933 ...


# select example using :
sml_data_select <- select(combined_data, `Sample type`:Species, Photosynthesis, Conductance)


head(sml_data_select)
str(sml_data_select)

'data.frame':	1722 obs. of  9 variables:
 $ Sample type           : chr  "1DroughtBoth Pathogens9" "1DroughtBoth Pathogens9" "1DroughtBoth Pathogens9" "1DroughtBoth Pathogens9" ...
 $ Days after inoculation: num  9 9 9 9 9 9 9 9 9 9 ...
 $ Date                  : chr  "6/8/2018" "6/8/2018" "6/8/2018" "6/8/2018" ...
 $ Licor                 : num  6800 6800 6800 6800 6800 6800 6800 6800 6800 6800 ...
 $ Trial                 : num  1 1 1 1 1 1 1 1 1 1 ...
 $ Treatment             : chr  "Drought" "Drought" "Drought" "Drought" ...
 $ Species               : chr  "Both Pathogens" "Both Pathogens" "Both Pathogens" "Both Pathogens" ...
 $ Photosynthesis        : num  0.0567 0.076 0.0606 0.0486 0.0747 ...
 $ Conductance           : num  0.001441 0.001589 0.001521 0.001897 0.000933 ...


# select example using -
sml_data_omit <- select(combined_data, -Licor, -Obs)


head(sml_data_omit)
str(sml_data_omit)

'data.frame':	1722 obs. of  12 variables:
 $ Sample type           : chr  "1DroughtBoth Pathogens9" "1DroughtBoth Pathogens9" "1DroughtBoth Pathogens9" "1DroughtBoth Pathogens9" ...
 $ Days after inoculation: num  9 9 9 9 9 9 9 9 9 9 ...
 $ Date                  : chr  "6/8/2018" "6/8/2018" "6/8/2018" "6/8/2018" ...
 $ Trial                 : num  1 1 1 1 1 1 1 1 1 1 ...
 $ Treatment             : chr  "Drought" "Drought" "Drought" "Drought" ...
 $ Species               : chr  "Both Pathogens" "Both Pathogens" "Both Pathogens" "Both Pathogens" ...
 $ Plant Number          : num  9 9 9 9 9 9 9 9 9 9 ...
 $ Isolate Number        : num  NA NA NA NA NA NA NA NA NA NA ...
 $ Unique Sample Number  : num  148 148 148 148 148 148 148 148 148 148 ...
 $ Photosynthesis        : num  0.0567 0.076 0.0606 0.0486 0.0747 ...
 $ Conductance           : num  0.001441 0.001589 0.001521 0.001897 0.000933 ...
 $ Ci                    : num  332 318 331 354 268 ...


# Filter example
filtered_data <- filter(combined_data, Species == "Indigenous Pathogen")


head(filtered_data)


head(filter(combined_data, Species == "Indigenous Pathogen"))


head(filter(combined_data, Species == "Indigenous Pathogen", Obs == 1))


levels(combined_data$Species)

NULL


#convert to factor
combined_data$Species <- as.factor(combined_data$Species)


levels(combined_data$Species)


# Filter 
data_filtered <- filter(combined_data, Photosynthesis < 200 & Species != "Both Pathogens")


head(data_filtered)


str(data_filtered)

'data.frame':	1640 obs. of  14 variables:
 $ Sample type           : chr  "1DroughtControl1" "1DroughtControl1" "1DroughtControl1" "1DroughtControl1" ...
 $ Days after inoculation: num  22 22 22 22 22 22 22 22 22 22 ...
 $ Date                  : chr  "6/21/2018" "6/21/2018" "6/21/2018" "6/21/2018" ...
 $ Licor                 : num  6400 6400 6400 6400 6400 6400 6400 6400 6400 6400 ...
 $ Trial                 : num  1 1 1 1 1 1 1 1 1 1 ...
 $ Treatment             : chr  "Drought" "Drought" "Drought" "Drought" ...
 $ Species               : Factor w/ 4 levels "Both Pathogens",..: 2 2 2 2 2 2 2 2 2 2 ...
 $ Plant Number          : num  1 1 1 1 1 1 1 1 1 1 ...
 $ Isolate Number        : num  5 5 5 5 5 5 5 5 5 5 ...
 $ Unique Sample Number  : num  51 51 51 51 51 51 51 51 51 51 ...
 $ Obs                   : num  1 10 11 12 13 2 3 4 5 6 ...
 $ Photosynthesis        : num  0.71 3.09 2.88 2.85 2.93 ...
 $ Conductance           : num  0.00513 0.01699 0.01713 0.01729 0.01725 ...
 $ Ci                    : num  174 104 126 130 123 ...


summary(data_filtered$Species)


# Make plot of all data
ggplot(data = combined_data,
    aes(x = Photosynthesis, y = Conductance, fill = Species)) +
    geom_point(shape = 21) +
    theme_classic() +
    labs(title = "combined_data")


# Make plot on FILTERED data (without outliers)
ggplot(data = data_filtered,
        aes(x = Photosynthesis, y = Conductance, fill = Species)) +
        geom_point(shape = 21) +
        theme_classic() +
        labs(title = "data_filtered")


# Creates a new data frame with rows containing only data from Indigenous Pathogen and Control Species
species_filtered <- filter(data_filtered, Species %in% c("Indigenous Pathogen", "Control")) 

# Then only selects the columns "Sample type", Species,Photosynthesis, Conductance)  
species_sml <- select(species_filtered, `Sample type`, Species, Photosynthesis, Conductance)


head(species_sml)


str(species_sml)

'data.frame':	1132 obs. of  4 variables:
 $ Sample type   : chr  "1DroughtControl1" "1DroughtControl1" "1DroughtControl1" "1DroughtControl1" ...
 $ Species       : Factor w/ 4 levels "Both Pathogens",..: 2 2 2 2 2 2 2 2 2 2 ...
 $ Photosynthesis: num  0.71 3.09 2.88 2.85 2.93 ...
 $ Conductance   : num  0.00513 0.01699 0.01713 0.01729 0.01725 ...


# Example of nested functions
species_sml <- select(filter(data_filtered, Species %in% c("Indigenous Pathogen", "Control")),
                      `Sample type`, Species, Photosynthesis, Conductance)


head(species_sml)


str(species_sml)

'data.frame':	1132 obs. of  4 variables:
 $ Sample type   : chr  "1DroughtControl1" "1DroughtControl1" "1DroughtControl1" "1DroughtControl1" ...
 $ Species       : Factor w/ 4 levels "Both Pathogens",..: 2 2 2 2 2 2 2 2 2 2 ...
 $ Photosynthesis: num  0.71 3.09 2.88 2.85 2.93 ...
 $ Conductance   : num  0.00513 0.01699 0.01713 0.01729 0.01725 ...


# Example of Pipes
species_sml <- data_filtered %>%
  filter(Species %in% c("Indigenous Pathogen", "Control")) %>% 
  select(`Sample type`, Species, Photosynthesis, Conductance)


head(species_sml)


str(species_sml)

'data.frame':	1132 obs. of  4 variables:
 $ Sample type   : chr  "1DroughtControl1" "1DroughtControl1" "1DroughtControl1" "1DroughtControl1" ...
 $ Species       : Factor w/ 4 levels "Both Pathogens",..: 2 2 2 2 2 2 2 2 2 2 ...
 $ Photosynthesis: num  0.71 3.09 2.88 2.85 2.93 ...
 $ Conductance   : num  0.00513 0.01699 0.01713 0.01729 0.01725 ...


# Example of a plot using pipes
species_sml %>% 
    ggplot() +
    geom_boxplot(aes(x = Species, y = Photosynthesis, fill = Species)) +
    theme_classic()


# Example of pivot_wide
data_wide <- data_filtered  %>% 
    filter(Treatment == "Drought", Obs == 1) %>% 
    select(Species, `Sample type`, Date, Photosynthesis) %>% 
    pivot_wider(names_from = "Species", values_from = "Photosynthesis")


data_wide %>% 
    head(4)


str(data_wide)

tibble [73 x 5] (S3: tbl_df/tbl/data.frame)
 $ Sample type        : chr [1:73] "1DroughtControl1" "1DroughtControl1" "1DroughtControl10" "1DroughtControl10" ...
 $ Date               : chr [1:73] "6/21/2018" "6/8/2018" "6/12/2018" "7/4/2018" ...
 $ Control            : num [1:73] 0.7101 1.5644 0.344 0.4086 0.0945 ...
 $ Exotic Pathogen    : num [1:73] NA NA NA NA NA NA NA NA NA NA ...
 $ Indigenous Pathogen: num [1:73] NA NA NA NA NA NA NA NA NA NA ...


install.packages("cowplot")


library(cowplot)


control <- data_wide %>% 
    ggplot()+
    geom_boxplot(aes(x = Date, y = Control)) +
    theme_classic() +
    theme(axis.text.x = element_text(angle = 90)) #roates X-axis text to 90 degrees

exotic <- data_wide %>% 
    ggplot() +
    geom_boxplot(aes(x = Date, y = `Exotic Pathogen`)) +
    theme_classic() +
    theme(axis.text.x = element_text(angle = 90))

indigenous <- data_wide %>% 
    ggplot() +
    geom_boxplot(aes(x = Date, y = `Indigenous Pathogen`)) +
    theme_classic() +
    theme(axis.text.x = element_text(angle = 90))

cowplot::plot_grid(control, exotic,indigenous, nrow = 1)

Warning message:
"Removed 50 rows containing non-finite values (stat_boxplot)."
Warning message:
"Removed 49 rows containing non-finite values (stat_boxplot)."
Warning message:
"Removed 47 rows containing non-finite values (stat_boxplot)."


# Example of pivot_wide
data_long <- data_wide %>%
    pivot_longer(names_to = "Species",
                 values_to = "Photosynthesis",
                 values_drop_na = TRUE,
                 !`Sample type`:Date)


data_long %>% 
    head(4)


str(data_long)

tibble [73 x 4] (S3: tbl_df/tbl/data.frame)
 $ Sample type   : chr [1:73] "1DroughtControl1" "1DroughtControl1" "1DroughtControl10" "1DroughtControl10" ...
 $ Date          : chr [1:73] "6/21/2018" "6/8/2018" "6/12/2018" "7/4/2018" ...
 $ Species       : chr [1:73] "Control" "Control" "Control" "Control" ...
 $ Photosynthesis: num [1:73] 0.7101 1.5644 0.344 0.4086 0.0945 ...


ggplot(data_long,
    aes(x = Date, y = Photosynthesis, fill = factor(Species))) +
    geom_boxplot() +
    theme_classic() +
    theme(axis.text.x = element_text(angle = 90))


# Example of mutate
unit_conversion <- data_filtered %>%
    mutate(Photosynthesis_ppb = Photosynthesis * 1000) %>% 
    select(`Sample type`, Photosynthesis, Photosynthesis_ppb)


unit_conversion %>% 
    head(4)


str(unit_conversion)

'data.frame':	1640 obs. of  3 variables:
 $ Sample type       : chr  "1DroughtControl1" "1DroughtControl1" "1DroughtControl1" "1DroughtControl1" ...
 $ Photosynthesis    : num  0.71 3.09 2.88 2.85 2.93 ...
 $ Photosynthesis_ppb: num  710 3091 2875 2853 2927 ...


# PLot of unit_conversion
unit_conversion %>% 
    ggplot(aes(x = Photosynthesis, y = Photosynthesis_ppb)) +
    geom_point() +
    theme_classic()


summary(unit_conversion)

                         Sample type   Photosynthesis    Photosynthesis_ppb
 1WetControl4                  :  36   Min.   :-7.0274   Min.   :-7027.4   
 1DroughtIndigenous Pathogen 1 :  33   1st Qu.: 0.4305   1st Qu.:  430.5   
 1WetExotic Pathogen 6         :  33   Median : 2.5453   Median : 2545.3   
 1WetIndigenous Pathogen 10    :  33   Mean   : 3.7214   Mean   : 3721.4   
 1WetIndigenous Pathogen 7     :  32   3rd Qu.: 6.7877   3rd Qu.: 6787.7   
 2DroughtIndigenous Pathogen 10:  32   Max.   :14.6453   Max.   :14645.3   
 (Other)                       :1441


levels(unit_conversion$Species)

NULL


# Change variable names
change_lables <- data_filtered %>%
    mutate(Species = factor(Species,
                         levels = c("Control", "Exotic Pathogen","Indigenous Pathogen"),
                         labels = c("Control", "P.Cinnamomi", "P.Multivora")))


levels(change_lables$Species)


# Example of use of mutate to change variable types
data_filtered <- data_filtered %>% 
    mutate(`Sample type` = factor(`Sample type`),
          Trial = factor(Trial),
          Treatment = factor(Treatment),
          Species = factor(Species),
          `Days after inoculation` = factor(`Days after inoculation`))


sapply(data_filtered,class)


# Example of group_by + summarize
data_filtered %>% 
    group_by(Treatment) %>% 
    summarize(average=mean(Photosynthesis),
            dev=sd(Photosynthesis))


# Plot using group_by
data_filtered %>% 
    group_by(Treatment) %>% 
    ggplot() +
    geom_boxplot(aes(x = Treatment, y = Photosynthesis, fill = Treatment)) +
    geom_hline(aes(yintercept = 1.232575), color = "red") +
    annotate("text", x = 0.7, y = 3,label ="Drought average = 1.23", size = 3, fontface = 2, color = "red") +
    geom_hline(aes(yintercept = 5.918684), color = "blue") +
    annotate("text", x = 1.4, y = 7,label = "Wet average = 5.92", size = 3, fontface = 2, color = "blue") +
    theme_classic() +
    guides(fill = FALSE)


# Example of group_by + summarize (multiple columns)
data_filtered %>% 
    group_by(Treatment, Species) %>% 
    summarize(median = median(Photosynthesis))

`summarise()` has grouped output by 'Treatment'. You can override using the `.groups` argument.


# Plot using group_by (multiple columns)
data_filtered %>% 
    group_by(Treatment, Species) %>%  
    ggplot(aes(x = Species, y = Photosynthesis)) +
    geom_boxplot(aes(fill = Species)) +
    labs(x = "") +
    theme_classic() +
    theme(axis.text.x = element_text(size = 8),
         legend.position = "bottom") + 
    facet_wrap(~Treatment) # separates plots by Treatment


# Example of group_by + summarize (arrange() by median Photosynthesis)
data_filtered %>% 
    group_by(Treatment, Species) %>% 
    summarize(median = median(Photosynthesis)) %>%
    arrange(desc(median))

`summarise()` has grouped output by 'Treatment'. You can override using the `.groups` argument.


# Example of count
data_filtered %>%
    count(`Sample type`, `Days after inoculation`) %>% 
    head(4)


# Example of group_by + summarize | count via n()
data_filtered %>%
    group_by(`Sample type`, `Days after inoculation`) %>%
    summarise(count = n())  %>% 
    head(4)

`summarise()` has grouped output by 'Sample type'. You can override using the `.groups` argument.


# Example of group_by + summarize | n_distinct()
plant.count <- data_filtered %>% 
    group_by(Treatment,Species, `Days after inoculation`) %>% 
    summarize(count = n_distinct(`Sample type`)) 

    plant.count %>% head(4)

`summarise()` has grouped output by 'Treatment', 'Species'. You can override using the `.groups` argument.


# Example of sorting via arrange()
plant.count %>%
    arrange(Treatment, desc(count)) %>% 
    head(10)


plant.count %>% 
    ggplot(aes(x = `Days after inoculation`, y = count, fill = Treatment)) +
    geom_col(position = "dodge", color = "black") +
    theme_classic() +
    facet_wrap(~Species) +
    scale_y_continuous(expand=c(0,0)) + # removes space between plot and axis
    theme(legend.position = "bottom")


# Calculate mean per plant
PlantMeanPhoto <- data_filtered %>% 
    group_by(`Sample type`, Trial, Treatment, Species, `Days after inoculation`) %>% 
    summarize(photo_average = mean(Photosynthesis, na.rm = TRUE))

PlantMeanPhoto  %>% 
    head(4)

`summarise()` has grouped output by 'Sample type', 'Trial', 'Treatment', 'Species'. You can override using the `.groups` argument.


# PLot mean per plant
PlantMeanPhoto %>% 
    ggplot(aes(Species, photo_average, shape = Treatment, color = Species)) +
    geom_point(position = "jitter") +
    theme_classic()


# Calculate mean per group
GroupMeanPhoto <- PlantMeanPhoto %>% 
    group_by(Treatment,Species,`Days after inoculation`) %>% 
    summarize(count = n(), 
        ave = mean(photo_average),
        dev = sd(photo_average), #standard deviation
        se = dev/sqrt(count) #standard error
        )

GroupMeanPhoto  %>% 
    head(4)

`summarise()` has grouped output by 'Treatment', 'Species'. You can override using the `.groups` argument.


# PLot mean per group
ggplot(GroupMeanPhoto, aes(x = `Days after inoculation`, y = ave, color = Species)) +
    geom_point() +
    facet_wrap(~Treatment, ncol = 1) +
    theme_classic()


# Add error bars
ggplot(GroupMeanPhoto, aes(x = `Days after inoculation`, y = ave, color = Species)) +
    geom_point() +
    geom_errorbar(aes(ymin = ave-se, ymax = ave+se)) +
    facet_wrap(~Treatment, ncol = 1) +
    theme_classic()


# Create new directory
dir.create(file.path("data_cleaned"))


# Save file
write_csv(combined_data,"./data_cleaned/combined_data.csv")


cssFile <- '../css/custom.css'
IRdisplay::display_html(readChar(cssFile, file.info(cssFile)$size))

IRdisplay::display_html("<style>.Q::before {counter-increment: question_num;
    content: 'QUESTION ' counter(question_num) ': '; white-space: pre; }.T::before {counter-increment: task_num;
    content: 'Task ' counter(task_num) ': ';</style>")

	Sample type	Photosynthesis	Conductance
	<chr>	<dbl>	<dbl>
1	1DroughtBoth Pathogens9	0.05671618	0.001441047
2	1DroughtBoth Pathogens9	0.07601768	0.001588715
3	1DroughtBoth Pathogens9	0.06055765	0.001520727
4	1DroughtBoth Pathogens9	0.04863937	0.001897092
5	1DroughtBoth Pathogens9	0.07465322	0.000933100
6	1DroughtBoth Pathogens9	0.07911806	0.001011424

	Sample type	Photosynthesis	Photosynthesis_ppb
	<chr>	<dbl>	<dbl>
1	1DroughtControl1	0.7101345	710.1345
2	1DroughtControl1	3.0909224	3090.9224
3	1DroughtControl1	2.8754158	2875.4158
4	1DroughtControl1	2.8534106	2853.4106

Setup of workspace¶

Data manipulation¶

The tidyverse¶

What are `dplyr` and `tidyr`?¶

The data¶

Combining two or more datasets¶

Join¶

left_join¶

inner_join¶

full_join¶

anti_join¶

Merge¶

Selecting columns¶

Selecting multiple columns with :¶

Omiting columns during select¶

Filtering rows¶

Sequential operations¶

Intermediate steps¶

Nested functions¶

Pipes¶

Reshaping dataframes¶

pivot_wider¶

pivot_longer¶

Mutate¶

group_by() and summarize() functions¶

Counting observations¶

Preliminary data examination¶

Mean per plant¶

Mean per group¶

Exporting data¶

	Sample type	Species	Photosynthesis	Conductance
	<chr>	<fct>	<dbl>	<dbl>
1	1DroughtControl1	Control	0.7101345	0.005128090
2	1DroughtControl1	Control	3.0909224	0.016987563
3	1DroughtControl1	Control	2.8754158	0.017134086
4	1DroughtControl1	Control	2.8534106	0.017291149
5	1DroughtControl1	Control	2.9267403	0.017253899
6	1DroughtControl1	Control	1.0517300	0.007082619

	Sample type	Days after inoculation	n
	<fct>	<fct>	<int>
1	1DroughtControl1	9	10
2	1DroughtControl1	22	13
3	1DroughtControl10	13	10
4	1DroughtControl10	35	10

A tibble: 2 × 3
	Treatment	average	dev
	<fct>	<dbl>	<dbl>
1	Drought	1.232575	2.488081
2	Wet	5.918684	3.682469

Setup of workspace¶

Data manipulation¶

The tidyverse¶

What are dplyr and tidyr?¶

The data¶

Combining two or more datasets¶

Join¶

left_join¶

inner_join¶

full_join¶

anti_join¶

Merge¶

Selecting columns¶

Selecting multiple columns with :¶

Omiting columns during select¶

Filtering rows¶

Sequential operations¶

Intermediate steps¶

Nested functions¶

Pipes¶

Reshaping dataframes¶

pivot_wider¶

pivot_longer¶

Mutate¶

group_by() and summarize() functions¶

Counting observations¶

Preliminary data examination¶

Mean per plant¶

Mean per group¶

Exporting data¶

What are `dplyr` and `tidyr`?¶