Skip to content

Commit

Permalink
Merge pull request #10 from waldronlab/sdgamboa/update-vignette
Browse files Browse the repository at this point in the history
Sdgamboa/update vignette
  • Loading branch information
lwaldron committed May 9, 2023
2 parents a0bcb48 + 551444c commit ac03151
Show file tree
Hide file tree
Showing 14 changed files with 2,238 additions and 67 deletions.
1 change: 1 addition & 0 deletions .Rbuildignore
Original file line number Diff line number Diff line change
@@ -1,2 +1,3 @@
^.*\.Rproj$
^\.Rproj\.user$
^html_docs$
1 change: 0 additions & 1 deletion .gitignore
Original file line number Diff line number Diff line change
@@ -1,4 +1,3 @@
*_cache*
*.html
.Rproj.user
.Rhistory
2 changes: 1 addition & 1 deletion DESCRIPTION
Original file line number Diff line number Diff line change
Expand Up @@ -10,7 +10,7 @@ Description: Reproduces analysis from Audrey Renson's and Francesco Beghini's ma
License: Artistic-2.0
Encoding: UTF-8
LazyData: true
RoxygenNote: 6.1.0
RoxygenNote: 7.2.3
Depends:
Biobase,
phyloseq,
Expand Down
35 changes: 28 additions & 7 deletions R/loadQiimeData.R
Original file line number Diff line number Diff line change
@@ -1,12 +1,33 @@
#' Import NYC HANES-II microbiome data as a \code{phyloseq} object.

#' Import
#'
#' \code{loadQiimeData} imports NYC HANES-II microbiome data as a
#' \code{phyloseq} object
#'
#' @return A phyloseq object.
#' @export
loadQiimeData <- function(metadata = sas7bdat::read.sas7bdat("http://nychanes.org/wp-content/uploads/sites/6/2018/01/public_v2_010518.sas7bdat")){

otu_table <- system.file("extdata","otu_table_mc10_w_tax.biom", package="nychanesmicrobiome", mustWork = TRUE)
tree_otu <- system.file("extdata","rep_set.tre", package="nychanesmicrobiome", mustWork = TRUE)
rep_set <- system.file("extdata","rep_set.fna", package="nychanesmicrobiome", mustWork = TRUE)

#'
#' @examples
#'
#' nychanes <- loadQiimeData()
#'
loadQiimeData <- function() {
metadata_fname <- system.file(
'extdata', 'public_v2_010518.sas7bdat', package = 'nychanesmicrobiome'
)
metadata <- sas7bdat::read.sas7bdat(metadata_fname)
otu_table <- system.file(
"extdata", "otu_table_mc10_w_tax.biom",
package = "nychanesmicrobiome", mustWork = TRUE
)
tree_otu <- system.file(
"extdata", "rep_set.tre",
package = "nychanesmicrobiome",
mustWork = TRUE
)
rep_set <- system.file(
"extdata", "rep_set.fna", package = "nychanesmicrobiome", mustWork = TRUE
)
phylo <- import_biom(BIOMfilename = otu_table,
treefilename = read_tree(tree_otu),
refseqfilename = rep_set,
Expand Down

Large diffs are not rendered by default.

Binary file not shown.

Large diffs are not rendered by default.

25 changes: 19 additions & 6 deletions man/get_edgeR_results.Rd

Some generated files are not rendered by default. Learn more about how customized files appear on GitHub.

16 changes: 12 additions & 4 deletions man/loadQiimeData.Rd

Some generated files are not rendered by default. Learn more about how customized files appear on GitHub.

22 changes: 17 additions & 5 deletions man/plot_abundance.Rd

Some generated files are not rendered by default. Learn more about how customized files appear on GitHub.

10 changes: 8 additions & 2 deletions man/plot_alpha_by.Rd

Some generated files are not rendered by default. Learn more about how customized files appear on GitHub.

15 changes: 12 additions & 3 deletions man/plot_edgeR.Rd

Some generated files are not rendered by default. Learn more about how customized files appear on GitHub.

10 changes: 8 additions & 2 deletions man/prettytable_autoindent.Rd

Some generated files are not rendered by default. Learn more about how customized files appear on GitHub.

88 changes: 52 additions & 36 deletions vignettes/smoking.Rmd
Original file line number Diff line number Diff line change
Expand Up @@ -21,37 +21,42 @@ editor_options:
```{r setup, include=FALSE}
knitr::opts_chunk$set(
cache = TRUE,
echo = FALSE,
message = FALSE,
warning = FALSE
)
```

```{r loading, include=FALSE}
suppressPackageStartupMessages({
library(nychanesmicrobiome)
library(dplyr)
})
```{r loading, include=FALSE, message=FALSE}
library(nychanesmicrobiome)
library(dplyr)
scale_palette <- c("#e41a1c","#377eb8","#4daf4a","#984ea3","#ff7f00")
theme_transparent <- ggplot2::theme(axis.title = ggplot2::element_text(colour = "white"),
axis.text = ggplot2::element_text(colour = "white"),
title = ggplot2::element_text(colour = "white"),
legend.text = ggplot2::element_text(colour = "white"),
axis.ticks = ggplot2::element_line(colour = "white"),
panel.border = ggplot2::element_rect(colour = "white"),
panel.background = ggplot2::element_rect(fill = "transparent",colour = NA),
plot.background = ggplot2::element_rect(fill = "transparent",colour = NA),
legend.background = ggplot2::element_rect(fill = "transparent",colour = NA),
legend.key = ggplot2::element_rect(fill = "transparent",colour = NA),
panel.grid = ggplot2::element_blank())
theme_transparent <- ggplot2::theme(
axis.title = ggplot2::element_text(colour = "white"),
axis.text = ggplot2::element_text(colour = "white"),
title = ggplot2::element_text(colour = "white"),
legend.text = ggplot2::element_text(colour = "white"),
axis.ticks = ggplot2::element_line(colour = "white"),
panel.border = ggplot2::element_rect(colour = "white"),
panel.background = ggplot2::element_rect(fill = "transparent",colour = NA),
plot.background = ggplot2::element_rect(fill = "transparent",colour = NA),
legend.background = ggplot2::element_rect(fill = "transparent",colour = NA),
legend.key = ggplot2::element_rect(fill = "transparent",colour = NA),
panel.grid = ggplot2::element_blank()
)
```

```{r Data loading, message=FALSE, warning=FALSE, include=FALSE}
NYC_HANES <- loadQiimeData() %>% annotateFactors(.)
NYC_HANES <- loadQiimeData() %>%
annotateFactors()
# Extract alternative smokers who also smoke cigarettes and remove them
alt_smokers_cigarettes <- sample_data(NYC_HANES) %>% dplyr::filter(smokingstatus == 'Alternative smoker') %>% dplyr::filter(CIGARETTES == 'Yes') %>% dplyr::select(Burklab_ID) %>% t
alt_smokers_cigarettes <- NYC_HANES |>
sample_data() |>
data.frame() |>
dplyr::filter(smokingstatus == 'Alternative smoker') |>
dplyr::filter(CIGARETTES == 'Yes') |>
dplyr::select(Burklab_ID) |>
t()
NYC_HANES <- prune_samples(!(sample_names(NYC_HANES) %in% alt_smokers_cigarettes), NYC_HANES)
sample_data(NYC_HANES)$smokingstatus <- relevel(sample_data(NYC_HANES)$smokingstatus,"Never smoker")
Expand Down Expand Up @@ -326,21 +331,20 @@ plot(
```{r permanova, echo=FALSE, message=FALSE, warning=FALSE, cache=F}
metadata <- as(sample_data(NYC_HANES), "data.frame")
permanova.res <- data.frame()
for (s in combn(levels(metadata$smokingstatus), 2, simplify = FALSE)) {
metadata_2cat <- metadata[metadata$smokingstatus %in% s, ]
distwu_2cat <-
phyloseq::distance(subset_samples(NYC_HANES, smokingstatus %in% s), "wunifrac")
permanova <-
vegan::adonis(
distwu_2cat <- phyloseq::distance(
subset_samples(NYC_HANES, smokingstatus %in% s), "wunifrac"
)
permanova <- vegan::adonis2(
formula = distwu_2cat ~ smokingstatus + OHQ_3 + RACE + GENDER + AGEGRP4C + SR_ACTIVE + EDU3CAT + DBTS_NEW,
data = metadata_2cat
)
)
permanova.res %<>% bind_rows(
data.frame(
contrast = stringr::str_c(s, collapse = " vs "),
r2 = permanova$aov.tab[1, 5],
pvalue = permanova$aov.tab[1, 6]
r2 = permanova[1, 'R2'],
pvalue = permanova[1, 'Pr(>F)']
)
) %>% arrange(pvalue)
}
Expand All @@ -354,7 +358,7 @@ metadata_2cat <- metadata[metadata$smokingstatus %in% s, ]
distwu_2cat <-
phyloseq::distance(subset_samples(NYC_HANES, smokingstatus %in% s), "wunifrac")
permanova <-
vegan::adonis(data = metadata_2cat, distwu_2cat ~ COTININE)
vegan::adonis2(data = metadata_2cat, distwu_2cat ~ COTININE)
permanova
```

Expand All @@ -367,15 +371,15 @@ distwu_3cat <-
NYC_HANES,
smokingstatus %in% c("Cigarette", "Never smoker", "Former smoker")
), "wunifrac")
vegan::adonis(
vegan::adonis2(
distwu_3cat ~ smokingstatus + RACE + GENDER + AGEGRP4C + SR_ACTIVE + EDU3CAT + DBTS_NEW,
metadata_3cat
)
```

#### All categories
```{r permanovaallcat, echo=FALSE, message=FALSE, warning=FALSE}
vegan::adonis(distwu ~ smokingstatus, metadata)
vegan::adonis2(distwu ~ smokingstatus, metadata)
```

# Differential analysis
Expand Down Expand Up @@ -1277,7 +1281,10 @@ epitools::epitab(x)
## Cigarette smokers vs Never smokers
### GSEA
```{r create GSEA objects, echo=FALSE, message=FALSE, warning=FALSE, cache=FALSE, paged.print=FALSE}
full_eset <- ExpressionSet(assayData = otu_table(NYC_HANES), phenoData = new("AnnotatedDataFrame", sample_data(NYC_HANES)))
full_eset <- ExpressionSet(
assayData = microbiome::abundances(NYC_HANES),
phenoData = new("AnnotatedDataFrame", sample_data(NYC_HANES))
)
full_eset$CATCOTININE <- ifelse(full_eset$COTININE < 3,'low','high')
full_annotated_ds <- tax_table(NYC_HANES) %>% as.data.frame %>% bind_cols(data.frame(OTU=rownames(tax_table(NYC_HANES)))) %>% filter(Domain != "Unassigned") %>% left_join(biosis, by = c("Genus"="X1"))
Expand Down Expand Up @@ -1318,7 +1325,8 @@ expr = expr[SummarizedExperiment::rowData(de.sns_eset)$ADJ.PVAL <= 0.05,]
grp = factor(de.sns_eset$GROUP, labels = c('Never smoker','Cigarette'))
expr <- t(scale(t(expr)))
expr <- expr[rownames(expr) %in% unlist(sns.gsea.res$gs$aero), ]
# expr <- expr[rownames(expr) %in% unlist(sns.gsea.res$gs$aero), ]
expr <- expr[rownames(expr) %in% unlist(sns.gsea.res$gs), ]
coll <- c("#B62A84", "#2AB68C")
names(coll) <- levels(grp)
Expand Down Expand Up @@ -1409,15 +1417,23 @@ topTable(sns.nc.fit)
```

```{r Data reloading, message=FALSE, warning=FALSE, include=FALSE}
NYC_HANES <- loadQiimeData() %>% annotateFactors(.)
alt_smokers_cigarettes <- sample_data(NYC_HANES) %>% dplyr::filter(smokingstatus == 'Alternative smoker') %>% dplyr::filter(CIGARETTES == 'Yes') %>% dplyr::select(Burklab_ID) %>% t
NYC_HANES <- loadQiimeData() |>
annotateFactors()
alt_smokers_cigarettes <- NYC_HANES |>
sample_data() |>
data.frame() |>
dplyr::filter(smokingstatus == 'Alternative smoker') |>
dplyr::filter(CIGARETTES == 'Yes') |>
dplyr::select(Burklab_ID) |>
t()
NYC_HANES <- prune_samples(!(sample_names(NYC_HANES) %in% alt_smokers_cigarettes), NYC_HANES)
sample_data(NYC_HANES)$smokingstatus <- relevel(sample_data(NYC_HANES)$smokingstatus,"Never smoker")
NYC_HANES.alt <- subset_samples(NYC_HANES, smokingstatus %in% c("Never smoker", "Alternative smoker"))
levels(sample_data(NYC_HANES.alt)$smokingstatus) <- c('Never','Alternative')
full_eset <- ExpressionSet(assayData = otu_table(NYC_HANES), phenoData = new("AnnotatedDataFrame", sample_data(NYC_HANES)))
full_eset <- ExpressionSet(assayData = microbiome::abundances(NYC_HANES), phenoData = new("AnnotatedDataFrame", sample_data(NYC_HANES)))
full_eset$CATCOTININE <- ifelse(full_eset$COTININE < 3,'low','high')
full_annotated_ds <- tax_table(NYC_HANES) %>% as.data.frame %>% bind_cols(data.frame(OTU=rownames(tax_table(NYC_HANES)))) %>% filter(Domain != "Unassigned") %>% left_join(biosis, by = c("Genus"="X1"))
Expand Down

0 comments on commit ac03151

Please sign in to comment.