0 收听	12 听众	278 主题

dada2物种分类鉴定

发表于 2023-5-11 20:26:12 | 查看: 1197| 回复: 0

本帖最后由生信喵于 2023-5-11 21:02 编辑

物种分类鉴定

#方法一:dada2自带注释函数,官网下载
#https://benjjneb.github.io/dada2/training.html
# taxa <- assignTaxonomy(seqtab.nochim, "MiSeq_SOP/tax/silva_nr99_v138.1_train_set.fa.gz", multithread=12)
# taxa <- addSpecies(taxa, "MiSeq_SOP/tax/silva_species_assignment_v138.1.fa.gz")
#
# taxa.print <- taxa
# rownames(taxa.print) <- NULL
# head(taxa.print)
#方法二： DECIPHER
download.file(url="http://www2.decipher.codes/Classification/TrainingSets/SILVA_SSU_r138_2019.RData", destfile="SILVA_SSU_r138_2019.RData")
#加载CECIPHER SILVA库
load("SILVA_SSU_r138_2019.RData")
#加载DECIPHER
library(DECIPHER)
packageVersion("DECIPHER")
#创建dna序列
dna <- DNAStringSet(getSequences(seqtab.nochim))
ids <- IdTaxa(dna, trainingSet, strand="top", processors=12, verbose=FALSE)
ranks <- c("domain", "phylum", "class", "order", "family", "genus", "species") # ranks of interest
# Convert the output object of class "Taxa" to a matrix analogous to the output from assignTaxonomy
taxid <- t(sapply(ids, function(x) {
m <- match(ranks, x$rank)
taxa <- x$taxon[m]
taxa[startsWith(taxa, "unclassified_")] <- NA
taxa
}))
colnames(taxid) <- ranks
rownames(taxid) <- getSequences(seqtab.nochim)

复制代码

评估结果

unqs.mock <- seqtab.nochim["Mock",]
unqs.mock <- sort(unqs.mock[unqs.mock>0], decreasing=TRUE)
cat("DADA2 inferred", length(unqs.mock), "sample sequences present in the Mock community.\n")
mock.ref <- getSequences(file.path(path, "HMP_MOCK.v35.fasta"))
match.ref <- sum(sapply(names(unqs.mock), function(x) any(grepl(x, mock.ref))))
cat("Of those,", sum(match.ref), "were exact matches to the expected reference sequences.\n")

复制代码

画树

复制代码

		自动登录	找回密码
密码			立即注册