For many of my sequences in my 18S analysis, when i run the classify.otu command I receive a lot of messages like
[WARNING]: M02149_449_000000000-AURT8_1_1101_18396_3602 is not in your taxonomy file. I will not include it in the consensus.
I mean a LOT.
<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<^>>>>>>>>>>>>>>>>>>>>>>>>>>>>>
<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<^>>>>>>>>>>>>>>>>>>>>>>>>>>>>>
<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<^>>>>>>>>>>>>>>>>>>>>>>>>>>>>>
Detected 21788 [WARNING] messages, please review.
<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<^>>>>>>>>>>>>>>>>>>>>>>>>>>>>>
<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<^>>>>>>>>>>>>>>>>>>>>>>>>>>>>>
<<<<<<<<<<<<<<<<<<<<<<<<<<<<<<^>>>>>>>>>>>>>>>>>>>>>>>>>>>>>
As you can see in my command file, I removed the Bacteria, Archaea, and unknowns before the cluster.spilt, so I don’t know why there are sequences in the shared file that aren’t in the taxonomy file. Any ideas?
make.contigs(ffastq=Run3_18S_R1.fastq, rfastq=Run3_18S_R2.fastq, rindex=Run3_18S_I1.fastq, oligos=Run3_18S_oligos.txt, processors=2)
summary.seqs(fasta=Run3_18S_R1.trim.contigs.fasta)
get.groups(fasta=Run3_18S_R1.trim.contigs.fasta, group=Run3_18S_R1.contigs.groups, groups=WED01-WED02-WED03-WED04-WED05-WED06-WED07-WED08-WED09-WED10-WED11-WED12-WED13-WED14-WED15-WED16-WED17-WED18-WED19-WED20-WED21-WED22-WED23-WED24-WED25-WED26-WED27-WED28-WED29-WED30-WED31-WED32)
screen.seqs(fasta=Run3_18S_R1.trim.contigs.pick.fasta, group=Run3_18S_R1.contigs.pick.groups, maxambig=0, maxlength=260, processors=2)
unique.seqs(fasta=Run3_18S_R1.trim.contigs.pick.good.fasta)
count.seqs(name=Run3_18S_R1.trim.contigs.pick.good.names, group=Run3_18S_R1.contigs.pick.good.groups)
summary.seqs(fasta=Run3_18S_R1.trim.contigs.pick.good.unique.fasta, count=Run3_18S_R1.trim.contigs.pick.good.count_table)
align.seqs(processors=2, fasta=Run3_18S_R1.trim.contigs.pick.good.unique.fasta, reference=silva.nr_v132.euk.align)
summary.seqs(processors=2, fasta=Run3_18S_R1.trim.contigs.pick.good.unique.align, count=Run3_18S_R1.trim.contigs.pick.good.count_table)
screen.seqs(fasta=Run3_18S_R1.trim.contigs.pick.good.unique.align, count=Run3_18S_R1.trim.contigs.pick.good.count_table, summary=Run3_18S_R1.trim.contigs.pick.good.unique.summary, start=15794, end=16431, maxhomop=6)
summary.seqs(fasta=Run3_18S_R1.trim.contigs.pick.good.unique.good.align, count=Run3_18S_R1.trim.contigs.pick.good.good.count_table)
filter.seqs(fasta=Run3_18S_R1.trim.contigs.pick.good.unique.good.align, vertical=T, trump=.)
unique.seqs(fasta= Run3_18S_R1.trim.contigs.pick.good.unique.good.filter.fasta, count=Run3_18S_R1.trim.contigs.pick.good.good.count_table)
pre.cluster(processors=1, fasta=Run3_18S_R1.trim.contigs.pick.good.unique.good.filter.unique.fasta, count=Run3_18S_R1.trim.contigs.pick.good.good.count_table, diffs=2)
chimera.vsearch(fasta=Run3_18S_R1.trim.contigs.pick.good.unique.good.filter.unique.precluster.fasta, count=Run3_18S_R1.trim.contigs.pick.good.unique.good.filter.unique.precluster.count_table, dereplicate=t)
remove.seqs(fasta=Run3_18S_R1.trim.contigs.pick.good.unique.good.filter.unique.precluster.fasta, accnos=Run3_18S_R1.trim.contigs.pick.good.unique.good.filter.unique.precluster.denovo.vsearch.accnos)
classify.seqs(fasta=Run3_18S_R1.trim.contigs.pick.good.unique.good.filter.unique.precluster.pick.fasta, count=Run3_18S_R1.trim.contigs.pick.good.unique.good.filter.unique.precluster.denovo.vsearch.pick.count_table, reference=silva.nr_v132.euk.align, taxonomy=silva.nr_v132.euk.tax, cutoff=80, processors=2)
remove.lineage(fasta=Run3_18S_R1.trim.contigs.pick.good.unique.good.filter.unique.precluster.pick.fasta, count=Run3_18S_R1.trim.contigs.pick.good.unique.good.filter.unique.precluster.denovo.vsearch.pick.count_table, taxonomy=Run3_18S_R1.trim.contigs.pick.good.unique.good.filter.unique.precluster.pick.euk.wang.taxonomy, taxon=Bacteria-unknown-Archaea)
cluster.split(fasta=Run3_18S_R1.trim.contigs.pick.good.unique.good.filter.unique.precluster.pick.pick.fasta, count=Run3_18S_R1.trim.contigs.pick.good.unique.good.filter.unique.precluster.denovo.vsearch.pick.pick.count_table, taxonomy=Run3_18S_R1.trim.contigs.pick.good.unique.good.filter.unique.precluster.pick.euk.wang.pick.taxonomy, splitmethod=classify, taxlevel=4, cutoff=0.03, processors=2, runsensspec=f)
make.shared(list=Run3_18S_R1.trim.contigs.pick.good.unique.good.filter.unique.precluster.pick.pick.opti_mcc.unique_list.list, count=Run3_18S_R1.trim.contigs.pick.good.unique.good.filter.unique.precluster.denovo.vsearch.pick.pick.count_table, label=0.03)
classify.otu(list=Run3_18S_R1.trim.contigs.pick.good.unique.good.filter.unique.precluster.pick.pick.opti_mcc.unique_list.list, count=Run3_18S_R1.trim.contigs.pick.good.unique.good.filter.unique.precluster.denovo.vsearch.pick.pick.count_table, taxonomy=Run3_18S_R1.trim.contigs.pick.good.unique.good.filter.unique.precluster.pick.euk.wang.pick.taxonomy, label=0.03)
count.groups(shared=Run3_18S_R1.trim.contigs.pick.good.unique.good.filter.unique.precluster.pick.pick.opti_mcc.unique_list.shared)
rarefaction.single(shared=Run3_18S_R1.trim.contigs.pick.good.unique.good.filter.unique.precluster.pick.pick.opti_mcc.unique_list.shared)