for n in *.flow; do o=`basename $n .flow`.oligos; mothur "# trim.flows(flow=$n, oligos=$o, pdiffs=2, bdiffs=1, processors=2, minflows=300, maxflows=450)"; done
for n in *.flow.files; do mothur "# shhh.flows(file=$n, processors=4)"; done
for n in ?????????.shhh.fasta; do o=`basename $n .shhh.fasta`.oligos; m=`basename $n .fasta`.names; mothur "# trim.seqs(fasta=$n, oligos=$o, name=$m, pdiffs=2, bdiffs=1, maxhomop=8, minlength=200)"; done
for n in ?????????.shhh.trim.fasta; do m=`basename $n .fasta`.names; mothur "# unique.seqs(fasta=$n, name=$m)"; done
for n in ?????????.shhh.trim.unique.fasta; do mothur "# align.seqs(fasta=$n, reference=silva.bacteria.fasta, flip=T, processors=4)"; done
for n in ?????????.shhh.trim.unique.align; do mothur "# summary.seqs(fasta=$n)"; done ### bac start 1044 97.5% end by 6111
for n in *.shhh.trim.unique.align; do g=`basename $n .trim.unique.align`.groups; m=`basename $n .align`.names; mothur "#screen.seqs(fasta=$n, name=$m, group=$g, start=1044, processors=4)"; done
for n in *.shhh.trim.unique.good.align; do mothur "#filter.seqs(fasta=$n, vertical=T)"; done
for n in *.shhh.trim.unique.good.filter.fasta; do m=`basename $n .filter.fasta`.names; mothur "#unique.seqs(fasta=$n, name=$m)"; done
for n in *.shhh.trim.unique.good.filter.unique.precluster.fasta; do m=`basename $n .trim.unique.good.filter.unique.precluster.fasta`.trim.unique.good.filter.unique.precluster.names; g=`basename $n .trim.unique.good.filter.unique.precluster.fasta`.good.groups; mothur "#chimera.uchime(fasta=$n, name=$m, group=$g, processors=4)"; done
for n in *.shhh.trim.unique.good.filter.unique.precluster.uchime.accnos; do m=`basename $n .trim.unique.good.filter.unique.precluster.uchime.accnos`.trim.unique.good.filter.unique.precluster.names; f=`basename $n .trim.unique.good.filter.unique.precluster.uchime.accnos`.trim.unique.good.filter.unique.precluster.fasta; g=`basename $n .trim.unique.good.filter.unique.precluster.uchime.accnos`.good.groups; mothur "#remove.seqs(accnos=$n, fasta=$f, name=$m, group=$g)"; done
for n in *.shhh.trim.unique.good.filter.unique.precluster.pick.fasta; do m=`basename $n .trim.unique.good.filter.unique.precluster.pick.fasta`.trim.unique.good.filter.unique.precluster.pick.names; g=`basename $n .trim.unique.good.filter.unique.precluster.pick.fasta`.good.pick.groups; mothur "#classify.seqs(fasta=$n, name=$m, group=$g, template=silva.bacteria.fasta, taxonomy=silva.bacteria.silva.tax, cutoff=50, processors=2)"; done
for n in *.shhh.trim.unique.good.filter.unique.precluster.pick.fasta; do m=`basename $n .trim.unique.good.filter.unique.precluster.pick.fasta`.trim.unique.good.filter.unique.precluster.pick.names; g=`basename $n .trim.unique.good.filter.unique.precluster.pick.fasta`.good.pick.groups; t=`basename $n .trim.unique.good.filter.unique.precluster.pick.fasta`.trim.unique.good.filter.unique.precluster.pick.silva.taxonomy; mothur "#remove.lineage(fasta=$n, name=$m, group=$g, taxonomy=$t, taxon=Mitochondria-Cyanobacteria_Chloroplast-Archaea-Eukarya-unknown)"; done
cat *.pick.pick.names > bc_bac.names
cat *.pick.pick.fasta > bc_bac.fasta
cat *.pick.taxonomy > bc_bac.tax
cat *.pick.pick.groups > bc_bac.groups
#switch to mothur now that I'm down to one set of file
## need to realign because they're not all the same length
align.seqs(fasta=bc_bac.fasta, reference=silva.bacteria.fasta, processors=4)
screen.seqs(fasta=current, name=current, group=bc_bac.groups, start=1044, processors=4)
filter.seqs(fasta=bc_bac.good.align, vertical=T)
cluster.split(fasta=bc_bac.good.align, name=bc_bac.good.names, taxonomy=bc_bac.pick.tax, countends=F, splitmethod=fasta, taxlevel=3, processors=2)