Feature Classifiers for the variable regions of Prokaryotic 16S rRNA genes.
Download SILVA data
qiime rescript get-silva-data --p-version '138' --p-target 'SSURef_NR99' --p-include-species-labels --o-silva-sequences silva-138-ssu-nr99-seqs.qza --o-silva-taxonomy silva-138-ssu-nr99-tax.qza
Remove low quality sequences
qiime rescript cull-seqs --i-sequences silva-138-ssu-nr99-seqs.qza --o-clean-sequences silva-138-ssu-nr99-seqs-cleaned.qza
Remove Eukaryotic taxa
qiime taxa filter-seqs --i-sequences silva-138-ssu-nr99-seqs-cleaned.qza --i-taxonomy silva-138-ssu-nr99-tax.qza --p-exclude 'd__Eukaryota' --p-mode 'contains' --o-filtered-sequences silva138_noEuk_seqs.qza
Filter by length
qiime taxa filter-seqs --i-sequences silva-138-ssu-nr99-seqs-cleaned.qza --i-taxonomy silva-138-ssu-nr99-tax.qza --p-exclude 'd__Eukaryota' --p-mode 'contains' --o-filtered-sequences silva138_noEuk_seqs.qza
Dereplicate
uniq
; Default rank-handles - silva
qiime rescript dereplicate --i-sequences silva138_noEuk_AB_seqs.qza --i-taxa silva-138-ssu-nr99-tax.qza --p-threads 12 --o-dereplicated-sequences silva138_noEuk_AB_seqs_uniq.qza --o-dereplicated-taxa silva138_noEuk_AB_tax_uniq.qza
Dereplicated Sequences: silva138_noEuk_AB_seqs_uniq.qza
Dereplicated Taxa: silva138_noEuk_AB_tax_uniq.qza
Extract the V1-V2 region
qiime feature-classifier extract-reads --i-sequences silva138_noEuk_AB_seqs_uniq.qza --p-f-primer AGAGTTTGATCMTGGCTCAG --p-r-primer TGCTGCCTCCCGTAGGAGT --p-n-jobs 12 --o-reads silva138_AB_V1-V2seqs.qza
Output: silva138_AB_V1-V2seqs.qza
Dereplicate the target region
qiime rescript dereplicate --i-sequences silva138_AB_V1-V2seqs.qza --i-taxa silva138_noEuk_AB_tax_uniq.qza --o-dereplicated-sequences silva138_AB_V1-V2seqs_uniq.qza --o-dereplicated-taxa silva138_AB_V1-V2taxa_uniq.qza
Dereplicated Sequences: silva138_AB_V1-V2seqs_uniq.qza
Dereplicated Taxa: silva138_AB_V1-V2taxa_uniq.qza
Classify & evaluate with RESCRIPt
qiime rescript evaluate-fit-classifier --i-sequences silva138_AB_V1-V2seqs_uniq.qza --i-taxonomy silva138_AB_V1-V2taxa_uniq.qza --o-classifier silva138_AB_V1-V2_classifier.qza --o-observed-taxonomy silva138_AB_V1-V2_predicted_taxonomy.qza --o-evaluation silva138_AB_V1-V2_classifier_eval.qzv
Classifier: silva138_AB_V1-V2_classifier.qza
Predicted Taxonomy: silva138_AB_V1-V2_predicted_taxonomy.qza
Evaluation: silva138_AB_V1-V2_classifier_eval.qzv
Extract the V3 region
qiime feature-classifier extract-reads --i-sequences silva138_noEuk_AB_seqs_uniq.qza --p-f-primer CCTACGGGNGGCWGCAG --p-r-primer GTATTACCGCGGCTGCTGG --p-n-jobs 12 --o-reads silva138_AB_V3seqs.qza
Output: silva138_AB_V3seqs.qza
Dereplicate the target region
qiime rescript dereplicate --i-sequences silva138_AB_V3seqs.qza --i-taxa silva138_noEuk_AB_tax_uniq.qza --o-dereplicated-sequences silva138_AB_V3seqs_uniq.qza --o-dereplicated-taxa silva138_AB_V3taza_uniq.qza
Dereplicated Sequences: silva138_AB_V3seqs_uniq.qza
Dereplicated Taxa: silva138_AB_V3taxa_uniq.qza
Classify & evaluate with RESCRIPt
qiime rescript evaluate-fit-classifier --i-sequences silva138_AB_V3seqs_uniq.qza --i-taxonomy silva138_AB_V3taxa_uniq.qza --o-classifier silva138_AB_V3_classifier.qza --o-observed-taxonomy silva138_AB_V3_predicted_taxonomy.qza --o-evaluation silva138_AB_V3_classifier_eval.qzv
Classifier: silva138_AB_V3_classifier.qza
Predicted Taxonomy: silva138_AB_V3_predicted_taxonomy.qza
Evaluation: silva138_AB_V3_classifier_eval.qzv
Extract the V3-V4 region
qiime feature-classifier extract-reads --i-sequences silva138_noEuk_AB_seqs_uniq.qza --p-f-primer CCTACGGGNGGCWGCAG --p-r-primer GACTACHVGGGTATCTAATCC --p-n-jobs 12 --o-reads silva138_AB_V3-V4seqs.qza
Output: silva138_AB_V3-V4seqs.qza
Dereplicate the target region
qiime rescript dereplicate --i-sequences silva138_AB_V3-V4seqs.qza --i-taxa silva138_noEuk_AB_tax_uniq.qza --o-dereplicated-sequences silva138_AB_V3-V4seqs_uniq.qza --o-dereplicated-taxa silva138_AB_V3-V4taxa_uniq.qza
Dereplicated Sequences: silva138_AB_V3-V4seqs_uniq.qza
Dereplicated Taxa: silva138_AB_V3-V4taxa_uniq.qza
Classify & evaluate with RESCRIPt
qiime rescript evaluate-fit-classifier --i-sequences silva138_AB_V3-V4seqs_uniq.qza --i-taxonomy silva138_AB_V3-V4taxa_uniq.qza --o-classifier silva138_AB_V3-V4_classifier.qza --o-observed-taxonomy silva138_AB_V3-V4_predicted_taxonomy.qza --o-evaluation silva138_AB_V3-V4_classifier_eval.qzv
Classifier: silva138_AB_V3-V4_classifier.qza
Predicted Taxonomy: silva138_AB_V3-V4_predicted_taxonomy.qza
Evaluation: silva138_AB_V3-V4_classifier_eval.qzv
Extract the V4 region
qiime feature-classifier extract-reads --i-sequences silva138_noEuk_AB_seqs_uniq.qza --p-f-primer GTGYCAGCMGCCGCGGTAA --p-r-primer GGACTACNVGGGTWTCTAAT --p-n-jobs 12 --o-reads silva138_AB_V4seqs.qza
Output: silva138_AB_V4seqs.qza
Dereplicate the target region
qiime rescript dereplicate --i-sequences silva138_AB_V4seqs.qza --i-taxa silva138_noEuk_AB_tax_uniq.qza --o-dereplicated-sequences silva138_AB_V4seqs_uniq.qza --o-dereplicated-taxa silva138_AB_V4taxa-uniq.qza --p-threads 12
Dereplicated Sequences: silva138_AB_V4seqs_uniq.qza
Dereplicated Taxa: silva138_AB_V4taxa_uniq.qza
Classify & evaluate with RESCRIPt
qiime rescript evaluate-fit-classifier --i-sequences silva138_AB_V4seqs_uniq.qza --i-taxonomy silva138_AB_V4taxa-uniq.qza --p-reads-per-batch 10000 --o-classifier silva138_AB_V4_classifier.qza --o-observed-taxonomy silva138_AB_V4_predicted_taxonomy.qza --o-evaluation silva138_AB_V4_classifier_eval.qzv
Classifier: silva138_AB_V4_classifier.qza
Predicted Taxonomy: silva138_AB_V4_predicted_taxonomy.qza
Evaluation: silva138_AB_V4_classifier_eval.qzv
Classifying & evaluating with RESCRIPt
qiime_2023.5
on a Fedora 39 server
qiime rescript evaluate-fit-classifier --i-sequences silva138_noEuk_AB_seqs_uniq.qza --i-taxonomy silva138_noEuk_AB_tax_uniq.qza --o-classifier silva138_noEuk_AB_classifier.qza --o-observed-taxonomy silva138_noEuk_AB_predicted_taxonomy.qza --o-evaluation silva138_noEuk_AB_classifier_eval.qzv --p-n-jobs 10
Classifier: silva138_noEuk_AB_classifier.qza
Predicted Taxonomy: silva138_noEuk_AB_predicted_taxonomy.qza
Evaluation: silva138_noEuk_AB_classifier_eval.qzv
(Except for the full-length classifier)
tmp
: 50GB