#!/bin/bash
#SBATCH -t 4:00:00
#SBATCH --nodes=1 --ntasks-per-node=1
#SBATCH --mem=24g
#SBATCH --export=NONE
#SBATCH --mail-user=mramsey@uri.edu
#SBATCH --mail-type=BEGIN,END,FAIL

module load QIIME2/2019.7

tablein=/data/mramseylab/raw_reads/2018_Serum/Merge_runs/denoise-table-merge.qza
clsdir=/data/mramseylab/classifiers/
metadir=/data/mramseylab/metadata/
visdir=/data/mramseylab/visualizations/
filtdir=/data/mramseylab/proc_reads/
# filter status of input files, "ctrl-filter" is just for taxa belonging to no template controls
fil=ctrl-filter


#must make the directory you are filtering to 1st or else it will error
mkdir $filtdir$fil


qiime feature-table filter-samples \
  --i-table $tablein \
  --m-metadata-file $metadir\Serum5.tsv \
  --p-where "[Source]='Control'" \
  --o-filtered-table $filtdir$fil/$fil-table.qza

qiime taxa collapse \
  --i-table $filtdir$fil/$fil-table.qza \
  --i-taxonomy $clsdir\silva-mod-taxonomy.qza \
  --p-level 6 \
  --o-collapsed-table $filtdir$fil/$fil-collapse-table.qza

qiime feature-table relative-frequency \
  --i-table $filtdir$fil/$fil-collapse-table.qza \
  --o-relative-frequency-table $filtdir$fil/$fil-relative-collapse-table.qza

qiime tools export \
  --input-path $filtdir$fil/$fil-relative-collapse-table.qza \
  --output-path $filtdir$fil/

biom convert \
-i $filtdir$fil/feature-table.biom \
-o $filtdir$fil/$fil-relative-collapse-table.txt \
--header-key “taxonomy” \
--to-tsv

#Use above taxa table to filter out based on taxa present in controls

qiime feature-table filter-features \
  --i-table $tablein \
  --m-metadata-file $filtdir$fil/$fil-collapse-table.qza \
  --o-filtered-table $filtdir$fil/$fil-excluded-table.qza \
  --p-exclude-ids

#Use excluded table to generate barplot for checking

qiime taxa barplot \
  --i-table $filtdir$fil/$fil-excluded-table.qza \
  --i-taxonomy $clsdir\silva-mod-taxonomy.qza \
  --m-metadata-file $metadir\Serum5.tsv \
  --o-visualization $filtdir$fil/$fil-excluded-table.qzv
