#!/bin/bash

#
# Generated at: 2015-12-23T10:39:02
# This file was generated with the following options
#	--workflow	gemini.yml
#

#
# Samples: SAMPLE1, SAMPLE2, SAMPLE3
#
#
# Starting Workflow
#
#
# Global Variables:
#	ROOT: data/raw
#	indir: data/raw
#	outdir: data/processed
#	file_rule: (.vcf)$|(.vcf.gz)$
#

#
#

# Starting bgzip
#



#
# Variables 
# Indir: data/raw
# Outdir: data/processed/bgzip
#

bgzip data/raw/SAMPLE1.vcf && tabix data/raw/SAMPLE1.vcf.gz










wait

#
# Ending bgzip
#


#
#

# Starting normalize_snpeff
#



#
# Variables 
# Indir: {$self->ROOT}
# Outdir: data/processed/normalize_snpeff
# Local Variables:
#	indir: {$self->ROOT}
#	outdir: data/processed/normalize_snpeff
#

bcftools view data/raw/SAMPLE1.vcf.gz | sed 's/ID=AD,Number=./ID=AD,Number=R/' \
    | vt decompose -s - \
    | vt normalize -r $REFGENOME - \
    | java -Xmx4G -jar $SNPEFF/snpEff.jar -c \$SNPEFF/snpEff.config -formatEff -classic GRCh37.75  \
    | bgzip -c > \
    data/processed/normalize_snpeff/SAMPLE1.norm.snpeff.gz && tabix data/processed/normalize_snpeff/SAMPLE1.norm.snpeff.gz


bcftools view data/raw/SAMPLE2.vcf.gz | sed 's/ID=AD,Number=./ID=AD,Number=R/' \
    | vt decompose -s - \
    | vt normalize -r $REFGENOME - \
    | java -Xmx4G -jar $SNPEFF/snpEff.jar -c \$SNPEFF/snpEff.config -formatEff -classic GRCh37.75  \
    | bgzip -c > \
    data/processed/normalize_snpeff/SAMPLE2.norm.snpeff.gz && tabix data/processed/normalize_snpeff/SAMPLE2.norm.snpeff.gz


bcftools view data/raw/SAMPLE3.vcf.gz | sed 's/ID=AD,Number=./ID=AD,Number=R/' \
    | vt decompose -s - \
    | vt normalize -r $REFGENOME - \
    | java -Xmx4G -jar $SNPEFF/snpEff.jar -c \$SNPEFF/snpEff.config -formatEff -classic GRCh37.75  \
    | bgzip -c > \
    data/processed/normalize_snpeff/SAMPLE3.norm.snpeff.gz && tabix data/processed/normalize_snpeff/SAMPLE3.norm.snpeff.gz



wait

#
# Ending normalize_snpeff
#


#
#

# Starting gemini_sqlite
#



#
# Variables 
# Indir: data/processed/normalize_snpeff
# Outdir: data/processed/gemini_sqlite
#

gemini load -v data/processed/normalize_snpeff/SAMPLE1.norm.snpeff.gz \
    --skip-cadd -t snpEff \
   data/processed/gemini_sqlite/SAMPLE1.vcf.db


gemini load -v data/processed/normalize_snpeff/SAMPLE2.norm.snpeff.gz \
    --skip-cadd -t snpEff \
   data/processed/gemini_sqlite/SAMPLE2.vcf.db


gemini load -v data/processed/normalize_snpeff/SAMPLE3.norm.snpeff.gz \
    --skip-cadd -t snpEff \
   data/processed/gemini_sqlite/SAMPLE3.vcf.db



wait

#
# Ending gemini_sqlite
#

#
# Ending Workflow
#