https://github.com/arjunrajlaboratory/RajLabSeqTools
Revision d64c7115b852e3a269ed9e3c069a3485b34bbea5 authored by Eric Sanford on 10 October 2019, 18:04:36 UTC, committed by Eric Sanford on 10 October 2019, 18:04:36 UTC
1 parent c5b88eb
Tip revision: d64c7115b852e3a269ed9e3c069a3485b34bbea5 authored by Eric Sanford on 10 October 2019, 18:04:36 UTC
added location of hg19 reference files as comments to setEnvironmentVariables.sh script
added location of hg19 reference files as comments to setEnvironmentVariables.sh script
Tip revision: d64c711
unzipAndConcatenateZippedFastq.sh
#!/bin/bash
ZIPFILEDIRECTORY=$1
OUTFASTQDIRECTORY=$2
PAIRED_OR_SINGLE_END_FRAGMENTS=$3
echo "you selected the pipeline settings for" $PAIRED_OR_SINGLE_END_FRAGMENTS "end reads"
for dirname in $ZIPFILEDIRECTORY/* ; do
cd $dirname
INPUT=`ls *`
SAMPLE=${INPUT%%_*} # Cuts filename string after first '_'
if [ ! -d $OUTFASTQDIRECTORY/raw ]; then
mkdir $OUTFASTQDIRECTORY/raw
fi
if [ ! -d $OUTFASTQDIRECTORY/raw/$SAMPLE ]; then
mkdir $OUTFASTQDIRECTORY/raw/$SAMPLE
fi
FASTQR1=${SAMPLE}_R1.fastq
FASTQR2=${SAMPLE}_R2.fastq
if [ ! -e $OUTFASTQDIRECTORY/raw/$SAMPLE/$FASTQR1 ]; then
echo Working on $SAMPLE
for i in *.gz; do
gunzip -c $i > ${i%.*}
done
cat ./*R1*fastq > $OUTFASTQDIRECTORY/raw/$SAMPLE/$FASTQR1
rm ./*R1*fastq
if [ $PAIRED_OR_SINGLE_END_FRAGMENTS = "paired" ]; then
cat ./*R2*fastq > $OUTFASTQDIRECTORY/raw/$SAMPLE/$FASTQR2
rm ./*R2*fastq
fi
fi
# compress fastq after concatenation, since STAR can read compressed FASTQ files.
# submit this final compression task to cluster since compression takes a while
bsub gzip $OUTFASTQDIRECTORY/raw/$SAMPLE/$FASTQR1
if [ $PAIRED_OR_SINGLE_END_FRAGMENTS = "paired" ]; then
bsub gzip $OUTFASTQDIRECTORY/raw/$SAMPLE/$FASTQR2
fi
done

Computing file changes ...