https://github.com/arjunrajlaboratory/RajLabSeqTools
Revision f267e82b2edd18a28926b84fc23cb2b55bdbc9c3 authored by Ian Mellis on 05 January 2016, 20:38:56 UTC, committed by Ian Mellis on 05 January 2016, 20:38:56 UTC
1 parent f26732e
Raw File
Tip revision: f267e82b2edd18a28926b84fc23cb2b55bdbc9c3 authored by Ian Mellis on 05 January 2016, 20:38:56 UTC
Updated runHTSeq.sh to call shared version of hg19.gtf, rather than Syd's in CancerSeq repo. Made a note on Rajlabseqtools pipeline doc.
Tip revision: f267e82
unzipAndConcatenateZippedFastq.sh
#!/bin/bash

ZIPFILEDIRECTORY=$1

OUTFASTADIRECTORY=$2

for dirname in $ZIPFIELDIRECTORY/* ; do
    cd $dirname

    INPUT=`ls *001_R1*`
    SAMPLE=${INPUT%%_*}  # Cuts filename string after first '_'

    if [ ! -d $OUTFASTADIRECTORY/raw ]; then
        mkdir $OUTFASTADIRECTORY/raw
    fi

    if [ ! -d $OUTFASTADIRECTORY/raw/$SAMPLE ]; then
        mkdir $OUTFASTADIRECTORY/raw/$SAMPLE
    fi

    for i in *.gz; do
        gunzip -c $i > ${i%.*}
    done

    FASTQR1=${SAMPLE}_R1.fastq
    FASTQR2=${SAMPLE}_R2.fastq

    cat *R1*fastq > $OUTFASTADIRECTORY/raw/$SAMPLE/$FASTQR1
    cat *R2*fastq > $OUTFASTADIRECTORY/raw/$SAMPLE/$FASTQR2

done

back to top