Skip to content
Snippets Groups Projects
Commit eb740601 authored by Holger Brandl's avatar Holger Brandl
Browse files

cont helin project

parent 6a530e75
No related branches found
No related tags found
No related merge requests found
## docs
## http://blog.joncairns.com/2013/08/what-you-need-to-know-about-bash-functions/
## create fastq report for all fastq and fastq.gz files in the current directory ## create fastq report for all fastq and fastq.gz files in the current directory
dge_fastqc(){ dge_fastqc(){
...@@ -9,7 +12,7 @@ while getopts "o:" curopt; do ...@@ -9,7 +12,7 @@ while getopts "o:" curopt; do
done done
shift $(($OPTIND - 1)) shift $(($OPTIND - 1))
fastqFiles=$* local fastqFiles=$*
#if [ -z "$fastqFiles" ]; then #if [ -z "$fastqFiles" ]; then
if [ $# -lt 1 ]; then if [ $# -lt 1 ]; then
...@@ -48,21 +51,24 @@ mailme "fastqc done for $outputDir" ...@@ -48,21 +51,24 @@ mailme "fastqc done for $outputDir"
export -f dge_fastqc export -f dge_fastqc
#http://wiki.bash-hackers.org/howto/getopts_tutorial #http://wiki.bash-hackers.org/howto/getopts_tutorial
dge_tophat_se(){ dge_tophat_se(){
# http://stackoverflow.com/questions/18414054/bash-getopts-reading-optarg-for-optional-flags # http://stackoverflow.com/questions/18414054/bash-getopts-reading-optarg-for-optional-flags
echo $*
while getopts "i:" curopt; do while getopts "i:" curopt; do
case $curopt in case $curopt in
i) IGENOME=$OPTARG; i) IGENOME="$OPTARG";
esac esac
done done
shift $(($OPTIND - 1)) shift $(($OPTIND - 1))
fastqFiles=$* local fastqFiles=$*
echo fastq $fastqFiles
echo igenomes "$IGENOME"
if [ -z "$IGENOME" ] || [ -z "$fastqFiles" ]; if [ -z "$IGENOME" ] || [ -z "$fastqFiles" ];
then echo "Usage: dge_tophat_se -i <path to igenome> [<fastq.gz file>]+" >&2 ; return; then echo "Usage: dge_tophat_se -i <path to igenome> [<fastq.gz file>]+" >&2 ; return;
...@@ -84,6 +90,7 @@ fi ...@@ -84,6 +90,7 @@ fi
echo "running tophat using igenome '$IGENOME' for the following files" echo "running tophat using igenome '$IGENOME' for the following files"
ll $fastqFiles
#fastqFiles=$(ls $baseDir/treps_pooled/*fastq.gz) #fastqFiles=$(ls $baseDir/treps_pooled/*fastq.gz)
...@@ -95,12 +102,12 @@ for fastqFile in $fastqFiles ; do ...@@ -95,12 +102,12 @@ for fastqFile in $fastqFiles ; do
outputdir=$fastqBaseName outputdir=$fastqBaseName
## uniquely mapping reads only: http:/seqanswers.com/forums/showthread.php?s=93da11109ae12a773a128a637d69defe&t=3464 ## uniquely mapping reads only: http:/seqanswers.com/forums/showthread.php?s=93da11109ae12a773a128a637d69defe&t=3464
# mysub "${project}__tophat__${fastqBaseName}" " mysub "${project}__tophat__${fastqBaseName}" "
# tophat -p6 -G $gtfFile -g1 -o $outputdir $bowtie_gindex $fastqFile tophat -p6 -G $gtfFile -g1 -o $outputdir $bowtie_gindex $fastqFile
#
# mv $outputdir/accepted_hits.bam $outputdir/$(basename $outputdir).bam mv $outputdir/accepted_hits.bam $outputdir/$(basename $outputdir).bam
# samtools index $outputdir/$(basename $outputdir).bam samtools index $outputdir/$(basename $outputdir).bam
# " -n 5 -R span[hosts=1] -q long | joblist .tophatjobs " -n 5 -R span[hosts=1] -q long | joblist .tophatjobs
done done
wait4jobs .tophatjobs wait4jobs .tophatjobs
...@@ -108,9 +115,53 @@ wait4jobs .tophatjobs ...@@ -108,9 +115,53 @@ wait4jobs .tophatjobs
## create tophat mapping report ## create tophat mapping report
source <(curl https://dl.dropboxusercontent.com/u/113630701/datautils/bash/bioinfo_utils.sh 2>&1 2>/dev/null) source <(curl https://dl.dropboxusercontent.com/u/113630701/datautils/bash/bioinfo_utils.sh 2>&1 2>/dev/null)
TophatMappingReport TophatMappingReport
} }
export -f dge_tophat_se
# dge_tophat_se # dge_tophat_se
# dge_tophat_se -i # dge_tophat_se -i
\ No newline at end of file
dge_cuffdiff(){
local gtfFile=$1
local bamDir=$2
local labels=$3
if [ $# -ne 3 ]; then
echo "Usage: dge_fastqc <gtf_file> <bam directory> <labels>" >&2 ; return;
fi
if [ -z "$(which cuffdiff)" ]; then
>&2 echo "no cuffdiff binary in PATH"; return;
fi
if [ ! -f $gtfFile ]; then
>&2 echo "gtf '$gtfFile' does not exis"; return;
fi
## collect all bam-files and group them
allBams=$(find $bamDir | grep ".bam$" | grep -v "unmapped" | sort)
bamsSplit=""
for label in $(echo $labels | tr ", " " "); do
echo $label
labelBams=$(echo "$allBams" | grep $label | xargs echo -n | tr ' ' ',')
bamsSplit+=$labelBams" "
done
#echo $bamsSplit
## make sure (again that all files are there
echo $gtfFile $bamsSplit | tr "," " " | xargs ls -la
#mysub ${project}_cuffdiff "cuffdiff -L aRGm,aRGp,aRG,bRG,IPC,N -o . -p 8 mm10_ensGene_ccds.gtf $amBams $apBams $aBams $bBams $cBams $dBams 2>&1 | tee cuffdiff.log" -q long -n 8 -R span[hosts=1] | blockScript
cdCmd="cuffdiff -L $labels -o . -p 10 $gtfFile $bamsSplit"
#echo "cmd is: $cdCmd"
mysub ${project}__cuffdiff "$cdCmd" -q long -n 8 -R span[hosts=1] | blockScript
MakeCuffDB $gtfFile "NAN"
}
\ No newline at end of file
0% Loading or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment