https://github.com/sfu-compbio/mrsfast
Revision 6aa8bb74d3d327b01c0f52cee7a271efbaf5abe1 authored by Iman Sarrafi on 16 May 2013, 22:07:04 UTC, committed by Iman Sarrafi on 16 May 2013, 22:07:04 UTC
1 parent 39958d0
Tip revision: 6aa8bb74d3d327b01c0f52cee7a271efbaf5abe1 authored by Iman Sarrafi on 16 May 2013, 22:07:04 UTC
Bug Fix: Quality not reversed in single best mode
Bug Fix: Quality not reversed in single best mode
Tip revision: 6aa8bb7
Common.c
/*
* Copyright (c) <2008 - 2020>, University of Washington, Simon Fraser University
* All rights reserved.
*
* Redistribution and use in source and binary forms, with or without modification,
* are permitted provided that the following conditions are met:
*
* Redistributions of source code must retain the above copyright notice, this list
* of conditions and the following disclaimer.
* - Redistributions in binary form must reproduce the above copyright notice, this
* list of conditions and the following disclaimer in the documentation and/or other
* materials provided with the distribution.
* - Neither the name of the <ORGANIZATION> nor the names of its contributors may be
* used to endorse or promote products derived from this software without specific
* prior written permission.
*
* THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
* "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
* LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
* A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR
* CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
* EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
* PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
* PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
* LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
* NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
* SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
*/
/*
* Author:
* Faraz Hach (fhach AT cs DOT sfu DOT ca)
* Iman Sarrafi (isarrafi AT cs DOT sfu DOT ca)
*/
#include <stdio.h>
#include <stdlib.h>
#include <sys/time.h>
#include <zlib.h>
#include <string.h>
#include <math.h>
#include "Common.h"
unsigned short SEQ_LENGTH = 0;
unsigned short QUAL_LENGTH = 0;
unsigned short CMP_SEQ_LENGTH = 0;
long long memUsage = 0;
char *alphabet = "ACGTN";
/**********************************************/
FILE *fileOpen(char *fileName, char *mode)
{
FILE *fp;
fp = fopen (fileName, mode);
if (fp == NULL)
{
fprintf(stdout, "Error: Cannot Open the file %s\n", fileName);
fflush(stdout);
exit(0);
}
return fp;
}
/**********************************************/
gzFile fileOpenGZ(char *fileName, char *mode)
{
gzFile gzfp;
gzfp = gzopen (fileName, mode);
if (gzfp == Z_NULL)
{
fprintf(stdout, "Error: Cannot Open the file %s\n", fileName);
fflush(stdout);
exit(0);
}
return gzfp;
}
/**********************************************/
double getTime(void)
{
struct timeval t;
gettimeofday(&t, NULL);
return t.tv_sec+t.tv_usec/1000000.0;
}
/**********************************************/
inline char reverseCompleteChar(char c)
{
char ret;
switch (c)
{
case 'A':
ret = 'T';
break;
case 'T':
ret = 'A';
break;
case 'C':
ret = 'G';
break;
case 'G':
ret = 'C';
break;
default:
ret = 'N';
break;
}
return ret;
}
/**********************************************/
inline void reverseComplete (char *seq, char *rcSeq , int length) // TODO: efficiency check
{
char rc[100];
memset(rc, 'N', 100);
rc['A']='T';
rc['T']='A';
rc['C']='G';
rc['G']='C';
rc['N']='N';
int i;
seq+=length-1;
for (i=0; i<length; i++)
{
rcSeq[i]=rc[*(seq--)];
//rcSeq[i]=reverseCompleteChar (seq[length-1-i]) ;
}
}
pthread_mutex_t _common_lock;
/**********************************************/
void * getMem(size_t size) // TODO: if malloc is unsuccessfull, return an error message
{
pthread_mutex_lock(&_common_lock);
memUsage+=size;
pthread_mutex_unlock(&_common_lock);
return malloc(size);
}
/**********************************************/
void freeMem(void *ptr, size_t size)
{
pthread_mutex_lock(&_common_lock);
memUsage-=size;
pthread_mutex_unlock(&_common_lock);
free(ptr);
}
/**********************************************/
double getMemUsage()
{
return memUsage/1048576.0;
}
/**********************************************/
inline void reverse (char *seq, char *rcSeq , int length)
{
int i;
seq += length-1;
for (i=0; i<length; i++)
{
//rcSeq[i]=seq[length-1-i];
rcSeq[i]=*(seq--);
}
}
/**********************************************/
void stripPath(char *full, char **path, char **fileName)
{
int i;
int pos = -1;
for (i=strlen(full)-1; i>=0; i--)
{
if (full[i]=='/')
{
pos = i;
break;
}
}
if (pos != -1)
{
sprintf(*fileName, "%s%c", (full+pos+1), '\0');
full[pos+1]='\0';
sprintf(*path,"%s%c", full, '\0');
}
else
{
sprintf(*fileName, "%s%c", full, '\0');
sprintf(*path,"%c", '\0');
}
}
/**********************************************/
inline int calculateCompressedLen(int normalLen)
{
return (normalLen / 21) + ((normalLen%21)?1:0);
}
/**********************************************/
void compressSequence(char *seq, int seqLen, CompressedSeq *cseq)
{
CompressedSeq val = 0;
int i = 0, pos = 0;
*cseq = 0;
while (pos < seqLen)
{
*cseq <<= 3;
switch (seq[pos++])
{
case 'A':
break;
case 'C':
*cseq |= 1;
break;
case 'G':
*cseq |= 2;
break;
case 'T':
*cseq |= 3;
break;
case 'N':
*cseq |= 4;
break;
default:
*cseq |= 4;
break;
}
if (++i == 21)
{
i = 0;
cseq++;
if (pos < seqLen) // not to write the adjacent memory in case seqLen % 21 == 0
*cseq = 0;
}
}
if (i > 0)
{
*cseq <<= (3*(21-i));
}
}
/**********************************************/
int hashVal(char *seq)
{
int i=0;
int val=0, numericVal=0;
while(i<WINDOW_SIZE)
{
switch (seq[i])
{
case 'A':
numericVal = 0; break;
case 'C':
numericVal = 1; break;
case 'G' :
numericVal = 2; break;
case 'T':
numericVal = 3; break;
default:
return -1;
break;
}
val = (val << 2)|numericVal;
i++;
}
return val;
}
/**********************************************/
int checkSumVal(char *seq)
{
int i=0;
int val=0, numericVal=0;
while(i<checkSumLength)
{
switch (seq[i])
{
case 'A':
numericVal = 0; break;
case 'C':
numericVal = 1; break;
case 'G' :
numericVal = 2; break;
case 'T':
numericVal = 3; break;
default:
return -1;
break;
}
val = (val << 2)|numericVal;
i++;
}
return val;
}
Computing file changes ...