swh:1:snp:0fa5e44aa9eaf68dc00949be32686577b750591b
Tip revision: 8575912e5aa73fde6ab54bba4fbaeadc7d8267f4 authored by Amin Haghani on 20 November 2024, 18:45:15 UTC
Delete MammalianNetworkAnalysis, Amin Haghani/Supplementary Data directory
Delete MammalianNetworkAnalysis, Amin Haghani/Supplementary Data directory
Tip revision: 8575912
getCoverage.py
# Finds how many CG sites are targeted in each species for a selected set of Infinium 2 probes
import sys
import gzip
from collections import defaultdict
def main():
if len(sys.argv) != 3:
print ("Usage: python pickInf2Probes.py <probes file> <output file>")
exit(1)
probesFile = open(sys.argv[1], 'r')
oFile = open(sys.argv[2], 'w')
speciesCount = defaultdict(int)
for line in probesFile:
splitLine = line.strip().split("\t")
species = splitLine[24].split(",")
for curSpecies in species:
if (curSpecies == "A"):
print(line)
speciesCount[curSpecies] += 1
for species in sorted(speciesCount.keys()):
if (species != "hg19"):
oFile.write(species + " " + str(speciesCount[species]) + "\n")
oFile.close()
probesFile.close()
main()