https://github.com/jvivian/one_off_scripts
Tip revision: 3ad04be99cd01e6a047c1b530cc8a1de82bd862e authored by John Vivian on 02 February 2017, 01:31:18 UTC
Refactor SRA pipeline to use faster method than fastq-dump
Refactor SRA pipeline to use faster method than fastq-dump
Tip revision: 3ad04be
convert_files_to_uuid.py
#!/usr/bin/env python2.7
# John Vivian
# 9-18-15
"""
Convert files in a directory to a random UUID4
Write a TSV matching original name to UUID4
"""
import sys
import uuid
import os
dir = sys.argv[1]
project = 'WCDT'
extension = '.fastq.gz'
onlyfiles = [ os.path.join(dir, f) for f in os.listdir(dir) if os.path.isfile(os.path.join(dir, f)) ]
with open('name_pair.tsv', 'w') as f_out:
for fname in onlyfiles:
sample_uuid = str(uuid.uuid4())
f_out.write('{}\t{}\t{}\n'.format(project, os.path.basename(fname).split('.')[0], sample_uuid))
os.rename(fname, os.path.join(dir, sample_uuid + extension))