https://github.com/adbar/laclos
Tip revision: e31767041fbb127ccaec5e4a14366c918dd6cc7b authored by Adrien Barbaresi on 20 December 2014, 14:34:19 UTC
general update
general update
Tip revision: e317670
badlistgen.py
#!/usr/bin/python3
### This script is part of LACLOS (https://github.com/adbar/laclos).
### Copyright (C) Adrien Barbaresi, 2013.
### This is free software, licensed under the GNU Lesser General Public License (https://www.gnu.org/licenses/lgpl.html)
# purpose: filter subtitles based on language check results
# Python3 compatible
import argparse
# argparse
parser = argparse.ArgumentParser()
parser.add_argument('-s', '--summary', dest='summary', help='summary of language statistics', required=True)
parser.add_argument('-o', '--output', dest='output', help='name of output file')
args = parser.parse_args()
badones = list()
with open(args.summary, 'r') as summaryfh:
# skip first line
next(summaryfh)
for line in summaryfh:
columns = line.split('\t')
if float(columns[1]) > 50 or float(columns[2]) < 20 : # or columns[3] is not 'de'
badones.append(int(columns[0]))
with open(args.output, 'w') as badonesfh:
for item in badones.sort():
badonesfh.write(str(item) + '\n')