Character checking: be more verbose if something fails

This way one can easily debug what file causes problems
This commit is contained in:
Jan Engelmohr 2018-12-03 12:08:19 +01:00
parent de279168ec
commit 18ef670b05
1 changed files with 8 additions and 4 deletions

View File

@ -29,14 +29,18 @@ else:
print("### Reading in the following transcript files: ###")
print(inFiles)
allText = set()
for inFile in (inFiles):
with open(inFile, 'r') as csvFile:
reader = csv.reader(csvFile)
for row in reader:
allText |= set(str(row[2]))
csvFile.close()
try:
for row in reader:
allText |= set(str(row[2]))
except IndexError as ie:
print("Your input file",inFile,"is not formatted properly. Check if there are 3 columns with the 3rd containing the transcript")
sys.exit(-1)
finally:
csvFile.close()
print("### The following unique characters were found in your transcripts: ###")
print(list(allText))