removed 'space' and 'paragraphNum' fields, added puncAfter and puncBefore, dealing with periods by putting them into appropcate puncafter fields

This commit is contained in:
2018-11-08 23:59:06 -05:00
parent 59cdc0777d
commit e31d9e6883
5 changed files with 2678 additions and 12 deletions

View File

@@ -10,13 +10,6 @@ class TranscriptConverter:
self.path = path
with open(path, 'r') as fin:
self.words = converters[format_name](json.load(fin))
# wordStart
# wordEnd
# word
# confidence
# index
# space
# alwaysCapitalized
def to_json(self):
return json.dumps(self.words, indent=4)