removed 'space' and 'paragraphNum' fields, added puncAfter and puncBefore, dealing with periods by putting them into appropcate puncafter fields
This commit is contained in:
@@ -10,13 +10,6 @@ class TranscriptConverter:
|
||||
self.path = path
|
||||
with open(path, 'r') as fin:
|
||||
self.words = converters[format_name](json.load(fin))
|
||||
# wordStart
|
||||
# wordEnd
|
||||
# word
|
||||
# confidence
|
||||
# index
|
||||
# space
|
||||
# alwaysCapitalized
|
||||
|
||||
def to_json(self):
|
||||
return json.dumps(self.words, indent=4)
|
||||
|
||||
Reference in New Issue
Block a user