Skip to content
Snippets Groups Projects
process_data.py 481 B
Newer Older
Marcin Wątroba's avatar
Marcin Wątroba committed
import json
from pathlib import Path
from pprint import pprint

if __name__ == '__main__':
    paths = sorted(list(Path('voicelab_cbiz_testset_20220322_techmo').iterdir()))
    for it in paths[:1]:
        try:
            data = json.load(open(it, 'r'))
            pprint(data)
            # data['transcription'] = [it['text']['text'] for it in data['transcription']]
            # pprint(data)
            # json.dump(data, open(it, 'w'))
        except:
            print(it)