Skip to content
Snippets Groups Projects
dvc.lock 159 KiB
Newer Older
Marcin Wątroba's avatar
Marcin Wątroba committed
schema: '2.0'
stages:
Marcin Wątroba's avatar
Marcin Wątroba committed
  import_dataset_to_relation_manager@0:
    cmd: PYTHONPATH=. python experiment/pl_luna/import_relation_manager.py
Marcin Wątroba's avatar
Marcin Wątroba committed
    deps:
Marcin Wątroba's avatar
Marcin Wątroba committed
    - path: experiment/pl_luna/import_relation_manager.py
      md5: 0b72ccf1aa1107d85def09140e76bdf9
      size: 8284
    - path: experiment_data/dataset/pl_luna
Marcin Wątroba's avatar
Marcin Wątroba committed
      md5: d342155b1871e881797cf7da09d5dc3c.dir
      size: 1578358645
      nfiles: 4500
    outs:
Marcin Wątroba's avatar
Marcin Wątroba committed
    - path: experiment_data/dataset_relation_manager_data/pl_luna
      md5: 7c6720b017c9fa82bb1c2264239b3b03.dir
Marcin Wątroba's avatar
Marcin Wątroba committed
      size: 229007155
      nfiles: 1000
Marcin Wątroba's avatar
Marcin Wątroba committed
  import_dataset_to_relation_manager@1:
    cmd: PYTHONPATH=. python experiment/pl_minds14/import_relation_manager.py
Marcin Wątroba's avatar
Marcin Wątroba committed
    deps:
Marcin Wątroba's avatar
Marcin Wątroba committed
    - path: experiment/pl_minds14/import_relation_manager.py
      md5: d83011855f3f1b2ddec96713c3c41177
      size: 438
    - path: experiment_data/dataset/pl_minds14
      md5: d751713988987e9331980363e24189ce.dir
      size: 0
      nfiles: 0
    outs:
    - path: experiment_data/dataset_relation_manager_data/pl_minds14
      md5: b6838bb00cb83d69ae818d8de96a2f18.dir
      size: 3545062
      nfiles: 1124
  import_dataset_to_relation_manager@2:
    cmd: PYTHONPATH=. python experiment/pl_common_voice/import_relation_manager.py
    deps:
    - path: experiment/pl_common_voice/import_relation_manager.py
      md5: 2d0b47d14088c2c5b61a78ddeeff5293
      size: 547
    - path: experiment_data/dataset/pl_common_voice
      md5: d751713988987e9331980363e24189ce.dir
      size: 0
      nfiles: 0
    outs:
    - path: experiment_data/dataset_relation_manager_data/pl_common_voice
      md5: fe73df318524dc33331c62b22a7f5237.dir
      size: 21756677
      nfiles: 16310
  process_gold_transcript@1:
    cmd: PYTHONPATH=. python experiment/pipeline_process_gold_transcript.py --dataset=pl_minds14
    deps:
    - path: experiment/pipeline_process_gold_transcript.py
      md5: baac4f80dcdfcc5a49806eea6eec832a
      size: 1195
    - path: experiment_data/dataset/pl_minds14
      md5: d751713988987e9331980363e24189ce.dir
      size: 0
      nfiles: 0
    - path: experiment_data/dataset_relation_manager_data/pl_minds14
      md5: b6838bb00cb83d69ae818d8de96a2f18.dir
      size: 3545062
      nfiles: 1124
    outs:
    - path: experiment_data/pipeline/pl_minds14/gold_transcript
      md5: 35661dfd20421a6a6068b7194e483eba.dir
      size: 689374
      nfiles: 562
  process_gold_transcript@0:
    cmd: PYTHONPATH=. python experiment/pipeline_process_gold_transcript.py --dataset=pl_luna
    deps:
    - path: experiment/pipeline_process_gold_transcript.py
      md5: baac4f80dcdfcc5a49806eea6eec832a
      size: 1195
    - path: experiment_data/dataset/pl_luna
      md5: d342155b1871e881797cf7da09d5dc3c.dir
      size: 1578358645
      nfiles: 4500
    - path: experiment_data/dataset_relation_manager_data/pl_luna
      md5: 7c6720b017c9fa82bb1c2264239b3b03.dir
      size: 229007155
      nfiles: 1000
    outs:
    - path: experiment_data/pipeline/pl_luna/gold_transcript
      md5: 7e71aa1b181ad75dd08dd7932bc0fc65.dir
      size: 6706925
      nfiles: 500
  process_asr@6:
    cmd: PYTHONPATH=. python experiment/pipeline_process_asr.py --dataset=pl_minds14
      --asr=wav2vec2
    deps:
    - path: experiment/pipeline_process_asr.py
      md5: efe378505897550fe1a8d423c321ef53
      size: 1403
    - path: experiment_data/cached_asr/pl_minds14
      md5: 8dbd7480f408f284f4b349c02c991afc.dir
      size: 3821899
      nfiles: 2248
    - path: experiment_data/dataset/pl_minds14
      md5: d751713988987e9331980363e24189ce.dir
      size: 0
      nfiles: 0
    - path: experiment_data/dataset_relation_manager_data/pl_minds14
      md5: b6838bb00cb83d69ae818d8de96a2f18.dir
      size: 3545062
      nfiles: 1124
    outs:
    - path: experiment_data/pipeline/pl_minds14/wav2vec2__result
      md5: 004f25308b0f5577af589bede338ae9f.dir
      size: 3523907
      nfiles: 562
  process_asr@2:
    cmd: PYTHONPATH=. python experiment/pipeline_process_asr.py --dataset=pl_luna
      --asr=wav2vec2
    deps:
    - path: experiment/pipeline_process_asr.py
      md5: efe378505897550fe1a8d423c321ef53
      size: 1403
    - path: experiment_data/cached_asr/pl_luna
      md5: 8dd7fbde8090469f4a0e41ea1c873cda.dir
      size: 22986007
      nfiles: 1951
    - path: experiment_data/dataset/pl_luna
      md5: d342155b1871e881797cf7da09d5dc3c.dir
      size: 1578358645
      nfiles: 4500
    - path: experiment_data/dataset_relation_manager_data/pl_luna
      md5: 7c6720b017c9fa82bb1c2264239b3b03.dir
      size: 229007155
      nfiles: 1000
    outs:
    - path: experiment_data/pipeline/pl_luna/wav2vec2__result
      md5: 80994fc18d2cc2a1fa56fd4436c5378b.dir
      size: 20658485
      nfiles: 456
  process_asr@5:
    cmd: PYTHONPATH=. python experiment/pipeline_process_asr.py --dataset=pl_minds14
      --asr=ajn
    deps:
    - path: experiment/pipeline_process_asr.py
      md5: efe378505897550fe1a8d423c321ef53
      size: 1403
    - path: experiment_data/cached_asr/pl_minds14
      md5: 8dbd7480f408f284f4b349c02c991afc.dir
      size: 3821899
      nfiles: 2248
    - path: experiment_data/dataset/pl_minds14
      md5: d751713988987e9331980363e24189ce.dir
      size: 0
      nfiles: 0
    - path: experiment_data/dataset_relation_manager_data/pl_minds14
      md5: b6838bb00cb83d69ae818d8de96a2f18.dir
      size: 3545062
      nfiles: 1124
    outs:
    - path: experiment_data/pipeline/pl_minds14/ajn__result
      md5: b09eb8176b26586b06093384bbaea770.dir
      size: 974727
      nfiles: 559
  process_asr@4:
    cmd: PYTHONPATH=. python experiment/pipeline_process_asr.py --dataset=pl_minds14
      --asr=google
    deps:
    - path: experiment/pipeline_process_asr.py
      md5: efe378505897550fe1a8d423c321ef53
      size: 1403
    - path: experiment_data/cached_asr/pl_minds14
      md5: 8dbd7480f408f284f4b349c02c991afc.dir
      size: 3821899
      nfiles: 2248
    - path: experiment_data/dataset/pl_minds14
      md5: d751713988987e9331980363e24189ce.dir
      size: 0
      nfiles: 0
    - path: experiment_data/dataset_relation_manager_data/pl_minds14
      md5: b6838bb00cb83d69ae818d8de96a2f18.dir
      size: 3545062
      nfiles: 1124
    outs:
    - path: experiment_data/pipeline/pl_minds14/google__result
      md5: 3505364058d488815dd90699e71fd00b.dir
      size: 985004
      nfiles: 562
  process_asr@0:
    cmd: PYTHONPATH=. python experiment/pipeline_process_asr.py --dataset=pl_luna
      --asr=google
    deps:
    - path: experiment/pipeline_process_asr.py
      md5: efe378505897550fe1a8d423c321ef53
      size: 1403
    - path: experiment_data/cached_asr/pl_luna
      md5: 8dd7fbde8090469f4a0e41ea1c873cda.dir
      size: 22986007
      nfiles: 1951
    - path: experiment_data/dataset/pl_luna
      md5: d342155b1871e881797cf7da09d5dc3c.dir
      size: 1578358645
      nfiles: 4500
    - path: experiment_data/dataset_relation_manager_data/pl_luna
      md5: 7c6720b017c9fa82bb1c2264239b3b03.dir
      size: 229007155
      nfiles: 1000
    outs:
    - path: experiment_data/pipeline/pl_luna/google__result
      md5: 254e060731d669a14f3a5525ccd1fe28.dir
      size: 5346497
      nfiles: 500
  process_asr@1:
    cmd: PYTHONPATH=. python experiment/pipeline_process_asr.py --dataset=pl_luna
      --asr=ajn
    deps:
    - path: experiment/pipeline_process_asr.py
      md5: efe378505897550fe1a8d423c321ef53
      size: 1403
    - path: experiment_data/cached_asr/pl_luna
      md5: 8dd7fbde8090469f4a0e41ea1c873cda.dir
      size: 22986007
      nfiles: 1951
    - path: experiment_data/dataset/pl_luna
      md5: d342155b1871e881797cf7da09d5dc3c.dir
      size: 1578358645
      nfiles: 4500
    - path: experiment_data/dataset_relation_manager_data/pl_luna
      md5: 7c6720b017c9fa82bb1c2264239b3b03.dir
      size: 229007155
      nfiles: 1000
    outs:
    - path: experiment_data/pipeline/pl_luna/ajn__result
      md5: bca7f2eae18f606867c9880bd0fe1c8d.dir
      size: 6159899
      nfiles: 494
  process_asr@3:
    cmd: PYTHONPATH=. python experiment/pipeline_process_asr.py --dataset=pl_luna
      --asr=techmo
    deps:
    - path: experiment/pipeline_process_asr.py
      md5: efe378505897550fe1a8d423c321ef53
      size: 1403
    - path: experiment_data/cached_asr/pl_luna
      md5: 8dd7fbde8090469f4a0e41ea1c873cda.dir
      size: 22986007
      nfiles: 1951
    - path: experiment_data/dataset/pl_luna
      md5: d342155b1871e881797cf7da09d5dc3c.dir
      size: 1578358645
      nfiles: 4500
    - path: experiment_data/dataset_relation_manager_data/pl_luna
      md5: 7c6720b017c9fa82bb1c2264239b3b03.dir
      size: 229007155
      nfiles: 1000
    outs:
    - path: experiment_data/pipeline/pl_luna/techmo__result
      md5: 4c6609ab50706ad45f3919eaf902a75e.dir
      size: 9697519
Marcin Wątroba's avatar
Marcin Wątroba committed
      nfiles: 500
Marcin Wątroba's avatar
Marcin Wątroba committed
  process_asr@7:
    cmd: PYTHONPATH=. python experiment/pipeline_process_asr.py --dataset=pl_minds14
      --asr=techmo
    deps:
    - path: experiment/pipeline_process_asr.py
      md5: efe378505897550fe1a8d423c321ef53
      size: 1403
    - path: experiment_data/cached_asr/pl_minds14
      md5: 8dbd7480f408f284f4b349c02c991afc.dir
      size: 3821899
      nfiles: 2248
    - path: experiment_data/dataset/pl_minds14
      md5: d751713988987e9331980363e24189ce.dir
      size: 0
      nfiles: 0
    - path: experiment_data/dataset_relation_manager_data/pl_minds14
      md5: b6838bb00cb83d69ae818d8de96a2f18.dir
      size: 3545062
      nfiles: 1124
    outs:
    - path: experiment_data/pipeline/pl_minds14/techmo__result
      md5: 13b6f9b23182b9255a802134c47ab4c4.dir
      size: 1336305
      nfiles: 562
  save_wave_files__pl_google_fleurs:
    cmd: PYTHONPATH=. python experiment/pl_google_fleurs/save_wav_files.py
    deps:
    - path: experiment/pl_google_fleurs/save_wav_files.py
      md5: 5fd1d6210a9766c35cf11892a9951266
      size: 610
    outs:
    - path: experiment_data/dataset/pl_google_fleurs
      md5: dfcb8cf40b4a1e1a62f9ada00468cca9.dir
      size: 236272072
      nfiles: 758
  import_dataset_to_relation_manager@3:
    cmd: PYTHONPATH=. python experiment/pl_vpl_voicelab_cbizoicelab/import_relation_manager.py
    deps:
    - path: experiment/pl_voicelab_cbiz/import_relation_manager.py
      md5: 8b100b393470511b789ee4bc722f12ea
      size: 2026
    - path: experiment_data/dataset/pl_voicelab_cbiz
      md5: 3c2b18e1f1f89e4c5ad7b254e472b25e.dir
      size: 4803739404
      nfiles: 1600
    outs:
    - path: experiment_data/dataset_relation_manager_data/pl_voicelab_cbiz
      md5: 7ef4be9a4eeef095baf7a4cd765610d0.dir
      size: 110711470
      nfiles: 1600
  import_dataset_to_relation_manager@4:
    cmd: PYTHONPATH=. python experiment/pl_google_fleurs/import_relation_manager.py
    deps:
    - path: experiment/pl_google_fleurs/import_relation_manager.py
      md5: f5547b678bb8fe0542eaaf047d1447aa
      size: 458
    - path: experiment_data/dataset/pl_google_fleurs
      md5: dfcb8cf40b4a1e1a62f9ada00468cca9.dir
      size: 236272072
      nfiles: 758
    outs:
    - path: experiment_data/dataset_relation_manager_data/pl_google_fleurs
      md5: 5a5609426d0a70990792c8a8b1854a48.dir
      size: 4991297
      nfiles: 1516
  process_gold_transcript@2:
    cmd: PYTHONPATH=. python experiment/pipeline_process_gold_transcript.py --dataset=pl_common_voice
    deps:
    - path: experiment/pipeline_process_gold_transcript.py
      md5: baac4f80dcdfcc5a49806eea6eec832a
      size: 1195
    - path: experiment_data/dataset/pl_common_voice
      md5: d751713988987e9331980363e24189ce.dir
      size: 0
      nfiles: 0
    - path: experiment_data/dataset_relation_manager_data/pl_common_voice
      md5: fe73df318524dc33331c62b22a7f5237.dir
      size: 21756677
      nfiles: 16310
    outs:
    - path: experiment_data/pipeline/pl_common_voice/gold_transcript
      md5: 4903cf286f3c1ae49876c4ba52713d3c.dir
      size: 4093545
      nfiles: 8155
  process_gold_transcript@3:
    cmd: PYTHONPATH=. python experiment/pipeline_process_gold_transcript.py --dataset=pl_voicelab_cbiz
    deps:
    - path: experiment/pipeline_process_gold_transcript.py
      md5: baac4f80dcdfcc5a49806eea6eec832a
      size: 1195
    - path: experiment_data/dataset/pl_voicelab_cbiz
      md5: 3c2b18e1f1f89e4c5ad7b254e472b25e.dir
      size: 4803739404
      nfiles: 1600
    - path: experiment_data/dataset_relation_manager_data/pl_voicelab_cbiz
      md5: 7ef4be9a4eeef095baf7a4cd765610d0.dir
      size: 110711470
      nfiles: 1600
    outs:
    - path: experiment_data/pipeline/pl_voicelab_cbiz/gold_transcript
      md5: 3462fc9dea267f7db0e133ced6b5f4e9.dir
      size: 21846798
      nfiles: 800
  process_gold_transcript@4:
    cmd: PYTHONPATH=. python experiment/pipeline_process_gold_transcript.py --dataset=pl_google_fleurs
    deps:
    - path: experiment/pipeline_process_gold_transcript.py
      md5: baac4f80dcdfcc5a49806eea6eec832a
      size: 1195
    - path: experiment_data/dataset/pl_google_fleurs
      md5: dfcb8cf40b4a1e1a62f9ada00468cca9.dir
      size: 236272072
      nfiles: 758
    - path: experiment_data/dataset_relation_manager_data/pl_google_fleurs
      md5: 5a5609426d0a70990792c8a8b1854a48.dir
      size: 4991297
      nfiles: 1516
    outs:
    - path: experiment_data/pipeline/pl_google_fleurs/gold_transcript
      md5: 7ea17627b30e788f34c81ca9322f2879.dir
      size: 975209
      nfiles: 758
  process_asr@17:
    cmd: PYTHONPATH=. python experiment/pipeline_process_asr.py --dataset=pl_common_voice
      --asr=wav2vec2
    deps:
    - path: experiment/pipeline_process_asr.py
      md5: efe378505897550fe1a8d423c321ef53
      size: 1403
    - path: experiment_data/cached_asr/pl_common_voice
      md5: 43714b76048ec7311d08a7c48c282146.dir
      size: 20219523
      nfiles: 24453
    - path: experiment_data/dataset/pl_common_voice
      md5: d751713988987e9331980363e24189ce.dir
      size: 0
      nfiles: 0
    - path: experiment_data/dataset_relation_manager_data/pl_common_voice
      md5: fe73df318524dc33331c62b22a7f5237.dir
      size: 21756677
      nfiles: 16310
    outs:
    - path: experiment_data/pipeline/pl_common_voice/wav2vec2__result
      md5: 402f9a70d682d030b8f7b6a36044c651.dir
      size: 19014997
      nfiles: 8154
  process_asr@10:
    cmd: PYTHONPATH=. python experiment/pipeline_process_asr.py --dataset=pl_google_fleurs
      --asr=wav2vec2
    deps:
    - path: experiment/pipeline_process_asr.py
      md5: efe378505897550fe1a8d423c321ef53
      size: 1403
    - path: experiment_data/cached_asr/pl_google_fleurs
      md5: dfa15d901991d0cc9634192e21a9cc23.dir
      size: 5645552
      nfiles: 3032
    - path: experiment_data/dataset/pl_google_fleurs
      md5: dfcb8cf40b4a1e1a62f9ada00468cca9.dir
      size: 236272072
      nfiles: 758
    - path: experiment_data/dataset_relation_manager_data/pl_google_fleurs
      md5: 5a5609426d0a70990792c8a8b1854a48.dir
      size: 4991297
      nfiles: 1516
    outs:
    - path: experiment_data/pipeline/pl_google_fleurs/wav2vec2__result
      md5: 88a7ae4e0399446f996c11d6ffef701a.dir
      size: 5137721
      nfiles: 758
  process_asr@8:
    cmd: PYTHONPATH=. python experiment/pipeline_process_asr.py --dataset=pl_google_fleurs
      --asr=google
    deps:
    - path: experiment/pipeline_process_asr.py
      md5: efe378505897550fe1a8d423c321ef53
      size: 1403
    - path: experiment_data/cached_asr/pl_google_fleurs
      md5: dfa15d901991d0cc9634192e21a9cc23.dir
      size: 5645552
      nfiles: 3032
    - path: experiment_data/dataset/pl_google_fleurs
      md5: dfcb8cf40b4a1e1a62f9ada00468cca9.dir
      size: 236272072
      nfiles: 758
    - path: experiment_data/dataset_relation_manager_data/pl_google_fleurs
      md5: 5a5609426d0a70990792c8a8b1854a48.dir
      size: 4991297
      nfiles: 1516
    outs:
    - path: experiment_data/pipeline/pl_google_fleurs/google__result
      md5: 9cb6cac07efe8e5d0b33ae7c818c5766.dir
      size: 1377134
      nfiles: 758
  save_audio_files:
    cmd: PYTHONPATH=. python experiment/dataset_specific/pl_google_fleurs/pipeline_save_wav_files.py
    deps:
    - path: experiment/dataset_specific/pl_google_fleurs/pipeline_save_wav_files.py
      md5: 0a386b55f0ad26109f110a4622690066
      size: 735
    outs:
    - path: experiment_data/dataset/pl_google_fleurs
      md5: dfcb8cf40b4a1e1a62f9ada00468cca9.dir
      size: 236272072
      nfiles: 758
  pipeline_prepare_relation_manager@4:
    cmd: PYTHONPATH=. python experiment/dataset_specific/pl_voicelab_cbiz/import_relation_manager.py
    deps:
    - path: experiment/dataset_specific/pl_voicelab_cbiz/import_relation_manager.py
      md5: ca3760c3f051a00575bf015322575d1a
      size: 2075
    - path: experiment_data/dataset/pl_voicelab_cbiz
      md5: 3c2b18e1f1f89e4c5ad7b254e472b25e.dir
      size: 4803739404
      nfiles: 1600
    outs:
    - path: experiment_data/dataset_relation_manager_data/pl_voicelab_cbiz
      md5: d23bd3824dc9e68a649edc94fbec50fb.dir
      size: 110711470
      nfiles: 1600
  pipeline_prepare_relation_manager@3:
    cmd: PYTHONPATH=. python experiment/dataset_specific/pl_minds14/import_relation_manager.py
    deps:
    - path: experiment/dataset_specific/pl_minds14/import_relation_manager.py
      md5: 2deae168760fa019e6d19d0111baca41
      size: 455
    - path: experiment_data/dataset/pl_minds14
      md5: d751713988987e9331980363e24189ce.dir
      size: 0
      nfiles: 0
    outs:
    - path: experiment_data/dataset_relation_manager_data/pl_minds14
Marcin Wątroba's avatar
Marcin Wątroba committed
      md5: 40bb7d02cc76d5b1093955b5046cc3c4.dir
Marcin Wątroba's avatar
Marcin Wątroba committed
      size: 3545062
      nfiles: 1124
  pipeline_prepare_relation_manager@0:
    cmd: PYTHONPATH=. python experiment/dataset_specific/pl_common_voice/import_relation_manager.py
    deps:
    - path: experiment/dataset_specific/pl_common_voice/import_relation_manager.py
      md5: 2d0b47d14088c2c5b61a78ddeeff5293
      size: 547
    - path: experiment_data/dataset/pl_common_voice
      md5: d751713988987e9331980363e24189ce.dir
      size: 0
      nfiles: 0
    outs:
    - path: experiment_data/dataset_relation_manager_data/pl_common_voice
      md5: da29f883159b95496c488a3c9c35e632.dir
      size: 21756677
      nfiles: 16310
  pipeline_prepare_relation_manager@1:
    cmd: PYTHONPATH=. python experiment/dataset_specific/pl_google_fleurs/import_relation_manager.py
    deps:
    - path: experiment/dataset_specific/pl_google_fleurs/import_relation_manager.py
      md5: f5547b678bb8fe0542eaaf047d1447aa
      size: 458
    - path: experiment_data/dataset/pl_google_fleurs
      md5: dfcb8cf40b4a1e1a62f9ada00468cca9.dir
      size: 236272072
      nfiles: 758
    outs:
    - path: experiment_data/dataset_relation_manager_data/pl_google_fleurs
      md5: ce176e60d7e55945e402d711b22b0c6a.dir
      size: 4991297
      nfiles: 1516
  pipeline_gold_transcript@0:
    cmd: PYTHONPATH=. python experiment/pipeline_process_gold_transcript.py --dataset=pl_common_voice
    deps:
    - path: experiment/pipeline_process_gold_transcript.py
      md5: baac4f80dcdfcc5a49806eea6eec832a
      size: 1195
    - path: experiment_data/dataset/pl_common_voice
      md5: d751713988987e9331980363e24189ce.dir
      size: 0
      nfiles: 0
    - path: experiment_data/dataset_relation_manager_data/pl_common_voice
      md5: da29f883159b95496c488a3c9c35e632.dir
      size: 21756677
      nfiles: 16310
    outs:
    - path: experiment_data/pipeline/pl_common_voice/gold_transcript
      md5: e77ce22b14cb32594ae9cfcd4d6403b3.dir
      size: 4093545
      nfiles: 8155
  pipeline_prepare_relation_manager@2:
    cmd: PYTHONPATH=. python experiment/dataset_specific/pl_luna/import_relation_manager.py
    deps:
    - path: experiment/dataset_specific/pl_luna/import_relation_manager.py
      md5: 100bd47d6984532b076776702d93fb9f
      size: 8301
    - path: experiment_data/dataset/pl_luna
      md5: d342155b1871e881797cf7da09d5dc3c.dir
      size: 1578358645
      nfiles: 4500
    outs:
    - path: experiment_data/dataset_relation_manager_data/pl_luna
      md5: 95ca6826129400092cdc41365a4f6dcb.dir
      size: 229007155
      nfiles: 1000
  pipeline_gold_transcript@2:
    cmd: PYTHONPATH=. python experiment/pipeline_process_gold_transcript.py --dataset=pl_luna
    deps:
    - path: experiment/pipeline_process_gold_transcript.py
      md5: baac4f80dcdfcc5a49806eea6eec832a
      size: 1195
    - path: experiment_data/dataset/pl_luna
Marcin Wątroba's avatar
Marcin Wątroba committed
      md5: d342155b1871e881797cf7da09d5dc3c.dir
      size: 1578358645
      nfiles: 4500
Marcin Wątroba's avatar
Marcin Wątroba committed
    - path: experiment_data/dataset_relation_manager_data/pl_luna
      md5: 95ca6826129400092cdc41365a4f6dcb.dir
Marcin Wątroba's avatar
Marcin Wątroba committed
      size: 229007155
      nfiles: 1000
    outs:
Marcin Wątroba's avatar
Marcin Wątroba committed
    - path: experiment_data/pipeline/pl_luna/gold_transcript
      md5: 4c3e09acb7ffac0ef5b117a38515e3a9.dir
      size: 6706925
      nfiles: 500
  pipeline_gold_transcript@3:
    cmd: PYTHONPATH=. python experiment/pipeline_process_gold_transcript.py --dataset=pl_minds14
    deps:
    - path: experiment/pipeline_process_gold_transcript.py
      md5: baac4f80dcdfcc5a49806eea6eec832a
      size: 1195
    - path: experiment_data/dataset/pl_minds14
      md5: d751713988987e9331980363e24189ce.dir
      size: 0
      nfiles: 0
    - path: experiment_data/dataset_relation_manager_data/pl_minds14
Marcin Wątroba's avatar
Marcin Wątroba committed
      md5: 40bb7d02cc76d5b1093955b5046cc3c4.dir
Marcin Wątroba's avatar
Marcin Wątroba committed
      size: 3545062
      nfiles: 1124
    outs:
    - path: experiment_data/pipeline/pl_minds14/gold_transcript
Marcin Wątroba's avatar
Marcin Wątroba committed
      md5: d4da8b3a8c5f044af1403d70d8f60fcf.dir
Marcin Wątroba's avatar
Marcin Wątroba committed
      size: 689374
      nfiles: 562
  pipeline_gold_transcript@4:
    cmd: PYTHONPATH=. python experiment/pipeline_process_gold_transcript.py --dataset=pl_voicelab_cbiz
    deps:
    - path: experiment/pipeline_process_gold_transcript.py
      md5: baac4f80dcdfcc5a49806eea6eec832a
      size: 1195
    - path: experiment_data/dataset/pl_voicelab_cbiz
      md5: 3c2b18e1f1f89e4c5ad7b254e472b25e.dir
      size: 4803739404
      nfiles: 1600
    - path: experiment_data/dataset_relation_manager_data/pl_voicelab_cbiz
      md5: d23bd3824dc9e68a649edc94fbec50fb.dir
      size: 110711470
      nfiles: 1600
    outs:
    - path: experiment_data/pipeline/pl_voicelab_cbiz/gold_transcript
      md5: ebffd3814a48564f4e33b9a4e0956af3.dir
      size: 21846798
      nfiles: 800
  pipeline_gold_transcript@1:
    cmd: PYTHONPATH=. python experiment/pipeline_process_gold_transcript.py --dataset=pl_google_fleurs
    deps:
    - path: experiment/pipeline_process_gold_transcript.py
      md5: baac4f80dcdfcc5a49806eea6eec832a
      size: 1195
    - path: experiment_data/dataset/pl_google_fleurs
      md5: dfcb8cf40b4a1e1a62f9ada00468cca9.dir
      size: 236272072
      nfiles: 758
    - path: experiment_data/dataset_relation_manager_data/pl_google_fleurs
      md5: ce176e60d7e55945e402d711b22b0c6a.dir
      size: 4991297
      nfiles: 1516
    outs:
    - path: experiment_data/pipeline/pl_google_fleurs/gold_transcript
      md5: 607f551eca5dabcca0caf31c87bd2ac6.dir
      size: 975209
      nfiles: 758
  pipeline_asr_result@7:
    cmd: PYTHONPATH=. python experiment/pipeline_process_asr.py --dataset=pl_google_fleurs
      --asr=google
    deps:
    - path: experiment/pipeline_process_asr.py
      md5: efe378505897550fe1a8d423c321ef53
      size: 1403
    - path: experiment_data/cached_asr/pl_google_fleurs/pl_google_fleurs__google
      md5: c740521abae49feebfaf20c2384c8de5.dir
      size: 350126
      nfiles: 758
    - path: experiment_data/dataset/pl_google_fleurs
      md5: dfcb8cf40b4a1e1a62f9ada00468cca9.dir
      size: 236272072
      nfiles: 758
    outs:
    - path: experiment_data/pipeline/pl_google_fleurs/google__result
      md5: 6e0d7eb490eadd8dcc3c5452ba85932b.dir
      size: 1377134
      nfiles: 758
  pipeline_asr_result@3:
    cmd: PYTHONPATH=. python experiment/pipeline_process_asr.py --dataset=pl_common_voice
      --asr=ajn
    deps:
    - path: experiment/pipeline_process_asr.py
      md5: efe378505897550fe1a8d423c321ef53
      size: 1403
    - path: experiment_data/cached_asr/pl_common_voice/pl_common_voice__ajn
      md5: 873867be79ac82f04d28bd3419fa95f3.dir
      size: 1677089
      nfiles: 8155
    - path: experiment_data/dataset/pl_common_voice
      md5: d751713988987e9331980363e24189ce.dir
      size: 0
      nfiles: 0
    outs:
    - path: experiment_data/pipeline/pl_common_voice/ajn__result
      md5: 77d873041fe2952e3c45ee4ac6458061.dir
      size: 6667841
      nfiles: 8155
  pipeline_asr_result@17:
    cmd: PYTHONPATH=. python experiment/pipeline_process_asr.py --dataset=pl_minds14
      --asr=techmo
    deps:
    - path: experiment/pipeline_process_asr.py
      md5: efe378505897550fe1a8d423c321ef53
      size: 1403
    - path: experiment_data/cached_asr/pl_minds14/pl_minds14__techmo
      md5: 5fd62d52b1a39db98d86ff0a11dcfd52.dir
      size: 612777
      nfiles: 562
    - path: experiment_data/dataset/pl_minds14
      md5: d751713988987e9331980363e24189ce.dir
      size: 0
      nfiles: 0
    outs:
    - path: experiment_data/pipeline/pl_minds14/techmo__result
      md5: 4c43636b4773f2bf9a2153ef3393a558.dir
      size: 1336305
      nfiles: 562
  pipeline_asr_result@13:
    cmd: PYTHONPATH=. python experiment/pipeline_process_asr.py --dataset=pl_luna
      --asr=techmo
    deps:
    - path: experiment/pipeline_process_asr.py
      md5: efe378505897550fe1a8d423c321ef53
      size: 1403
    - path: experiment_data/cached_asr/pl_luna/pl_luna__techmo
      md5: 033ea7b5434dded73bf869bfdd299462.dir
      size: 4256479
      nfiles: 500
    - path: experiment_data/dataset/pl_luna
Marcin Wątroba's avatar
Marcin Wątroba committed
      md5: d342155b1871e881797cf7da09d5dc3c.dir
      size: 1578358645
      nfiles: 4500
    outs:
Marcin Wątroba's avatar
Marcin Wątroba committed
    - path: experiment_data/pipeline/pl_luna/techmo__result
      md5: 0e596570e1502b38588427bc72dcc006.dir
      size: 9697519
      nfiles: 500
  pipeline_asr_result@15:
    cmd: PYTHONPATH=. python experiment/pipeline_process_asr.py --dataset=pl_minds14
      --asr=google
    deps:
    - path: experiment/pipeline_process_asr.py
      md5: efe378505897550fe1a8d423c321ef53
      size: 1403
    - path: experiment_data/cached_asr/pl_minds14/pl_minds14__google
      md5: bb1acae0c3070424d635ae9d2c6e14f0.dir
      size: 247940
      nfiles: 562
    - path: experiment_data/dataset/pl_minds14
      md5: d751713988987e9331980363e24189ce.dir
      size: 0
      nfiles: 0
    outs:
    - path: experiment_data/pipeline/pl_minds14/google__result
      md5: 3f7a79298a5156fd2b023e673326e72f.dir
      size: 985004
      nfiles: 562
  pipeline_asr_result@2:
    cmd: PYTHONPATH=. python experiment/pipeline_process_asr.py --dataset=pl_common_voice
      --asr=techmo
    deps:
    - path: experiment/pipeline_process_asr.py
      md5: efe378505897550fe1a8d423c321ef53
      size: 1403
    - path: experiment_data/cached_asr/pl_common_voice/pl_common_voice__techmo
      md5: 47a9d744ff9f02d0a82a4a30664270b5.dir
      size: 3686716
      nfiles: 8155
    - path: experiment_data/dataset/pl_common_voice
      md5: d751713988987e9331980363e24189ce.dir
      size: 0
      nfiles: 0
    outs:
    - path: experiment_data/pipeline/pl_common_voice/techmo__result
      md5: 9030cf3640f2749d9c1b4439687bdc2f.dir
      size: 7761880
      nfiles: 8136
  pipeline_asr_result@6:
    cmd: PYTHONPATH=. python experiment/pipeline_process_asr.py --dataset=pl_voicelab_cbiz
      --asr=techmo
    deps:
    - path: experiment/pipeline_process_asr.py
      md5: efe378505897550fe1a8d423c321ef53
      size: 1403
    - path: experiment_data/cached_asr/pl_voicelab_cbiz/pl_voicelab_cbiz__techmo
      md5: 6c3b356723d562c978f84e733b91f5d0.dir
      size: 17539259
      nfiles: 800
    - path: experiment_data/dataset/pl_voicelab_cbiz
      md5: 3c2b18e1f1f89e4c5ad7b254e472b25e.dir
      size: 4803739404
      nfiles: 1600
    outs:
    - path: experiment_data/pipeline/pl_voicelab_cbiz/techmo__result
      md5: e544489fc21b6a3e6d4fd68ab8c2c069.dir
      size: 39158267
      nfiles: 800
  pipeline_asr_result@11:
    cmd: PYTHONPATH=. python experiment/pipeline_process_asr.py --dataset=pl_luna
      --asr=google
    deps:
    - path: experiment/pipeline_process_asr.py
      md5: efe378505897550fe1a8d423c321ef53
      size: 1403
    - path: experiment_data/cached_asr/pl_luna/pl_luna__google
      md5: ac191369daf21c45c48da1bcd3e3a540.dir
      size: 1096697
      nfiles: 500
    - path: experiment_data/dataset/pl_luna
      md5: d342155b1871e881797cf7da09d5dc3c.dir
      size: 1578358645
      nfiles: 4500
    outs:
    - path: experiment_data/pipeline/pl_luna/google__result
      md5: 8e4bf67df4dccd218d4d7c3de69688a4.dir
      size: 5346497
      nfiles: 500
  pipeline_asr_result@1:
    cmd: PYTHONPATH=. python experiment/pipeline_process_asr.py --dataset=pl_common_voice
      --asr=wav2vec2
    deps:
    - path: experiment/pipeline_process_asr.py
      md5: efe378505897550fe1a8d423c321ef53
      size: 1403
    - path: experiment_data/cached_asr/pl_common_voice/pl_common_voice__wav2vec2
      md5: 8f84125abe861abbcd39499079aa1777.dir
      size: 14830897
      nfiles: 8155
    - path: experiment_data/dataset/pl_common_voice
      md5: d751713988987e9331980363e24189ce.dir
      size: 0
      nfiles: 0
    outs:
    - path: experiment_data/pipeline/pl_common_voice/wav2vec2__result
      md5: b0d0042d77d7adce37890ca63ad40091.dir
      size: 19014997
      nfiles: 8154
  pipeline_asr_result@8:
    cmd: PYTHONPATH=. python experiment/pipeline_process_asr.py --dataset=pl_google_fleurs
      --asr=ajn
    deps:
    - path: experiment/pipeline_process_asr.py
      md5: efe378505897550fe1a8d423c321ef53
      size: 1403
    - path: experiment_data/cached_asr/pl_google_fleurs/pl_google_fleurs__ajn
      md5: 2218d65c2c73761ce8825015cf79bacd.dir
      size: 343198
      nfiles: 758
    - path: experiment_data/dataset/pl_google_fleurs
      md5: dfcb8cf40b4a1e1a62f9ada00468cca9.dir
      size: 236272072
      nfiles: 758
    outs:
    - path: experiment_data/pipeline/pl_google_fleurs/ajn__result
      md5: 545e63a6daf9c46387c1d7d40b85499f.dir
      size: 1413262
      nfiles: 758
  pipeline_asr_result@5:
    cmd: PYTHONPATH=. python experiment/pipeline_process_asr.py --dataset=pl_voicelab_cbiz
      --asr=ajn
    deps:
    - path: experiment/pipeline_process_asr.py
      md5: efe378505897550fe1a8d423c321ef53
      size: 1403
    - path: experiment_data/cached_asr/pl_voicelab_cbiz/pl_voicelab_cbiz__ajn
      md5: 0705aafa0969142288cc9baa88d1ed57.dir
      size: 6896694
      nfiles: 800
    - path: experiment_data/dataset/pl_voicelab_cbiz
      md5: 3c2b18e1f1f89e4c5ad7b254e472b25e.dir
      size: 4803739404
      nfiles: 1600
    outs:
    - path: experiment_data/pipeline/pl_voicelab_cbiz/ajn__result
      md5: 7de1137f44fad26766da0fc309720160.dir
      size: 22765926
      nfiles: 800
  pipeline_asr_result@12:
    cmd: PYTHONPATH=. python experiment/pipeline_process_asr.py --dataset=pl_luna
      --asr=ajn
    deps:
    - path: experiment/pipeline_process_asr.py
      md5: efe378505897550fe1a8d423c321ef53
      size: 1403
    - path: experiment_data/cached_asr/pl_luna/pl_luna__ajn
      md5: 10454ef4568c2023e9d51ad418db2854.dir
      size: 1276562
      nfiles: 495
    - path: experiment_data/dataset/pl_luna
      md5: d342155b1871e881797cf7da09d5dc3c.dir
      size: 1578358645
      nfiles: 4500
    outs:
    - path: experiment_data/pipeline/pl_luna/ajn__result
      md5: 653d65e186a7d05958ce3cbef219038c.dir
      size: 6159899
      nfiles: 494
  pipeline_asr_result@16:
    cmd: PYTHONPATH=. python experiment/pipeline_process_asr.py --dataset=pl_minds14
      --asr=ajn
    deps:
    - path: experiment/pipeline_process_asr.py
      md5: efe378505897550fe1a8d423c321ef53
      size: 1403
    - path: experiment_data/cached_asr/pl_minds14/pl_minds14__ajn
      md5: 41b35b832b72e132575e1c8bc777682f.dir
      size: 205731
      nfiles: 562
    - path: experiment_data/dataset/pl_minds14
      md5: d751713988987e9331980363e24189ce.dir
      size: 0
      nfiles: 0
    outs:
    - path: experiment_data/pipeline/pl_minds14/ajn__result
Marcin Wątroba's avatar
Marcin Wątroba committed
      md5: 4094dd4b22895a0a4ce82793cd6a8b0f.dir
Marcin Wątroba's avatar
Marcin Wątroba committed
      size: 974727
      nfiles: 559
  pipeline_asr_result@10:
    cmd: PYTHONPATH=. python experiment/pipeline_process_asr.py --dataset=pl_google_fleurs
      --asr=wav2vec2
Marcin Wątroba's avatar
Marcin Wątroba committed
    deps:
    - path: experiment/pipeline_process_asr.py
      md5: efe378505897550fe1a8d423c321ef53
      size: 1403
    - path: experiment_data/cached_asr/pl_google_fleurs/pl_google_fleurs__wav2vec2
      md5: 9638746467b0dea972a0be101a7d5c58.dir
      size: 4093001
Marcin Wątroba's avatar
Marcin Wątroba committed
      nfiles: 758
    - path: experiment_data/dataset/pl_google_fleurs
      md5: dfcb8cf40b4a1e1a62f9ada00468cca9.dir
      size: 236272072
      nfiles: 758
    outs:
    - path: experiment_data/pipeline/pl_google_fleurs/wav2vec2__result
      md5: bf9c77e34376bcda73dbdb6afee55c8c.dir
      size: 5137721
Marcin Wątroba's avatar
Marcin Wątroba committed
      nfiles: 758
  pipeline_asr_result@4:
    cmd: PYTHONPATH=. python experiment/pipeline_process_asr.py --dataset=pl_voicelab_cbiz
      --asr=google
    deps:
    - path: experiment/pipeline_process_asr.py
      md5: efe378505897550fe1a8d423c321ef53
      size: 1403
    - path: experiment_data/cached_asr/pl_voicelab_cbiz/pl_voicelab_cbiz__google
      md5: 35a79b96887fbf705327937fdd57c0c6.dir
      size: 5651375
      nfiles: 799
    - path: experiment_data/dataset/pl_voicelab_cbiz
      md5: 3c2b18e1f1f89e4c5ad7b254e472b25e.dir
      size: 4803739404
      nfiles: 1600
    outs:
    - path: experiment_data/pipeline/pl_voicelab_cbiz/google__result
      md5: cb6322c8c0c6d3cf557b93bf52efd0dc.dir
      size: 27432599
      nfiles: 799
  pipeline_asr_result@14:
    cmd: PYTHONPATH=. python experiment/pipeline_process_asr.py --dataset=pl_luna
      --asr=wav2vec2
    deps:
    - path: experiment/pipeline_process_asr.py
      md5: efe378505897550fe1a8d423c321ef53
      size: 1403
    - path: experiment_data/cached_asr/pl_luna/pl_luna__wav2vec2
      md5: 0555f6346ef6332d27fc0979e8ac16f7.dir
      size: 16356269
      nfiles: 456
    - path: experiment_data/dataset/pl_luna
      md5: d342155b1871e881797cf7da09d5dc3c.dir
      size: 1578358645
      nfiles: 4500
    outs:
    - path: experiment_data/pipeline/pl_luna/wav2vec2__result
      md5: 9c63b061ac7763144bca121e163ee7aa.dir
      size: 20658485
      nfiles: 456
  pipeline_asr_result@9:
    cmd: PYTHONPATH=. python experiment/pipeline_process_asr.py --dataset=pl_google_fleurs
      --asr=techmo
Marcin Wątroba's avatar
Marcin Wątroba committed
    deps:
    - path: experiment/pipeline_process_asr.py
      md5: efe378505897550fe1a8d423c321ef53
      size: 1403
    - path: experiment_data/cached_asr/pl_google_fleurs/pl_google_fleurs__techmo
      md5: 876e8cff4ebd191617fcd3844e411475.dir
      size: 859227
Marcin Wątroba's avatar
Marcin Wątroba committed
      nfiles: 758
    - path: experiment_data/dataset/pl_google_fleurs
      md5: dfcb8cf40b4a1e1a62f9ada00468cca9.dir
      size: 236272072
      nfiles: 758
    outs:
    - path: experiment_data/pipeline/pl_google_fleurs/techmo__result
      md5: 33c60c2b8bd57c3aedd7161256ad8cfa.dir
      size: 1880403
Marcin Wątroba's avatar
Marcin Wątroba committed
      nfiles: 758
  pipeline_asr_result@0:
    cmd: PYTHONPATH=. python experiment/pipeline_process_asr.py --dataset=pl_common_voice
      --asr=google
    deps:
    - path: experiment/pipeline_process_asr.py
      md5: efe378505897550fe1a8d423c321ef53
      size: 1403
    - path: experiment_data/cached_asr/pl_common_voice/pl_common_voice__google
      md5: e640b898f723eed2af42b93596eabecd.dir
      size: 1701910
      nfiles: 8143
    - path: experiment_data/dataset/pl_common_voice
      md5: d751713988987e9331980363e24189ce.dir
      size: 0
      nfiles: 0
    outs:
    - path: experiment_data/pipeline/pl_common_voice/google__result
      md5: afb53476cc93ef4de3591908df41fd2a.dir
      size: 5854366
      nfiles: 8143
  pipeline_word_wer@8:
    cmd: PYTHONPATH=. python experiment/pipeline_process_word_wer.py --dataset=pl_google_fleurs
      --asr=ajn
Marcin Wątroba's avatar
Marcin Wątroba committed
    deps:
    - path: experiment/pipeline_process_word_wer.py
      md5: 98c7d6b43efbe0c2e84b5ad44d01fec9
      size: 2125
    - path: experiment_data/dataset/pl_google_fleurs
      md5: dfcb8cf40b4a1e1a62f9ada00468cca9.dir
      size: 236272072
      nfiles: 758
    - path: experiment_data/pipeline/pl_google_fleurs/ajn__result