Skip to content
Snippets Groups Projects
dvc.lock 96.1 KiB
Newer Older
Marcin Wątroba's avatar
Marcin Wątroba committed
      md5: 607f551eca5dabcca0caf31c87bd2ac6.dir
      size: 975209
      nfiles: 758
    - path: experiment_data/pipeline/pl_google_fleurs/techmo__result
      md5: 33c60c2b8bd57c3aedd7161256ad8cfa.dir
      size: 1880403
      nfiles: 758
    outs:
    - path: experiment_data/pipeline/pl_google_fleurs/techmo__word_wer_classic_alignment
      md5: 689776c77c4ecaa11578b53480100ecc.dir
      size: 3821036
      nfiles: 758
    - path: experiment_data/pipeline/pl_google_fleurs/techmo__word_wer_classic_metrics
      md5: 8d0d99fd7d965d4070c0b391cd6fa2b0.dir
      size: 23030
      nfiles: 758
    - path: experiment_data/pipeline/pl_google_fleurs/techmo__word_wer_embeddings_alignment
      md5: 0ec5fe337bde2254c91146fd16b9c6af.dir
      size: 7995553
      nfiles: 758
    - path: experiment_data/pipeline/pl_google_fleurs/techmo__word_wer_embeddings_metrics
      md5: 55eb6eb0aacc12e3e2caf224b4b89df1.dir
      size: 53591
      nfiles: 758
  pipeline_word_wer@6:
    cmd: PYTHONPATH=. python experiment/pipeline_process_word_wer.py --dataset=pl_google_fleurs
      --asr=google
Marcin Wątroba's avatar
Marcin Wątroba committed
    deps:
Marcin Wątroba's avatar
Marcin Wątroba committed
    - path: experiment/pipeline_process_word_wer.py
      md5: 98c7d6b43efbe0c2e84b5ad44d01fec9
      size: 2125
    - path: experiment_data/dataset/pl_google_fleurs
      md5: dfcb8cf40b4a1e1a62f9ada00468cca9.dir
      size: 236272072
      nfiles: 758
    - path: experiment_data/pipeline/pl_google_fleurs/gold_transcript
      md5: 607f551eca5dabcca0caf31c87bd2ac6.dir
      size: 975209
      nfiles: 758
    - path: experiment_data/pipeline/pl_google_fleurs/google__result
      md5: 6e0d7eb490eadd8dcc3c5452ba85932b.dir
      size: 1377134
      nfiles: 758
Marcin Wątroba's avatar
Marcin Wątroba committed
    outs:
Marcin Wątroba's avatar
Marcin Wątroba committed
    - path: experiment_data/pipeline/pl_google_fleurs/google__word_wer_classic_alignment
      md5: 9beb57e9be598275ac9d449618da440e.dir
      size: 3818553
      nfiles: 758
    - path: experiment_data/pipeline/pl_google_fleurs/google__word_wer_classic_metrics
      md5: 984770b57ca48fd793099c9ed67791d0.dir
      size: 23344
      nfiles: 758
    - path: experiment_data/pipeline/pl_google_fleurs/google__word_wer_embeddings_alignment
      md5: aeb20f1662b696a6fc11bcd39a02a0de.dir
      size: 7984964
      nfiles: 758
    - path: experiment_data/pipeline/pl_google_fleurs/google__word_wer_embeddings_metrics
      md5: b2626f92231431e163813ef7112c119d.dir
      size: 53916
      nfiles: 758
  pipeline_word_wer@17:
    cmd: PYTHONPATH=. python experiment/pipeline_process_word_wer.py --dataset=pl_minds14
      --asr=wav2vec2
Marcin Wątroba's avatar
Marcin Wątroba committed
    - path: experiment/pipeline_process_word_wer.py
      md5: 98c7d6b43efbe0c2e84b5ad44d01fec9
      size: 2125
    - path: experiment_data/dataset/pl_minds14
      md5: d751713988987e9331980363e24189ce.dir
      size: 0
      nfiles: 0
    - path: experiment_data/pipeline/pl_minds14/gold_transcript
      md5: d2d48495000b3ea7ea6f4212ddb113a5.dir
      size: 689374
      nfiles: 562
    - path: experiment_data/pipeline/pl_minds14/wav2vec2__result
      md5: 5658da01ecdce39ed99156bbc7f2dc62.dir
      size: 3523907
      nfiles: 562
Marcin Wątroba's avatar
Marcin Wątroba committed
    - path: experiment_data/pipeline/pl_minds14/wav2vec2__word_wer_classic_alignment
      md5: c1d947bbd7bb1dff8d39e03ad4a1d11e.dir
      size: 2811807
      nfiles: 562
    - path: experiment_data/pipeline/pl_minds14/wav2vec2__word_wer_classic_metrics
      md5: a3477ae81fcba4a8e21b044f279425bb.dir
      size: 17073
      nfiles: 562
    - path: experiment_data/pipeline/pl_minds14/wav2vec2__word_wer_embeddings_alignment
      md5: cbdcbfe7157f28d70ca55b787483e26b.dir
      size: 5870633
      nfiles: 562
    - path: experiment_data/pipeline/pl_minds14/wav2vec2__word_wer_embeddings_metrics
      md5: c3395e582b4562a33e97419134363d30.dir
      size: 37892
      nfiles: 562
  pipeline_word_wer@15:
    cmd: PYTHONPATH=. python experiment/pipeline_process_word_wer.py --dataset=pl_minds14
      --asr=ajn
Marcin Wątroba's avatar
Marcin Wątroba committed
    - path: experiment/pipeline_process_word_wer.py
      md5: 98c7d6b43efbe0c2e84b5ad44d01fec9
      size: 2125
    - path: experiment_data/dataset/pl_minds14
      md5: d751713988987e9331980363e24189ce.dir
      size: 0
      nfiles: 0
    - path: experiment_data/pipeline/pl_minds14/ajn__result
      md5: 6fd1b042a7cb6d6f200c2eb9a926b7f1.dir
      size: 974727
      nfiles: 559
    - path: experiment_data/pipeline/pl_minds14/gold_transcript
      md5: d2d48495000b3ea7ea6f4212ddb113a5.dir
      size: 689374
      nfiles: 562
    outs:
    - path: experiment_data/pipeline/pl_minds14/ajn__word_wer_classic_alignment
      md5: c03a478840305afb1eadf4752b3a5678.dir
      size: 2851613
      nfiles: 559
    - path: experiment_data/pipeline/pl_minds14/ajn__word_wer_classic_metrics
      md5: 6d6d430e7f3672c67b9c78eb7d0ea296.dir
      size: 15213
      nfiles: 559
    - path: experiment_data/pipeline/pl_minds14/ajn__word_wer_embeddings_alignment
      md5: ae577cd5886aced83d7de4ba47bb4457.dir
      size: 5960904
      nfiles: 559
    - path: experiment_data/pipeline/pl_minds14/ajn__word_wer_embeddings_metrics
      md5: c599599e5935075cd26ac89e0d3b5f1b.dir
      size: 22438
      nfiles: 559
  pipeline_word_wer@12:
    cmd: PYTHONPATH=. python experiment/pipeline_process_word_wer.py --dataset=pl_luna
      --asr=techmo
    deps:
    - path: experiment/pipeline_process_word_wer.py
      md5: 98c7d6b43efbe0c2e84b5ad44d01fec9
      size: 2125
    - path: experiment_data/dataset/pl_luna
      md5: d342155b1871e881797cf7da09d5dc3c.dir
      size: 1578358645
      nfiles: 4500
Marcin Wątroba's avatar
Marcin Wątroba committed
    - path: experiment_data/pipeline/pl_luna/gold_transcript
      md5: 4c3e09acb7ffac0ef5b117a38515e3a9.dir
      size: 6706925
      nfiles: 500
Marcin Wątroba's avatar
Marcin Wątroba committed
    - path: experiment_data/pipeline/pl_luna/techmo__result
      md5: 0e596570e1502b38588427bc72dcc006.dir
      size: 9697519
      nfiles: 500
    outs:
Marcin Wątroba's avatar
Marcin Wątroba committed
    - path: experiment_data/pipeline/pl_luna/techmo__word_wer_classic_alignment
      md5: 5e90722635a811db67a1f0d917707b0a.dir
      size: 21380796
Marcin Wątroba's avatar
Marcin Wątroba committed
      nfiles: 500
Marcin Wątroba's avatar
Marcin Wątroba committed
    - path: experiment_data/pipeline/pl_luna/techmo__word_wer_classic_metrics
      md5: 4cfbb2830b280084ece14b1ef815b92a.dir
      size: 17298
Marcin Wątroba's avatar
Marcin Wątroba committed
      nfiles: 500
Marcin Wątroba's avatar
Marcin Wątroba committed
    - path: experiment_data/pipeline/pl_luna/techmo__word_wer_embeddings_alignment
      md5: 74f8be84e1e913050483713fbc945d80.dir
Marcin Wątroba's avatar
Marcin Wątroba committed
      size: 44326962
      nfiles: 500
Marcin Wątroba's avatar
Marcin Wątroba committed
    - path: experiment_data/pipeline/pl_luna/techmo__word_wer_embeddings_metrics
Marcin Wątroba's avatar
Marcin Wątroba committed
      md5: 98a7edeee3b630e8e301acfc578a8393.dir
      size: 34869
      nfiles: 500
Marcin Wątroba's avatar
Marcin Wątroba committed
  pipeline_word_wer@10:
    cmd: PYTHONPATH=. python experiment/pipeline_process_word_wer.py --dataset=pl_luna
      --asr=google
Marcin Wątroba's avatar
Marcin Wątroba committed
    - path: experiment/pipeline_process_word_wer.py
      md5: 98c7d6b43efbe0c2e84b5ad44d01fec9
      size: 2125
    - path: experiment_data/dataset/pl_luna
      md5: d342155b1871e881797cf7da09d5dc3c.dir
      size: 1578358645
      nfiles: 4500
Marcin Wątroba's avatar
Marcin Wątroba committed
    - path: experiment_data/pipeline/pl_luna/gold_transcript
      md5: 4c3e09acb7ffac0ef5b117a38515e3a9.dir
      size: 6706925
      nfiles: 500
Marcin Wątroba's avatar
Marcin Wątroba committed
    - path: experiment_data/pipeline/pl_luna/google__result
      md5: 8e4bf67df4dccd218d4d7c3de69688a4.dir
      size: 5346497
      nfiles: 500
    outs:
Marcin Wątroba's avatar
Marcin Wątroba committed
    - path: experiment_data/pipeline/pl_luna/google__word_wer_classic_alignment
      md5: 5bdee43e646a4e9470310073365ebc37.dir
      size: 19650202
      nfiles: 500
Marcin Wątroba's avatar
Marcin Wątroba committed
    - path: experiment_data/pipeline/pl_luna/google__word_wer_classic_metrics
      md5: 9951fb70382cc8bed9aa48d1185c1c7c.dir
      size: 16989
      nfiles: 500
Marcin Wątroba's avatar
Marcin Wątroba committed
    - path: experiment_data/pipeline/pl_luna/google__word_wer_embeddings_alignment
      md5: a06bd5f0b4c52c679315b6c6d7478084.dir
      size: 40586004
Marcin Wątroba's avatar
Marcin Wątroba committed
      nfiles: 500
Marcin Wątroba's avatar
Marcin Wątroba committed
    - path: experiment_data/pipeline/pl_luna/google__word_wer_embeddings_metrics
      md5: 351543fb54e2098ac07999482d2280a8.dir
      size: 34530
      nfiles: 500
Marcin Wątroba's avatar
Marcin Wątroba committed
  pipeline_word_wer@13:
    cmd: PYTHONPATH=. python experiment/pipeline_process_word_wer.py --dataset=pl_luna
      --asr=wav2vec2
    deps:
    - path: experiment/pipeline_process_word_wer.py
      md5: 98c7d6b43efbe0c2e84b5ad44d01fec9
      size: 2125
    - path: experiment_data/dataset/pl_luna
      md5: d342155b1871e881797cf7da09d5dc3c.dir
      size: 1578358645
      nfiles: 4500
    - path: experiment_data/pipeline/pl_luna/gold_transcript
      md5: 4c3e09acb7ffac0ef5b117a38515e3a9.dir
      size: 6706925
Marcin Wątroba's avatar
Marcin Wątroba committed
      nfiles: 500
Marcin Wątroba's avatar
Marcin Wątroba committed
    - path: experiment_data/pipeline/pl_luna/wav2vec2__result
      md5: 9c63b061ac7763144bca121e163ee7aa.dir
      size: 20658485
      nfiles: 456
    outs:
    - path: experiment_data/pipeline/pl_luna/wav2vec2__word_wer_classic_alignment
      md5: 4d4ae25d4fac2a52893e60389fcd2f9e.dir
      size: 18462856
      nfiles: 456
    - path: experiment_data/pipeline/pl_luna/wav2vec2__word_wer_classic_metrics
      md5: f209479afd2482800f1e75bdab9f83b2.dir
      size: 15604
      nfiles: 456
    - path: experiment_data/pipeline/pl_luna/wav2vec2__word_wer_embeddings_alignment
      md5: 41ad4c0923986a90fc9ed12aa6e30f73.dir
      size: 38402586
      nfiles: 456
    - path: experiment_data/pipeline/pl_luna/wav2vec2__word_wer_embeddings_metrics
      md5: df02c1f9d7e26ed10815175de086e0b6.dir
      size: 24633
      nfiles: 456
  pipeline_word_wer@3:
    cmd: PYTHONPATH=. python experiment/pipeline_process_word_wer.py --dataset=pl_voicelab_cbiz
      --asr=google
Marcin Wątroba's avatar
Marcin Wątroba committed
    deps:
Marcin Wątroba's avatar
Marcin Wątroba committed
    - path: experiment/pipeline_process_word_wer.py
      md5: 98c7d6b43efbe0c2e84b5ad44d01fec9
      size: 2125
    - path: experiment_data/dataset/pl_voicelab_cbiz
Marcin Wątroba's avatar
Marcin Wątroba committed
      md5: 3c2b18e1f1f89e4c5ad7b254e472b25e.dir
      size: 4803739404
      nfiles: 1600
Marcin Wątroba's avatar
Marcin Wątroba committed
    - path: experiment_data/pipeline/pl_voicelab_cbiz/gold_transcript
      md5: ebffd3814a48564f4e33b9a4e0956af3.dir
Marcin Wątroba's avatar
Marcin Wątroba committed
      size: 21846798
      nfiles: 800
Marcin Wątroba's avatar
Marcin Wątroba committed
    - path: experiment_data/pipeline/pl_voicelab_cbiz/google__result
      md5: cb6322c8c0c6d3cf557b93bf52efd0dc.dir
      size: 27432599
      nfiles: 799
    outs:
    - path: experiment_data/pipeline/pl_voicelab_cbiz/google__word_wer_classic_alignment
      md5: 184cdfdd465db609f514891b0330ef67.dir
      size: 83997172
      nfiles: 799
    - path: experiment_data/pipeline/pl_voicelab_cbiz/google__word_wer_classic_metrics
      md5: c12eab8acb3cee0219fc8046691b24ab.dir
      size: 27841
      nfiles: 799
    - path: experiment_data/pipeline/pl_voicelab_cbiz/google__word_wer_embeddings_alignment
      md5: 1e7ef6690d2e36f368eb02a8dcba9ab0.dir
      size: 174732507
      nfiles: 799
    - path: experiment_data/pipeline/pl_voicelab_cbiz/google__word_wer_embeddings_metrics
      md5: c15414f2ec9c0a1ab78199861b0b4ce0.dir
      size: 55765
      nfiles: 799
  pipeline_word_wer@16:
    cmd: PYTHONPATH=. python experiment/pipeline_process_word_wer.py --dataset=pl_minds14
      --asr=techmo
Marcin Wątroba's avatar
Marcin Wątroba committed
    deps:
Marcin Wątroba's avatar
Marcin Wątroba committed
    - path: experiment/pipeline_process_word_wer.py
      md5: 98c7d6b43efbe0c2e84b5ad44d01fec9
      size: 2125
    - path: experiment_data/dataset/pl_minds14
      md5: d751713988987e9331980363e24189ce.dir
      size: 0
      nfiles: 0
    - path: experiment_data/pipeline/pl_minds14/gold_transcript
      md5: d2d48495000b3ea7ea6f4212ddb113a5.dir
      size: 689374
      nfiles: 562
    - path: experiment_data/pipeline/pl_minds14/techmo__result
      md5: 4c43636b4773f2bf9a2153ef3393a558.dir
      size: 1336305
      nfiles: 562
    outs:
    - path: experiment_data/pipeline/pl_minds14/techmo__word_wer_classic_alignment
      md5: bb8b304a25b60f779c27ca4d6c9183ba.dir
      size: 2723010
      nfiles: 562
    - path: experiment_data/pipeline/pl_minds14/techmo__word_wer_classic_metrics
      md5: b6a4f05d71bd3fbed796d54b1ac2b29d.dir
      size: 17198
      nfiles: 562
    - path: experiment_data/pipeline/pl_minds14/techmo__word_wer_embeddings_alignment
      md5: 9956c918227d6b76f26ac6540a34e931.dir
      size: 5673712
      nfiles: 562
    - path: experiment_data/pipeline/pl_minds14/techmo__word_wer_embeddings_metrics
      md5: de8e393488ff05187c7866272675fd8e.dir
      size: 39775
      nfiles: 562
  pipeline_word_wer@11:
    cmd: PYTHONPATH=. python experiment/pipeline_process_word_wer.py --dataset=pl_luna
      --asr=ajn
    deps:
    - path: experiment/pipeline_process_word_wer.py
      md5: 98c7d6b43efbe0c2e84b5ad44d01fec9
      size: 2125
    - path: experiment_data/dataset/pl_luna
      md5: d342155b1871e881797cf7da09d5dc3c.dir
      size: 1578358645
      nfiles: 4500
    - path: experiment_data/pipeline/pl_luna/ajn__result
      md5: 653d65e186a7d05958ce3cbef219038c.dir
      size: 6159899
      nfiles: 494
    - path: experiment_data/pipeline/pl_luna/gold_transcript
      md5: 4c3e09acb7ffac0ef5b117a38515e3a9.dir
      size: 6706925
      nfiles: 500
    outs:
    - path: experiment_data/pipeline/pl_luna/ajn__word_wer_classic_alignment
      md5: e25ae51f8dc1afe55d5c0b44a67ab8ee.dir
      size: 20671277
      nfiles: 494
    - path: experiment_data/pipeline/pl_luna/ajn__word_wer_classic_metrics
      md5: 18605657ff9c7ef3221e27b671a3b4d1.dir
      size: 16835
      nfiles: 494
    - path: experiment_data/pipeline/pl_luna/ajn__word_wer_embeddings_alignment
      md5: 6be0a1c035f4a84a9035bfba1458cdac.dir
      size: 43099546
      nfiles: 494
    - path: experiment_data/pipeline/pl_luna/ajn__word_wer_embeddings_metrics
      md5: 4f368d2ba1c5a54d5e3ab69a7581549e.dir
      size: 19326
      nfiles: 494
  pipeline_word_wer@7:
    cmd: PYTHONPATH=. python experiment/pipeline_process_word_wer.py --dataset=pl_google_fleurs
      --asr=ajn
    deps:
    - path: experiment/pipeline_process_word_wer.py
      md5: 98c7d6b43efbe0c2e84b5ad44d01fec9
      size: 2125
    - path: experiment_data/dataset/pl_google_fleurs
      md5: dfcb8cf40b4a1e1a62f9ada00468cca9.dir
      size: 236272072
      nfiles: 758
    - path: experiment_data/pipeline/pl_google_fleurs/ajn__result
      md5: 545e63a6daf9c46387c1d7d40b85499f.dir
      size: 1413262
      nfiles: 758
    - path: experiment_data/pipeline/pl_google_fleurs/gold_transcript
      md5: 607f551eca5dabcca0caf31c87bd2ac6.dir
      size: 975209
      nfiles: 758
    outs:
    - path: experiment_data/pipeline/pl_google_fleurs/ajn__word_wer_classic_alignment
      md5: 6437952d0ab383e44acca5fa70d02e54.dir
      size: 3981739
      nfiles: 758
    - path: experiment_data/pipeline/pl_google_fleurs/ajn__word_wer_classic_metrics
      md5: a40ae0901f53a33231a4c3dc18708d2c.dir
      size: 22935
      nfiles: 758
    - path: experiment_data/pipeline/pl_google_fleurs/ajn__word_wer_embeddings_alignment
      md5: 06e64fca6fc73e1cc9e7e86b21eb11f3.dir
      size: 8318047
      nfiles: 758
    - path: experiment_data/pipeline/pl_google_fleurs/ajn__word_wer_embeddings_metrics
      md5: 68da1ded61389ae5d866bc762c61363c.dir
      size: 33029
      nfiles: 758
  pipeline_word_wer@2:
    cmd: PYTHONPATH=. python experiment/pipeline_process_word_wer.py --dataset=pl_common_voice
      --asr=techmo
    deps:
    - path: experiment/pipeline_process_word_wer.py
      md5: 98c7d6b43efbe0c2e84b5ad44d01fec9
      size: 2125
    - path: experiment_data/dataset/pl_common_voice
      md5: d751713988987e9331980363e24189ce.dir
      size: 0
      nfiles: 0
    - path: experiment_data/pipeline/pl_common_voice/gold_transcript
      md5: e77ce22b14cb32594ae9cfcd4d6403b3.dir
      size: 4093545
      nfiles: 8155
    - path: experiment_data/pipeline/pl_common_voice/techmo__result
      md5: 9030cf3640f2749d9c1b4439687bdc2f.dir
      size: 7761880
      nfiles: 8136
    outs:
    - path: experiment_data/pipeline/pl_common_voice/techmo__word_wer_classic_alignment
      md5: 478503dcf96c6162f15466d5455b6271.dir
      size: 15696317
      nfiles: 8136
    - path: experiment_data/pipeline/pl_common_voice/techmo__word_wer_classic_metrics
      md5: 7b60102e7896228777eb92fdc2aaebc2.dir
      size: 223467
      nfiles: 8136
    - path: experiment_data/pipeline/pl_common_voice/techmo__word_wer_embeddings_alignment
      md5: 09126e1594234e97cd10858cbc06f4be.dir
      size: 33111258
      nfiles: 8136
    - path: experiment_data/pipeline/pl_common_voice/techmo__word_wer_embeddings_metrics
      md5: 4fdb7cea64f99b62b20a725929093d4d.dir
      size: 571563
      nfiles: 8136
  pipeline_word_wer@14:
    cmd: PYTHONPATH=. python experiment/pipeline_process_word_wer.py --dataset=pl_minds14
      --asr=google
    deps:
    - path: experiment/pipeline_process_word_wer.py
      md5: 98c7d6b43efbe0c2e84b5ad44d01fec9
      size: 2125
    - path: experiment_data/dataset/pl_minds14
      md5: d751713988987e9331980363e24189ce.dir
      size: 0
      nfiles: 0
    - path: experiment_data/pipeline/pl_minds14/gold_transcript
      md5: d2d48495000b3ea7ea6f4212ddb113a5.dir
      size: 689374
      nfiles: 562
    - path: experiment_data/pipeline/pl_minds14/google__result
      md5: 3f7a79298a5156fd2b023e673326e72f.dir
      size: 985004
      nfiles: 562
    outs:
    - path: experiment_data/pipeline/pl_minds14/google__word_wer_classic_alignment
      md5: 8469a41c345e0c21accb960782a49e75.dir
      size: 2725626
      nfiles: 562
    - path: experiment_data/pipeline/pl_minds14/google__word_wer_classic_metrics
      md5: 41621d3845a0035ee77352902c46a186.dir
      size: 15012
      nfiles: 562
    - path: experiment_data/pipeline/pl_minds14/google__word_wer_embeddings_alignment
      md5: a0e3d4ddda612480de739c898e79bf73.dir
      size: 5686170
      nfiles: 562
    - path: experiment_data/pipeline/pl_minds14/google__word_wer_embeddings_metrics
      md5: 673f6b46c7735163726f7d9e3b1f2dd4.dir
      size: 40260
      nfiles: 562
  pipeline_word_wer@0:
    cmd: PYTHONPATH=. python experiment/pipeline_process_word_wer.py --dataset=pl_common_voice
      --asr=google
    deps:
    - path: experiment/pipeline_process_word_wer.py
      md5: 98c7d6b43efbe0c2e84b5ad44d01fec9
      size: 2125
    - path: experiment_data/dataset/pl_common_voice
      md5: d751713988987e9331980363e24189ce.dir
      size: 0
      nfiles: 0
    - path: experiment_data/pipeline/pl_common_voice/gold_transcript
      md5: e77ce22b14cb32594ae9cfcd4d6403b3.dir
      size: 4093545
      nfiles: 8155
    - path: experiment_data/pipeline/pl_common_voice/google__result
      md5: afb53476cc93ef4de3591908df41fd2a.dir
      size: 5854366
      nfiles: 8143
    outs:
    - path: experiment_data/pipeline/pl_common_voice/google__word_wer_classic_alignment
      md5: 0562ca30a9415b6a568430f34650f063.dir
      size: 15821424
      nfiles: 8143
    - path: experiment_data/pipeline/pl_common_voice/google__word_wer_classic_metrics
      md5: deafb9c70dd9bb48c57dd0802bd8c923.dir
      size: 225225
      nfiles: 8143
    - path: experiment_data/pipeline/pl_common_voice/google__word_wer_embeddings_alignment
      md5: 4b1952cbde7ce121c616f686459ef924.dir
      size: 33384670
      nfiles: 8143
    - path: experiment_data/pipeline/pl_common_voice/google__word_wer_embeddings_metrics
      md5: e2dcce4d029ffe904d363790da375fac.dir
      size: 572632
      nfiles: 8143
  pipeline_word_wer@5:
    cmd: PYTHONPATH=. python experiment/pipeline_process_word_wer.py --dataset=pl_voicelab_cbiz
      --asr=techmo
    deps:
    - path: experiment/pipeline_process_word_wer.py
      md5: 98c7d6b43efbe0c2e84b5ad44d01fec9
      size: 2125
    - path: experiment_data/dataset/pl_voicelab_cbiz
Marcin Wątroba's avatar
Marcin Wątroba committed
      md5: 3c2b18e1f1f89e4c5ad7b254e472b25e.dir
      size: 4803739404
      nfiles: 1600
Marcin Wątroba's avatar
Marcin Wątroba committed
    - path: experiment_data/pipeline/pl_voicelab_cbiz/gold_transcript
      md5: ebffd3814a48564f4e33b9a4e0956af3.dir
Marcin Wątroba's avatar
Marcin Wątroba committed
      size: 21846798
      nfiles: 800
Marcin Wątroba's avatar
Marcin Wątroba committed
    - path: experiment_data/pipeline/pl_voicelab_cbiz/techmo__result
      md5: e544489fc21b6a3e6d4fd68ab8c2c069.dir
Marcin Wątroba's avatar
Marcin Wątroba committed
      size: 39158267
      nfiles: 800
Marcin Wątroba's avatar
Marcin Wątroba committed
    outs:
    - path: experiment_data/pipeline/pl_voicelab_cbiz/techmo__word_wer_classic_alignment
      md5: 37f0c27869efd72bf3eaedae70e426d5.dir
Marcin Wątroba's avatar
Marcin Wątroba committed
      size: 83756423
      nfiles: 800
Marcin Wątroba's avatar
Marcin Wątroba committed
    - path: experiment_data/pipeline/pl_voicelab_cbiz/techmo__word_wer_classic_metrics
Marcin Wątroba's avatar
Marcin Wątroba committed
      md5: 2fe3288abe85e4a385e2aefa0e8cad7e.dir
      size: 27780
      nfiles: 800
Marcin Wątroba's avatar
Marcin Wątroba committed
    - path: experiment_data/pipeline/pl_voicelab_cbiz/techmo__word_wer_embeddings_alignment
      md5: 01badff31f4d2f6583481c332fae8abc.dir
      size: 174322727
      nfiles: 800
    - path: experiment_data/pipeline/pl_voicelab_cbiz/techmo__word_wer_embeddings_metrics
Marcin Wątroba's avatar
Marcin Wątroba committed
      md5: 1fc2985ad4c3cb00d05b1865ad5b22d4.dir
      size: 56182
      nfiles: 800
Marcin Wątroba's avatar
Marcin Wątroba committed
  pipeline_word_wer@1:
    cmd: PYTHONPATH=. python experiment/pipeline_process_word_wer.py --dataset=pl_common_voice
      --asr=wav2vec2
Marcin Wątroba's avatar
Marcin Wątroba committed
    deps:
Marcin Wątroba's avatar
Marcin Wątroba committed
    - path: experiment/pipeline_process_word_wer.py
      md5: 98c7d6b43efbe0c2e84b5ad44d01fec9
      size: 2125
    - path: experiment_data/dataset/pl_common_voice
      md5: d751713988987e9331980363e24189ce.dir
      size: 0
      nfiles: 0
    - path: experiment_data/pipeline/pl_common_voice/gold_transcript
      md5: e77ce22b14cb32594ae9cfcd4d6403b3.dir
      size: 4093545
      nfiles: 8155
    - path: experiment_data/pipeline/pl_common_voice/wav2vec2__result
      md5: b0d0042d77d7adce37890ca63ad40091.dir
      size: 19014997
      nfiles: 8154
    outs:
    - path: experiment_data/pipeline/pl_common_voice/wav2vec2__word_wer_classic_alignment
      md5: 59beaa6beb3dc834c555376a5aeca7b4.dir
      size: 15851643
      nfiles: 8154
    - path: experiment_data/pipeline/pl_common_voice/wav2vec2__word_wer_classic_metrics
      md5: ccb35fbf94c551765dca2f72babcb7cb.dir
      size: 225545
      nfiles: 8154
    - path: experiment_data/pipeline/pl_common_voice/wav2vec2__word_wer_embeddings_alignment
      md5: a49f354af5d3f345fe2f85557f47931b.dir
      size: 33444109
      nfiles: 8154
    - path: experiment_data/pipeline/pl_common_voice/wav2vec2__word_wer_embeddings_metrics
      md5: c829268cd43ce5af3f57be7db6d058ce.dir
      size: 573538
      nfiles: 8154
  pipeline_word_wer@9:
    cmd: PYTHONPATH=. python experiment/pipeline_process_word_wer.py --dataset=pl_google_fleurs
      --asr=wav2vec2
    deps:
    - path: experiment/pipeline_process_word_wer.py
      md5: 98c7d6b43efbe0c2e84b5ad44d01fec9
      size: 2125
    - path: experiment_data/dataset/pl_google_fleurs
      md5: dfcb8cf40b4a1e1a62f9ada00468cca9.dir
      size: 236272072
      nfiles: 758
    - path: experiment_data/pipeline/pl_google_fleurs/gold_transcript
      md5: 607f551eca5dabcca0caf31c87bd2ac6.dir
      size: 975209
      nfiles: 758
    - path: experiment_data/pipeline/pl_google_fleurs/wav2vec2__result
      md5: bf9c77e34376bcda73dbdb6afee55c8c.dir
      size: 5137721
      nfiles: 758
    outs:
    - path: experiment_data/pipeline/pl_google_fleurs/wav2vec2__word_wer_classic_alignment
      md5: 052fa8f97b2f9d5b8ca4175b4e92dfd1.dir
      size: 3854678
      nfiles: 758
    - path: experiment_data/pipeline/pl_google_fleurs/wav2vec2__word_wer_classic_metrics
      md5: d9dec56ef7ddb6a3bc03638e37d1c04c.dir
      size: 23168
      nfiles: 758
    - path: experiment_data/pipeline/pl_google_fleurs/wav2vec2__word_wer_embeddings_alignment
      md5: 069191de9f84f37303bc202968f26766.dir
      size: 8069804
      nfiles: 758
    - path: experiment_data/pipeline/pl_google_fleurs/wav2vec2__word_wer_embeddings_metrics
      md5: b45390641698e71fdf420fbb2afec7e0.dir
      size: 53351
      nfiles: 758
  pipeline_word_wer@4:
    cmd: PYTHONPATH=. python experiment/pipeline_process_word_wer.py --dataset=pl_voicelab_cbiz
      --asr=ajn
    deps:
    - path: experiment/pipeline_process_word_wer.py
      md5: 98c7d6b43efbe0c2e84b5ad44d01fec9
      size: 2125
    - path: experiment_data/dataset/pl_voicelab_cbiz
Marcin Wątroba's avatar
Marcin Wątroba committed
      md5: 3c2b18e1f1f89e4c5ad7b254e472b25e.dir
      size: 4803739404
      nfiles: 1600
Marcin Wątroba's avatar
Marcin Wątroba committed
    - path: experiment_data/pipeline/pl_voicelab_cbiz/ajn__result
      md5: 7de1137f44fad26766da0fc309720160.dir
Marcin Wątroba's avatar
Marcin Wątroba committed
      size: 22765926
Marcin Wątroba's avatar
Marcin Wątroba committed
      nfiles: 800
Marcin Wątroba's avatar
Marcin Wątroba committed
    - path: experiment_data/pipeline/pl_voicelab_cbiz/gold_transcript
      md5: ebffd3814a48564f4e33b9a4e0956af3.dir
      size: 21846798
Marcin Wątroba's avatar
Marcin Wątroba committed
      nfiles: 800
Marcin Wątroba's avatar
Marcin Wątroba committed
    outs:
    - path: experiment_data/pipeline/pl_voicelab_cbiz/ajn__word_wer_classic_alignment
      md5: 1ed03de918f5373afdbdbb020c6161b5.dir
Marcin Wątroba's avatar
Marcin Wątroba committed
      size: 78992762
Marcin Wątroba's avatar
Marcin Wątroba committed
      nfiles: 800
Marcin Wątroba's avatar
Marcin Wątroba committed
    - path: experiment_data/pipeline/pl_voicelab_cbiz/ajn__word_wer_classic_metrics
Marcin Wątroba's avatar
Marcin Wątroba committed
      md5: 04f6ccbaf94cf08c34ac201ae079c21c.dir
      size: 25307
Marcin Wątroba's avatar
Marcin Wątroba committed
      nfiles: 800
Marcin Wątroba's avatar
Marcin Wątroba committed
    - path: experiment_data/pipeline/pl_voicelab_cbiz/ajn__word_wer_embeddings_alignment
      md5: a67e7a6e8a6e0755ea35a519d9decf86.dir
      size: 128258410
      nfiles: 646
    - path: experiment_data/pipeline/pl_voicelab_cbiz/ajn__word_wer_embeddings_metrics
      md5: c83561c448950860f36037c2287a25f5.dir
      size: 25194
      nfiles: 646
  pipeline_spacy_pos_wer@14:
    cmd: PYTHONPATH=. python experiment/pipeline_process_spacy_pos_wer.py --dataset=pl_minds14
      --asr=wav2vec2
Marcin Wątroba's avatar
Marcin Wątroba committed
    deps:
Marcin Wątroba's avatar
Marcin Wątroba committed
    - path: experiment/pipeline_process_spacy_pos_wer.py
      md5: 3817c96d1d91d2cf2d8ec7fe570f1472
      size: 1469
    - path: experiment_data/dataset/pl_minds14
      md5: d751713988987e9331980363e24189ce.dir
      size: 0
      nfiles: 0
    - path: experiment_data/pipeline/pl_minds14/gold_transcript
      md5: d2d48495000b3ea7ea6f4212ddb113a5.dir
      size: 689374
      nfiles: 562
    - path: experiment_data/pipeline/pl_minds14/wav2vec2__result
      md5: 5658da01ecdce39ed99156bbc7f2dc62.dir
      size: 3523907
      nfiles: 562
Marcin Wątroba's avatar
Marcin Wątroba committed
    outs:
Marcin Wątroba's avatar
Marcin Wątroba committed
    - path: experiment_data/pipeline/pl_minds14/wav2vec2__spacy_pos_alignment
      md5: 0d04963621be1dd6a1c81225734de652.dir
      size: 2724276
      nfiles: 562
    - path: experiment_data/pipeline/pl_minds14/wav2vec2__spacy_pos_metrics
      md5: 818882d685785a9d7d9b8d757c4c8e90.dir
      size: 6840
      nfiles: 562
  pipeline_spacy_pos_wer@2:
    cmd: PYTHONPATH=. python experiment/pipeline_process_spacy_pos_wer.py --dataset=pl_common_voice
      --asr=techmo
    deps:
    - path: experiment/pipeline_process_spacy_pos_wer.py
      md5: 273f598ac14ea7b894189bf0d553a39a
      size: 1469
    - path: experiment_data/dataset/pl_common_voice
      md5: d751713988987e9331980363e24189ce.dir
      size: 0
      nfiles: 0
    - path: experiment_data/pipeline/pl_common_voice/gold_transcript
      md5: e77ce22b14cb32594ae9cfcd4d6403b3.dir
      size: 4093545
      nfiles: 8155
    - path: experiment_data/pipeline/pl_common_voice/techmo__result
      md5: 9030cf3640f2749d9c1b4439687bdc2f.dir
      size: 7761880
      nfiles: 8136
    outs:
    - path: experiment_data/pipeline/pl_common_voice/techmo__spacy_pos_alignment
      md5: 1d2f7fbcca280abdbfb91e83f70e9789.dir
      size: 18192387
      nfiles: 8136
    - path: experiment_data/pipeline/pl_common_voice/techmo__spacy_pos_metrics
      md5: 61c69fcd287051f4ab7d1ffcc68a9aca.dir
      size: 96845
      nfiles: 8136
  pipeline_spacy_pos_wer@16:
    cmd: PYTHONPATH=. python experiment/pipeline_process_spacy_pos_wer.py --dataset=pl_minds14
      --asr=techmo
    deps:
    - path: experiment/pipeline_process_spacy_pos_wer.py
      md5: 3817c96d1d91d2cf2d8ec7fe570f1472
      size: 1469
    - path: experiment_data/dataset/pl_minds14
      md5: d751713988987e9331980363e24189ce.dir
      size: 0
      nfiles: 0
    - path: experiment_data/pipeline/pl_minds14/gold_transcript
      md5: d2d48495000b3ea7ea6f4212ddb113a5.dir
      size: 689374
      nfiles: 562
    - path: experiment_data/pipeline/pl_minds14/techmo__result
      md5: 4c43636b4773f2bf9a2153ef3393a558.dir
      size: 1336305
      nfiles: 562
    outs:
    - path: experiment_data/pipeline/pl_minds14/techmo__spacy_pos_alignment
      md5: aebbf34f80eb8151d8cf4d1ed840757c.dir
      size: 2640387
      nfiles: 562
    - path: experiment_data/pipeline/pl_minds14/techmo__spacy_pos_metrics
      md5: 7d555363b27e9c0d0ab7d0e3011c6d13.dir
      size: 6095
      nfiles: 562
  pipeline_spacy_pos_wer@6:
    cmd: PYTHONPATH=. python experiment/pipeline_process_spacy_pos_wer.py --dataset=pl_google_fleurs
      --asr=google
    deps:
    - path: experiment/pipeline_process_spacy_pos_wer.py
      md5: 1475a345757c2c9d699c0d4bc6c194f6
      size: 1734
    - path: experiment_data/dataset/pl_google_fleurs
      md5: dfcb8cf40b4a1e1a62f9ada00468cca9.dir
      size: 236272072
      nfiles: 758
    - path: experiment_data/pipeline/pl_google_fleurs/gold_transcript
      md5: 607f551eca5dabcca0caf31c87bd2ac6.dir
      size: 975209
      nfiles: 758
    - path: experiment_data/pipeline/pl_google_fleurs/google__result
      md5: 6e0d7eb490eadd8dcc3c5452ba85932b.dir
      size: 1377134
      nfiles: 758
    outs:
    - path: experiment_data/pipeline/pl_google_fleurs/google__spacy_pos_alignment
      md5: 39ad38a46e1489b88629b8512ca09ea3.dir
      size: 3712618
      nfiles: 758
    - path: experiment_data/pipeline/pl_google_fleurs/google__spacy_pos_metrics
      md5: 56dddb48cea2022b91fd4323efd43a8b.dir
      size: 9213
      nfiles: 758
  pipeline_spacy_pos_wer@0:
    cmd: PYTHONPATH=. python experiment/pipeline_process_spacy_pos_wer.py --dataset=pl_common_voice
      --asr=google
    deps:
    - path: experiment/pipeline_process_spacy_pos_wer.py
      md5: 3817c96d1d91d2cf2d8ec7fe570f1472
      size: 1469
    - path: experiment_data/dataset/pl_common_voice
      md5: d751713988987e9331980363e24189ce.dir
      size: 0
      nfiles: 0
    - path: experiment_data/pipeline/pl_common_voice/gold_transcript
      md5: e77ce22b14cb32594ae9cfcd4d6403b3.dir
      size: 4093545
      nfiles: 8155
    - path: experiment_data/pipeline/pl_common_voice/google__result
      md5: afb53476cc93ef4de3591908df41fd2a.dir
      size: 5854366
      nfiles: 8143
    outs:
    - path: experiment_data/pipeline/pl_common_voice/google__spacy_pos_alignment
      md5: d7f32c8741318563bdec3f35679cdc9a.dir
      size: 18316770
      nfiles: 8143
    - path: experiment_data/pipeline/pl_common_voice/google__spacy_pos_metrics
      md5: 117611317774e81fb482ba9c71ec806b.dir
      size: 97235
      nfiles: 8143
  pipeline_spacy_pos_wer@11:
    cmd: PYTHONPATH=. python experiment/pipeline_process_spacy_pos_wer.py --dataset=pl_luna
      --asr=ajn
Marcin Wątroba's avatar
Marcin Wątroba committed
    deps:
Marcin Wątroba's avatar
Marcin Wątroba committed
    - path: experiment/pipeline_process_spacy_pos_wer.py
      md5: 273f598ac14ea7b894189bf0d553a39a
      size: 1469
    - path: experiment_data/dataset/pl_luna
Marcin Wątroba's avatar
Marcin Wątroba committed
      md5: d342155b1871e881797cf7da09d5dc3c.dir
      size: 1578358645
      nfiles: 4500
Marcin Wątroba's avatar
Marcin Wątroba committed
    - path: experiment_data/pipeline/pl_luna/ajn__result
      md5: 653d65e186a7d05958ce3cbef219038c.dir
      size: 6159899
      nfiles: 494
    - path: experiment_data/pipeline/pl_luna/gold_transcript
      md5: 4c3e09acb7ffac0ef5b117a38515e3a9.dir
      size: 6706925
Marcin Wątroba's avatar
Marcin Wątroba committed
      nfiles: 500
    outs:
Marcin Wątroba's avatar
Marcin Wątroba committed
    - path: experiment_data/pipeline/pl_luna/ajn__spacy_pos_alignment
      md5: f12f57b3229bbbd18fb6584d6891b5cc.dir
      size: 21936929
      nfiles: 494
    - path: experiment_data/pipeline/pl_luna/ajn__spacy_pos_metrics
      md5: 6c6bb673ea5f64c9d851878c9d8a7c09.dir
      size: 8444
      nfiles: 494
  pipeline_spacy_pos_wer@15:
    cmd: PYTHONPATH=. python experiment/pipeline_process_spacy_pos_wer.py --dataset=pl_minds14
      --asr=ajn
    deps:
    - path: experiment/pipeline_process_spacy_pos_wer.py
      md5: 1475a345757c2c9d699c0d4bc6c194f6
      size: 1734
    - path: experiment_data/dataset/pl_minds14
      md5: d751713988987e9331980363e24189ce.dir
      size: 0
      nfiles: 0
    - path: experiment_data/pipeline/pl_minds14/ajn__result
      md5: 6fd1b042a7cb6d6f200c2eb9a926b7f1.dir
      size: 974727
      nfiles: 559
    - path: experiment_data/pipeline/pl_minds14/gold_transcript
      md5: d2d48495000b3ea7ea6f4212ddb113a5.dir
      size: 689374
      nfiles: 562
    outs:
    - path: experiment_data/pipeline/pl_minds14/ajn__spacy_pos_alignment
      md5: 101ee541a794af147e48dd460afc227f.dir
      size: 3178442
      nfiles: 559
    - path: experiment_data/pipeline/pl_minds14/ajn__spacy_pos_metrics
      md5: 014fbe751a4f357f78f073920890e06d.dir
      size: 7059
      nfiles: 559
  pipeline_spacy_pos_wer@12:
    cmd: PYTHONPATH=. python experiment/pipeline_process_spacy_pos_wer.py --dataset=pl_minds14
      --asr=ajn
    deps:
    - path: experiment/pipeline_process_spacy_pos_wer.py
      md5: 3817c96d1d91d2cf2d8ec7fe570f1472
      size: 1469
    - path: experiment_data/dataset/pl_minds14
      md5: d751713988987e9331980363e24189ce.dir
      size: 0
      nfiles: 0
    - path: experiment_data/pipeline/pl_minds14/ajn__result
      md5: 6fd1b042a7cb6d6f200c2eb9a926b7f1.dir
      size: 974727
      nfiles: 559
    - path: experiment_data/pipeline/pl_minds14/gold_transcript
      md5: d2d48495000b3ea7ea6f4212ddb113a5.dir
      size: 689374
      nfiles: 562
    outs:
    - path: experiment_data/pipeline/pl_minds14/ajn__spacy_pos_alignment
      md5: 013fbb68289e1c35986bcaaa773c396c.dir
      size: 3178442
      nfiles: 559
    - path: experiment_data/pipeline/pl_minds14/ajn__spacy_pos_metrics
      md5: 014fbe751a4f357f78f073920890e06d.dir
      size: 7059
      nfiles: 559
  pipeline_spacy_pos_wer@17:
    cmd: PYTHONPATH=. python experiment/pipeline_process_spacy_pos_wer.py --dataset=pl_minds14
      --asr=wav2vec2
    deps:
    - path: experiment/pipeline_process_spacy_pos_wer.py
      md5: 3817c96d1d91d2cf2d8ec7fe570f1472
      size: 1469
    - path: experiment_data/dataset/pl_minds14
      md5: d751713988987e9331980363e24189ce.dir
      size: 0
      nfiles: 0
    - path: experiment_data/pipeline/pl_minds14/gold_transcript
      md5: d2d48495000b3ea7ea6f4212ddb113a5.dir
      size: 689374
      nfiles: 562
    - path: experiment_data/pipeline/pl_minds14/wav2vec2__result
      md5: 5658da01ecdce39ed99156bbc7f2dc62.dir
      size: 3523907
      nfiles: 562
    outs:
    - path: experiment_data/pipeline/pl_minds14/wav2vec2__spacy_pos_alignment
      md5: 0d04963621be1dd6a1c81225734de652.dir
      size: 2724276
      nfiles: 562
    - path: experiment_data/pipeline/pl_minds14/wav2vec2__spacy_pos_metrics
      md5: 818882d685785a9d7d9b8d757c4c8e90.dir
      size: 6840
      nfiles: 562
  pipeline_spacy_pos_wer@1:
    cmd: PYTHONPATH=. python experiment/pipeline_process_spacy_pos_wer.py --dataset=pl_common_voice
      --asr=wav2vec2
Marcin Wątroba's avatar
Marcin Wątroba committed
    deps:
Marcin Wątroba's avatar
Marcin Wątroba committed
    - path: experiment/pipeline_process_spacy_pos_wer.py
      md5: 3817c96d1d91d2cf2d8ec7fe570f1472
      size: 1469
    - path: experiment_data/dataset/pl_common_voice
      md5: d751713988987e9331980363e24189ce.dir
      size: 0
      nfiles: 0
    - path: experiment_data/pipeline/pl_common_voice/gold_transcript
      md5: e77ce22b14cb32594ae9cfcd4d6403b3.dir
      size: 4093545
      nfiles: 8155
    - path: experiment_data/pipeline/pl_common_voice/wav2vec2__result
      md5: b0d0042d77d7adce37890ca63ad40091.dir
      size: 19014997
      nfiles: 8154
Marcin Wątroba's avatar
Marcin Wątroba committed
    outs:
Marcin Wątroba's avatar
Marcin Wątroba committed
    - path: experiment_data/pipeline/pl_common_voice/wav2vec2__spacy_pos_alignment
      md5: caf518456afa1864c286cd5e15b9e563.dir
      size: 18349138
      nfiles: 8154
    - path: experiment_data/pipeline/pl_common_voice/wav2vec2__spacy_pos_metrics
      md5: 71381fa7fd6c0cdba00f25c17fd6be5e.dir
      size: 97426
      nfiles: 8154
  pipeline_spacy_pos_wer@7:
    cmd: PYTHONPATH=. python experiment/pipeline_process_spacy_pos_wer.py --dataset=pl_luna
      --asr=google
Marcin Wątroba's avatar
Marcin Wątroba committed
    deps:
Marcin Wątroba's avatar
Marcin Wątroba committed
    - path: experiment/pipeline_process_spacy_pos_wer.py
      md5: 3817c96d1d91d2cf2d8ec7fe570f1472
      size: 1469
    - path: experiment_data/dataset/pl_luna
Marcin Wątroba's avatar
Marcin Wątroba committed
      md5: d342155b1871e881797cf7da09d5dc3c.dir
      size: 1578358645
      nfiles: 4500
Marcin Wątroba's avatar
Marcin Wątroba committed
    - path: experiment_data/pipeline/pl_luna/gold_transcript
      md5: 4c3e09acb7ffac0ef5b117a38515e3a9.dir
Marcin Wątroba's avatar
Marcin Wątroba committed
      size: 6706925
      nfiles: 500
Marcin Wątroba's avatar
Marcin Wątroba committed
    - path: experiment_data/pipeline/pl_luna/google__result
      md5: 8e4bf67df4dccd218d4d7c3de69688a4.dir
      size: 5346497
Marcin Wątroba's avatar
Marcin Wątroba committed
      nfiles: 500
    outs:
Marcin Wątroba's avatar
Marcin Wątroba committed
    - path: experiment_data/pipeline/pl_luna/google__spacy_pos_alignment
      md5: 460edffd716b1f46fb863e5b2b0d949e.dir
      size: 19342263
Marcin Wątroba's avatar
Marcin Wątroba committed
      nfiles: 500
Marcin Wątroba's avatar
Marcin Wątroba committed
    - path: experiment_data/pipeline/pl_luna/google__spacy_pos_metrics
      md5: a65dd7d74319da06f4ebaca08cde30ce.dir
      size: 8659
Marcin Wątroba's avatar
Marcin Wątroba committed
      nfiles: 500
Marcin Wątroba's avatar
Marcin Wątroba committed
  pipeline_spacy_pos_wer@10:
    cmd: PYTHONPATH=. python experiment/pipeline_process_spacy_pos_wer.py --dataset=pl_luna
      --asr=wav2vec2
Marcin Wątroba's avatar
Marcin Wątroba committed
    deps:
Marcin Wątroba's avatar
Marcin Wątroba committed
    - path: experiment/pipeline_process_spacy_pos_wer.py
      md5: 3817c96d1d91d2cf2d8ec7fe570f1472
      size: 1469
    - path: experiment_data/dataset/pl_luna
Marcin Wątroba's avatar
Marcin Wątroba committed
      md5: d342155b1871e881797cf7da09d5dc3c.dir
      size: 1578358645
      nfiles: 4500
Marcin Wątroba's avatar
Marcin Wątroba committed
    - path: experiment_data/pipeline/pl_luna/gold_transcript
      md5: 4c3e09acb7ffac0ef5b117a38515e3a9.dir
Marcin Wątroba's avatar
Marcin Wątroba committed
      size: 6706925
      nfiles: 500
Marcin Wątroba's avatar
Marcin Wątroba committed
    - path: experiment_data/pipeline/pl_luna/wav2vec2__result
      md5: 9c63b061ac7763144bca121e163ee7aa.dir
      size: 20658485
      nfiles: 456
Marcin Wątroba's avatar
Marcin Wątroba committed
    outs:
Marcin Wątroba's avatar
Marcin Wątroba committed
    - path: experiment_data/pipeline/pl_luna/wav2vec2__spacy_pos_alignment
      md5: a791fae1ca5599b9422b94d4c6ce760a.dir
      size: 17967467
      nfiles: 456
    - path: experiment_data/pipeline/pl_luna/wav2vec2__spacy_pos_metrics
      md5: 7848ddff997fd231f3857ff30dfd7154.dir
      size: 7940
      nfiles: 456
  pipeline_spacy_pos_wer@13:
    cmd: PYTHONPATH=. python experiment/pipeline_process_spacy_pos_wer.py --dataset=pl_minds14
      --asr=techmo
    deps:
    - path: experiment/pipeline_process_spacy_pos_wer.py
      md5: 3817c96d1d91d2cf2d8ec7fe570f1472
      size: 1469
    - path: experiment_data/dataset/pl_minds14
      md5: d751713988987e9331980363e24189ce.dir
      size: 0
      nfiles: 0
    - path: experiment_data/pipeline/pl_minds14/gold_transcript
      md5: d2d48495000b3ea7ea6f4212ddb113a5.dir
      size: 689374
      nfiles: 562
    - path: experiment_data/pipeline/pl_minds14/techmo__result
      md5: 4c43636b4773f2bf9a2153ef3393a558.dir
      size: 1336305
      nfiles: 562
    outs:
    - path: experiment_data/pipeline/pl_minds14/techmo__spacy_pos_alignment
      md5: aebbf34f80eb8151d8cf4d1ed840757c.dir
      size: 2640387
      nfiles: 562
    - path: experiment_data/pipeline/pl_minds14/techmo__spacy_pos_metrics
      md5: 7d555363b27e9c0d0ab7d0e3011c6d13.dir
      size: 6095
      nfiles: 562