schema: '2.0'
stages:
  download_dataset@enron_spam:
    cmd: PYTHONPATH=. python experiments/scripts/download_dataset.py --dataset_name
      enron_spam --output_dir data/datasets/enron_spam
    deps:
    - path: experiments/scripts/download_dataset.py
      md5: 9eb915fd5b9216965db519f686408a51
      size: 887
    outs:
    - path: data/datasets/enron_spam/
      md5: 66d44efedf37990b1989c81bbee085e0.dir
      size: 53096069
      nfiles: 3
  get_model@enron_spam:
    cmd: PYTHONPATH=. python experiments/scripts/get_model.py --dataset_name enron_spam
      --output_dir data/models/enron_spam
    deps:
    - path: data/preprocessed/enron_spam
      md5: 30c63efbc615347ddcb5f61e011113bd.dir
      size: 65971374
      nfiles: 3
    - path: experiments/scripts/get_model.py
      md5: 5050f51b4019bba97af47971f6c7cab4
      size: 747
    outs:
    - path: data/models/enron_spam/
      md5: 3e16b22f59532c66beeadea958e0579a.dir
      size: 18505614
      nfiles: 6
  classify@enron_spam:
    cmd: PYTHONPATH=. python experiments/scripts/classify.py --dataset_name enron_spam
      --output_dir data/classification/enron_spam
    deps:
    - path: data/models/enron_spam/
      md5: 3e16b22f59532c66beeadea958e0579a.dir
      size: 18505614
      nfiles: 6
    - path: data/preprocessed/enron_spam/
      md5: 30c63efbc615347ddcb5f61e011113bd.dir
      size: 65971374
      nfiles: 3
    - path: experiments/scripts/classify.py
      md5: 6fc1a6a0a11ba6cd99a8b6625a96d9f5
      size: 1181
    outs:
    - path: data/classification/enron_spam
      md5: 5de1a2fcbae0de94f5fbfd2bb747d919.dir
      size: 14585920
      nfiles: 2
  explain@enron_spam:
    cmd: PYTHONPATH=. python experiments/scripts/explain.py --dataset_name enron_spam
      --output_dir data/explanations/enron_spam
    deps:
    - path: data/models/enron_spam
      md5: 3e16b22f59532c66beeadea958e0579a.dir
      size: 18505614
      nfiles: 6
    - path: data/preprocessed/enron_spam
      md5: b75efba1a62182dc8ac32acd1faf92ed.dir
      size: 61709260
      nfiles: 3
    - path: experiments/scripts/explain.py
      md5: afc02ef263a59c911098dea969faa932
      size: 3234
    outs:
    - path: data/explanations/enron_spam/
      md5: 70c3f3d04e0b73fd56eecfda04914bd4.dir
      size: 13589794
      nfiles: 403
  download_dataset@poleval:
    cmd: PYTHONPATH=. python experiments/scripts/download_dataset.py --dataset_name
      poleval --output_dir data/datasets/poleval
    deps:
    - path: experiments/scripts/download_dataset.py
      md5: 9eb915fd5b9216965db519f686408a51
      size: 887
    outs:
    - path: data/datasets/poleval/
      md5: 826f974f794e24efcb5aedb054d1fd55.dir
      size: 1688836
      nfiles: 3
  preprocess_dataset@poleval:
    cmd: PYTHONPATH=. python experiments/scripts/tag_dataset.py --dataset_name poleval
    deps:
    - path: data/datasets/poleval/
      md5: 826f974f794e24efcb5aedb054d1fd55.dir
      size: 1688836
      nfiles: 3
    - path: experiments/scripts/tag_dataset.py
      md5: f73e2203fdb988a00d4e8363a349c617
      size: 3932
    outs:
    - path: data/preprocessed/poleval/
      md5: 9d067db65ba6a27db19effce45b01876.dir
      size: 2541105
      nfiles: 3
  preprocess_dataset@enron_spam:
    cmd: PYTHONPATH=. python experiments/scripts/tag_dataset.py --dataset_name enron_spam
    deps:
    - path: data/datasets/enron_spam/
      md5: 66d44efedf37990b1989c81bbee085e0.dir
      size: 53096069
      nfiles: 3
    - path: experiments/scripts/tag_dataset.py
      md5: f73e2203fdb988a00d4e8363a349c617
      size: 3932
    outs:
    - path: data/preprocessed/enron_spam/
      md5: 30c63efbc615347ddcb5f61e011113bd.dir
      size: 65971374
      nfiles: 3
  preprocess_dataset@wiki_pl:
    cmd: PYTHONPATH=. python experiments/scripts/tag_dataset.py --dataset_name wiki_pl
    deps:
    - path: data/datasets/wiki_pl/
      md5: abcbccb3e352ed623cace1b95078bd63.dir
      size: 29115538
      nfiles: 3
    - path: experiments/scripts/tag_dataset.py
      md5: f73e2203fdb988a00d4e8363a349c617
      size: 3932
    outs:
    - path: data/preprocessed/wiki_pl/
      md5: 0014b9bb52913cbc9a568d237ea2207b.dir
      size: 65553079
      nfiles: 3
  classify@wiki_pl:
    cmd: PYTHONPATH=. python experiments/scripts/classify.py --dataset_name wiki_pl
      --output_dir data/classification/wiki_pl
    deps:
    - path: data/models/wiki_pl/
      md5: fd453042628fb09c080ef05d34a32cce.dir
      size: 501711136
      nfiles: 7
    - path: data/preprocessed/wiki_pl/
      md5: 0014b9bb52913cbc9a568d237ea2207b.dir
      size: 65553079
      nfiles: 3
    - path: experiments/scripts/classify.py
      md5: 6fc1a6a0a11ba6cd99a8b6625a96d9f5
      size: 1181
    outs:
    - path: data/classification/wiki_pl
      md5: 88c3cea96b2cb3ddda1a82037bf6130a.dir
      size: 44196727
      nfiles: 2
  preprocess_dataset@20_news:
    cmd: PYTHONPATH=. python experiments/scripts/tag_dataset.py --dataset_name 20_news
    deps:
    - path: data/datasets/20_news/
      md5: 999207f1c2c123c9943397b47f2c3b3a.dir
      size: 23460358
      nfiles: 3
    - path: experiments/scripts/tag_dataset.py
      md5: f73e2203fdb988a00d4e8363a349c617
      size: 3932
    outs:
    - path: data/preprocessed/20_news/
      md5: 20da0980e52df537e5b7ca5db0305879.dir
      size: 58582060
      nfiles: 3
  classify@20_news:
    cmd: PYTHONPATH=. python experiments/scripts/classify.py --dataset_name 20_news
      --output_dir data/classification/20_news
    deps:
    - path: data/models/20_news/
      md5: 43d68a67ecb8149bd6bf50db9767cb64.dir
      size: 439008808
      nfiles: 6
    - path: data/preprocessed/20_news/
      md5: 20da0980e52df537e5b7ca5db0305879.dir
      size: 58582060
      nfiles: 3
    - path: experiments/scripts/classify.py
      md5: 6fc1a6a0a11ba6cd99a8b6625a96d9f5
      size: 1181
    outs:
    - path: data/classification/20_news
      md5: b73611443c4189af91b827c083f37e0b.dir
      size: 42897496
      nfiles: 2
  attack_basic@enron_spam:
    cmd: PYTHONPATH=. python experiments/scripts/attack.py --dataset_name enron_spam
    deps:
    - path: data/models/enron_spam
      md5: 3e16b22f59532c66beeadea958e0579a.dir
      size: 18505614
      nfiles: 6
    - path: data/preprocessed/enron_spam
      md5: b75efba1a62182dc8ac32acd1faf92ed.dir
      size: 61709260
      nfiles: 3
    - path: experiments/scripts/attack.py
      md5: 4a2870b5a21b20b0046be0350c55d495
      size: 4714
    outs:
    - path: data/results/attack_basic/enron_spam/
      md5: fc35de09ce5e2aa7043325b2819c0aa0.dir
      size: 4869
      nfiles: 1
  explain@wiki_pl:
    cmd: PYTHONPATH=. python experiments/scripts/explain.py --dataset_name wiki_pl
      --output_dir data/explanations/wiki_pl
    deps:
    - path: data/models/wiki_pl
      md5: fd453042628fb09c080ef05d34a32cce.dir
      size: 501711136
      nfiles: 7
    - path: data/preprocessed/wiki_pl
      md5: 3e9b2e1e0542777e0a751d9d7f7f4241.dir
      size: 55380570
      nfiles: 3
    - path: experiments/scripts/explain.py
      md5: afc02ef263a59c911098dea969faa932
      size: 3234
    outs:
    - path: data/explanations/wiki_pl/
      md5: 5a3b9b069024456412078143e3af15d7.dir
      size: 331450794
      nfiles: 10065
  explain@20_news:
    cmd: PYTHONPATH=. python experiments/scripts/explain.py --dataset_name 20_news
      --output_dir data/explanations/20_news
    deps:
    - path: data/models/20_news
      md5: 43d68a67ecb8149bd6bf50db9767cb64.dir
      size: 439008808
      nfiles: 6
    - path: data/preprocessed/20_news
      md5: 1ed5ef2dabe4bc05f7377175ed11137b.dir
      size: 46845669
      nfiles: 3
    - path: experiments/scripts/explain.py
      md5: afc02ef263a59c911098dea969faa932
      size: 3234
    outs:
    - path: data/explanations/20_news/
      md5: c8ba90f9757a4e3cc4843d3791ef2446.dir
      size: 232912969
      nfiles: 14041
  attack_basic@wiki_pl:
    cmd: PYTHONPATH=. python experiments/scripts/attack.py --dataset_name wiki_pl
      --attack_type attack_basic
    deps:
    - path: data/models/wiki_pl
      md5: fd453042628fb09c080ef05d34a32cce.dir
      size: 501711136
      nfiles: 7
    - path: data/preprocessed/wiki_pl
      md5: 0014b9bb52913cbc9a568d237ea2207b.dir
      size: 65553079
      nfiles: 3
    - path: experiments/scripts/attack.py
      md5: 702997933e5af85d09d8286a14e2cc05
      size: 2486
    outs:
    - path: data/results/attack_basic/wiki_pl/
      md5: f118a41e391b5f713f77611140f2f2cc.dir
      size: 1
      nfiles: 1
  attack_textfooler@enron_spam:
    cmd: 'PYTHONPATH=. python experiments/scripts/attack.py --dataset_name enron_spam
      --attack_type attack_textfooler   '
    deps:
    - path: data/models/enron_spam
      md5: 3e16b22f59532c66beeadea958e0579a.dir
      size: 18505614
      nfiles: 6
    - path: data/preprocessed/enron_spam
      md5: 30c63efbc615347ddcb5f61e011113bd.dir
      size: 65971374
      nfiles: 3
    - path: experiments/scripts/attack.py
      md5: b9d9a4d9fcba1cb4dfbb554ecc3e26fb
      size: 10083
    outs:
    - path: data/results/attack_textfooler/enron_spam/
      md5: 10ecd4c940e8df1058465048ffbe78d4.dir
      size: 3291044
      nfiles: 2
  attack_textfooler@20_news:
    cmd: 'PYTHONPATH=. python experiments/scripts/attack.py --dataset_name 20_news
      --attack_type attack_textfooler   '
    deps:
    - path: data/models/20_news
      md5: 43d68a67ecb8149bd6bf50db9767cb64.dir
      size: 439008808
      nfiles: 6
    - path: data/preprocessed/20_news
      md5: 20da0980e52df537e5b7ca5db0305879.dir
      size: 58582060
      nfiles: 3
    - path: experiments/scripts/attack.py
      md5: 4fe9c6210ce0f3be66b54c2565ad2daa
      size: 10132
    outs:
    - path: data/results/attack_textfooler/20_news/
      md5: 007aba16e343ca283180c7bc7b9a0190.dir
      size: 93666157
      nfiles: 2
  attack_textfooler@wiki_pl:
    cmd: 'PYTHONPATH=. python experiments/scripts/attack.py --dataset_name wiki_pl
      --attack_type attack_textfooler   '
    deps:
    - path: data/classification/wiki_pl
      md5: 88c3cea96b2cb3ddda1a82037bf6130a.dir
      size: 44196727
      nfiles: 2
    - path: data/models/wiki_pl
      md5: fd453042628fb09c080ef05d34a32cce.dir
      size: 501711136
      nfiles: 7
    - path: experiments/scripts/attack.py
      md5: 2977363ba8806c393498f98d5733c013
      size: 11497
    outs:
    - path: data/results/attack_textfooler/wiki_pl/
      md5: eccc12b9a5ae383ea02067cd1955753e.dir
      size: 20293404
      nfiles: 2
  attack_textfooler_discard@wiki_pl:
    cmd: PYTHONPATH=. python experiments/scripts/attack.py --dataset_name wiki_pl
      --attack_type attack_textfooler_discard
    deps:
    - path: data/classification/wiki_pl
      md5: 88c3cea96b2cb3ddda1a82037bf6130a.dir
      size: 44196727
      nfiles: 2
    - path: data/models/wiki_pl
      md5: fd453042628fb09c080ef05d34a32cce.dir
      size: 501711136
      nfiles: 7
    - path: experiments/scripts/attack.py
      md5: 2b9ddc1ff1f56855ff667171ba04ed78
      size: 11606
    outs:
    - path: data/results/attack_textfooler_discard/wiki_pl/
      md5: e41122c3cdf76ad1b163aba49acce0f0.dir
      size: 14396685
      nfiles: 2
  attack_textfooler_discard@enron_spam:
    cmd: PYTHONPATH=. python experiments/scripts/attack.py --dataset_name enron_spam
      --attack_type attack_textfooler_discard
    deps:
    - path: data/classification/enron_spam
      md5: 5de1a2fcbae0de94f5fbfd2bb747d919.dir
      size: 14585920
      nfiles: 2
    - path: data/models/enron_spam
      md5: 3e16b22f59532c66beeadea958e0579a.dir
      size: 18505614
      nfiles: 6
    - path: experiments/scripts/attack.py
      md5: 2b9ddc1ff1f56855ff667171ba04ed78
      size: 11606
    outs:
    - path: data/results/attack_textfooler_discard/enron_spam/
      md5: 8a78484bd77916f82021a72338342a44.dir
      size: 2816160
      nfiles: 2
  attack_textfooler_discard@20_news:
    cmd: PYTHONPATH=. python experiments/scripts/attack.py --dataset_name 20_news
      --attack_type attack_textfooler_discard
    deps:
    - path: data/classification/20_news
      md5: b73611443c4189af91b827c083f37e0b.dir
      size: 42897496
      nfiles: 2
    - path: data/models/20_news
      md5: 43d68a67ecb8149bd6bf50db9767cb64.dir
      size: 439008808
      nfiles: 6
    - path: experiments/scripts/attack.py
      md5: 9e913b341cb0993625a41c401d64a30b
      size: 12017
    outs:
    - path: data/results/attack_textfooler_discard/20_news/
      md5: 82d89b00a710e9de0a2157357fed5894.dir
      size: 24977923
      nfiles: 2
  attack_xai@enron_spam:
    cmd: PYTHONPATH=. python experiments/scripts/attack.py --dataset_name enron_spam
      --attack_type attack_xai
    deps:
    - path: data/classification/enron_spam
      md5: 5de1a2fcbae0de94f5fbfd2bb747d919.dir
      size: 14585920
      nfiles: 2
    - path: data/models/enron_spam
      md5: 3e16b22f59532c66beeadea958e0579a.dir
      size: 18505614
      nfiles: 6
    - path: experiments/scripts/attack.py
      md5: 87f54ee4e2a08f1259d9d8b2d01fe1b9
      size: 12061
    outs:
    - path: data/results/attack_xai/enron_spam/
      md5: ad19831866da140de113e64862da0bce.dir
      size: 2860109
      nfiles: 2
  attack_xai@20_news:
    cmd: PYTHONPATH=. python experiments/scripts/attack.py --dataset_name 20_news
      --attack_type attack_xai
    deps:
    - path: data/classification/20_news
      md5: b73611443c4189af91b827c083f37e0b.dir
      size: 42897496
      nfiles: 2
    - path: data/models/20_news
      md5: 43d68a67ecb8149bd6bf50db9767cb64.dir
      size: 439008808
      nfiles: 6
    - path: experiments/scripts/attack.py
      md5: 87f54ee4e2a08f1259d9d8b2d01fe1b9
      size: 12061
    outs:
    - path: data/results/attack_xai/20_news/
      md5: af00c730d4d73a0a8e2a047882c0d9aa.dir
      size: 8739816
      nfiles: 2