Skip to content
Snippets Groups Projects
dvc.lock 3.6 KiB
Newer Older
MGniew's avatar
MGniew committed
schema: '2.0'
stages:
  download_dataset@enron_spam:
    cmd: PYTHONPATH=. python experiments/scripts/download_dataset.py --dataset_name
      enron_spam --output_dir data/datasets/enron_spam
    deps:
    - path: experiments/scripts/download_dataset.py
MGniew's avatar
MGniew committed
      md5: 9eb915fd5b9216965db519f686408a51
      size: 887
MGniew's avatar
MGniew committed
    outs:
    - path: data/datasets/enron_spam/
MGniew's avatar
MGniew committed
      md5: 66d44efedf37990b1989c81bbee085e0.dir
MGniew's avatar
MGniew committed
      size: 53096069
      nfiles: 3
  get_model@enron_spam:
    cmd: PYTHONPATH=. python experiments/scripts/get_model.py --dataset_name enron_spam
      --output_dir data/models/enron_spam
    deps:
pwalkow's avatar
pwalkow committed
    - path: data/preprocessed/enron_spam
      md5: b75efba1a62182dc8ac32acd1faf92ed.dir
      size: 61709260
MGniew's avatar
MGniew committed
      nfiles: 3
MGniew's avatar
MGniew committed
    - path: experiments/scripts/get_model.py
      md5: 5050f51b4019bba97af47971f6c7cab4
      size: 747
    outs:
    - path: data/models/enron_spam/
      md5: 3e16b22f59532c66beeadea958e0579a.dir
      size: 18505614
      nfiles: 6
  classify@enron_spam:
    cmd: PYTHONPATH=. python experiments/scripts/classify.py --dataset_name enron_spam
      --output_dir data/classification/enron_spam
    deps:
MGniew's avatar
MGniew committed
    - path: data/models/enron_spam/
      md5: 3e16b22f59532c66beeadea958e0579a.dir
      size: 18505614
      nfiles: 6
pwalkow's avatar
pwalkow committed
    - path: data/preprocessed/enron_spam/
      md5: b75efba1a62182dc8ac32acd1faf92ed.dir
      size: 61709260
      nfiles: 3
MGniew's avatar
MGniew committed
    - path: experiments/scripts/classify.py
pwalkow's avatar
pwalkow committed
      md5: ba9284c90847fbbd0f2a6cca414d9636
      size: 1106
MGniew's avatar
MGniew committed
    outs:
    - path: data/classification/enron_spam
pwalkow's avatar
pwalkow committed
      md5: 0450c0b672bc4a5db3cc7be2dac786bd.dir
      size: 10674882
MGniew's avatar
MGniew committed
      nfiles: 2
MGniew's avatar
MGniew committed
  explain@enron_spam:
    cmd: PYTHONPATH=. python experiments/scripts/explain.py --dataset_name enron_spam
      --output_dir data/explanations/enron_spam
    deps:
MGniew's avatar
MGniew committed
    - path: data/datasets/enron_spam
MGniew's avatar
MGniew committed
      md5: 66d44efedf37990b1989c81bbee085e0.dir
MGniew's avatar
MGniew committed
      size: 53096069
      nfiles: 3
    - path: data/models/enron_spam
      md5: 3e16b22f59532c66beeadea958e0579a.dir
      size: 18505614
      nfiles: 6
MGniew's avatar
MGniew committed
    - path: experiments/scripts/explain.py
      md5: c85cbb774f2682ee39948e701fa0b0ca
      size: 1445
    outs:
    - path: data/explanations/enron_spam/
MGniew's avatar
MGniew committed
      md5: 376bd1619c08b4989564788e74de8e06.dir
      size: 7870394
MGniew's avatar
MGniew committed
      nfiles: 1
pwalkow's avatar
pwalkow committed
  download_dataset@poleval:
    cmd: PYTHONPATH=. python experiments/scripts/download_dataset.py --dataset_name
      poleval --output_dir data/datasets/poleval
    deps:
    - path: experiments/scripts/download_dataset.py
      md5: 9eb915fd5b9216965db519f686408a51
      size: 887
    outs:
    - path: data/datasets/poleval/
      md5: 826f974f794e24efcb5aedb054d1fd55.dir
      size: 1688836
      nfiles: 3
  preprocess_dataset@poleval:
    cmd: PYTHONPATH=. python experiments/scripts/tag_dataset.py --dataset_name poleval
    deps:
    - path: data/datasets/poleval/
      md5: 826f974f794e24efcb5aedb054d1fd55.dir
      size: 1688836
      nfiles: 3
    - path: experiments/scripts/tag_dataset.py
pwalkow's avatar
pwalkow committed
      md5: 2c4e097b3a278c12d19858f988232b44
      size: 3435
pwalkow's avatar
pwalkow committed
    outs:
    - path: data/preprocessed/poleval/
pwalkow's avatar
pwalkow committed
      md5: 854387459b193c5eba6db1273ca5ad23.dir
      size: 2277282
      nfiles: 3
pwalkow's avatar
pwalkow committed
  preprocess_dataset@enron_spam:
    cmd: PYTHONPATH=. python experiments/scripts/tag_dataset.py --dataset_name enron_spam
    deps:
    - path: data/datasets/enron_spam/
      md5: 66d44efedf37990b1989c81bbee085e0.dir
      size: 53096069
      nfiles: 3
    - path: experiments/scripts/tag_dataset.py
pwalkow's avatar
pwalkow committed
      md5: 2c4e097b3a278c12d19858f988232b44
      size: 3435
pwalkow's avatar
pwalkow committed
    outs:
    - path: data/preprocessed/enron_spam/
pwalkow's avatar
pwalkow committed
      md5: b75efba1a62182dc8ac32acd1faf92ed.dir
      size: 61709260
      nfiles: 3