From 2ac1bad229460cafda7d01e9a2f91e761e34c78a Mon Sep 17 00:00:00 2001
From: pwalkow <pwalkow@gpu-server.ws.clarin>
Date: Tue, 14 Mar 2023 18:04:58 +0100
Subject: [PATCH] Add dvc

---
 dvc.lock | 32 ++++++++++++++++----------------
 dvc.yaml |  4 ++--
 2 files changed, 18 insertions(+), 18 deletions(-)

diff --git a/dvc.lock b/dvc.lock
index e3a507e..18c0a65 100644
--- a/dvc.lock
+++ b/dvc.lock
@@ -88,12 +88,12 @@ stages:
       size: 1688836
       nfiles: 3
     - path: experiments/scripts/tag_dataset.py
-      md5: 8e8039b73b8ea3ce39287ed0a304af9b
-      size: 3750
+      md5: f73e2203fdb988a00d4e8363a349c617
+      size: 3932
     outs:
     - path: data/preprocessed/poleval/
-      md5: 854387459b193c5eba6db1273ca5ad23.dir
-      size: 2277282
+      md5: 9d067db65ba6a27db19effce45b01876.dir
+      size: 2541105
       nfiles: 3
   preprocess_dataset@enron_spam:
     cmd: PYTHONPATH=. python experiments/scripts/tag_dataset.py --dataset_name enron_spam
@@ -103,12 +103,12 @@ stages:
       size: 53096069
       nfiles: 3
     - path: experiments/scripts/tag_dataset.py
-      md5: 8e8039b73b8ea3ce39287ed0a304af9b
-      size: 3750
+      md5: f73e2203fdb988a00d4e8363a349c617
+      size: 3932
     outs:
     - path: data/preprocessed/enron_spam/
-      md5: b75efba1a62182dc8ac32acd1faf92ed.dir
-      size: 61709260
+      md5: 30c63efbc615347ddcb5f61e011113bd.dir
+      size: 65971374
       nfiles: 3
   preprocess_dataset@wiki_pl:
     cmd: PYTHONPATH=. python experiments/scripts/tag_dataset.py --dataset_name wiki_pl
@@ -118,12 +118,12 @@ stages:
       size: 29115538
       nfiles: 3
     - path: experiments/scripts/tag_dataset.py
-      md5: 8e8039b73b8ea3ce39287ed0a304af9b
-      size: 3750
+      md5: f73e2203fdb988a00d4e8363a349c617
+      size: 3932
     outs:
     - path: data/preprocessed/wiki_pl/
-      md5: 3e9b2e1e0542777e0a751d9d7f7f4241.dir
-      size: 55380570
+      md5: 0014b9bb52913cbc9a568d237ea2207b.dir
+      size: 65553079
       nfiles: 3
   classify@wiki_pl:
     cmd: PYTHONPATH=. python experiments/scripts/classify.py --dataset_name wiki_pl
@@ -153,12 +153,12 @@ stages:
       size: 23460358
       nfiles: 3
     - path: experiments/scripts/tag_dataset.py
-      md5: 8e8039b73b8ea3ce39287ed0a304af9b
-      size: 3750
+      md5: f73e2203fdb988a00d4e8363a349c617
+      size: 3932
     outs:
     - path: data/preprocessed/20_news/
-      md5: 1ed5ef2dabe4bc05f7377175ed11137b.dir
-      size: 46845669
+      md5: 20da0980e52df537e5b7ca5db0305879.dir
+      size: 58582060
       nfiles: 3
   classify@20_news:
     cmd: PYTHONPATH=. python experiments/scripts/classify.py --dataset_name 20_news
diff --git a/dvc.yaml b/dvc.yaml
index 5115a47..6862a88 100644
--- a/dvc.yaml
+++ b/dvc.yaml
@@ -80,8 +80,8 @@ stages:
   attack_basic:
     foreach:
       - enron_spam
-        #- 20_news
-        #- wiki_pl
+      - 20_news
+      - wiki_pl
     do:
       wdir: .
       cmd: >-
-- 
GitLab