-
Notifications
You must be signed in to change notification settings - Fork 0
/
dvc.lock
48 lines (48 loc) · 1.63 KB
/
dvc.lock
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
process_accounts:
cmd: python src/data/process_accounts.py datasets/accounts.csv
deps:
- path: datasets/accounts.csv
md5: 770de02d407c75b594cf00e69a2f508f
- path: src/data/process_accounts.py
md5: 8b8e587cd1405e270bc82c295726f0ce
outs:
- path: datasets/accounts_processed.csv
md5: d81198e56c0c129cba75c81cba3a0cbe
download_tweets:
cmd: python src/data/download_tweets.py datasets/accounts_processed.csv
deps:
- path: datasets/accounts_processed.csv
md5: d81198e56c0c129cba75c81cba3a0cbe
- path: src/data/download_tweets.py
md5: d5a087aab1dfa0246efc2f90ae1d6b8b
outs:
- path: datasets/tweets/
md5: 02e2ac87b0f8b014abe8f5466312ac15.dir
visualize_tweets_count:
cmd: python src/visualization/tweets_data_visualizer.py datasets/accounts_processed.csv
deps:
- path: datasets/accounts_processed.csv
md5: d81198e56c0c129cba75c81cba3a0cbe
- path: src/visualization/tweets_data_visualizer.py
md5: 4381b9e60bfaa4e6c6a3608715d39d51
outs:
- path: reports/plots/all_replies_count_hist_full.png
md5: e434b75fc5eb836532728a86022dad66
- path: reports/plots/all_replies_count_less_than_500_hist.png
md5: cf5647c72360c2091bd4d3ff67845cff
embed_tweets:
cmd: python src/data/embedding.py -m herbert -a mean -i datasets/tweets -o datasets/embeddings.csv
-p datasets/embeddings
deps:
- path: datasets/tweets
md5: 02e2ac87b0f8b014abe8f5466312ac15.dir
size: 820898667
nfiles: 548
outs:
- path: datasets/embeddings
md5: c31e124bea83f16cbaae48e8f90ce035.dir
size: 5099252722
nfiles: 548
- path: datasets/embeddings.csv
md5: 71a6487850d8a63c698a9f2ff043ec08
size: 6829270