-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathveld_step_4_train_glove.yaml
48 lines (44 loc) · 1.46 KB
/
veld_step_4_train_glove.yaml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
x-veld:
chain:
description: "Trains a glove model on the bible and exports its vectors as a dict serialized
into a pkl file. The training data is rather small and the hyperparameteres are simplistic,
in order to demonstrate the reproducibility of this chain rather than claiming any deeper
insight into the data's words context."
topic:
- "ETL"
- "NLP"
- "Machine Learning"
- "Word Embeddings"
- "Bible Studies"
services:
veld_step_4_train_glove:
extends:
file: ./code/veld_code__glove/veld_train.yaml
service: veld_train
volumes:
- ./data/training_data/:/veld/input/
- ./data/models/glove/:/veld/output/
environment:
in_corpus_file: "bible_processed.txt"
out_vocab_file: "m1_vocab.txt"
out_cooccurrence_file: "m1_cooccurrence.bin"
out_cooccurrence_shuf_file: "m1_cooccurrence_shuf.bin"
out_vector_file: "m1_vector"
model_id: "m1"
model_description: "simple bible glove model"
vector_size: 200
max_iter: 50
window_size: 10
veld_step_4_export_glove:
extends:
file: ./code/veld_code__glove/veld_export.yaml
service: veld_export
volumes:
- ./data/models/glove/:/veld/input/
- ./data/vectors/glove/:/veld/output/
environment:
in_vector_file: "m1_vector.txt"
out_vector_file: "m1.pkl"
depends_on:
veld_step_4_train_glove:
condition: service_completed_successfully