forked from hellohaptik/multi-task-NLP
-
Notifications
You must be signed in to change notification settings - Fork 0
/
transform_file.yml
69 lines (61 loc) · 1.35 KB
/
transform_file.yml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
sample_transform1:
transform_func: snips_intent_ner
read_file_names:
- snips_train.txt
- snips_dev.txt
- snips_test.txt
read_dir: snips_data
save_dir: demo_transform
sample_transform2:
transform_func: coNLL_pos_ner
read_file_names:
- coNLL_train.txt
- coNLL_testa.txt
- coNLL_testb.txt
read_dir: coNLL_data
save_dir: demo_transform
sample_transform3:
transform_func: snli_entailment
read_file_names:
- snli_train.jsonl
- snli_dev.jsonl
- snli_test.jsonl
read_dir : snli_data
save_dir: demo_transform
sample_transform4:
transform_func: bio_ner
transform_params:
save_prefix : sample
tag_col : 1
col_sep : " "
sen_sep : "\n"
read_file_names:
- coNLL_train.txt
- coNLL_testa.txt
- coNLL_testb.txt
read_dir: coNLL_data
save_dir: demo_transform
sample_transform5:
transform_func: fragment
transform_params:
data_frac : 0.2
seq_len_right : 3
seq_len_left : 2
sep : "\t"
query_col : 2
read_file_names:
- int_snips_train.tsv
- int_snips_dev.tsv
- int_snips_test.tsv
read_dir: data
save_dir: demo_transform
sample_transform6:
transform_func: msmarco_query_type
transform_params:
data_frac : 0.2
read_file_names:
- train_v2.1.json
- dev_v2.1.json
- eval_v2.1_public.json
read_dir: msmarco_qna_data
save_dir: demo_transform