-
Notifications
You must be signed in to change notification settings - Fork 0
/
no-doc-id.yaml
54 lines (49 loc) · 1.16 KB
/
no-doc-id.yaml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
## experiment
experiment:
name: seq-training-url-last
output_dir: outputs/experiments/paper
cache_dir: /net/nfs.cirrascale/allennlp/muhammadk/cache
## data
data:
text_data_path: sample-data/biocite-1k/text
augment:
doc:
do: false
method: permute
n_sample_per_doc: 2
finetune:
number_non_attributable_negatives: 0
neg_create_probability: 0.0
## model
model:
name: TinyLlama/TinyLlama-1.1B-intermediate-step-1431k-3T
train:
url_location: no_url
pretrain: true
sequential: false
finetune_q_url_a: false
repeat_url_across_doc: false
finetune_q_a_url: false
finetune_q_a: true
finetune_q_a_doc_url: false
q_a_url_predict_url_only: false
## loss and attn config
cross_doc_attention: false
url_loss_factor: 1.0
loss_type: mask
config_template_path: conf/templates/train_config.yaml
device_eval_batch_size: 40
device_train_microbatch_size: 2
eval_first: false
weight_decay: 0.02
lr: 8.0e-5
max_duration: 10ep
save_folder: null
eval:
disable_qa_eval: false
disable_all_eval: false
disable_attribution_eval: false
disable_non_attrib_eval: true
icl_eval: false
ppl_eval: false
use_ais: false