LLM_deepspeed.yaml 873 Bytes
Newer Older
chenzk's avatar
v1.0  
chenzk committed
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
# general
seed: 2020
state: INFO
use_text: True
reproducibility: True
checkpoint_dir: 'saved'
show_progress: True

log_wandb: False
wandb_project: 'REC'
MAX_ITEM_LIST_LENGTH: 50
MAX_TEXT_LENGTH: 64

data_path: ../dataset/                       # dataset path
dataset: Pixel200K                        # dataset name

text_path: text_path # Use absolute path
text_keys: ['title', 'tag', 'description']

item_prompt: 'Compress the following sentence into embedding: '
item_emb_token_n: 1

loss: nce

# training settings
epochs: 10
train_batch_size: 8
optim_args: {
  learning_rate: 1e-4,
  weight_decay: 0.01
}
scheduler_args: {
  type: cosine,
  warmup: 0.1
}

# eval settings
eval_batch_size: 8
topk: [5,10,50,200]
metrics: ['Recall', 'NDCG']
valid_metric: NDCG@200
metric_decimal_place: 7
eval_step: 1 
stopping_step: 5

strategy: deepspeed
precision: bf16-mixed
stage: 2