summaryrefslogtreecommitdiff
path: root/configs/review_user.yaml
blob: d2423ee140e447e205c854f89c2c20d90ba22b36 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
task: review
setting: user
dataset_config: product_review_user
model_name: Qwen/Qwen2.5-1.5B-Instruct
device: cuda:1

# CVH hyperparams
d: 64
alpha: 0.1
beta: 0.05
lam: 0.0001
lr: 0.05
adapt_steps: 30
max_grad_norm: 5.0
basis_seed: 42

# Support set
K: 4

# Generation
max_new_tokens: 512
temperature: 0.0
top_p: 0.9

# Evaluation
num_eval: -1  # -1 means all
batch_size: 1

# Blended generation
blend_gamma: 0.5
min_new_tokens: 128