-
Notifications
You must be signed in to change notification settings - Fork 26
Expand file tree
/
Copy patheval_longmemeval.sh
More file actions
44 lines (42 loc) · 1.26 KB
/
eval_longmemeval.sh
File metadata and controls
44 lines (42 loc) · 1.26 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
#!/bin/bash
export CUDA_VISIBLE_DEVICES=0
# --disable-flash-attn \
python main.py \
--memory-cache-suffix "longmemeval_eval" \
--eval-only \
--inference-workers 4 \
--inference-session-workers 1 \
--action-top-k 5 \
--mem-top-k-eval 20 \
--session-mode fixed-length \
--chunk-size 512 \
--chunk-overlap 64 \
--load-checkpoint '[YOUR_CHECKPOINT_PATH]' \
--dataset longmemeval \
--data-file "[YOUR_DATA_PATH]" \
--model "[YOUR_MODEL_NAME]" \
--api \
--api-base "[YOUR_API_BASE]" \
--api-key "YOUR_API_KEY_1" "YOUR_API_KEY_2" \
--retriever contriever \
--designer-freq 1 \
--inner-epochs 100 \
--outer-epochs 10 \
--batch-size 4 \
--encode-batch-size 64 \
--ppo-epochs 2 \
--new-action-bias-steps 25 \
--stage-reward-fraction 0.25 \
--designer-reflection-cycles 3 \
--mem-top-k 20 \
--designer-max-changes 2 \
--designer-failure-window-epochs 100 \
--designer-failure-pool-size 2000 \
--reward-metric llm_judge \
--designer-new-skill-hint \
--device cuda \
--enable-designer \
--skip-load-snapshot-manager \
--wandb-run-name eval \
--save-dir ./checkpoints/longmemeval_with_designer \
--out-file ./results/longmemeval_with_designer.json