hostfile
|
add SimPO
|
2024-06-24 02:12:20 +00:00 |
train_dpo.py
|
refactor evaluation
|
2024-07-22 05:57:39 +00:00 |
train_dpo.sh
|
refactor evaluation
|
2024-07-22 05:57:39 +00:00 |
train_kto.py
|
refactor evaluation
|
2024-07-22 05:57:39 +00:00 |
train_kto.sh
|
refactor evaluation
|
2024-07-22 05:57:39 +00:00 |
train_orpo.py
|
refactor evaluation
|
2024-07-22 05:57:39 +00:00 |
train_orpo.sh
|
refactor evaluation
|
2024-07-22 05:57:39 +00:00 |
train_rm.py
|
refactor evaluation
|
2024-07-22 05:57:39 +00:00 |
train_rm.sh
|
refactor evaluation
|
2024-07-22 05:57:39 +00:00 |
train_sft.py
|
refactor evaluation
|
2024-07-22 05:57:39 +00:00 |
train_sft.sh
|
refactor evaluation
|
2024-07-22 05:57:39 +00:00 |