.. |
ckpt_convert_mixtral_hf2mcore.sh
|
!1597 新增权重转换ut模板和mixtral用例,支持legacy和mcore互转
|
2024-09-10 07:40:15 +00:00 |
ckpt_convert_mixtral_mg2mg_lora.sh
|
!1911 增加llama2、mixtral的lora权重转换脚本
|
2024-11-25 01:23:41 +00:00 |
data_convert_mixtral_instruction.sh
|
!1817 整改两处公网地址
|
2024-10-29 11:05:59 +00:00 |
data_convert_mixtral_pairwise.sh
|
!1858 dpo、simpo方案特性支持:支持vpp、dpp、ep、cp、断点续训等
|
2024-11-21 03:31:39 +00:00 |
data_convert_mixtral_pretrain.sh
|
!1555 新增 Mixtral 8x22B 预训练、推理和评估
|
2024-09-02 03:43:11 +00:00 |
dpo_mixtral_8x7b_full_ptd.sh
|
!1858 dpo、simpo方案特性支持:支持vpp、dpp、ep、cp、断点续训等
|
2024-11-21 03:31:39 +00:00 |
dpo_mixtral_8x7b_lora_ptd.sh
|
!1858 dpo、simpo方案特性支持:支持vpp、dpp、ep、cp、断点续训等
|
2024-11-21 03:31:39 +00:00 |
evaluate_mixtral_8x7b_ptd.sh
|
!1741 更新llama2-7b,13b,70b性能
|
2024-10-09 02:35:47 +00:00 |
evaluate_mixtral_8x22b_ptd.sh
|
!1555 新增 Mixtral 8x22B 预训练、推理和评估
|
2024-09-02 03:43:11 +00:00 |
generate_mixtral_8x7b_ptd.sh
|
!1741 更新llama2-7b,13b,70b性能
|
2024-10-09 02:35:47 +00:00 |
generate_mixtral_8x22b_ptd.sh
|
!1555 新增 Mixtral 8x22B 预训练、推理和评估
|
2024-09-02 03:43:11 +00:00 |
pretrain_mixtral_8x7b_ptd.sh
|
!1604 增加mixtral_8*7b推理评估
|
2024-09-04 01:05:21 +00:00 |
pretrain_mixtral_8x22b_32k_ptd_C.sh
|
!1613 修复Mixtral预训练加载权重
|
2024-09-05 02:09:37 +00:00 |
pretrain_mixtral_8x22b_32k_ptd.sh
|
!1613 修复Mixtral预训练加载权重
|
2024-09-05 02:09:37 +00:00 |
pretrain_mixtral_8x22b_64k_ptd_C.sh
|
!1613 修复Mixtral预训练加载权重
|
2024-09-05 02:09:37 +00:00 |
tune_mixtral_8x7B_full_ptd.sh
|
!1814 refactor trainer
|
2024-11-06 10:53:02 +00:00 |
tune_mixtral_8x7b_lora_ptd.sh
|
!1814 refactor trainer
|
2024-11-06 10:53:02 +00:00 |