ModelLink2/examples/mcore/mixtral
2024-11-25 01:23:41 +00:00
..
ckpt_convert_mixtral_hf2mcore.sh !1597 新增权重转换ut模板和mixtral用例,支持legacy和mcore互转 2024-09-10 07:40:15 +00:00
ckpt_convert_mixtral_mg2mg_lora.sh !1911 增加llama2、mixtral的lora权重转换脚本 2024-11-25 01:23:41 +00:00
data_convert_mixtral_instruction.sh !1817 整改两处公网地址 2024-10-29 11:05:59 +00:00
data_convert_mixtral_pairwise.sh !1858 dpo、simpo方案特性支持:支持vpp、dpp、ep、cp、断点续训等 2024-11-21 03:31:39 +00:00
data_convert_mixtral_pretrain.sh !1555 新增 Mixtral 8x22B 预训练、推理和评估 2024-09-02 03:43:11 +00:00
dpo_mixtral_8x7b_full_ptd.sh !1858 dpo、simpo方案特性支持:支持vpp、dpp、ep、cp、断点续训等 2024-11-21 03:31:39 +00:00
dpo_mixtral_8x7b_lora_ptd.sh !1858 dpo、simpo方案特性支持:支持vpp、dpp、ep、cp、断点续训等 2024-11-21 03:31:39 +00:00
evaluate_mixtral_8x7b_ptd.sh !1741 更新llama2-7b,13b,70b性能 2024-10-09 02:35:47 +00:00
evaluate_mixtral_8x22b_ptd.sh !1555 新增 Mixtral 8x22B 预训练、推理和评估 2024-09-02 03:43:11 +00:00
generate_mixtral_8x7b_ptd.sh !1741 更新llama2-7b,13b,70b性能 2024-10-09 02:35:47 +00:00
generate_mixtral_8x22b_ptd.sh !1555 新增 Mixtral 8x22B 预训练、推理和评估 2024-09-02 03:43:11 +00:00
pretrain_mixtral_8x7b_ptd.sh !1604 增加mixtral_8*7b推理评估 2024-09-04 01:05:21 +00:00
pretrain_mixtral_8x22b_32k_ptd_C.sh !1613 修复Mixtral预训练加载权重 2024-09-05 02:09:37 +00:00
pretrain_mixtral_8x22b_32k_ptd.sh !1613 修复Mixtral预训练加载权重 2024-09-05 02:09:37 +00:00
pretrain_mixtral_8x22b_64k_ptd_C.sh !1613 修复Mixtral预训练加载权重 2024-09-05 02:09:37 +00:00
tune_mixtral_8x7B_full_ptd.sh !1814 refactor trainer 2024-11-06 10:53:02 +00:00
tune_mixtral_8x7b_lora_ptd.sh !1814 refactor trainer 2024-11-06 10:53:02 +00:00