deepseek_v2


引用自:https://zhuanlan.zhihu.com/p/1890082781461207006
moe的三种实现:
def get_moe_impl_class():
if global_server_args_dict["enable_deepep_moe"]:
return DeepEPMoE
if global_server_args_dict["enable_flashinfer_moe"]:
# Must come before EPMoE because FusedMoE also supports enable_ep_moe
return FusedMoE
if global_server_args_dict["enable_ep_moe"]:
return EPMoE
return FusedMoE