mirror of
https://github.com/hpcaitech/ColossalAI.git
synced 2025-11-13 06:11:09 +00:00
[zero] add ZeroTensorShardStrategy (#793)
This commit is contained in:
6
setup.py
6
setup.py
@@ -134,6 +134,12 @@ if build_cuda_ext:
|
||||
'nvcc': append_nvcc_threads(['-O3', '--use_fast_math'] + version_dependent_macros + extra_cuda_flags)
|
||||
})
|
||||
|
||||
ext_modules.append(
|
||||
cuda_ext_helper(name='colossal_zero_comm',
|
||||
sources=['zero_comm.cpp'],
|
||||
extra_cuda_flags=['-DUSE_C10D_NCCL'],
|
||||
extra_cxx_flags=['-DUSE_C10D_NCCL']))
|
||||
|
||||
ext_modules.append(
|
||||
cuda_ext_helper('colossal_C', [
|
||||
'colossal_C_frontend.cpp', 'multi_tensor_sgd_kernel.cu', 'multi_tensor_scale_kernel.cu',
|
||||
|
||||
Reference in New Issue
Block a user