LICENSE
MANIFEST.in
README.md
build.txt
setup.cfg
setup.py
version.txt
accelerator/__init__.py
accelerator/abstract_accelerator.py
accelerator/cuda_accelerator.py
accelerator/real_accelerator.py
benchmarks/__init__.py
benchmarks/communication/__init__.py
benchmarks/communication/all_gather.py
benchmarks/communication/all_reduce.py
benchmarks/communication/all_to_all.py
benchmarks/communication/broadcast.py
benchmarks/communication/constants.py
benchmarks/communication/pt2pt.py
benchmarks/communication/run_all.py
benchmarks/communication/utils.py
benchmarks/inference/bert-bench.py
benchmarks/inference/collect_results.py
benchmarks/inference/gpt-bench.py
bin/deepspeed
bin/deepspeed.pt
bin/ds
bin/ds_bench
bin/ds_elastic
bin/ds_report
bin/ds_ssh
bin/dsr
csrc/adagrad/cpu_adagrad.cpp
csrc/adam/cpu_adam.cpp
csrc/adam/fused_adam_frontend.cpp
csrc/adam/multi_tensor_adam.cu
csrc/adam/multi_tensor_apply.cuh
csrc/aio/common/deepspeed_aio_common.cpp
csrc/aio/common/deepspeed_aio_common.h
csrc/aio/common/deepspeed_aio_types.cpp
csrc/aio/common/deepspeed_aio_types.h
csrc/aio/common/deepspeed_aio_utils.cpp
csrc/aio/common/deepspeed_aio_utils.h
csrc/aio/py_lib/deepspeed_aio_thread.cpp
csrc/aio/py_lib/deepspeed_aio_thread.h
csrc/aio/py_lib/deepspeed_pin_tensor.cpp
csrc/aio/py_lib/deepspeed_pin_tensor.h
csrc/aio/py_lib/deepspeed_py_aio.cpp
csrc/aio/py_lib/deepspeed_py_aio.h
csrc/aio/py_lib/deepspeed_py_aio_handle.cpp
csrc/aio/py_lib/deepspeed_py_aio_handle.h
csrc/aio/py_lib/deepspeed_py_copy.cpp
csrc/aio/py_lib/deepspeed_py_copy.h
csrc/aio/py_lib/py_ds_aio.cpp
csrc/common/custom_cuda_kernel.cu
csrc/includes/StopWatch.h
csrc/includes/Timer.h
csrc/includes/compat.h
csrc/includes/context.h
csrc/includes/conversion_utils.h
csrc/includes/cpu_adagrad.h
csrc/includes/cpu_adam.h
csrc/includes/cublas_wrappers.h
csrc/includes/custom_cuda_layers.h
csrc/includes/dequantization_utils.h
csrc/includes/dropout.h
csrc/includes/ds_kernel_utils.h
csrc/includes/ds_transformer_cuda.h
csrc/includes/feed_forward.h
csrc/includes/gelu.h
csrc/includes/gemm_test.h
csrc/includes/general_kernels.h
csrc/includes/memory_access_utils.h
csrc/includes/normalize_layer.h
csrc/includes/quantization.h
csrc/includes/quantization_utils.h
csrc/includes/quantizer.h
csrc/includes/reduction_utils.h
csrc/includes/simd.h
csrc/includes/softmax.h
csrc/includes/strided_batch_gemm.h
csrc/includes/type_shim.h
csrc/lamb/fused_lamb_cuda.cpp
csrc/lamb/fused_lamb_cuda_kernel.cu
csrc/quantization/dequantize.cu
csrc/quantization/fake_quantizer.cu
csrc/quantization/pt_binding.cpp
csrc/quantization/quantize.cu
csrc/random_ltd/gather_scatter.cu
csrc/random_ltd/pt_binding.cpp
csrc/random_ltd/slice_attn_masks.cu
csrc/random_ltd/token_sort.cu
csrc/sparse_attention/utils.cpp
csrc/spatial/csrc/opt_bias_add.cu
csrc/spatial/csrc/pt_binding.cpp
csrc/spatial/includes/spatial_cuda_layers.h
csrc/transformer/cublas_wrappers.cu
csrc/transformer/dropout_kernels.cu
csrc/transformer/ds_transformer_cuda.cpp
csrc/transformer/gelu_kernels.cu
csrc/transformer/general_kernels.cu
csrc/transformer/normalize_kernels.cu
csrc/transformer/softmax_kernels.cu
csrc/transformer/transform_kernels.cu
csrc/transformer/inference/csrc/apply_rotary_pos_emb.cu
csrc/transformer/inference/csrc/dequantize.cu
csrc/transformer/inference/csrc/gelu.cu
csrc/transformer/inference/csrc/layer_norm.cu
csrc/transformer/inference/csrc/pt_binding.cpp
csrc/transformer/inference/csrc/relu.cu
csrc/transformer/inference/csrc/softmax.cu
csrc/transformer/inference/csrc/transform.cu
csrc/transformer/inference/includes/inference_context.h
csrc/transformer/inference/includes/inference_cublas_wrappers.h
csrc/transformer/inference/includes/inference_cuda_layers.h
csrc/utils/flatten_unflatten.cpp
deepspeed/__init__.py
deepspeed/constants.py
deepspeed/env_report.py
deepspeed/git_version_info.py
deepspeed/git_version_info_installed.py
deepspeed.egg-info/PKG-INFO
deepspeed.egg-info/SOURCES.txt
deepspeed.egg-info/dependency_links.txt
deepspeed.egg-info/entry_points.txt
deepspeed.egg-info/requires.txt
deepspeed.egg-info/top_level.txt
deepspeed/accelerator/__init__.py
deepspeed/accelerator/abstract_accelerator.py
deepspeed/accelerator/cuda_accelerator.py
deepspeed/accelerator/real_accelerator.py
deepspeed/autotuning/__init__.py
deepspeed/autotuning/autotuner.py
deepspeed/autotuning/config.py
deepspeed/autotuning/constants.py
deepspeed/autotuning/scheduler.py
deepspeed/autotuning/utils.py
deepspeed/autotuning/config_templates/template_zero0.json
deepspeed/autotuning/config_templates/template_zero1.json
deepspeed/autotuning/config_templates/template_zero2.json
deepspeed/autotuning/config_templates/template_zero3.json
deepspeed/autotuning/tuner/__init__.py
deepspeed/autotuning/tuner/base_tuner.py
deepspeed/autotuning/tuner/cost_model.py
deepspeed/autotuning/tuner/index_based_tuner.py
deepspeed/autotuning/tuner/model_based_tuner.py
deepspeed/autotuning/tuner/utils.py
deepspeed/checkpoint/__init__.py
deepspeed/checkpoint/constants.py
deepspeed/checkpoint/deepspeed_checkpoint.py
deepspeed/checkpoint/reshape_3d_utils.py
deepspeed/checkpoint/reshape_meg_2d.py
deepspeed/checkpoint/reshape_utils.py
deepspeed/checkpoint/universal_checkpoint.py
deepspeed/checkpoint/utils.py
deepspeed/checkpoint/zero_checkpoint.py
deepspeed/comm/__init__.py
deepspeed/comm/backend.py
deepspeed/comm/comm.py
deepspeed/comm/config.py
deepspeed/comm/constants.py
deepspeed/comm/torch.py
deepspeed/comm/utils.py
deepspeed/compression/__init__.py
deepspeed/compression/basic_layer.py
deepspeed/compression/compress.py
deepspeed/compression/config.py
deepspeed/compression/constants.py
deepspeed/compression/helper.py
deepspeed/compression/scheduler.py
deepspeed/compression/utils.py
deepspeed/elasticity/__init__.py
deepspeed/elasticity/config.py
deepspeed/elasticity/constants.py
deepspeed/elasticity/elastic_agent.py
deepspeed/elasticity/elasticity.py
deepspeed/elasticity/utils.py
deepspeed/inference/__init__.py
deepspeed/inference/config.py
deepspeed/inference/engine.py
deepspeed/launcher/__init__.py
deepspeed/launcher/constants.py
deepspeed/launcher/launch.py
deepspeed/launcher/multinode_runner.py
deepspeed/launcher/runner.py
deepspeed/model_implementations/__init__.py
deepspeed/model_implementations/diffusers/__init__.py
deepspeed/model_implementations/diffusers/unet.py
deepspeed/model_implementations/diffusers/vae.py
deepspeed/model_implementations/features/__init__.py
deepspeed/model_implementations/features/cuda_graph.py
deepspeed/model_implementations/transformers/__init__.py
deepspeed/model_implementations/transformers/clip_encoder.py
deepspeed/model_implementations/transformers/ds_base.py
deepspeed/model_implementations/transformers/ds_bert.py
deepspeed/model_implementations/transformers/ds_bloom.py
deepspeed/model_implementations/transformers/ds_gpt.py
deepspeed/model_implementations/transformers/ds_megatron_gpt.py
deepspeed/model_implementations/transformers/ds_opt.py
deepspeed/model_implementations/transformers/ds_transformer.py
deepspeed/module_inject/__init__.py
deepspeed/module_inject/auto_tp.py
deepspeed/module_inject/inject.py
deepspeed/module_inject/layers.py
deepspeed/module_inject/load_checkpoint.py
deepspeed/module_inject/module_quantize.py
deepspeed/module_inject/policy.py
deepspeed/module_inject/replace_module.py
deepspeed/module_inject/replace_policy.py
deepspeed/module_inject/utils.py
deepspeed/module_inject/containers/__init__.py
deepspeed/module_inject/containers/base.py
deepspeed/module_inject/containers/base_moe.py
deepspeed/module_inject/containers/bert.py
deepspeed/module_inject/containers/bloom.py
deepspeed/module_inject/containers/clip.py
deepspeed/module_inject/containers/distil_bert.py
deepspeed/module_inject/containers/gpt2.py
deepspeed/module_inject/containers/gptj.py
deepspeed/module_inject/containers/gptneo.py
deepspeed/module_inject/containers/gptneox.py
deepspeed/module_inject/containers/megatron_gpt.py
deepspeed/module_inject/containers/megatron_gpt_moe.py
deepspeed/module_inject/containers/opt.py
deepspeed/module_inject/containers/unet.py
deepspeed/module_inject/containers/vae.py
deepspeed/module_inject/containers/features/__init__.py
deepspeed/module_inject/containers/features/megatron.py
deepspeed/module_inject/containers/features/meta_tensor.py
deepspeed/moe/__init__.py
deepspeed/moe/experts.py
deepspeed/moe/layer.py
deepspeed/moe/mappings.py
deepspeed/moe/sharded_moe.py
deepspeed/moe/utils.py
deepspeed/monitor/__init__.py
deepspeed/monitor/config.py
deepspeed/monitor/csv_monitor.py
deepspeed/monitor/monitor.py
deepspeed/monitor/tensorboard.py
deepspeed/monitor/utils.py
deepspeed/monitor/wandb.py
deepspeed/nebula/__init__.py
deepspeed/nebula/config.py
deepspeed/nebula/constants.py
deepspeed/ops/__init__.py
deepspeed/ops/adagrad/__init__.py
deepspeed/ops/adagrad/cpu_adagrad.py
deepspeed/ops/adam/__init__.py
deepspeed/ops/adam/cpu_adam.py
deepspeed/ops/adam/fused_adam.py
deepspeed/ops/adam/multi_tensor_apply.py
deepspeed/ops/aio/__init__.py
deepspeed/ops/csrc/adagrad/cpu_adagrad.cpp
deepspeed/ops/csrc/adam/cpu_adam.cpp
deepspeed/ops/csrc/adam/fused_adam_frontend.cpp
deepspeed/ops/csrc/adam/multi_tensor_adam.cu
deepspeed/ops/csrc/adam/multi_tensor_apply.cuh
deepspeed/ops/csrc/aio/common/deepspeed_aio_common.cpp
deepspeed/ops/csrc/aio/common/deepspeed_aio_common.h
deepspeed/ops/csrc/aio/common/deepspeed_aio_types.cpp
deepspeed/ops/csrc/aio/common/deepspeed_aio_types.h
deepspeed/ops/csrc/aio/common/deepspeed_aio_utils.cpp
deepspeed/ops/csrc/aio/common/deepspeed_aio_utils.h
deepspeed/ops/csrc/aio/py_lib/deepspeed_aio_thread.cpp
deepspeed/ops/csrc/aio/py_lib/deepspeed_aio_thread.h
deepspeed/ops/csrc/aio/py_lib/deepspeed_pin_tensor.cpp
deepspeed/ops/csrc/aio/py_lib/deepspeed_pin_tensor.h
deepspeed/ops/csrc/aio/py_lib/deepspeed_py_aio.cpp
deepspeed/ops/csrc/aio/py_lib/deepspeed_py_aio.h
deepspeed/ops/csrc/aio/py_lib/deepspeed_py_aio_handle.cpp
deepspeed/ops/csrc/aio/py_lib/deepspeed_py_aio_handle.h
deepspeed/ops/csrc/aio/py_lib/deepspeed_py_copy.cpp
deepspeed/ops/csrc/aio/py_lib/deepspeed_py_copy.h
deepspeed/ops/csrc/aio/py_lib/py_ds_aio.cpp
deepspeed/ops/csrc/aio/py_test/single_process_config.json
deepspeed/ops/csrc/common/custom_cuda_kernel.cu
deepspeed/ops/csrc/includes/StopWatch.h
deepspeed/ops/csrc/includes/Timer.h
deepspeed/ops/csrc/includes/compat.h
deepspeed/ops/csrc/includes/context.h
deepspeed/ops/csrc/includes/conversion_utils.h
deepspeed/ops/csrc/includes/cpu_adagrad.h
deepspeed/ops/csrc/includes/cpu_adam.h
deepspeed/ops/csrc/includes/cublas_wrappers.h
deepspeed/ops/csrc/includes/custom_cuda_layers.h
deepspeed/ops/csrc/includes/dequantization_utils.h
deepspeed/ops/csrc/includes/dropout.h
deepspeed/ops/csrc/includes/ds_kernel_utils.h
deepspeed/ops/csrc/includes/ds_transformer_cuda.h
deepspeed/ops/csrc/includes/feed_forward.h
deepspeed/ops/csrc/includes/gelu.h
deepspeed/ops/csrc/includes/gemm_test.h
deepspeed/ops/csrc/includes/general_kernels.h
deepspeed/ops/csrc/includes/memory_access_utils.h
deepspeed/ops/csrc/includes/normalize_layer.h
deepspeed/ops/csrc/includes/quantization.h
deepspeed/ops/csrc/includes/quantization_utils.h
deepspeed/ops/csrc/includes/quantizer.h
deepspeed/ops/csrc/includes/reduction_utils.h
deepspeed/ops/csrc/includes/simd.h
deepspeed/ops/csrc/includes/softmax.h
deepspeed/ops/csrc/includes/strided_batch_gemm.h
deepspeed/ops/csrc/includes/type_shim.h
deepspeed/ops/csrc/lamb/fused_lamb_cuda.cpp
deepspeed/ops/csrc/lamb/fused_lamb_cuda_kernel.cu
deepspeed/ops/csrc/quantization/dequantize.cu
deepspeed/ops/csrc/quantization/fake_quantizer.cu
deepspeed/ops/csrc/quantization/pt_binding.cpp
deepspeed/ops/csrc/quantization/quantize.cu
deepspeed/ops/csrc/random_ltd/gather_scatter.cu
deepspeed/ops/csrc/random_ltd/pt_binding.cpp
deepspeed/ops/csrc/random_ltd/slice_attn_masks.cu
deepspeed/ops/csrc/random_ltd/token_sort.cu
deepspeed/ops/csrc/sparse_attention/utils.cpp
deepspeed/ops/csrc/spatial/csrc/opt_bias_add.cu
deepspeed/ops/csrc/spatial/csrc/pt_binding.cpp
deepspeed/ops/csrc/spatial/includes/spatial_cuda_layers.h
deepspeed/ops/csrc/transformer/cublas_wrappers.cu
deepspeed/ops/csrc/transformer/dropout_kernels.cu
deepspeed/ops/csrc/transformer/ds_transformer_cuda.cpp
deepspeed/ops/csrc/transformer/gelu_kernels.cu
deepspeed/ops/csrc/transformer/general_kernels.cu
deepspeed/ops/csrc/transformer/normalize_kernels.cu
deepspeed/ops/csrc/transformer/softmax_kernels.cu
deepspeed/ops/csrc/transformer/transform_kernels.cu
deepspeed/ops/csrc/transformer/inference/csrc/apply_rotary_pos_emb.cu
deepspeed/ops/csrc/transformer/inference/csrc/dequantize.cu
deepspeed/ops/csrc/transformer/inference/csrc/gelu.cu
deepspeed/ops/csrc/transformer/inference/csrc/layer_norm.cu
deepspeed/ops/csrc/transformer/inference/csrc/pt_binding.cpp
deepspeed/ops/csrc/transformer/inference/csrc/relu.cu
deepspeed/ops/csrc/transformer/inference/csrc/softmax.cu
deepspeed/ops/csrc/transformer/inference/csrc/transform.cu
deepspeed/ops/csrc/transformer/inference/includes/inference_context.h
deepspeed/ops/csrc/transformer/inference/includes/inference_cublas_wrappers.h
deepspeed/ops/csrc/transformer/inference/includes/inference_cuda_layers.h
deepspeed/ops/csrc/utils/flatten_unflatten.cpp
deepspeed/ops/lamb/__init__.py
deepspeed/ops/lamb/fused_lamb.py
deepspeed/ops/op_builder/__init__.py
deepspeed/ops/op_builder/all_ops.py
deepspeed/ops/op_builder/async_io.py
deepspeed/ops/op_builder/builder.py
deepspeed/ops/op_builder/cpu_adagrad.py
deepspeed/ops/op_builder/cpu_adam.py
deepspeed/ops/op_builder/fused_adam.py
deepspeed/ops/op_builder/fused_lamb.py
deepspeed/ops/op_builder/quantizer.py
deepspeed/ops/op_builder/random_ltd.py
deepspeed/ops/op_builder/sparse_attn.py
deepspeed/ops/op_builder/spatial_inference.py
deepspeed/ops/op_builder/stochastic_transformer.py
deepspeed/ops/op_builder/transformer.py
deepspeed/ops/op_builder/transformer_inference.py
deepspeed/ops/op_builder/utils.py
deepspeed/ops/quantizer/__init__.py
deepspeed/ops/quantizer/quantizer.py
deepspeed/ops/random_ltd/__init__.py
deepspeed/ops/random_ltd/dropping_utils.py
deepspeed/ops/sparse_attention/__init__.py
deepspeed/ops/sparse_attention/bert_sparse_self_attention.py
deepspeed/ops/sparse_attention/matmul.py
deepspeed/ops/sparse_attention/softmax.py
deepspeed/ops/sparse_attention/sparse_attention_utils.py
deepspeed/ops/sparse_attention/sparse_self_attention.py
deepspeed/ops/sparse_attention/sparsity_config.py
deepspeed/ops/sparse_attention/trsrc/__init__.py
deepspeed/ops/sparse_attention/trsrc/matmul.tr
deepspeed/ops/sparse_attention/trsrc/softmax_bwd.tr
deepspeed/ops/sparse_attention/trsrc/softmax_fwd.tr
deepspeed/ops/transformer/__init__.py
deepspeed/ops/transformer/transformer.py
deepspeed/ops/transformer/inference/__init__.py
deepspeed/ops/transformer/inference/bias_add.py
deepspeed/ops/transformer/inference/config.py
deepspeed/ops/transformer/inference/diffusers_2d_transformer.py
deepspeed/ops/transformer/inference/diffusers_attention.py
deepspeed/ops/transformer/inference/diffusers_transformer_block.py
deepspeed/ops/transformer/inference/ds_attention.py
deepspeed/ops/transformer/inference/ds_mlp.py
deepspeed/ops/transformer/inference/moe_inference.py
deepspeed/ops/transformer/inference/triton_ops.py
deepspeed/ops/transformer/inference/op_binding/__init__.py
deepspeed/ops/transformer/inference/op_binding/base.py
deepspeed/ops/transformer/inference/op_binding/gelu_gemm.py
deepspeed/ops/transformer/inference/op_binding/linear.py
deepspeed/ops/transformer/inference/op_binding/mlp_gemm.py
deepspeed/ops/transformer/inference/op_binding/qkv_gemm.py
deepspeed/ops/transformer/inference/op_binding/residual_add.py
deepspeed/ops/transformer/inference/op_binding/softmax.py
deepspeed/ops/transformer/inference/op_binding/softmax_context.py
deepspeed/ops/transformer/inference/op_binding/vector_matmul.py
deepspeed/pipe/__init__.py
deepspeed/profiling/__init__.py
deepspeed/profiling/config.py
deepspeed/profiling/constants.py
deepspeed/profiling/flops_profiler/__init__.py
deepspeed/profiling/flops_profiler/profiler.py
deepspeed/runtime/__init__.py
deepspeed/runtime/bf16_optimizer.py
deepspeed/runtime/config.py
deepspeed/runtime/config_utils.py
deepspeed/runtime/constants.py
deepspeed/runtime/dataloader.py
deepspeed/runtime/eigenvalue.py
deepspeed/runtime/engine.py
deepspeed/runtime/lr_schedules.py
deepspeed/runtime/progressive_layer_drop.py
deepspeed/runtime/quantize.py
deepspeed/runtime/sparse_tensor.py
deepspeed/runtime/state_dict_factory.py
deepspeed/runtime/utils.py
deepspeed/runtime/weight_quantizer.py
deepspeed/runtime/activation_checkpointing/__init__.py
deepspeed/runtime/activation_checkpointing/checkpointing.py
deepspeed/runtime/activation_checkpointing/config.py
deepspeed/runtime/checkpoint_engine/__init__.py
deepspeed/runtime/checkpoint_engine/checkpoint_engine.py
deepspeed/runtime/checkpoint_engine/nebula_checkpoint_engine.py
deepspeed/runtime/checkpoint_engine/torch_checkpoint_engine.py
deepspeed/runtime/comm/__init__.py
deepspeed/runtime/comm/coalesced_collectives.py
deepspeed/runtime/comm/mpi.py
deepspeed/runtime/comm/nccl.py
deepspeed/runtime/compression/__init__.py
deepspeed/runtime/compression/cupy.py
deepspeed/runtime/data_pipeline/__init__.py
deepspeed/runtime/data_pipeline/config.py
deepspeed/runtime/data_pipeline/constants.py
deepspeed/runtime/data_pipeline/curriculum_scheduler.py
deepspeed/runtime/data_pipeline/data_routing/__init__.py
deepspeed/runtime/data_pipeline/data_routing/basic_layer.py
deepspeed/runtime/data_pipeline/data_routing/helper.py
deepspeed/runtime/data_pipeline/data_routing/scheduler.py
deepspeed/runtime/data_pipeline/data_routing/utils.py
deepspeed/runtime/data_pipeline/data_sampling/__init__.py
deepspeed/runtime/data_pipeline/data_sampling/data_analyzer.py
deepspeed/runtime/data_pipeline/data_sampling/data_sampler.py
deepspeed/runtime/data_pipeline/data_sampling/indexed_dataset.py
deepspeed/runtime/data_pipeline/data_sampling/utils.py
deepspeed/runtime/fp16/__init__.py
deepspeed/runtime/fp16/fused_optimizer.py
deepspeed/runtime/fp16/loss_scaler.py
deepspeed/runtime/fp16/unfused_optimizer.py
deepspeed/runtime/fp16/onebit/__init__.py
deepspeed/runtime/fp16/onebit/adam.py
deepspeed/runtime/fp16/onebit/lamb.py
deepspeed/runtime/fp16/onebit/zoadam.py
deepspeed/runtime/pipe/__init__.py
deepspeed/runtime/pipe/engine.py
deepspeed/runtime/pipe/module.py
deepspeed/runtime/pipe/p2p.py
deepspeed/runtime/pipe/schedule.py
deepspeed/runtime/pipe/topology.py
deepspeed/runtime/swap_tensor/__init__.py
deepspeed/runtime/swap_tensor/aio_config.py
deepspeed/runtime/swap_tensor/async_swapper.py
deepspeed/runtime/swap_tensor/constants.py
deepspeed/runtime/swap_tensor/optimizer_utils.py
deepspeed/runtime/swap_tensor/partitioned_optimizer_swapper.py
deepspeed/runtime/swap_tensor/partitioned_param_swapper.py
deepspeed/runtime/swap_tensor/pipelined_optimizer_swapper.py
deepspeed/runtime/swap_tensor/utils.py
deepspeed/runtime/zero/__init__.py
deepspeed/runtime/zero/config.py
deepspeed/runtime/zero/contiguous_memory_allocator.py
deepspeed/runtime/zero/linear.py
deepspeed/runtime/zero/offload_config.py
deepspeed/runtime/zero/parameter_offload.py
deepspeed/runtime/zero/partition_parameters.py
deepspeed/runtime/zero/partitioned_param_coordinator.py
deepspeed/runtime/zero/stage3.py
deepspeed/runtime/zero/stage_1_and_2.py
deepspeed/runtime/zero/test.py
deepspeed/runtime/zero/tiling.py
deepspeed/runtime/zero/utils.py
deepspeed/utils/__init__.py
deepspeed/utils/comms_logging.py
deepspeed/utils/debug.py
deepspeed/utils/exceptions.py
deepspeed/utils/groups.py
deepspeed/utils/init_on_device.py
deepspeed/utils/logging.py
deepspeed/utils/mixed_precision_linkage.py
deepspeed/utils/nvtx.py
deepspeed/utils/tensor_fragment.py
deepspeed/utils/timer.py
deepspeed/utils/types.py
deepspeed/utils/zero_to_fp32.py
op_builder/__init__.py
op_builder/all_ops.py
op_builder/async_io.py
op_builder/builder.py
op_builder/cpu_adagrad.py
op_builder/cpu_adam.py
op_builder/fused_adam.py
op_builder/fused_lamb.py
op_builder/quantizer.py
op_builder/random_ltd.py
op_builder/sparse_attn.py
op_builder/spatial_inference.py
op_builder/stochastic_transformer.py
op_builder/transformer.py
op_builder/transformer_inference.py
op_builder/utils.py
requirements/requirements-1bit-mpi.txt
requirements/requirements-autotuning-ml.txt
requirements/requirements-autotuning.txt
requirements/requirements-dev.txt
requirements/requirements-inf.txt
requirements/requirements-readthedocs.txt
requirements/requirements-sd.txt
requirements/requirements-sparse_attn.txt
requirements/requirements.txt