DeepSpeed
af4bfb7d - Merge branch 'master' into remove-unused-quantize-settings

Comment changes are shownComment changes are hidden
Commit
2 years ago
Merge branch 'master' into remove-unused-quantize-settings
Author
  • .github/workflows
    • File
      amd.yml
    • File
      auto-sync.yml
    • File
      nv-torch-latest-cpu.yml
    • setup-venv
      • File
        action.yml
  • File
    .pre-commit-config.yaml
  • File
    README.md
  • accelerator
    • File
      __init__.py
    • File
      abstract_accelerator.py
    • File
      cuda_accelerator.py
    • File
      real_accelerator.py
  • benchmarks
    • File
      __init__.py
    • communication
      • File
        __init__.py
      • File
        all_gather.py
      • File
        all_reduce.py
      • File
        all_to_all.py
      • File
        broadcast.py
      • File
        constants.py
      • File
        pt2pt.py
      • File
        run_all.py
      • File
        utils.py
    • inference
      • File
        bert-bench.py
      • File
        collect_results.py
      • File
        gpt-bench.py
  • csrc
    • aio
      • common
        • File
          deepspeed_aio_utils.cpp
      • py_lib
        • File
          deepspeed_pin_tensor.cpp
        • File
          deepspeed_pin_tensor.h
        • File
          deepspeed_py_aio_handle.cpp
        • File
          deepspeed_py_aio_handle.h
        • File
          py_ds_aio.cpp
      • py_test
        • File
          ds_aio_handle.py
        • File
          perf_sweep_utils.py
        • File
          test_ds_aio.py
    • common
      • File
        custom_cuda_kernel.cu
    • includes
      • File
        StopWatch.h
      • File
        Timer.h
      • File
        context.h
      • File
        cpu_adagrad.h
      • File
        cpu_adam.h
      • File
        cublas_wrappers.h
      • File
        dropout.h
      • File
        ds_transformer_cuda.h
      • File
        feed_forward.h
      • File
        gelu.h
      • File
        gemm_test.h
      • File
        general_kernels.h
      • File
        normalize_layer.h
      • File
        quantization.h
      • File
        quantizer.h
      • File
        simd.h
      • File
        softmax.h
      • File
        strided_batch_gemm.h
      • File
        type_shim.h
    • quantization
      • File
        fake_quantizer.cu
    • transformer
      • File
        cublas_wrappers.cu
      • File
        dropout_kernels.cu
      • File
        gelu_kernels.cu
      • File
        general_kernels.cu
      • inference/csrc
        • File
          apply_rotary_pos_emb.cu
        • File
          pt_binding.cpp
      • File
        normalize_kernels.cu
      • File
        softmax_kernels.cu
      • File
        transform_kernels.cu
  • deepspeed
    • autotuning
      • File
        __init__.py
      • File
        autotuner.py
      • File
        config.py
      • File
        constants.py
      • File
        scheduler.py
      • tuner
        • File
          __init__.py
        • File
          base_tuner.py
        • File
          cost_model.py
        • File
          index_based_tuner.py
        • File
          model_based_tuner.py
        • File
          utils.py
      • File
        utils.py
    • checkpoint
      • File
        __init__.py
      • File
        constants.py
      • File
        deepspeed_checkpoint.py
      • File
        reshape_3d_utils.py
      • File
        reshape_meg_2d.py
      • File
        reshape_utils.py
      • File
        utils.py
      • File
        zero_checkpoint.py
    • comm
      • File
        __init__.py
      • File
        backend.py
      • File
        config.py
      • File
        constants.py
      • File
        utils.py
    • compression
      • File
        __init__.py
      • File
        basic_layer.py
      • File
        compress.py
      • File
        config.py
      • File
        constants.py
      • File
        helper.py
      • File
        scheduler.py
      • File
        utils.py
    • elasticity
      • File
        __init__.py
      • File
        elastic_agent.py
      • File
        utils.py
    • File
      env_report.py
    • File
      git_version_info.py
    • inference
      • File
        __init__.py
      • File
        config.py
      • File
        engine.py
    • launcher
      • File
        __init__.py
      • File
        constants.py
      • File
        multinode_runner.py
      • File
        runner.py
    • model_implementations
      • File
        __init__.py
      • diffusers
        • File
          __init__.py
      • transformers
        • File
          __init__.py
        • File
          ds_base.py
    • module_inject
      • File
        __init__.py
      • File
        auto_tp.py
      • containers
        • File
          __init__.py
        • File
          base.py
        • File
          base_moe.py
        • File
          bert.py
        • File
          bloom.py
        • File
          clip.py
        • File
          distil_bert.py
        • features
          • File
            __init__.py
          • File
            megatron.py
          • File
            meta_tensor.py
        • File
          gpt2.py
        • File
          gptj.py
        • File
          gptneo.py
        • File
          gptneox.py
        • File
          megatron_gpt.py
        • File
          megatron_gpt_moe.py
        • File
          opt.py
      • File
        inject.py
      • File
        layers.py
      • File
        load_checkpoint.py
      • File
        module_quantize.py
      • File
        policy.py
      • File
        replace_module.py
      • File
        utils.py
    • moe
      • File
        __init__.py
      • File
        utils.py
    • monitor
      • File
        __init__.py
      • File
        config.py
      • File
        csv_monitor.py
      • File
        monitor.py
      • File
        tensorboard.py
      • File
        utils.py
      • File
        wandb.py
    • nebula
      • File
        __init__.py
      • File
        config.py
      • File
        constants.py
    • ops
      • File
        __init__.py
      • adagrad
        • File
          __init__.py
      • adam
        • File
          __init__.py
        • File
          cpu_adam.py
      • lamb
        • File
          __init__.py
      • quantizer
        • File
          __init__.py
      • random_ltd
        • File
          __init__.py
      • sparse_attention
        • File
          __init__.py
        • File
          matmul.py
        • File
          softmax.py
        • trsrc
          • File
            __init__.py
      • transformer
        • File
          __init__.py
        • inference
          • File
            __init__.py
          • File
            ds_attention.py
          • op_binding
            • File
              __init__.py
            • File
              base.py
            • File
              gelu_gemm.py
            • File
              linear.py
            • File
              mlp_gemm.py
            • File
              qkv_gemm.py
            • File
              residual_add.py
            • File
              softmax.py
            • File
              softmax_context.py
            • File
              vector_matmul.py
          • File
            triton_ops.py
    • pipe
      • File
        __init__.py
    • profiling
      • File
        __init__.py
      • File
        config.py
      • File
        constants.py
      • flops_profiler
        • File
          __init__.py
        • File
          profiler.py
    • runtime
      • File
        __init__.py
      • activation_checkpointing
        • File
          __init__.py
        • File
          checkpointing.py
        • File
          config.py
      • File
        bf16_optimizer.py
      • checkpoint_engine
        • File
          __init__.py
        • File
          checkpoint_engine.py
        • File
          nebula_checkpoint_engine.py
        • File
          torch_checkpoint_engine.py
      • comm
        • File
          __init__.py
        • File
          coalesced_collectives.py
      • compression
        • File
          __init__.py
      • File
        config.py
      • File
        config_utils.py
      • File
        constants.py
      • data_pipeline
        • File
          __init__.py
        • data_routing
          • File
            __init__.py
        • data_sampling
          • File
            __init__.py
          • File
            data_analyzer.py
      • File
        dataloader.py
      • File
        eigenvalue.py
      • File
        engine.py
      • fp16
        • File
          __init__.py
        • onebit
          • File
            __init__.py
      • pipe
        • File
          __init__.py
        • File
          module.py
        • File
          schedule.py
      • File
        progressive_layer_drop.py
      • File
        quantize.py
      • File
        utils.py
      • File
        weight_quantizer.py
      • zero
        • File
          config.py
        • File
          contiguous_memory_allocator.py
        • File
          linear.py
        • File
          offload_config.py
        • File
          stage3.py
        • File
          stage_1_and_2.py
        • File
          test.py
        • File
          tiling.py
        • File
          utils.py
    • utils
      • File
        __init__.py
      • File
        comms_logging.py
      • File
        debug.py
      • File
        logging.py
      • File
        mixed_precision_linkage.py
      • File
        nvtx.py
      • File
        tensor_fragment.py
      • File
        types.py
      • File
        zero_to_fp32.py
  • docs
    • File
      _config.yml
    • _data
      • File
        navigation.yml
    • _posts
      • File
        2022-12-12-data-efficiency.md
    • _tutorials
      • File
        automatic-tensor-parallelism.md
      • File
        curriculum-learning.md
      • File
        data-efficiency.md
      • File
        inference-tutorial.md
      • File
        mixture-of-experts-inference.md
    • code-docs/source
      • File
        conf.py
      • File
        inference-init.rst
      • File
        zero3.rst
    • File
      index.md
  • op_builder
    • File
      async_io.py
    • File
      quantizer.py
    • File
      transformer_inference.py
  • release
    • File
      bump_patch_version.py
  • scripts
    • File
      check-license.py
    • File
      check-torchdist.py
  • File
    setup.py
  • tests
    • benchmarks
      • File
        flatten_bench.py
      • File
        unflatten_bench.py
    • File
      conftest.py
    • lightning
      • File
        test_simple.py
    • model/BingBertSquad
      • File
        test_e2e_squad.py
    • onebit
      • File
        test_mpi_backend.py
      • File
        test_mpi_perf.py
      • File
        test_nccl_backend.py
      • File
        test_nccl_perf.py
    • perf
      • File
        adagrad_test.py
      • File
        adam_test.py
      • File
        adam_test1.py
    • small_model_debugging
      • File
        stage3_test.py
      • File
        test.py
      • File
        test_model.py
    • unit
      • File
        __init__.py
      • File
        alexnet_model.py
      • autotuning
        • File
          test_autotuning.py
      • checkpoint
        • File
          common.py
        • File
          test_latest_checkpoint.py
        • File
          test_lr_scheduler.py
        • File
          test_moe_checkpoint.py
        • File
          test_other_optimizer.py
        • File
          test_pipeline.py
        • File
          test_reshape_checkpoint.py
        • File
          test_sparse.py
        • File
          test_tag_validation.py
        • File
          test_zero_optimizer.py
      • comm
        • File
          test_dist.py
      • File
        common.py
      • compression
        • File
          test_compression.py
      • elasticity
        • File
          test_elastic.py
      • inference
        • File
          test_checkpoint_sharding.py
        • File
          test_inference.py
        • File
          test_inference_config.py
        • File
          test_model_profiling.py
      • launcher
        • File
          test_ds_arguments.py
        • File
          test_multinode_runner.py
        • File
          test_run.py
      • File
        megatron_model.py
      • model_parallelism
        • File
          test_configurable_parallel_mp.py
        • File
          test_configurable_parallel_pp.py
      • File
        modeling.py
      • File
        modelingpreln.py
      • moe
        • File
          test_moe.py
        • File
          test_moe_tp.py
      • monitor
        • File
          test_monitor.py
      • File
        multi_output_model.py
      • ops
        • adagrad
          • File
            test_cpu_adagrad.py
        • adam
          • File
            test_adamw.py
          • File
            test_cpu_adam.py
        • aio
          • File
            test_aio.py
        • cuda
          • File
            test_cuda_backward.py
          • File
            test_cuda_forward.py
        • quantizer
          • File
            test_fake_quantization.py
        • sparse_attention
          • File
            test_sparse_attention.py
        • transformer/inference
          • File
            test_bias_add.py
      • pipe
        • File
          test_pipe_module.py
      • profiling/flops_profiler
        • File
          test_flops_profiler.py
      • runtime
        • activation_checkpointing
          • File
            test_activation_checkpointing.py
        • comm
          • File
            test_coalesced_collectives.py
        • half_precision
          • onebit
            • File
              test_onebit.py
          • File
            test_bf16.py
          • File
            test_dynamic_loss_scale.py
          • File
            test_fp16.py
        • pipe
          • File
            test_pipe.py
          • File
            test_pipe_schedule.py
          • File
            test_topology.py
        • sparse_tensor
          • File
            test_averaging_sparse_gradients.py
          • File
            test_csr.py
          • File
            test_sparse_grads.py
        • File
          test_autocast.py
        • File
          test_data.py
        • File
          test_data_efficiency.py
        • File
          test_ds_config_dict.py
        • File
          test_ds_config_model.py
        • File
          test_ds_initialize.py
        • File
          test_lr_schedulers.py
        • File
          test_multi_output_model.py
        • File
          test_pld.py
        • File
          test_runtime_utils.py
        • utils
          • File
            test_partition.py
        • zero
          • File
            test_ignore_unused_parameters.py
          • File
            test_zero.py
          • File
            test_zero_config.py
          • File
            test_zero_context.py
          • File
            test_zero_context_ancestry.py
          • File
            test_zero_context_return.py
          • File
            test_zero_tensor_fragment.py
          • File
            test_zero_tiled.py
          • File
            utils.py
      • File
        simple_model.py
      • File
        util.py
      • utils
        • File
          test_get_optim_files.py
        • File
          test_groups.py
        • File
          test_init_on_device.py
  • File
    version.txt