DeepSpeed
ae91f324 - Merge branch 'master' of github.com:microsoft/DeepSpeed

Comment changes are shownComment changes are hidden
Commit
2 years ago
Merge branch 'master' of github.com:microsoft/DeepSpeed
Author
Reza Yazdani
  • accelerator
    • File
      abstract_accelerator.py
    • File
      cuda_accelerator.py
  • csrc
    • aio/py_test
      • File
        aio_bench_perf_sweep.py
      • File
        ds_aio_basic.py
      • File
        ds_aio_handle.py
      • File
        validate_async_io.py
    • transformer
      • File
        softmax_kernels.cu
  • deepspeed
    • autotuning
      • File
        autotuner.py
    • inference
      • File
        engine.py
    • launcher
      • File
        multinode_runner.py
      • File
        runner.py
    • model_implementations/transformers
      • File
        clip_encoder.py
      • File
        ds_transformer.py
    • module_inject
      • File
        auto_tp.py
      • containers
        • File
          vae.py
      • File
        layers.py
      • File
        load_checkpoint.py
      • File
        replace_module.py
    • monitor
      • File
        config.py
      • File
        constants.py
      • File
        csv_monitor.py
      • File
        monitor.py
      • File
        tensorboard.py
      • File
        wandb.py
    • ops
      • adagrad
        • File
          cpu_adagrad.py
      • adam
        • File
          cpu_adam.py
        • File
          fused_adam.py
      • lamb
        • File
          fused_lamb.py
      • quantizer
        • File
          quantizer.py
      • random_ltd
        • File
          dropping_utils.py
      • transformer
        • inference
          • File
            bias_add.py
          • File
            diffusers_attention.py
          • File
            diffusers_transformer_block.py
          • File
            moe_inference.py
          • op_binding
            • File
              base.py
        • File
          transformer.py
    • profiling/flops_profiler
      • File
        profiler.py
    • runtime
      • activation_checkpointing
        • File
          checkpointing.py
      • comm
        • File
          nccl.py
      • File
        config.py
      • data_pipeline/data_sampling
        • File
          data_sampler.py
      • File
        dataloader.py
      • File
        engine.py
      • fp16
        • File
          fused_optimizer.py
        • onebit
          • File
            adam.py
          • File
            lamb.py
          • File
            zoadam.py
        • File
          unfused_optimizer.py
      • pipe
        • File
          engine.py
        • File
          module.py
        • File
          p2p.py
      • swap_tensor
        • File
          partitioned_optimizer_swapper.py
        • File
          partitioned_param_swapper.py
        • File
          pipelined_optimizer_swapper.py
        • File
          utils.py
      • File
        utils.py
      • File
        weight_quantizer.py
      • zero
        • File
          linear.py
        • File
          parameter_offload.py
        • File
          partition_parameters.py
        • File
          partitioned_param_coordinator.py
        • File
          stage3.py
        • File
          stage_1_and_2.py
        • File
          utils.py
    • utils
      • File
        nvtx.py
      • File
        timer.py
  • docs
    • _tutorials
      • File
        autotuning.md
      • File
        azure.md
    • code-docs/source
      • File
        index.rst
      • File
        monitor.rst
  • op_builder
    • File
      __init__.py
    • File
      all_ops.py
    • File
      builder.py
    • File
      builder_names.py
  • requirements
    • File
      requirements.txt
  • tests/unit
    • inference
      • File
        test_inference.py
    • monitor
      • File
        test_monitor.py
    • ops/transformer/inference
      • File
        test_bias_gelu.py
    • runtime
      • File
        test_ds_initialize.py
      • zero
        • File
          test_zero.py
        • File
          test_zero_context.py