DeepSpeed
7ae577cd - Merge branch 'master' into fix-sp-dense

Comment changes are shownComment changes are hidden
Commit
1 year ago
  • .github/workflows
    • File
      amd-mi200.yml
  • File
    README.md
  • accelerator
    • File
      npu_accelerator.py
  • csrc
    • includes
      • File
        conversion_utils.h
      • File
        cublas_wrappers.h
      • File
        ds_kernel_utils.h
      • File
        feed_forward.h
      • File
        gemm_test.h
      • File
        general_kernels.h
      • File
        quantizer.h
      • File
        reduction_utils.h
      • File
        strided_batch_gemm.h
    • lamb
      • File
        fused_lamb_cuda_kernel.cu
    • quantization
      • File
        fake_quantizer.cu
    • random_ltd
      • File
        token_sort.cu
    • spatial/includes
      • File
        spatial_cuda_layers.h
    • transformer
      • File
        cublas_wrappers.cu
      • File
        ds_transformer_cuda.cpp
      • inference
        • csrc
          • File
            apply_rotary_pos_emb.cu
          • File
            pt_binding.cpp
          • File
            softmax.cu
          • File
            transform.cu
        • includes
          • File
            inference_context.h
          • File
            inference_cublas_wrappers.h
          • File
            inference_cuda_layers.h
  • deepspeed
    • comm
      • File
        ccl.py
      • File
        comm.py
    • launcher
      • File
        multinode_runner.py
    • module_inject/containers
      • File
        llama.py
    • ops/transformer/inference
      • File
        config.py
      • op_binding
        • File
          linear.py
        • File
          softmax_context.py
    • runtime/zero
      • File
        stage3.py
  • docs/assets/files
    • File
      ICML-5mins.pdf
    • File
      SC21-ZeRO-Infinity.pdf
    • File
      presentation-mlops.pdf
    • File
      sc22-ds-inference.pdf
  • op_builder
    • File
      cpu_adagrad.py
    • File
      cpu_adam.py
    • npu
      • File
        __init__.py
      • File
        fused_adam.py
    • File
      random_ltd.py
    • File
      transformer.py