DeepSpeed
a2984d0a
- Merge pull request #1 from microsoft/master
Go
Login via GitHub
Home
Pricing
FAQ
Install
Login
via GitHub
Commit
View On
GitHub
Hide Minimap (CTRL+M)
Commit
4 years ago
Merge pull request #1 from microsoft/master Pulling upstream
References
#355 - Adding link to Sparse Attention in Navigation page
Author
arashashari
Parents
5590a440
1661e830
Files
191
.clang-format
.gitignore
.pre-commit-config.yaml
CODEOWNERS
DeepSpeedExamples
Dockerfile
README.md
azure-pipelines.yml
basic_install_test.py
bin
ds
csrc
fused_lamb_cuda.cpp
fused_lamb_cuda_kernel.cu
includes
StopWatch.h
Timer.h
context.h
cublas_wrappers.h
custom_cuda_layers.h
dropout.h
ds_transformer_cuda.h
feed_forward.h
gelu.h
gemm_test.h
general_kernels.h
normalize_layer.h
softmax.h
strided_batch_gemm.h
type_shim.h
lamb
fused_lamb_cuda.cpp
fused_lamb_cuda_kernel.cu
sparse_attention
utils.cpp
transformer
cublas_wrappers.cu
dropout_kernels.cu
ds_transformer_cuda.cpp
gelu_kernels.cu
general_kernels.cu
normalize_kernels.cu
softmax_kernels.cu
transform_kernels.cu
type_shim.h
deepspeed
__init__.py
launcher
__init__.py
launch.py
runner.py
ops
__init__.py
lamb
__init__.py
fused_lamb.py
sparse_attention
__init__.py
bert_sparse_self_attention.py
matmul.py
softmax.py
sparse_attention_utils.py
sparse_self_attention.py
sparsity_config.py
trsrc
__init__.py
matmul.tr
softmax_bwd.tr
softmax_fwd.tr
transformer
__init__.py
transformer.py
pt
deepspeed_zero_optimizer.py
runtime
__init__.py
activation_checkpointing
__init__.py
checkpointing.py
config.py
config.py
config_utils.py
constants.py
csr_tensor.py
dataloader.py
engine.py
fp16
__init__.py
fused_optimizer.py
loss_scaler.py
unfused_optimizer.py
lr_schedules.py
utils.py
zero
__init__.py
config.py
stage1.py
stage2.py
utils.py
utils
__init__.py
logging.py
timer.py
docs
Gemfile.lock
README.md
_config.yml
_data
navigation.yml
_layouts
news-home.html
_pages
config-json.md
features.md
_posts
2020-03-17-zero-stage2.md
2020-05-19-bert-record.md
2020-05-19-press-release.md
2020-05-19-zero-stage2.md
2020-05-28-fastest-bert-training.md
2020-07-24-deepspeed-webinar.md
2020-08-07-webinar-on-demand.md
2020-09-09-sparse-attention.md
_tutorials
azure.md
bert-finetuning.md
bert-pretraining.md
cifar-10.md
getting-started.md
megatron.md
sparse_attention.md
transformer_kernel.md
assets/images
deepspeed-speedup.png
deepspeed-throughput-seq128.png
deepspeed-throughput-seq512.png
end-to-end-bert-training.PNG
layernorm_animation.gif
layernorm_deepspeed.gif
layernorm_ds.png
layernorm_pytorch.gif
layernorm_torch.png
qkv_fusion.png
sa_backward_pass.png
sa_bert_base_time_result.png
sa_bert_large_time_result.png
sa_fixed_sparsity_structure.png
sa_forward_pass.png
sa_gpt2_time_result.png
sa_long_document_comprehension_result.png
sa_maximum_sequence_runnable_on_bert.png
sa_variable_sparsity_structure.png
softmax_animation.gif
softmax_deepspeed.gif
softmax_ds.png
softmax_pytorch.gif
softmax_torch.png
transformer_kernel_perf.png
transformer_kernel_perf_seq128.PNG
transformer_kernel_perf_seq512.PNG
transformer_preln_arch.png
variable_sparsity_pattern.png
webinar-aug2020.png
zero-full.png
code-docs
requirements.readthedocs.txt
source
activation-checkpointing.rst
conf.py
index.rst
initialize.rst
kernel.rst
model-checkpointing.rst
training.rst
contributing.md
index.md
install.sh
requirements.txt
requirements
requirements-dev.txt
requirements-sparse-attn.txt
requirements.txt
setup.py
tests
model
BingBertSquad
BingBertSquad_run_func_test.py
deepspeed_bsz24_fp16_config.json
deepspeed_bsz24_fp16_zero2_config.json
run_BingBertSquad.sh
Megatron_GPT2
ds_config_func_bs4_zero1.json
ds_config_func_bs4_zero2.json
ds_config_func_bs8_no_zero.json
ds_config_func_bs8_zero0_gas3.json
ds_config_func_bs8_zero1.json
ds_config_func_bs8_zero2.json
ds_config_func_bs8_zero2_gas3.json
ds_config_func_scheduler.json
ds_config_perf_bs16.json
ds_config_perf_bs32.json
ds_config_perf_bs8.json
ds_gpt2_test.sh
run_checkpoint_test.py
run_func_test.py
test_common.py
run_sanity_check.py
small_model_debugging
test_model.py
unit
common.py
ds_batch_config.json
modeling.py
modelingpreln.py
simple_model.py
test_checkpointing.py
test_config.py
test_csr.py
test_cuda_backward.py
test_cuda_forward.py
test_ds_config.py
test_fp16.py
test_lr_schedulers.py
test_multi_output_model.py
test_run.py
test_sparse_attention.py
Loading