未验证 提交 3347460e 编写于 作者: J Jeff Rasley 提交者: GitHub

Switch to CI to GitHub Actions (#556)

上级 c18fb0de
......@@ -2,7 +2,7 @@
name: CI
# Controls when the action will run.
# Controls when the action will run.
on:
# Triggers the workflow on push or pull request events but only for the master branch
push:
......@@ -29,22 +29,25 @@ jobs:
- name: environment
run: |
nvidia-smi
echo $GITHUB_WORKSPACE
pwd
which python
python --version
which nvcc
nvcc --version
python -c "import torch; print('torch:', torch.__version__, torch)"
python -c "import torch; print('CUDA available:', torch.cuda.is_available())"
# Runs a set of commands using the runners shell
- name: Install deepspeed
run: |
pip install .[dev]
ds_report
- name: Formatting checks
run: |
pip install pre-commit
pre-commit run --all-files
# Runs a set of commands using the runners shell
- name: Run unit tests
- name: Unit tests
run: |
if [[ -d ./torch-extensions ]]; then rm -rf ./torch-extensions; fi
TORCH_EXTENSIONS_DIR=./torch-extensions pytest --durations=0 --forked --verbose -x tests/unit/
# Docker
# Build a Docker image
# https://docs.microsoft.com/azure/devops/pipelines/languages/docker
trigger:
- master
resources:
- repo: self
variables:
tag: '$(Build.BuildId)'
stages:
- stage: Build
displayName: Build image
jobs:
- job: Build
displayName: Build
pool:
vmImage: 'ubuntu-latest'
steps:
- task: Docker@2
displayName: Login to Docker Hub
inputs:
command: login
containerRegistry: DeepSpeedDocker
- task: Docker@2
displayName: Build and Push
inputs:
command: buildAndPush
dockerfile: '$(Build.SourcesDirectory)/docker/Dockerfile'
repository: deepspeed/deepspeed
tags: |
$(tag)
latest
trigger:
paths:
exclude:
- docs
- azure
jobs:
- job: DeepSpeed_Tests
timeoutInMinutes: 360
pool:
name: 'DS_testing'
strategy:
matrix:
PyTorch12-CUDA100:
python.version: '3.6'
cuda.version: '10.0'
pytorch.version: '1.2'
torchvision.version: '0.4.0'
runmodeltests: false
#PyTorch15-CUDA101:
# python.version: '3.7'
# cuda.version: '10.1'
# pytorch.version: '1.5.0+cu101'
# torchvision.version: '0.6.0+cu101'
# runmodeltests: true
##PyTorch15-CUDA102:
# python.version: '3.7'
# cuda.version: '10.2'
# pytorch.version: '1.5'
# torchvision.version: '0.6.1'
# runmodeltests: true
variables:
conda_env: 'ds_test_py$(python.version)_cuda$(cuda.version)_pytorch$(pytorch.version)'
steps:
# Unfortunately nvidia's nvcc_linux-64=<version> seems to install 10.1 regardless?
# Most of this complexity is a workaround to get the compiler toolchain to match the
# cudatoolkit runtime
- script: |
conda create --force --yes -n $(conda_env) python=$(python.version) cudatoolkit=$(cuda.version)
source activate $(conda_env)
conda install -q --yes conda
conda install -q --yes pip
conda install -q --yes gxx_linux-64
echo "PATH=$PATH, LD_LIBRARY_PATH=$LD_LIBRARY_PATH"
displayName: 'Setup environment python=$(python.version) pytorch=$(pytorch.version) cuda=$(cuda.version)'
# Manually install torch/torchvision first to enforce versioning.
- script: |
source activate $(conda_env)
pip install --progress-bar=off torch==$(pytorch.version) torchvision==$(torchvision.version)
pip install .[dev]
ds_report
displayName: 'Install DeepSpeed'
- script: |
source activate $(conda_env)
which python
python --version
which nvcc
nvcc --version
which deepspeed
python -c "import torch; print('torch:', torch.__version__, torch)"
python -c "import torch; print('CUDA available:', torch.cuda.is_available())"
python -c "import deepspeed; print('deepspeed:', deepspeed.__version__)"
displayName: 'Show environment'
- script: |
source activate $(conda_env)
if [[ -d ./torch-extensions ]]; then rm -rf ./torch-extensions; fi
TORCH_EXTENSIONS_DIR=./torch-extensions pytest --durations=0 --forked --verbose -x tests/unit/
displayName: 'Unit tests'
# - script: |
# source activate $(conda_env)
# ln -s /data/Megatron-LM/data DeepSpeedExamples/Megatron-LM/
# pip install --progress-bar=off -r DeepSpeedExamples/Megatron-LM/requirements.txt
# cd tests/model/
# rm -rf BingBertSquad/baseline
# rm -rf Megatron_GPT2/baseline
# pytest --durations=0 -s run_sanity_check.py
# condition: and(succeeded(), eq(variables['runmodeltests'], true))
# displayName: 'Model tests'
# #BingBertSquad logs
# - task: PublishPipelineArtifact@1
# inputs:
# targetPath: '$(Build.SourcesDirectory)/tests/model/BingBertSquad/test/'
# artifactName: BingBertSquad_logs
# displayName: 'BingBertSquad log uploads'
# condition: eq(variables['runmodeltests'], true)
- job: Code_Quality_Checks
pool:
vmImage: 'ubuntu-latest'
variables:
conda_env: 'ds_codetest'
steps:
- bash: echo "##vso[task.prependpath]$CONDA/bin"
displayName: Add conda to PATH
- script: |
conda create --force --yes -n $(conda_env) python=3.7
source activate $(conda_env)
displayName: 'Create code test environment'
- script: |
source activate $(conda_env)
pip install pre-commit
pre-commit run --all-files
displayName: 'Formatting checks'
- script: |
source activate $(conda_env)
pip install pylint
pylint --exit-zero deepspeed/
displayName: 'Code linter'
Markdown is supported
0% .
You are about to add 0 people to the discussion. Proceed with caution.
先完成此消息的编辑!
想要评论请 注册