2023-05-14 04:18:40 -04:00
|
|
|
name: Build CUDA binary on Ubuntu
|
|
|
|
|
|
|
|
on:
|
|
|
|
push:
|
|
|
|
branches: [ '**' ]
|
|
|
|
tags: ['**']
|
|
|
|
pull_request:
|
|
|
|
branches: [ "main" ]
|
|
|
|
|
|
|
|
env:
|
|
|
|
# Customize the CMake build type here (Release, Debug, RelWithDebInfo, etc.)
|
|
|
|
BUILD_TYPE: Release
|
|
|
|
|
|
|
|
jobs:
|
|
|
|
|
|
|
|
build-ubuntu:
|
|
|
|
# The CMake configure and build commands are platform agnostic and should work equally well on Windows or Mac.
|
|
|
|
# You can convert this to a matrix build if you need cross-platform coverage.
|
|
|
|
# See: https://docs.github.com/en/free-pro-team@latest/actions/learn-github-actions/managing-complex-workflows#using-a-build-matrix
|
|
|
|
runs-on: ubuntu-latest
|
|
|
|
|
|
|
|
# strategy:
|
|
|
|
# matrix:
|
|
|
|
# include:
|
|
|
|
# - build: 'avx2'
|
|
|
|
# defines: ''
|
|
|
|
# - build: 'avx'
|
|
|
|
# defines: '-DLLAMA_AVX2=OFF'
|
|
|
|
# - build: 'avx512'
|
|
|
|
# defines: '-DLLAMA_AVX512=ON'
|
|
|
|
|
|
|
|
|
|
|
|
steps:
|
|
|
|
- uses: actions/checkout@v3
|
|
|
|
with:
|
|
|
|
submodules: true
|
|
|
|
|
|
|
|
- name: Install Dependencies
|
|
|
|
run: |
|
|
|
|
wget https://developer.download.nvidia.com/compute/cuda/repos/ubuntu2204/x86_64/cuda-keyring_1.0-1_all.deb
|
|
|
|
sudo dpkg -i cuda-keyring_1.0-1_all.deb
|
2023-05-14 04:34:26 -04:00
|
|
|
sudo apt-get update && sudo apt-get install -yq libboost-dev cuda-nvcc-11-7 libcublas-dev-11-7
|
2023-05-14 04:18:40 -04:00
|
|
|
|
|
|
|
- name: Build
|
|
|
|
# Configure CMake in a 'build' subdirectory. `CMAKE_BUILD_TYPE` is only required if you are using a single-configuration generator such as make.
|
|
|
|
# See https://cmake.org/cmake/help/latest/variable/CMAKE_BUILD_TYPE.html?highlight=cmake_build_type
|
|
|
|
run: |
|
|
|
|
cd ${{github.workspace}}/ggml
|
2023-05-16 15:16:47 -04:00
|
|
|
cmake -B ${{github.workspace}}/ggml/build -DCMAKE_BUILD_TYPE=${{env.BUILD_TYPE}} -DGGML_CUBLAS=ON -DCMAKE_CUDA_COMPILER=/usr/local/cuda/bin/nvcc
|
2023-05-14 04:18:40 -04:00
|
|
|
cd ${{github.workspace}}/ggml/build
|
|
|
|
make codegen codegen-serve codegen-quantize
|
|
|
|
chmod +x ${{github.workspace}}/ggml/build/bin/codegen
|
|
|
|
chmod +x ${{github.workspace}}/ggml/build/bin/codegen-serve
|
|
|
|
chmod +x ${{github.workspace}}/ggml/build/bin/codegen-quantize
|
|
|
|
|
|
|
|
|
|
|
|
- uses: benjlevesque/short-sha@v2.2
|
|
|
|
id: short-sha
|
|
|
|
with:
|
|
|
|
length: 6
|
|
|
|
|
|
|
|
|
|
|
|
- name: Upload Build Artifacts
|
|
|
|
uses: actions/upload-artifact@v3.1.2
|
|
|
|
with:
|
|
|
|
# Artifact name
|
2023-05-14 04:29:57 -04:00
|
|
|
name: turbopilot-${{ runner.os }}-${{ runner.arch }}-${{ steps.short-sha.outputs.sha }}-cuda # optional, default is artifact
|
2023-05-14 04:18:40 -04:00
|
|
|
# A file, directory or wildcard pattern that describes what to upload
|
|
|
|
path: ${{github.workspace}}/ggml/build/bin/codegen*
|
|
|
|
# The desired behavior if no files are found using the provided path.
|
|
|
|
|
|
|
|
- name: package artifacts for release
|
|
|
|
if: startsWith(github.ref, 'refs/tags/')
|
|
|
|
|
|
|
|
run: |
|
|
|
|
cd ${{github.workspace}}/ggml/build/bin
|
|
|
|
zip turbopilot-${{ runner.os }}-${{ runner.arch }}.zip ./codegen*
|
|
|
|
|
|
|
|
- name: Upload binaries to release
|
|
|
|
uses: softprops/action-gh-release@v1
|
|
|
|
if: startsWith(github.ref, 'refs/tags/')
|
|
|
|
with:
|
|
|
|
token: ${{ secrets.PUBLISH_TOKEN }}
|
2023-05-16 15:23:57 -04:00
|
|
|
files: ${{github.workspace}}/ggml/build/bin/turbopilot-${{ runner.os }}-${{ runner.arch }}-cuda.zip
|