name: Build CUDA binary on Ubuntu on: push: branches: [ '**' ] tags: ['**'] pull_request: branches: [ "main" ] env: # Customize the CMake build type here (Release, Debug, RelWithDebInfo, etc.) BUILD_TYPE: Release jobs: build-ubuntu: # The CMake configure and build commands are platform agnostic and should work equally well on Windows or Mac. # You can convert this to a matrix build if you need cross-platform coverage. # See: https://docs.github.com/en/free-pro-team@latest/actions/learn-github-actions/managing-complex-workflows#using-a-build-matrix runs-on: ubuntu-latest # strategy: # matrix: # include: # - build: 'avx2' # defines: '' # - build: 'avx' # defines: '-DLLAMA_AVX2=OFF' # - build: 'avx512' # defines: '-DLLAMA_AVX512=ON' steps: - uses: actions/checkout@v3 with: submodules: true - name: Install Dependencies run: | wget https://developer.download.nvidia.com/compute/cuda/repos/ubuntu2204/x86_64/cuda-keyring_1.0-1_all.deb sudo dpkg -i cuda-keyring_1.0-1_all.deb sudo apt-get update && sudo apt-get install -yq libboost-dev cuda-nvcc-11-7 libcublas-dev-11-7 - name: Build # Configure CMake in a 'build' subdirectory. `CMAKE_BUILD_TYPE` is only required if you are using a single-configuration generator such as make. # See https://cmake.org/cmake/help/latest/variable/CMAKE_BUILD_TYPE.html?highlight=cmake_build_type run: | cd ${{github.workspace}}/ggml cmake -B ${{github.workspace}}/ggml/build -DCMAKE_BUILD_TYPE=${{env.BUILD_TYPE}} -D CMAKE_EXE_LINKER_FLAGS="-static" -DGGML_CUBLAS=ON -DCMAKE_CUDA_COMPILER=/usr/local/cuda/bin/nvcc cd ${{github.workspace}}/ggml/build make codegen codegen-serve codegen-quantize chmod +x ${{github.workspace}}/ggml/build/bin/codegen chmod +x ${{github.workspace}}/ggml/build/bin/codegen-serve chmod +x ${{github.workspace}}/ggml/build/bin/codegen-quantize - uses: benjlevesque/short-sha@v2.2 id: short-sha with: length: 6 - name: Upload Build Artifacts uses: actions/upload-artifact@v3.1.2 with: # Artifact name name: turbopilot-${{ runner.os }}-${{ runner.arch }}-${{ steps.short-sha.outputs.sha }}-cuda # optional, default is artifact # A file, directory or wildcard pattern that describes what to upload path: ${{github.workspace}}/ggml/build/bin/codegen* # The desired behavior if no files are found using the provided path. - name: package artifacts for release if: startsWith(github.ref, 'refs/tags/') run: | cd ${{github.workspace}}/ggml/build/bin zip turbopilot-${{ runner.os }}-${{ runner.arch }}.zip ./codegen* - name: Upload binaries to release uses: softprops/action-gh-release@v1 if: startsWith(github.ref, 'refs/tags/') with: token: ${{ secrets.PUBLISH_TOKEN }} files: ${{github.workspace}}/ggml/build/bin/turbopilot-${{ runner.os }}-${{ runner.arch }}.zip