parent
							
								
									eae92bc7da
								
							
						
					
					
						commit
						6a902b892e
					
				
					 3 changed files with 77 additions and 0 deletions
				
			
		| 
						 | 
					@ -15,6 +15,7 @@ runs:
 | 
				
			||||||
        mv linux-avx512/* python/llm/llm-binary/
 | 
					        mv linux-avx512/* python/llm/llm-binary/
 | 
				
			||||||
        mv linux-avxvnni/* python/llm/llm-binary/
 | 
					        mv linux-avxvnni/* python/llm/llm-binary/
 | 
				
			||||||
        mv linux-avx/* python/llm/llm-binary/
 | 
					        mv linux-avx/* python/llm/llm-binary/
 | 
				
			||||||
 | 
					        mv linux-amx/* python/llm/llm-binary/
 | 
				
			||||||
        mv windows-avx2/* python/llm/llm-binary/
 | 
					        mv windows-avx2/* python/llm/llm-binary/
 | 
				
			||||||
        mv windows-avx2-vnni/* python/llm/llm-binary/
 | 
					        mv windows-avx2-vnni/* python/llm/llm-binary/
 | 
				
			||||||
        mv windows-avx/* python/llm/llm-binary/
 | 
					        mv windows-avx/* python/llm/llm-binary/
 | 
				
			||||||
| 
						 | 
					@ -22,6 +23,7 @@ runs:
 | 
				
			||||||
        rm -rf linux-avx512 || true
 | 
					        rm -rf linux-avx512 || true
 | 
				
			||||||
        rm -rf linux-avxvnni || true
 | 
					        rm -rf linux-avxvnni || true
 | 
				
			||||||
        rm -rf linux-avx || true
 | 
					        rm -rf linux-avx || true
 | 
				
			||||||
 | 
					        rm -rf linux-amx || true
 | 
				
			||||||
        rm -rf windows-avx2 || true
 | 
					        rm -rf windows-avx2 || true
 | 
				
			||||||
        rm -rf windows-avx2-vnni || true
 | 
					        rm -rf windows-avx2-vnni || true
 | 
				
			||||||
        rm -rf windows-avx || true
 | 
					        rm -rf windows-avx || true
 | 
				
			||||||
| 
						 | 
					
 | 
				
			||||||
							
								
								
									
										70
									
								
								.github/workflows/llm-binary-build.yml
									
									
									
									
										vendored
									
									
								
							
							
						
						
									
										70
									
								
								.github/workflows/llm-binary-build.yml
									
									
									
									
										vendored
									
									
								
							| 
						 | 
					@ -215,6 +215,76 @@ jobs:
 | 
				
			||||||
          make clean
 | 
					          make clean
 | 
				
			||||||
          conda remove -n python39 --all -y
 | 
					          conda remove -n python39 --all -y
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					  check-linux-amx-artifact:
 | 
				
			||||||
 | 
					    runs-on: ubuntu-latest
 | 
				
			||||||
 | 
					    outputs:
 | 
				
			||||||
 | 
					      if-exists: ${{steps.check_artifact.outputs.exists}}
 | 
				
			||||||
 | 
					    steps:
 | 
				
			||||||
 | 
					      - name: Check if built
 | 
				
			||||||
 | 
					        id: check_artifact
 | 
				
			||||||
 | 
					        uses: xSAVIKx/artifact-exists-action@v0
 | 
				
			||||||
 | 
					        with:
 | 
				
			||||||
 | 
					          name: linux-amx
 | 
				
			||||||
 | 
					
 | 
				
			||||||
 | 
					  linux-build-amx:
 | 
				
			||||||
 | 
					    runs-on: [self-hosted, amx, almalinux8]
 | 
				
			||||||
 | 
					    needs: check-linux-amx-artifact
 | 
				
			||||||
 | 
					    if: needs.check-linux-amx-artifact.outputs.if-exists == 'false'
 | 
				
			||||||
 | 
					    steps:
 | 
				
			||||||
 | 
					      - name: Set access token
 | 
				
			||||||
 | 
					        run: |
 | 
				
			||||||
 | 
					          echo "github_access_token=${GITHUB_ACCESS_TOKEN}" >> "$GITHUB_ENV"
 | 
				
			||||||
 | 
					      - name: Install Build Environment
 | 
				
			||||||
 | 
					        shell: bash
 | 
				
			||||||
 | 
					        run: |
 | 
				
			||||||
 | 
					          export http_proxy=${HTTP_PROXY}
 | 
				
			||||||
 | 
					          export https_proxy=${HTTPS_PROXY}
 | 
				
			||||||
 | 
					          yum install -y gcc-toolset-12 cmake git
 | 
				
			||||||
 | 
					          conda remove -n python39 --all -y
 | 
				
			||||||
 | 
					          conda create -n python39 python=3.9 -y
 | 
				
			||||||
 | 
					      - uses: actions/checkout@v3
 | 
				
			||||||
 | 
					        with:
 | 
				
			||||||
 | 
					          repository: "intel-analytics/llm.cpp"
 | 
				
			||||||
 | 
					          ref: ${{ inputs.llmcpp-ref }}
 | 
				
			||||||
 | 
					          token: ${{ env.github_access_token }}
 | 
				
			||||||
 | 
					          submodules: "recursive"
 | 
				
			||||||
 | 
					      - name: Build amx binary
 | 
				
			||||||
 | 
					        shell: bash
 | 
				
			||||||
 | 
					        run: |
 | 
				
			||||||
 | 
					          scl enable gcc-toolset-12 "cmake -DONLYAVX=OFF -DONLYAVX2=OFF -B build"
 | 
				
			||||||
 | 
					          scl enable gcc-toolset-12 "cmake --build build --config Release"
 | 
				
			||||||
 | 
					          # build chatglm
 | 
				
			||||||
 | 
					          source activate python39 || conda activate python39
 | 
				
			||||||
 | 
					          cd src/chatglm
 | 
				
			||||||
 | 
					          scl enable gcc-toolset-12 "cmake -B build"
 | 
				
			||||||
 | 
					          scl enable gcc-toolset-12 "cmake --build build --config Release"
 | 
				
			||||||
 | 
					      - name: Move amx release binary
 | 
				
			||||||
 | 
					        shell: bash
 | 
				
			||||||
 | 
					        run: |
 | 
				
			||||||
 | 
					          mkdir amx_release
 | 
				
			||||||
 | 
					          mv build/quantize-bloom amx_release/quantize-bloom_amx
 | 
				
			||||||
 | 
					          mv build/libbloom.so amx_release/libbloom_amx.so
 | 
				
			||||||
 | 
					          mv build/quantize-llama amx_release/quantize-llama_amx
 | 
				
			||||||
 | 
					          mv build/libllama.so amx_release/libllama_amx.so
 | 
				
			||||||
 | 
					          mv build/quantize-gptneox amx_release/quantize-gptneox_amx
 | 
				
			||||||
 | 
					          mv build/libgptneox.so amx_release/libgptneox_amx.so
 | 
				
			||||||
 | 
					          mv build/quantize-starcoder amx_release/quantize-starcoder_amx
 | 
				
			||||||
 | 
					          mv build/libstarcoder.so amx_release/libstarcoder_amx.so
 | 
				
			||||||
 | 
					          # chatglm binary files
 | 
				
			||||||
 | 
					          mv src/chatglm/build/main amx_release/main-chatglm_amx
 | 
				
			||||||
 | 
					          # mv src/chatglm/build/_C.cpython-39-x86_64-linux-gnu.so amx_release/chatglm_C.cpython-39-x86_64-linux-gnu.so
 | 
				
			||||||
 | 
					      - name: Archive amx build files
 | 
				
			||||||
 | 
					        uses: actions/upload-artifact@v3
 | 
				
			||||||
 | 
					        with:
 | 
				
			||||||
 | 
					          name: linux-amx
 | 
				
			||||||
 | 
					          path: |
 | 
				
			||||||
 | 
					            amx_release
 | 
				
			||||||
 | 
					      - name: Clean up test environment
 | 
				
			||||||
 | 
					        shell: bash
 | 
				
			||||||
 | 
					        run: |
 | 
				
			||||||
 | 
					          make clean
 | 
				
			||||||
 | 
					          conda remove -n python39 --all -y
 | 
				
			||||||
 | 
					          
 | 
				
			||||||
  check-windows-avx2-artifact:
 | 
					  check-windows-avx2-artifact:
 | 
				
			||||||
    runs-on: ubuntu-latest
 | 
					    runs-on: ubuntu-latest
 | 
				
			||||||
    outputs:
 | 
					    outputs:
 | 
				
			||||||
| 
						 | 
					
 | 
				
			||||||
| 
						 | 
					@ -102,6 +102,10 @@ linux_binarys = [
 | 
				
			||||||
    "libgptneox_avx512.so",
 | 
					    "libgptneox_avx512.so",
 | 
				
			||||||
    "libbloom_avx512.so",
 | 
					    "libbloom_avx512.so",
 | 
				
			||||||
    "libstarcoder_avx512.so",
 | 
					    "libstarcoder_avx512.so",
 | 
				
			||||||
 | 
					    "libllama_amx.so",
 | 
				
			||||||
 | 
					    "libgptneox_amx.so",
 | 
				
			||||||
 | 
					    "libbloom_amx.so",
 | 
				
			||||||
 | 
					    "libstarcoder_amx.so",
 | 
				
			||||||
    "quantize-llama",
 | 
					    "quantize-llama",
 | 
				
			||||||
    "quantize-gptneox",
 | 
					    "quantize-gptneox",
 | 
				
			||||||
    "quantize-bloom",
 | 
					    "quantize-bloom",
 | 
				
			||||||
| 
						 | 
					@ -116,6 +120,7 @@ linux_binarys = [
 | 
				
			||||||
    "main-starcoder",
 | 
					    "main-starcoder",
 | 
				
			||||||
 | 
					
 | 
				
			||||||
    "main-chatglm_vnni",
 | 
					    "main-chatglm_vnni",
 | 
				
			||||||
 | 
					    "main-chatglm_amx",
 | 
				
			||||||
    "chatglm_C.cpython-39-x86_64-linux-gnu.so",
 | 
					    "chatglm_C.cpython-39-x86_64-linux-gnu.so",
 | 
				
			||||||
]
 | 
					]
 | 
				
			||||||
 | 
					
 | 
				
			||||||
| 
						 | 
					
 | 
				
			||||||
		Loading…
	
		Reference in a new issue