Add model builder for Qwen2_5_VLTextModel #5033
This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
| name: "Windows CUDA x64 Build" | |
| on: | |
| workflow_dispatch: | |
| push: | |
| branches: | |
| - main | |
| - rel-* | |
| pull_request: | |
| concurrency: | |
| group: ${{ github.workflow }}-${{ github.event_name == 'pull_request' && github.ref || github.sha }} | |
| cancel-in-progress: true | |
| env: | |
| AZCOPY_AUTO_LOGIN_TYPE: MSI | |
| AZCOPY_MSI_CLIENT_ID: 63b63039-6328-442f-954b-5a64d124e5b4 | |
| cuda_dir: "${{ github.workspace }}\\cuda_sdk" | |
| cuda_version: "12.2" | |
| CUDA_PATH: ${{ github.workspace }}\\cuda_sdk\\v12.2 | |
| binaryDir: 'build/cuda/win-x64' | |
| ORT_NIGHTLY_REST_API: "https://feeds.dev.azure.com/aiinfra/PublicPackages/_apis/packaging/Feeds/ORT-Nightly/packages?packageNameQuery=Microsoft.ML.OnnxRuntime.Gpu.Windows&api-version=6.0-preview.1" | |
| ORT_PACKAGE_NAME: "Microsoft.ML.OnnxRuntime.Gpu.Windows" | |
| jobs: | |
| windows-cuda-x64-build: | |
| runs-on: ["self-hosted", "1ES.Pool=onnxruntime-genai-Win2022-GPU-A10"] | |
| steps: | |
| - name: Checkout OnnxRuntime GenAI repo | |
| uses: actions/checkout@v5 | |
| with: | |
| submodules: true | |
| - uses: actions/setup-python@v6 | |
| with: | |
| python-version: '3.11.x' | |
| architecture: 'x64' | |
| - name: Setup VCPKG | |
| uses: microsoft/onnxruntime-github-actions/[email protected] | |
| with: | |
| vcpkg-version: '2025.03.19' | |
| vcpkg-hash: '17e96169cd3f266c4716fcdc1bb728e6a64f103941ece463a2834d50694eba4fb48f30135503fd466402afa139abc847ef630733c442595d1c34979f261b0114' | |
| cmake-version: '3.31.6' | |
| cmake-hash: '0f1584e8666cf4a65ec514bd02afe281caabf1d45d2c963f3151c41484f457386aa03273ab25776a670be02725354ce0b46f3a5121857416da37366342a833a0' | |
| add-cmake-to-path: 'true' | |
| disable-terrapin: 'false' | |
| - name: Download cuda | |
| run: | | |
| azcopy.exe cp --recursive "https://lotusscus.blob.core.windows.net/models/cuda_sdk/v${{ env.cuda_version }}" ${{ env.cuda_dir}} | |
| - uses: actions/setup-dotnet@v5 | |
| with: | |
| dotnet-version: '8.0.x' | |
| - name: Download OnnxRuntime Nightly | |
| shell: pwsh | |
| run: | | |
| $resp = Invoke-RestMethod "${{ env.ORT_NIGHTLY_REST_API }}" | |
| $ORT_NIGHTLY_VERSION = $resp.value[0].versions[0].normalizedVersion | |
| Write-Host "$ORT_NIGHTLY_VERSION" | |
| "ORT_NIGHTLY_VERSION=$ORT_NIGHTLY_VERSION" | Out-File -FilePath $env:GITHUB_ENV -Append | |
| nuget install ${{ env.ORT_PACKAGE_NAME }} -version $ORT_NIGHTLY_VERSION -ExcludeVersion -NonInteractive | |
| - run: Get-ChildItem ${{ env.ORT_PACKAGE_NAME }} -Recurse | |
| continue-on-error: true | |
| - name: Extract OnnxRuntime library and header files | |
| run: | | |
| mkdir ort/lib | |
| move ${{ env.ORT_PACKAGE_NAME }}/buildTransitive/native/include ort/ | |
| move ${{ env.ORT_PACKAGE_NAME }}/runtimes/win-x64/native/* ort/lib/ | |
| - name: Install Rust Toolchain | |
| run: | | |
| $exePath = "$env:TEMP\rustup-init.exe" | |
| (New-Object Net.WebClient).DownloadFile('https://static.rust-lang.org/rustup/dist/x86_64-pc-windows-msvc/rustup-init.exe', $exePath) | |
| & $exePath -y --default-toolchain=1.86.0 | |
| Add-Content $env:GITHUB_PATH "$env:USERPROFILE\.cargo\bin" | |
| - name: Configure CMake | |
| run: | | |
| cmake --preset windows_x64_cuda_release -T cuda=${{ env.cuda_dir }}\\v${{ env.cuda_version }} | |
| - name: Build with CMake | |
| run: | | |
| cmake --build --preset windows_x64_cuda_release --parallel | |
| cmake --build --preset windows_x64_cuda_release --target PyPackageBuild | |
| - name: Add CUDA to PATH | |
| run: | | |
| echo "${{ env.cuda_dir }}\\v${{ env.cuda_version }}\\bin" | Out-File -FilePath $env:GITHUB_PATH -Encoding utf8 -Append | |
| - name: Install the Python Wheel and Test Dependencies | |
| run: | | |
| python -m pip install -r test\python\requirements.txt | |
| python -m pip install -r test\python\cuda\torch\requirements.txt | |
| python -m pip install -r test\python\cuda\ort\requirements.txt | |
| python -m pip install (Get-ChildItem ("$env:binaryDir\wheel\*.whl")) --no-deps | |
| - name: Run the Python Tests | |
| run: | | |
| python test/python/test_onnxruntime_genai.py --cwd "test\python" --test_models "test\test_models" --e2e | |
| - name: Verify Build Artifacts | |
| if: always() | |
| continue-on-error: true | |
| run: |2 | |
| Get-ChildItem -Path $env:GITHUB_WORKSPACE\$env:binaryDir -Recurse | |
| - name: Build the C# API and Run the C# Tests | |
| run: | | |
| $env:PATH = "${{ env.cuda_dir }}\\v${{ env.cuda_version }}\\bin;" + $env:PATH | |
| cd test\csharp | |
| dotnet test /p:Configuration=release /p:NativeBuildOutputDir="$env:GITHUB_WORKSPACE\$env:binaryDir\Release" /p:OrtLibDir="$env:GITHUB_WORKSPACE\ort\lib" | |
| - name: Prepend CUDA to PATH and Run tests | |
| run: |- | |
| $env:PATH = "${{ env.cuda_dir }}\\v${{ env.cuda_version }}\\bin;" + $env:PATH | |
| echo "Current PATH variable is: $env:PATH" | |
| copy $env:GITHUB_WORKSPACE\ort\lib\* .\$env:binaryDir\Release | |
| & .\$env:binaryDir\Release\unit_tests.exe |