build.yml 13 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387
  1. name: CI
  2. on:
  3. push:
  4. branches: [main, master]
  5. paths:
  6. - '**/*.cpp'
  7. - '**/*.h'
  8. - '**/*.hpp'
  9. - '**/CMakeLists.txt'
  10. - '.github/workflows/**'
  11. pull_request:
  12. types: [opened, synchronize, reopened]
  13. workflow_dispatch:
  14. concurrency:
  15. group: ${{ github.workflow }}-${{ github.head_ref && github.ref || github.run_id }}
  16. cancel-in-progress: true
  17. env:
  18. # HuggingFace model info
  19. HF_MODEL_REPO: GaboxR67/MelBandRoformers
  20. HF_CHECKPOINT_PATH: melbandroformers/vocals/voc_fv6.ckpt
  21. HF_CONFIG_PATH: melbandroformers/vocals/voc_gabox.yaml
  22. # Music-Source-Separation-Training repo
  23. MSST_REPO: https://github.com/ZFTurbo/Music-Source-Separation-Training.git
  24. jobs:
  25. # ===========================================================================
  26. # Prepare: Generate test data (runs once, shared via artifacts)
  27. # ===========================================================================
  28. prepare-test-data:
  29. runs-on: ubuntu-latest
  30. steps:
  31. - name: Checkout
  32. uses: actions/checkout@v4
  33. - name: Setup Python
  34. uses: actions/setup-python@v5
  35. with:
  36. python-version: '3.11'
  37. - name: Clone MSST Repository
  38. run: git clone --depth 1 ${{ env.MSST_REPO }} msst
  39. - name: Install Dependencies
  40. run: |
  41. pip install torch torchaudio --index-url https://download.pytorch.org/whl/cpu
  42. pip install huggingface_hub scipy soundfile gguf librosa ml_collections einops pyyaml numpy tqdm beartype rotary_embedding_torch
  43. - name: Download Model from HuggingFace
  44. env:
  45. HF_TOKEN: ${{ secrets.HF_TOKEN }}
  46. run: |
  47. python -c "
  48. from huggingface_hub import hf_hub_download
  49. import os
  50. token = os.environ.get('HF_TOKEN') or None
  51. hf_hub_download('${{ env.HF_MODEL_REPO }}', '${{ env.HF_CHECKPOINT_PATH }}',
  52. local_dir='./model', token=token)
  53. hf_hub_download('${{ env.HF_MODEL_REPO }}', '${{ env.HF_CONFIG_PATH }}',
  54. local_dir='./model', token=token)
  55. "
  56. - name: Generate Test Audio
  57. run: |
  58. python -c "
  59. import numpy as np
  60. import scipy.io.wavfile as wav
  61. sr = 44100
  62. duration = 5.0
  63. t = np.linspace(0, duration, int(sr * duration))
  64. # Create a more complex test signal
  65. left = (np.sin(2 * np.pi * 440 * t) + 0.5 * np.sin(2 * np.pi * 880 * t)) * 0.3
  66. right = (np.sin(2 * np.pi * 660 * t) + 0.5 * np.sin(2 * np.pi * 1320 * t)) * 0.3
  67. stereo = np.stack([left, right], axis=1).astype(np.float32)
  68. wav.write('test_audio.wav', sr, stereo)
  69. print(f'Generated test audio: {len(t)} samples, {duration}s')
  70. "
  71. - name: Generate Test Data
  72. run: |
  73. python scripts/generate_test_data.py \
  74. --model-repo msst \
  75. --audio test_audio.wav \
  76. --checkpoint model/${{ env.HF_CHECKPOINT_PATH }} \
  77. --config model/${{ env.HF_CONFIG_PATH }} \
  78. --output test_data
  79. - name: Convert Model to GGUF
  80. run: |
  81. python scripts/convert_to_gguf.py \
  82. --ckpt model/${{ env.HF_CHECKPOINT_PATH }} \
  83. --config model/${{ env.HF_CONFIG_PATH }} \
  84. --out model.gguf \
  85. --dtype fp16
  86. - name: Upload Test Data Artifact
  87. uses: actions/upload-artifact@v4
  88. with:
  89. name: test-data
  90. path: |
  91. test_data/
  92. model.gguf
  93. test_audio.wav
  94. retention-days: 1
  95. # ===========================================================================
  96. # Build Matrix: Core Platforms + Vulkan
  97. # ===========================================================================
  98. build:
  99. needs: prepare-test-data
  100. strategy:
  101. fail-fast: false
  102. matrix:
  103. include:
  104. # Tier 1: Core Platforms (CPU)
  105. - { name: linux-x64-cpu, os: ubuntu-22.04, backend: cpu, test: true }
  106. - { name: linux-arm64-cpu, os: ubuntu-22.04-arm, backend: cpu, test: true }
  107. - { name: macos-arm64, os: macos-latest, backend: cpu, test: true }
  108. - { name: macos-x64, os: macos-15-intel, backend: cpu, test: true }
  109. - { name: windows-x64-msvc, os: windows-2025, backend: cpu, test: true }
  110. # Tier 2: Vulkan Backend
  111. - { name: linux-vulkan, os: ubuntu-24.04, backend: vulkan, test: true }
  112. - { name: windows-vulkan, os: windows-2025, backend: vulkan, test: true }
  113. runs-on: ${{ matrix.os }}
  114. steps:
  115. - name: Checkout
  116. uses: actions/checkout@v4
  117. - name: Clone GGML
  118. run: git clone --depth 1 https://github.com/ggerganov/ggml.git ggml
  119. - name: Download Test Data
  120. uses: actions/download-artifact@v4
  121. with:
  122. name: test-data
  123. - name: Setup Python
  124. uses: actions/setup-python@v5
  125. with:
  126. python-version: '3.11'
  127. - name: Install Python Dependencies
  128. run: pip install numpy scipy
  129. # ----- Linux Dependencies -----
  130. - name: Install Dependencies (Linux)
  131. if: runner.os == 'Linux'
  132. run: |
  133. sudo apt-get update
  134. sudo apt-get install -y build-essential cmake
  135. - name: Install Vulkan SDK (Linux)
  136. if: matrix.backend == 'vulkan' && runner.os == 'Linux'
  137. run: |
  138. sudo apt-get install -y libvulkan-dev glslc mesa-vulkan-drivers
  139. # ----- macOS Dependencies -----
  140. - name: Install Dependencies (macOS)
  141. if: runner.os == 'macOS'
  142. run: brew install cmake
  143. # ----- Windows Dependencies -----
  144. - name: Install Dependencies (Windows)
  145. if: runner.os == 'Windows'
  146. run: choco install ninja -y
  147. - name: Install Vulkan SDK (Windows)
  148. if: matrix.backend == 'vulkan' && runner.os == 'Windows'
  149. run: |
  150. $VK_VERSION = "1.4.313.2"
  151. curl.exe -o VulkanSDK.exe -L "https://sdk.lunarg.com/sdk/download/${VK_VERSION}/windows/vulkansdk-windows-X64-${VK_VERSION}.exe"
  152. Start-Process -FilePath .\VulkanSDK.exe -ArgumentList "--accept-licenses --default-answer --confirm-command install" -Wait
  153. Add-Content $env:GITHUB_ENV "VULKAN_SDK=C:\VulkanSDK\${VK_VERSION}"
  154. Add-Content $env:GITHUB_PATH "C:\VulkanSDK\${VK_VERSION}\bin"
  155. # ----- Configure -----
  156. - name: Configure (Unix)
  157. if: runner.os != 'Windows'
  158. run: |
  159. cmake -B build \
  160. -DCMAKE_BUILD_TYPE=Release \
  161. -DGGML_DIR=ggml \
  162. -DGGML_CUDA=OFF \
  163. -DGGML_VULKAN=${{ matrix.backend == 'vulkan' && 'ON' || 'OFF' }} \
  164. -DMBR_BUILD_TESTS=ON \
  165. -DMBR_BUILD_CLI=ON
  166. - name: Configure (Windows)
  167. if: runner.os == 'Windows'
  168. run: |
  169. cmake -B build -G "Ninja Multi-Config" `
  170. -DGGML_DIR=ggml `
  171. -DGGML_CUDA=OFF `
  172. -DGGML_VULKAN=${{ matrix.backend == 'vulkan' && 'ON' || 'OFF' }} `
  173. -DMBR_BUILD_TESTS=ON `
  174. -DMBR_BUILD_CLI=ON
  175. # ----- Build -----
  176. - name: Build (Unix)
  177. if: runner.os != 'Windows'
  178. run: cmake --build build --config Release -j $(nproc 2>/dev/null || sysctl -n hw.logicalcpu)
  179. - name: Build (Windows)
  180. if: runner.os == 'Windows'
  181. run: cmake --build build --config Release -j $env:NUMBER_OF_PROCESSORS
  182. # ----- Unit Tests -----
  183. - name: Run Unit Tests
  184. if: matrix.test
  185. env:
  186. MBR_MODEL_PATH: ${{ github.workspace }}/model.gguf
  187. MBR_TEST_DATA_DIR: ${{ github.workspace }}/test_data
  188. run: ctest --test-dir build -C Release --output-on-failure --timeout 300
  189. # ----- CLI Tests -----
  190. - name: Test CLI
  191. if: matrix.test
  192. shell: bash
  193. env:
  194. MBR_MODEL_PATH: ${{ github.workspace }}/model.gguf
  195. run: |
  196. echo "=== CLI Test Suite ==="
  197. # Determine CLI path based on OS
  198. if [[ "$RUNNER_OS" == "Windows" ]]; then
  199. CLI="./build/bin/Release/mel_band_roformer-cli.exe"
  200. else
  201. CLI="./build/mel_band_roformer-cli"
  202. fi
  203. # 1. Test --help
  204. echo "[1/4] Testing --help..."
  205. $CLI --help
  206. # 2. Test with missing arguments (should fail)
  207. echo "[2/4] Testing error handling..."
  208. if $CLI 2>/dev/null; then
  209. echo "ERROR: CLI should fail without arguments"
  210. exit 1
  211. fi
  212. # 3. Generate test audio (short 2-second clip)
  213. echo "[3/4] Generating test audio..."
  214. python3 -c "
  215. import numpy as np
  216. import scipy.io.wavfile as wav
  217. sr = 44100
  218. t = np.linspace(0, 2.0, sr * 2)
  219. stereo = np.stack([np.sin(2*np.pi*440*t), np.sin(2*np.pi*880*t)], axis=1).astype(np.float32) * 0.5
  220. wav.write('cli_test_input.wav', sr, stereo)
  221. "
  222. # 4. Run full inference
  223. echo "[4/4] Running inference..."
  224. $CLI "$MBR_MODEL_PATH" cli_test_input.wav cli_test_output.wav --chunk-size 88200 --overlap 2
  225. # Verify output exists and has reasonable size
  226. if [[ ! -f cli_test_output.wav ]]; then
  227. echo "ERROR: Output file not created"
  228. exit 1
  229. fi
  230. OUTPUT_SIZE=$(stat -c%s cli_test_output.wav 2>/dev/null || stat -f%z cli_test_output.wav)
  231. if [[ $OUTPUT_SIZE -lt 1000 ]]; then
  232. echo "ERROR: Output file too small: $OUTPUT_SIZE bytes"
  233. exit 1
  234. fi
  235. echo "=== CLI Tests Passed ==="
  236. # ----- Upload Artifacts -----
  237. - name: Upload Build Artifacts
  238. uses: actions/upload-artifact@v4
  239. with:
  240. name: build-${{ matrix.name }}
  241. path: |
  242. build/bin/
  243. build/lib*/
  244. build/*.dll
  245. build/*.so
  246. build/*.dylib
  247. build/mel_band_roformer-cli*
  248. build/Release/
  249. retention-days: 7
  250. # ===========================================================================
  251. # CUDA Build: Linux (Compile Only - No GPU for testing)
  252. # ===========================================================================
  253. build-cuda-linux:
  254. runs-on: ubuntu-latest
  255. container: nvidia/cuda:12.6.2-devel-ubuntu24.04
  256. steps:
  257. - name: Install Git
  258. run: |
  259. apt-get update
  260. apt-get install -y git
  261. - name: Checkout
  262. uses: actions/checkout@v4
  263. - name: Clone GGML
  264. run: git clone --depth 1 https://github.com/ggerganov/ggml.git ggml
  265. - name: Install Dependencies
  266. run: |
  267. apt-get install -y cmake build-essential ninja-build
  268. - name: Configure
  269. run: |
  270. ls -ld ggml
  271. cmake -B build -G Ninja \
  272. -DCMAKE_BUILD_TYPE=Release \
  273. -DGGML_DIR=ggml \
  274. -DGGML_CUDA=ON \
  275. -DCMAKE_CUDA_ARCHITECTURES="75;80;86;89" \
  276. -DMBR_BUILD_TESTS=OFF \
  277. -DMBR_BUILD_CLI=ON
  278. - name: Build
  279. run: cmake --build build --config Release -j $(nproc)
  280. - name: Upload Artifacts
  281. uses: actions/upload-artifact@v4
  282. with:
  283. name: build-linux-cuda
  284. path: |
  285. build/bin/
  286. build/lib*/
  287. build/*.so
  288. retention-days: 7
  289. # ===========================================================================
  290. # CUDA Build: Windows (Compile Only - No GPU for testing)
  291. # ===========================================================================
  292. build-cuda-windows:
  293. runs-on: windows-2022
  294. env:
  295. CUDA_VERSION: '12.4'
  296. steps:
  297. - name: Checkout
  298. uses: actions/checkout@v4
  299. - name: Clone GGML
  300. run: git clone --depth 1 https://github.com/ggerganov/ggml.git ggml
  301. - name: Install CUDA Toolkit
  302. run: |
  303. # For CI, use the official CUDA installer approach
  304. curl.exe -o cuda_installer.exe -L "https://developer.download.nvidia.com/compute/cuda/12.4.0/network_installers/cuda_12.4.0_windows_network.exe"
  305. Start-Process -FilePath .\cuda_installer.exe -ArgumentList "-s nvcc_12.4 cudart_12.4 cublas_12.4 cublas_dev_12.4 cufft_12.4 cufft_dev_12.4" -Wait -NoNewWindow
  306. Add-Content $env:GITHUB_ENV "CUDA_PATH=C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v12.4"
  307. Add-Content $env:GITHUB_PATH "C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v12.4\bin"
  308. - name: Install Ninja
  309. run: choco install ninja -y
  310. - name: Configure
  311. shell: cmd
  312. run: |
  313. call "C:\Program Files\Microsoft Visual Studio\2022\Enterprise\VC\Auxiliary\Build\vcvarsall.bat" x64
  314. cmake -B build -G "Ninja Multi-Config" ^
  315. -DGGML_DIR=ggml ^
  316. -DGGML_CUDA=ON ^
  317. -DCMAKE_CUDA_ARCHITECTURES="75;80;86;89" ^
  318. -DMBR_BUILD_TESTS=OFF ^
  319. -DMBR_BUILD_CLI=ON
  320. - name: Build
  321. run: cmake --build build --config Release -j $env:NUMBER_OF_PROCESSORS
  322. - name: Upload Artifacts
  323. uses: actions/upload-artifact@v4
  324. with:
  325. name: build-windows-cuda
  326. path: |
  327. build/bin/
  328. build/Release/
  329. build/*.dll
  330. retention-days: 7