benchmarks.yml 1.9 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071
  1. name: Build and Test
  2. on:
  3. push:
  4. branches: [ '*' ]
  5. tags: [ '*' ]
  6. pull_request:
  7. branches: [ '*' ]
  8. jobs:
  9. single-m4-pro:
  10. strategy:
  11. matrix:
  12. model: ['llama-3.2-1b', 'llama-3.2-3b', 'llama-3.1-8b']
  13. uses: ./.github/workflows/bench_job.yml
  14. with:
  15. config: '{"M4PRO_GPU16_24GB": 1}'
  16. model: ${{ matrix.model }}
  17. calling_job_name: 'single-m4-pro'
  18. network_interface: 'Ethernet'
  19. secrets: inherit
  20. two-m4-pro-cluster:
  21. strategy:
  22. matrix:
  23. model: ['llama-3.2-1b', 'llama-3.2-3b', 'llama-3.1-8b']
  24. uses: ./.github/workflows/bench_job.yml
  25. with:
  26. config: '{"M4PRO_GPU16_24GB": 2}'
  27. model: ${{ matrix.model }}
  28. calling_job_name: 'two-m4-pro-cluster'
  29. network_interface: 'Ethernet'
  30. secrets: inherit
  31. # two-m4-pro-cluster-thunderbolt:
  32. # strategy:
  33. # matrix:
  34. # model: ['llama-3.2-1b', 'llama-3.2-3b', 'llama-3.1-8b']
  35. # uses: ./.github/workflows/bench_job.yml
  36. # with:
  37. # config: '{"M4PRO_GPU16_24GB": 2}'
  38. # model: ${{ matrix.model }}
  39. # calling_job_name: 'two-m4-pro-cluster-thunderbolt'
  40. # network_interface: 'Thunderbolt'
  41. # secrets: inherit
  42. three-m4-pro-cluster:
  43. strategy:
  44. matrix:
  45. model: ['llama-3.2-1b', 'llama-3.2-3b', 'llama-3.1-8b', 'llama-3.3-70b']
  46. fail-fast: false
  47. uses: ./.github/workflows/bench_job.yml
  48. with:
  49. config: '{"M4PRO_GPU16_24GB": 3}'
  50. model: ${{ matrix.model }}
  51. calling_job_name: 'three-m4-pro-cluster'
  52. network_interface: 'Ethernet'
  53. secrets: inherit
  54. # test-m3-single-node:
  55. # strategy:
  56. # matrix:
  57. # model: ['llama-3.2-1b']
  58. # fail-fast: false
  59. # uses: ./.github/workflows/bench_job.yml
  60. # with:
  61. # config: '{"M3MAX_GPU40_128GB": 1}'
  62. # model: ${{ matrix.model }}
  63. # calling_job_name: 'test-m3-cluster'
  64. # network_interface: 'Ethernet'
  65. # secrets: inherit