here we go ...

neuralmagic · Jun 6, 2024 · 7723eb7 · 7723eb7 · github-actions · Jun 7, 2024
1 parent cbbb67f
commit 7723eb7
Show file tree

Hide file tree

Showing 2 changed files with 83 additions and 83 deletions.
diff --git a/.github/workflows/build-test.yml b/.github/workflows/build-test.yml
@@ -81,18 +81,18 @@ jobs:
             python: ${{ inputs.python }}
         secrets: inherit
 
-    # TEST-SOLO:
-    #     needs: [BUILD]
-    #     if: success()
-    #     uses: ./.github/workflows/test.yml
-    #     with:
-    #         test_label: ${{ inputs.test_label_solo }}
-    #         timeout: ${{ inputs.test_timeout }}
-    #         gitref: ${{ github.ref }}
-    #         python: ${{ inputs.python }}
-    #         whl: ${{ needs.BUILD.outputs.whl }}
-    #         test_skip_list: ${{ inputs.test_skip_list }}
-    #     secrets: inherit
+    TEST-SOLO:
+        needs: [BUILD]
+        if: success()
+        uses: ./.github/workflows/test.yml
+        with:
+            test_label: ${{ inputs.test_label_solo }}
+            timeout: ${{ inputs.test_timeout }}
+            gitref: ${{ github.ref }}
+            python: ${{ inputs.python }}
+            whl: ${{ needs.BUILD.outputs.whl }}
+            test_skip_list: ${{ inputs.test_skip_list }}
+        secrets: inherit
 
     # TEST-MULTI:
     #     needs: [BUILD]
@@ -108,7 +108,7 @@ jobs:
     #     secrets: inherit
 
     UPLOAD:
-        needs: [BUILD]
+        needs: [TEST-SOLO]
         if: contains(fromJSON('["NIGHTLY", "WEEKLY", "RELEASE"]'), inputs.wf_category)
         uses: ./.github/workflows/nm-upload-assets-to-gcp.yml
         with:
@@ -118,45 +118,45 @@ jobs:
             python: ${{ inputs.python }}
         secrets: inherit
 
-    # BENCHMARK:
-    #     needs: [BUILD]
-    #     if: success()
-    #     uses: ./.github/workflows/nm-benchmark.yml
-    #     with:
-    #         label: ${{ inputs.test_label_solo }}
-    #         benchmark_config_list_file: ${{ inputs.benchmark_config_list_file }}
-    #         timeout: ${{ inputs.benchmark_timeout }}
-    #         gitref: ${{ github.ref }}
-    #         python: ${{ inputs.python }}
-    #         whl: ${{ needs.BUILD.outputs.whl }}
-    #         # Always push if it is a scheduled job
-    #         push_benchmark_results_to_gh_pages: "${{ github.event_name == 'schedule' || inputs.push_benchmark_results_to_gh_pages }}"
-    #     secrets: inherit
+    BENCHMARK:
+        needs: [BUILD]
+        if: success()
+        uses: ./.github/workflows/nm-benchmark.yml
+        with:
+            label: ${{ inputs.test_label_solo }}
+            benchmark_config_list_file: ${{ inputs.benchmark_config_list_file }}
+            timeout: ${{ inputs.benchmark_timeout }}
+            gitref: ${{ github.ref }}
+            python: ${{ inputs.python }}
+            whl: ${{ needs.BUILD.outputs.whl }}
+            # Always push if it is a scheduled job
+            push_benchmark_results_to_gh_pages: "${{ github.event_name == 'schedule' || inputs.push_benchmark_results_to_gh_pages }}"
+        secrets: inherit
 
-    # TEST-ACCURACY-SMOKE:
-    #   needs: [BUILD]
-    #   if: inputs.wf_category == 'NIGHTLY'
-    #   uses: ./.github/workflows/nm-test-accuracy-smoke.yml
-    #   with:
-    #     label: ${{ inputs.test_label_solo }}
-    #     timeout: ${{ inputs.benchmark_timeout }}
-    #     gitref: ${{ inputs.gitref }}
-    #     Gi_per_thread: ${{ inputs.Gi_per_thread }}
-    #     nvcc_threads: ${{ inputs.nvcc_threads }}
-    #     python: ${{ inputs.python }}
-    #     whl: ${{ needs.BUILD.outputs.whl }}
-    #   secrets: inherit
+    TEST-ACCURACY-SMOKE:
+      needs: [BUILD]
+      if: inputs.wf_category == 'NIGHTLY'
+      uses: ./.github/workflows/nm-test-accuracy-smoke.yml
+      with:
+        label: ${{ inputs.test_label_solo }}
+        timeout: ${{ inputs.benchmark_timeout }}
+        gitref: ${{ inputs.gitref }}
+        Gi_per_thread: ${{ inputs.Gi_per_thread }}
+        nvcc_threads: ${{ inputs.nvcc_threads }}
+        python: ${{ inputs.python }}
+        whl: ${{ needs.BUILD.outputs.whl }}
+      secrets: inherit
 
-    # TEST-ACCURACY-FULL:
-    #   needs: [BUILD]
-    #   if: ${{ inputs.wf_category == 'WEEKLY' || inputs.wf_category == 'RELEASE' }}
-    #   uses: ./.github/workflows/nm-test-accuracy-full.yml
-    #   with:
-    #     label: ${{ inputs.test_label_multi }}
-    #     timeout: ${{ inputs.benchmark_timeout }}
-    #     gitref: ${{ inputs.gitref }}
-    #     Gi_per_thread: ${{ inputs.Gi_per_thread }}
-    #     nvcc_threads: ${{ inputs.nvcc_threads }}
-    #     python: ${{ inputs.python }}
-    #     whl: ${{ needs.BUILD.outputs.whl }}
-    #   secrets: inherit
+    TEST-ACCURACY-FULL:
+      needs: [BUILD]
+      if: ${{ inputs.wf_category == 'WEEKLY' || inputs.wf_category == 'RELEASE' }}
+      uses: ./.github/workflows/nm-test-accuracy-full.yml
+      with:
+        label: ${{ inputs.test_label_multi }}
+        timeout: ${{ inputs.benchmark_timeout }}
+        gitref: ${{ inputs.gitref }}
+        Gi_per_thread: ${{ inputs.Gi_per_thread }}
+        nvcc_threads: ${{ inputs.nvcc_threads }}
+        python: ${{ inputs.python }}
+        whl: ${{ needs.BUILD.outputs.whl }}
+      secrets: inherit
diff --git a/.github/workflows/nightly.yml b/.github/workflows/nightly.yml
@@ -17,41 +17,41 @@ on:
 
 jobs:
 
-    # PYTHON-3-8:
-    #     uses: ./.github/workflows/build-test.yml
-    #     with:
-    #         wf_category: NIGHTLY
-    #         python: 3.8.17
-    #         gitref: ${{ github.ref }}
+    PYTHON-3-8:
+        uses: ./.github/workflows/build-test.yml
+        with:
+            wf_category: NIGHTLY
+            python: 3.8.17
+            gitref: ${{ github.ref }}
 
-    #         test_label_solo: aws-test-a10g-24G
-    #         test_label_multi: ignore
-    #         test_timeout: 480
-    #         test_skip_list: neuralmagic/tests/skip-for-remote-push-tmp.txt
+            test_label_solo: aws-test-a10g-24G
+            test_label_multi: ignore
+            test_timeout: 480
+            test_skip_list: neuralmagic/tests/skip-for-remote-push-tmp.txt
 
-    #         benchmark_label: aws-test-a10g-24G
-    #         benchmark_config_list_file: ./.github/data/nm_benchmark_nightly_configs_list.txt
-    #         benchmark_timeout: 720
-    #         push_benchmark_results_to_gh_pages: "${{ github.event_name == 'schedule' || inputs.push_benchmark_results_to_gh_pages }}"
-    #     secrets: inherit
+            benchmark_label: aws-test-a10g-24G
+            benchmark_config_list_file: ./.github/data/nm_benchmark_nightly_configs_list.txt
+            benchmark_timeout: 720
+            push_benchmark_results_to_gh_pages: "${{ github.event_name == 'schedule' || inputs.push_benchmark_results_to_gh_pages }}"
+        secrets: inherit
 
-    # PYTHON-3-9:
-    #     uses: ./.github/workflows/build-test.yml
-    #     with:
-    #         wf_category: NIGHTLY
-    #         python: 3.9.17
-    #         gitref: ${{ github.ref }}
+    PYTHON-3-9:
+        uses: ./.github/workflows/build-test.yml
+        with:
+            wf_category: NIGHTLY
+            python: 3.9.17
+            gitref: ${{ github.ref }}
 
-    #         test_label_solo: aws-test-a10g-24G
-    #         test_label_multi: ignore
-    #         test_timeout: 480
-    #         test_skip_list: neuralmagic/tests/skip-for-remote-push-tmp.txt
+            test_label_solo: aws-test-a10g-24G
+            test_label_multi: ignore
+            test_timeout: 480
+            test_skip_list: neuralmagic/tests/skip-for-remote-push-tmp.txt
 
-    #         benchmark_label: aws-test-a10g-24G
-    #         benchmark_config_list_file: ./.github/data/nm_benchmark_nightly_configs_list.txt
-    #         benchmark_timeout: 720
-    #         push_benchmark_results_to_gh_pages: "${{ github.event_name == 'schedule' || inputs.push_benchmark_results_to_gh_pages }}"
-    #     secrets: inherit
+            benchmark_label: aws-test-a10g-24G
+            benchmark_config_list_file: ./.github/data/nm_benchmark_nightly_configs_list.txt
+            benchmark_timeout: 720
+            push_benchmark_results_to_gh_pages: "${{ github.event_name == 'schedule' || inputs.push_benchmark_results_to_gh_pages }}"
+        secrets: inherit
 
     PYTHON-3-10:
         uses: ./.github/workflows/build-test.yml
Benchmark suite	Current: `7723eb7`	Previous: `367c5ee`	Ratio
{"name": "request_throughput", "description": "VLLM Engine prefill throughput - 2:4 Sparse (synthetic)\nmodel - neuralmagic/OpenHermes-2.5-Mistral-7B-pruned2.4\nmax_model_len - 4096\nbenchmark_throughput {\n \"use-all-available-gpus_\": \"\",\n \"input-len\": 128,\n \"output-len\": 1,\n \"num-prompts\": 1,\n \"sparsity\": \"semi_structured_sparse_w16a16\"\n}", "gpu_description": "NVIDIA A10G x 1", "vllm_version": "0.5.0", "python_version": "3.9.17 (main, Jun 7 2023, 12:29:40) \n[GCC 9.4.0]", "torch_version": "2.3.0+cu121"}	`21.433299156481482` prompts/s	`24.347844802232547` prompts/s	`1.14`
{"name": "token_throughput", "description": "VLLM Engine prefill throughput - 2:4 Sparse (synthetic)\nmodel - neuralmagic/OpenHermes-2.5-Mistral-7B-pruned2.4\nmax_model_len - 4096\nbenchmark_throughput {\n \"use-all-available-gpus_\": \"\",\n \"input-len\": 128,\n \"output-len\": 1,\n \"num-prompts\": 1,\n \"sparsity\": \"semi_structured_sparse_w16a16\"\n}", "gpu_description": "NVIDIA A10G x 1", "vllm_version": "0.5.0", "python_version": "3.9.17 (main, Jun 7 2023, 12:29:40) \n[GCC 9.4.0]", "torch_version": "2.3.0+cu121"}	`2764.895591186111` tokens/s	`3140.8719794879985` tokens/s	`1.14`