Test manual workflow to send pytest JSON results to DB

psanal35 · psanal35 · commit 8751cec5e36b · 2026-02-05T21:13:14.000Z
diff --git a/.github/workflows/nightly.yml b/.github/workflows/nightly.yml
@@ -1,89 +1,86 @@
 name: Nightly
 
 on:
-  schedule:
-    - cron: "0 1 * * *"
   workflow_dispatch:
-  pull_request:
-    paths:
-      - '.github/workflows/nightly.yml'
-
-concurrency:
-  group: ${{ github.workflow }}-${{ github.ref }}
-  cancel-in-progress: true
-
-permissions:
-  contents: read
-  packages: write
+    inputs:
+      source-repo:
+        description: "ORG/REPO"
+        required: true
+        type: string
+      source-github-run-id:
+        description: "Repo GitHub Run ID"
+        required: true                    #TODO
+        type: string
+      source-artifact-name:
+        description: "Run Artifact Name"
+        required: true                    #TODO
+        type: string
+      rocm-version:
+        required: true
+        type: string
+      ubuntu-version:
+        required: true
+        type: string
+      rocm-build-num:
+        required: false
+        type: string
+        default: "0"
+      github-sha:
+        required: false
+        type: string
+        default: ToT
+      runner-label:
+        required: false
+        type: string
+        default: "MI300"
+    secrets:
+      ROCM_JAX_DB_HOSTNAME:
+        required: true
+      ROCM_JAX_DB_USERNAME:
+        required: true
+      ROCM_JAX_DB_PASSWORD:
+        required: true
+      ROCM_JAX_DB_NAME:
+        required: true
 
 jobs:
-  call-build-wheels:
-    strategy:
-      fail-fast: false
-      matrix:
-        rocm-version: ["7.1.1", "7.2.0"]
-        include:
-          - rocm-version: "7.1.1"
-            runner-label: '["linux-x86-64-1gpu-amd"]'
-          - rocm-version: "7.2.0"
-            runner-label: '["linux-x86-64-1gpu-amd"]'
-    uses: ./.github/workflows/build-wheels.yml
-    with:
-      python-versions: "3.11,3.12"
-      rocm-version: ${{ matrix.rocm-version }}
-      rocm-build-job: ${{ matrix.rocm-build-job }}
-      rocm-build-num: ${{ matrix.rocm-build-num }}
-      runner-label: ${{ matrix.runner-label }}
-    secrets:
-      rbe_ci_cert: ${{ secrets.RBE_CI_CERT }}
-      rbe_ci_key: ${{ secrets.RBE_CI_KEY }}
-  call-build-docker:
-    needs: call-build-wheels
-    strategy:
-      fail-fast: false
-      matrix:
-        rocm-version: ["7.1.1", "7.2.0"]
-        include:
-          - rocm-version: "7.1.1"
-            runner-label: '["linux-x86-64-1gpu-amd"]'
-          - rocm-version: "7.2.0"
-            runner-label: '["linux-x86-64-1gpu-amd"]'
-    uses: ./.github/workflows/build-docker.yml
-    with:
-      rocm-version: ${{ matrix.rocm-version }}
-      rocm-build-job: ${{ matrix.rocm-build-job }}
-      rocm-build-num: ${{ matrix.rocm-build-num }}
-      runner-label: ${{ matrix.runner-label }}
-      extra-cr-tag: "nightly"
-  call-test-and-upload:
-    needs: call-build-docker
-    strategy:
-      fail-fast: false
-      matrix:
-        test-command:
-          - "python jax_rocm_plugin/build/rocm/run_single_gpu.py -c -s"
-          - "python jax_rocm_plugin/build/rocm/run_multi_gpu.py -c -s"
-        rocm-version: ["7.1.1", "7.2.0"]
-        ubuntu-version: ["22", "24"]
-        include:
-          - test-command: "python jax_rocm_plugin/build/rocm/run_single_gpu.py -c -s"
-            runner-label: '["linux-x86-64-1gpu-amd"]'
-            test-id: "single"
-          - test-command: "python jax_rocm_plugin/build/rocm/run_multi_gpu.py -c -s"
-            runner-label: '["linux-x86-64-4gpu-amd"]'
-            test-id: "multi"
-    uses: ./.github/workflows/test-and-upload.yml
-    with:
-      rocm-version: ${{ matrix.rocm-version }}
-      ubuntu-version: ${{ matrix.ubuntu-version }}
-      rocm-build-num: ${{ matrix.rocm-build-num || '0' }}
-      github-sha: ${{ github.sha }}
-      github-run-id: ${{ github.run_id }}
-      runner-label: ${{ matrix.runner-label }}
-      test-command: ${{ matrix.test-command }}
-      test-id: ${{ matrix.test-id }}
-    secrets:
-      ROCM_JAX_DB_HOSTNAME: ${{ secrets.ROCM_JAX_DB_HOSTNAME }}
-      ROCM_JAX_DB_USERNAME: ${{ secrets.ROCM_JAX_DB_USERNAME }}
-      ROCM_JAX_DB_PASSWORD: ${{ secrets.ROCM_JAX_DB_PASSWORD }}
-      ROCM_JAX_DB_NAME: ${{ secrets.ROCM_JAX_DB_NAME }}
+  upload-to-db:
+    runs-on: mysqldb
+    steps:
+      - name: Checkout source
+        uses: actions/checkout@v4
+      - name: Download logs artifact from source run
+        env:
+          GH_TOKEN: ${{ secrets.SECRET_TOKEN }}
+        run: |
+          gh run download "${{ inputs.source-github-run-id }}" \
+            -R "${{ inputs.source-repo }}" \
+            -n "${{ inputs.source-artifact-name }}" \
+            -D "logs-${{ inputs.source-github-run-id }}"
+      - name: Upload logs to MySQL database
+        env:
+          ROCM_JAX_DB_HOSTNAME: ${{ secrets.ROCM_JAX_DB_HOSTNAME }}
+          ROCM_JAX_DB_USERNAME: ${{ secrets.ROCM_JAX_DB_USERNAME }}
+          ROCM_JAX_DB_PASSWORD: ${{ secrets.ROCM_JAX_DB_PASSWORD }}
+          ROCM_JAX_DB_NAME: ${{ secrets.ROCM_JAX_DB_NAME }}
+          ROCM_VERSION: ${{ inputs.rocm-version }}
+          UBUNTU_VERSION: ${{ inputs.ubuntu-version }}
+          LOGS_DIR: logs-${{ inputs.source-github-run-id }}
+          GITHUB_SHA: ${{ inputs.github-sha }}
+          GITHUB_RUN_ID: ${{ inputs.github-run-id }}
+          ROCM_BUILD_NUM: ${{ inputs.rocm-build-num }}
+        run: |
+          python3 -m venv venv
+          source venv/bin/activate
+          pip install --upgrade pip
+          pip install mysql-connector-python
+
+          python ci/upload_test_to_db.py \
+          --logs_dir "$LOGS_DIR" \
+          --run-tag "ci-run" \
+          --runner-label "MI300" \
+          --ubuntu-version "${UBUNTU_VERSION}" \
+          --rocm-version "${ROCM_VERSION//.}" \
+          --commit-sha "$GITHUB_SHA" \
+          --build-num "$ROCM_BUILD_NUM" \
+          --github-run-id "$GITHUB_RUN_ID"
diff --git a/ci/upload_test_to_db.py b/ci/upload_test_to_db.py
@@ -2,9 +2,9 @@
 """
 Upload pytest results to MySQL.
 Tables:
- - ci_runs:    one row per run
- - ci_tests:   one row per unique test
- - ci_results: one row per test per run
+ - ci_runs_dup:    one row per run
+ - ci_tests_dup:   one row per unique test
+ - ci_results_dup: one row per test per run
 """
 
 from __future__ import annotations
@@ -72,37 +72,41 @@ def nodeid_parts(nodeid: str) -> Tuple[str, str, str]:
     return f, c, t
 
 
-def list_test_jsons(logs_dir: Path) -> List[Path]:
-    """Return per-test JSON files under logs_dir; skip aux files."""
-    return sorted(
+def find_single_report_json(logs_dir: Path) -> Path:
+    jsons = [
         p
         for p in logs_dir.iterdir()
         if p.is_file()
         and p.suffix.lower() == ".json"
-        and p.name not in SKIP_FILES
         and not p.name.endswith("last_running.json")
-    )
-
-
-def load_from_per_test_jsons(files: Iterable[Path]) -> Tuple[datetime, List[dict]]:
-    """Load tests and set run created_at to the latest per-file 'created'.
-
-    Each per-test JSON file must have a 'created' timestamp. We use the maximum
-    of these values as the run's created_at (i.e., when the run finished).
-    """
-    tests: List[dict] = []
-    created_values: List[float] = []
-
-    for path in files:
-        with path.open("r", encoding="utf-8") as fh:
-            data = json.load(fh)
-        if "created" not in data:
-            raise ValueError(f"Missing 'created' in {path.name}")
-        created_values.append(float(data["created"]))
-        tests.extend(data.get("tests", []))
-
-    created_at = datetime.fromtimestamp(max(created_values))
-    return created_at, tests
+    ]
+    if not jsons:
+        print(f"No JSON report found in {logs_dir}")
+        raise SystemExit(2)
+    if len(jsons) != 1:
+        print(
+            f"Expected exactly ONE JSON report, found {len(jsons)}: "
+            + ", ".join(p.name for p in jsons)
+        )
+        raise SystemExit(2)
+    return jsons[0]
+
+
+def load_from_single_json(path: Path) -> Tuple[datetime, List[dict]]:
+    with path.open("r", encoding="utf-8") as fh:
+        data = json.load(fh)
+    if isinstance(data, dict):
+        tests = data.get("tests", [])
+        created = data.get("created")
+        if created is not None:
+            created_at = datetime.fromtimestamp(float(created))
+        else:
+            created_at = datetime.fromtimestamp(path.stat().st_mtime)
+        return created_at, tests
+    if isinstance(data, list):
+        created_at = datetime.fromtimestamp(path.stat().st_mtime)
+        return created_at, data
+    raise ValueError(f"Unexpected JSON structure in {path.name}")
 
 
 def extract_result_fields(
@@ -263,10 +267,10 @@ def connect():
 
 
 def insert_run(cur, created_at: datetime, meta: dict) -> int:
-    """Insert one row into ci_runs and return run_id. Idempotence is not enforced here."""
+    """Insert one row into ci_runs_dup and return run_id. Idempotence is not enforced here."""
     cur.execute(
         """
-       INSERT INTO ci_runs (
+       INSERT INTO ci_runs_dup (
            created_at, commit_sha, runner_label, ubuntu_version,
            rocm_version, build_num, github_run_id, run_tag, logs_path
        ) VALUES (%s,%s,%s,%s,%s,%s,%s,%s,%s)
@@ -287,11 +291,11 @@ def insert_run(cur, created_at: datetime, meta: dict) -> int:
 
 
 def sync_tests_and_get_ids(cur, tests: List[dict]) -> Dict[Tuple[str, str, str], int]:
-    """Ensure all tests exist in ci_tests and return an ID mapping.
+    """Ensure all tests exist in ci_tests_dup and return an ID mapping.
 
     Uses a TEMPORARY TABLE for efficiency with large runs:
       1) Bulk insert unique (filename, classname, test_name) into a temp table.
-      2) INSERT any missing rows into ci_tests in one set operation.
+      2) INSERT any missing rows into ci_tests_dup in one set operation.
       3) SELECT back (file, class, test) -> id mapping in one query.
     """
     uniq = {nodeid_parts(t["nodeid"]) for t in tests}
@@ -315,10 +319,10 @@ def sync_tests_and_get_ids(cur, tests: List[dict]) -> Dict[Tuple[str, str, str],
 
     cur.execute(
         """
-       INSERT INTO ci_tests (filename, classname, test_name)
+       INSERT INTO ci_tests_dup (filename, classname, test_name)
        SELECT s.filename, s.classname, s.test_name
        FROM tmp_tests s
-       LEFT JOIN ci_tests t
+       LEFT JOIN ci_tests_dup t
          ON t.filename = s.filename
         AND t.classname = s.classname
         AND t.test_name = s.test_name
@@ -330,7 +334,7 @@ def sync_tests_and_get_ids(cur, tests: List[dict]) -> Dict[Tuple[str, str, str],
         """
        SELECT t.id, s.filename, s.classname, s.test_name
        FROM tmp_tests s
-       JOIN ci_tests t
+       JOIN ci_tests_dup t
          ON t.filename = s.filename
         AND t.classname = s.classname
         AND t.test_name = s.test_name
@@ -356,7 +360,7 @@ def batch_insert_results(
         return
 
     sql = """
-       INSERT INTO ci_results
+       INSERT INTO ci_results_dup
            (run_id, test_id, outcome, duration, longrepr, message, skip_label)
        VALUES (%s,%s,%s,%s,%s,%s,%s)
        ON DUPLICATE KEY UPDATE
@@ -388,16 +392,13 @@ def upload_pytest_results(  # pylint: disable=too-many-arguments, too-many-local
 
     Flow:
       1) Parse JSONs and gather tests.
-      2) Insert a ci_runs row and get run_id.
+      2) Insert a ci_runs_dup row and get run_id.
       3) Ensure all tests exist; get (file,class,test) -> test_id map.
-      4) Bulk insert/update ci_results for this run.
+      4) Bulk insert/update ci_results_dup for this run.
     """
-    files = list_test_jsons(logs_dir)
-    if not files:
-        print(f"No JSON files under {logs_dir}")
-        raise SystemExit(2)  # input error
-
-    created_at, tests = load_from_per_test_jsons(files)
+    report = find_single_report_json(logs_dir)
+    created_at, tests = load_from_single_json(report)
+    
     if not tests:
         print("No tests found in JSONs")
         raise SystemExit(2)  # input error