RianKoja · google-labs-jules · Jan 14, 2026 · coderabbitai · Jan 14, 2026 · gemini-code-assist
diff --git a/.github/workflows/benchmark.yml b/.github/workflows/benchmark.yml
@@ -24,90 +24,6 @@ jobs:
         enable-cache: true
         cache-dependency-glob: "requirements.in"
 
-    - name: Set up Python
-      run: |
-        # Automatically detect compatible Python version by testing dependency installation
-        # Try default latest Python first, then downgrade up to 2 times if needed
-
-        echo "Attempting to find compatible Python version..."
-
-        # Try installing default/latest Python
-        uv python install
-
-        # Get the initial version that was installed
-        test_version=$(uv python list | grep -E 'cpython-[0-9]+\.[0-9]+' | grep -v 'pypy' | head -n1 | awk '{print $1}' | sed 's/cpython-//' | cut -d'-' -f1)
-
-        for attempt in 1 2 3; do
-          echo ""
-          echo "Attempt $attempt:"
-          echo "Testing Python $test_version..."
-
-          # Create a temporary virtual environment with the specific Python version
-          # Use attempt number to avoid path collisions
-          test_venv="/tmp/test-venv-attempt-$attempt-$$"
-          uv venv --python "$test_version" "$test_venv" 2>&1
-          source "$test_venv/bin/activate"
-
-          # Try to compile requirements (capture output separately for error reporting)
-          compile_output=$(mktemp)
-          success=false
-          if uv pip compile requirements.in > /tmp/requirements-$attempt.txt 2>"$compile_output"; then
-            # Compile succeeded, now try to sync
-            if uv pip sync /tmp/requirements-$attempt.txt 2>&1; then
-              echo "✓ Python $test_version is compatible with all frameworks"
-              echo "PYTHON_VERSION=$test_version" >> $GITHUB_ENV
-              success=true
-            else
-              echo "✗ Python $test_version: pip sync failed"
-            fi
-          else
-            echo "✗ Python $test_version: dependency compilation failed"
-          fi
-
-          # Show the error for debugging if failed
-          if [ "$success" = false ]; then
-            echo "Error output:"
-            cat "$compile_output" 2>/dev/null || true
-          fi
-
-          # Clean up test venv
-          deactivate 2>/dev/null || true
-          rm -rf "$test_venv"
-          rm -f "$compile_output"
-
-          # If successful, we're done
-          if [ "$success" = true ]; then
-            break
-          fi
-
-          # If not the last attempt, try downgrading
-          if [ $attempt -lt 3 ]; then
-            # Parse version and downgrade
-            major=$(echo "$test_version" | cut -d. -f1)
-            minor=$(echo "$test_version" | cut -d. -f2)
-
-            # Downgrade minor version
-            new_minor=$((minor - 1))
-
-            if [ $new_minor -ge 10 ]; then
-              test_version="$major.$new_minor"
-              echo "Downgrading to Python $test_version..."
-
-              # Install downgraded version
-              uv python install "$test_version"
-            else
-              echo "Cannot downgrade further (reached Python 3.10)"
-              exit 1
-            fi
-          else
-            echo "Error: No compatible Python version found after 3 attempts"
-            exit 1
-          fi
-        done
-
-        echo ""
-        echo "Using Python $PYTHON_VERSION"
-
     - name: Install system dependencies
       run: |
         sudo apt-get update
@@ -118,14 +34,8 @@ jobs:
         # Make run.sh executable
         chmod +x run.sh
 
-        # Set Python version for run.sh to use
-        # If PYTHON_VERSION was set by the setup step, pin it
-        if [ -n "$PYTHON_VERSION" ]; then
-          export UV_PYTHON="$PYTHON_VERSION"
-          echo "Using Python $PYTHON_VERSION for benchmark suite"
-        fi
-
         # Run the benchmark suite
+        # It will install the latest compatible Python and dependencies
         bash run.sh
       env:
         # Set environment variable to indicate GitHub Actions
@@ -219,4 +129,4 @@ jobs:
           echo "::endgroup::"
         else
           echo "Summary statistics file not found"
-        fi
+        fi
diff --git a/00_tools.py b/00_tools.py
@@ -5,6 +5,49 @@
 from typing import Any, Callable, Dict
 
 
+def normalize_result(result: Any) -> Any:
+    """
+    Normalize the result DataFrame to ensure consistent format across frameworks.
+    - Resets index (moving index to columns)
+    - Flattens MultiIndex columns
+    """
+    # Check if it looks like a pandas/fireducks DataFrame
+    if (
+        hasattr(result, "index")
+        and hasattr(result, "columns")
+        and hasattr(result, "reset_index")
+    ):
+        # 1. Reset index if it's not a RangeIndex
+        # This moves grouping keys from index to columns
+        is_range_index = False
+        # Check for RangeIndex (has start/stop/step attributes)
+        if (
+            hasattr(result.index, "start")
+            and hasattr(result.index, "stop")
+            and hasattr(result.index, "step")
+        ):
+            is_range_index = True
+
+        if not is_range_index:
+            result = result.reset_index()
+
+        # 2. Flatten MultiIndex columns
+        # Check if columns is a MultiIndex (has nlevels > 1)
+        if hasattr(result.columns, "nlevels") and result.columns.nlevels > 1:
+            new_columns = []
+            for col in result.columns.values:
+                if isinstance(col, tuple):
+                    # Join non-empty parts with underscore
+                    # E.g. ('total_amount', 'sum') -> 'total_amount_sum'
+                    name = "_".join([str(c) for c in col if str(c) != ""]).strip("_")
+                    new_columns.append(name)
+                else:
+                    new_columns.append(str(col))
+            result.columns = new_columns
+
+    return result
+
+
 def time_operation(
     operation_name: str,
     df_lib: Any,
@@ -49,6 +92,14 @@ def time_operation(
     if hasattr(result, "to_frame"):
         result = result.to_frame(name=operation_name)
 
+    # Normalize result (reset index, flatten columns) before saving
+    # This ensures consistency between Pandas (which uses Index/MultiIndex)
+    # and Polars (which uses flat DataFrames)
+    try:
+        result = normalize_result(result)
+    except Exception as e:
+        print(f"Warning: Failed to normalize result for {operation_name}: {e}")
+
     if hasattr(result, "to_parquet"):
         result.to_parquet(output_filename, index=False)
     elif hasattr(result, "write_parquet"):