mirror of
https://github.com/esphome/esphome.git
synced 2025-10-24 04:33:49 +01:00
381 lines
14 KiB
Python
Executable File
381 lines
14 KiB
Python
Executable File
#!/usr/bin/env python3
|
|
"""Split components into batches with intelligent grouping.
|
|
|
|
This script analyzes components to identify which ones share common bus configurations
|
|
and intelligently groups them into batches to maximize the efficiency of the
|
|
component grouping system in CI.
|
|
|
|
Components with the same bus signature are placed in the same batch whenever possible,
|
|
allowing the test_build_components.py script to merge them into single builds.
|
|
"""
|
|
|
|
from __future__ import annotations
|
|
|
|
import argparse
|
|
from collections import defaultdict
|
|
import json
|
|
from pathlib import Path
|
|
import sys
|
|
|
|
# Add esphome to path
|
|
sys.path.insert(0, str(Path(__file__).parent.parent))
|
|
|
|
from script.analyze_component_buses import (
|
|
ISOLATED_COMPONENTS,
|
|
ISOLATED_SIGNATURE_PREFIX,
|
|
NO_BUSES_SIGNATURE,
|
|
analyze_all_components,
|
|
create_grouping_signature,
|
|
merge_compatible_bus_groups,
|
|
)
|
|
from script.helpers import get_component_test_files
|
|
|
|
# Weighting for batch creation
|
|
# Isolated components can't be grouped/merged, so they count as 10x
|
|
# Groupable components can be merged into single builds, so they count as 1x
|
|
ISOLATED_WEIGHT = 10
|
|
GROUPABLE_WEIGHT = 1
|
|
|
|
# Platform used for batching (platform-agnostic batching)
|
|
# Batches are split across CI runners and each runner tests all platforms
|
|
ALL_PLATFORMS = "all"
|
|
|
|
|
|
def has_test_files(component_name: str, tests_dir: Path) -> bool:
|
|
"""Check if a component has test files.
|
|
|
|
Args:
|
|
component_name: Name of the component
|
|
tests_dir: Path to tests/components directory (unused, kept for compatibility)
|
|
|
|
Returns:
|
|
True if the component has test.*.yaml files
|
|
"""
|
|
return bool(get_component_test_files(component_name))
|
|
|
|
|
|
def create_intelligent_batches(
|
|
components: list[str],
|
|
tests_dir: Path,
|
|
batch_size: int = 40,
|
|
directly_changed: set[str] | None = None,
|
|
) -> tuple[list[list[str]], dict[tuple[str, str], list[str]]]:
|
|
"""Create batches optimized for component grouping.
|
|
|
|
Args:
|
|
components: List of component names to batch
|
|
tests_dir: Path to tests/components directory
|
|
batch_size: Target size for each batch
|
|
directly_changed: Set of directly changed components (for logging only)
|
|
|
|
Returns:
|
|
Tuple of (batches, signature_groups) where:
|
|
- batches: List of component batches (lists of component names)
|
|
- signature_groups: Dict mapping (platform, signature) to component lists
|
|
"""
|
|
# Filter out components without test files
|
|
# Platform components like 'climate' and 'climate_ir' don't have test files
|
|
components_with_tests = [
|
|
comp for comp in components if has_test_files(comp, tests_dir)
|
|
]
|
|
|
|
# Log filtered components to stderr for debugging
|
|
if len(components_with_tests) < len(components):
|
|
filtered_out = set(components) - set(components_with_tests)
|
|
print(
|
|
f"Note: Filtered {len(filtered_out)} components without test files: "
|
|
f"{', '.join(sorted(filtered_out))}",
|
|
file=sys.stderr,
|
|
)
|
|
|
|
# Analyze all components to get their bus signatures
|
|
component_buses, non_groupable, _direct_bus_components = analyze_all_components(
|
|
tests_dir
|
|
)
|
|
|
|
# Group components by their bus signature ONLY (ignore platform)
|
|
# All platforms will be tested by test_build_components.py for each batch
|
|
# Key: (platform, signature), Value: list of components
|
|
# We use ALL_PLATFORMS since batching is platform-agnostic
|
|
signature_groups: dict[tuple[str, str], list[str]] = defaultdict(list)
|
|
|
|
for component in components_with_tests:
|
|
# Components that can't be grouped get unique signatures
|
|
# This includes:
|
|
# - Manually curated ISOLATED_COMPONENTS
|
|
# - Automatically detected non_groupable components
|
|
# - Directly changed components (passed via --isolate in CI)
|
|
# These can share a batch/runner but won't be grouped/merged
|
|
is_isolated = (
|
|
component in ISOLATED_COMPONENTS
|
|
or component in non_groupable
|
|
or (directly_changed and component in directly_changed)
|
|
)
|
|
if is_isolated:
|
|
signature_groups[
|
|
(ALL_PLATFORMS, f"{ISOLATED_SIGNATURE_PREFIX}{component}")
|
|
].append(component)
|
|
continue
|
|
|
|
# Get signature from any platform (they should all have the same buses)
|
|
# Components not in component_buses were filtered out by has_test_files check
|
|
comp_platforms = component_buses[component]
|
|
for platform, buses in comp_platforms.items():
|
|
if buses:
|
|
signature = create_grouping_signature({platform: buses}, platform)
|
|
# Group by signature only - platform doesn't matter for batching
|
|
# Use ALL_PLATFORMS since we're batching across all platforms
|
|
signature_groups[(ALL_PLATFORMS, signature)].append(component)
|
|
break # Only use first platform for grouping
|
|
else:
|
|
# No buses found for any platform - can be grouped together
|
|
signature_groups[(ALL_PLATFORMS, NO_BUSES_SIGNATURE)].append(component)
|
|
|
|
# Merge compatible bus groups (cross-bus optimization)
|
|
# This allows components with different buses (ble + uart) to be batched together
|
|
# improving the efficiency of test_build_components.py grouping
|
|
signature_groups = merge_compatible_bus_groups(signature_groups)
|
|
|
|
# Create batches by keeping signature groups together
|
|
# Components with the same signature stay in the same batches
|
|
batches = []
|
|
|
|
# Sort signature groups to prioritize groupable components
|
|
# 1. Put "isolated_*" signatures last (can't be grouped with others)
|
|
# 2. Sort groupable signatures by size (largest first)
|
|
# 3. "no_buses" components CAN be grouped together
|
|
def sort_key(item):
|
|
(_platform, signature), components = item
|
|
is_isolated = signature.startswith(ISOLATED_SIGNATURE_PREFIX)
|
|
# Put "isolated_*" last (1), groupable first (0)
|
|
# Within each category, sort by size (largest first)
|
|
return (is_isolated, -len(components))
|
|
|
|
sorted_groups = sorted(signature_groups.items(), key=sort_key)
|
|
|
|
# Strategy: Create batches using weighted sizes
|
|
# - Isolated components count as 10x (since they can't be grouped/merged)
|
|
# - Groupable components count as 1x (can be merged into single builds)
|
|
# - This distributes isolated components across more runners
|
|
# - Ensures each runner has a good mix of groupable vs isolated components
|
|
|
|
current_batch = []
|
|
current_weight = 0
|
|
|
|
for (_platform, signature), group_components in sorted_groups:
|
|
is_isolated = signature.startswith(ISOLATED_SIGNATURE_PREFIX)
|
|
weight_per_component = ISOLATED_WEIGHT if is_isolated else GROUPABLE_WEIGHT
|
|
|
|
for component in group_components:
|
|
# Check if adding this component would exceed the batch size
|
|
if current_weight + weight_per_component > batch_size and current_batch:
|
|
# Start a new batch
|
|
batches.append(current_batch)
|
|
current_batch = []
|
|
current_weight = 0
|
|
|
|
# Add component to current batch
|
|
current_batch.append(component)
|
|
current_weight += weight_per_component
|
|
|
|
# Don't forget the last batch
|
|
if current_batch:
|
|
batches.append(current_batch)
|
|
|
|
return batches, signature_groups
|
|
|
|
|
|
def main() -> int:
|
|
"""Main entry point."""
|
|
parser = argparse.ArgumentParser(
|
|
description="Split components into intelligent batches for CI testing"
|
|
)
|
|
parser.add_argument(
|
|
"--components",
|
|
"-c",
|
|
required=True,
|
|
help="JSON array of component names",
|
|
)
|
|
parser.add_argument(
|
|
"--batch-size",
|
|
"-b",
|
|
type=int,
|
|
default=40,
|
|
help="Target batch size (default: 40, weighted)",
|
|
)
|
|
parser.add_argument(
|
|
"--tests-dir",
|
|
type=Path,
|
|
default=Path("tests/components"),
|
|
help="Path to tests/components directory",
|
|
)
|
|
parser.add_argument(
|
|
"--directly-changed",
|
|
help="JSON array of directly changed component names (for logging only)",
|
|
)
|
|
parser.add_argument(
|
|
"--output",
|
|
"-o",
|
|
choices=["json", "github"],
|
|
default="github",
|
|
help="Output format (json or github for GitHub Actions)",
|
|
)
|
|
|
|
args = parser.parse_args()
|
|
|
|
# Parse component list from JSON
|
|
try:
|
|
components = json.loads(args.components)
|
|
except json.JSONDecodeError as e:
|
|
print(f"Error parsing components JSON: {e}", file=sys.stderr)
|
|
return 1
|
|
|
|
if not isinstance(components, list):
|
|
print("Components must be a JSON array", file=sys.stderr)
|
|
return 1
|
|
|
|
# Parse directly changed components list from JSON (if provided)
|
|
directly_changed = None
|
|
if args.directly_changed:
|
|
try:
|
|
directly_changed = set(json.loads(args.directly_changed))
|
|
except json.JSONDecodeError as e:
|
|
print(f"Error parsing directly-changed JSON: {e}", file=sys.stderr)
|
|
return 1
|
|
|
|
# Create intelligent batches
|
|
batches, signature_groups = create_intelligent_batches(
|
|
components=components,
|
|
tests_dir=args.tests_dir,
|
|
batch_size=args.batch_size,
|
|
directly_changed=directly_changed,
|
|
)
|
|
|
|
# Convert batches to space-separated strings for CI
|
|
batch_strings = [" ".join(batch) for batch in batches]
|
|
|
|
if args.output == "json":
|
|
# Output as JSON array
|
|
print(json.dumps(batch_strings))
|
|
else:
|
|
# Output for GitHub Actions (set output)
|
|
output_json = json.dumps(batch_strings)
|
|
print(f"components={output_json}")
|
|
|
|
# Print summary to stderr so it shows in CI logs
|
|
# Count actual components being batched
|
|
actual_components = sum(len(batch.split()) for batch in batch_strings)
|
|
|
|
# Re-analyze to get isolated component counts for summary
|
|
_, non_groupable, _ = analyze_all_components(args.tests_dir)
|
|
|
|
# Show grouping details
|
|
print("\n=== Component Grouping Details ===", file=sys.stderr)
|
|
# Sort groups by signature for readability
|
|
groupable_groups = []
|
|
isolated_groups = []
|
|
for (platform, signature), group_comps in sorted(signature_groups.items()):
|
|
if signature.startswith(ISOLATED_SIGNATURE_PREFIX):
|
|
isolated_groups.append((signature, group_comps))
|
|
else:
|
|
groupable_groups.append((signature, group_comps))
|
|
|
|
if groupable_groups:
|
|
print(
|
|
f"\nGroupable signatures ({len(groupable_groups)} merged groups after cross-bus optimization):",
|
|
file=sys.stderr,
|
|
)
|
|
for signature, group_comps in sorted(
|
|
groupable_groups, key=lambda x: (-len(x[1]), x[0])
|
|
):
|
|
# Check if this is a merged signature (contains +)
|
|
is_merged = "+" in signature and signature != NO_BUSES_SIGNATURE
|
|
# Special handling for no_buses components
|
|
if signature == NO_BUSES_SIGNATURE:
|
|
print(
|
|
f" [{signature}]: {len(group_comps)} components (used as fillers across batches)",
|
|
file=sys.stderr,
|
|
)
|
|
else:
|
|
merge_indicator = " [MERGED]" if is_merged else ""
|
|
print(
|
|
f" [{signature}]{merge_indicator}: {len(group_comps)} components",
|
|
file=sys.stderr,
|
|
)
|
|
# Show first few components as examples
|
|
examples = ", ".join(sorted(group_comps)[:8])
|
|
if len(group_comps) > 8:
|
|
examples += f", ... (+{len(group_comps) - 8} more)"
|
|
print(f" → {examples}", file=sys.stderr)
|
|
|
|
if isolated_groups:
|
|
print(
|
|
f"\nIsolated components ({len(isolated_groups)} components - tested individually):",
|
|
file=sys.stderr,
|
|
)
|
|
isolated_names = sorted(
|
|
[comp for _, comps in isolated_groups for comp in comps]
|
|
)
|
|
# Group isolated components for compact display
|
|
for i in range(0, len(isolated_names), 10):
|
|
chunk = isolated_names[i : i + 10]
|
|
print(f" {', '.join(chunk)}", file=sys.stderr)
|
|
|
|
# Count isolated vs groupable components
|
|
all_batched_components = [comp for batch in batches for comp in batch]
|
|
isolated_count = sum(
|
|
1
|
|
for comp in all_batched_components
|
|
if comp in ISOLATED_COMPONENTS
|
|
or comp in non_groupable
|
|
or (directly_changed and comp in directly_changed)
|
|
)
|
|
groupable_count = actual_components - isolated_count
|
|
|
|
print("\n=== Intelligent Batch Summary ===", file=sys.stderr)
|
|
print(f"Total components requested: {len(components)}", file=sys.stderr)
|
|
print(f"Components with test files: {actual_components}", file=sys.stderr)
|
|
|
|
# Show breakdown of directly changed vs dependencies
|
|
if directly_changed:
|
|
direct_count = sum(
|
|
1 for comp in all_batched_components if comp in directly_changed
|
|
)
|
|
dep_count = actual_components - direct_count
|
|
direct_comps = [
|
|
comp for comp in all_batched_components if comp in directly_changed
|
|
]
|
|
dep_comps = [
|
|
comp for comp in all_batched_components if comp not in directly_changed
|
|
]
|
|
print(
|
|
f" - Direct changes: {direct_count} ({', '.join(sorted(direct_comps))})",
|
|
file=sys.stderr,
|
|
)
|
|
print(
|
|
f" - Dependencies: {dep_count} ({', '.join(sorted(dep_comps))})",
|
|
file=sys.stderr,
|
|
)
|
|
|
|
print(f" - Groupable (weight=1): {groupable_count}", file=sys.stderr)
|
|
print(f" - Isolated (weight=10): {isolated_count}", file=sys.stderr)
|
|
if actual_components < len(components):
|
|
print(
|
|
f"Components skipped (no test files): {len(components) - actual_components}",
|
|
file=sys.stderr,
|
|
)
|
|
print(f"Number of batches: {len(batches)}", file=sys.stderr)
|
|
print(f"Batch size target (weighted): {args.batch_size}", file=sys.stderr)
|
|
if len(batches) > 0:
|
|
print(
|
|
f"Average components per batch: {actual_components / len(batches):.1f}",
|
|
file=sys.stderr,
|
|
)
|
|
print(file=sys.stderr)
|
|
|
|
return 0
|
|
|
|
|
|
if __name__ == "__main__":
|
|
sys.exit(main())
|