mirror of
https://github.com/home-assistant/supervisor.git
synced 2026-02-15 07:27:13 +00:00
* Use count-based progress for Docker image pulls Refactor Docker image pull progress to use a simpler count-based approach where each layer contributes equally (100% / total_layers) regardless of size. This replaces the previous size-weighted calculation that was susceptible to progress regression. The core issue was that Docker rate-limits concurrent downloads (~3 at a time) and reports layer sizes only when downloading starts. With size- weighted progress, large layers appearing late would cause progress to drop dramatically (e.g., 59% -> 29%) as the total size increased. The new approach: - Each layer contributes equally to overall progress - Per-layer progress: 70% download weight, 30% extraction weight - Progress only starts after first "Downloading" event (when layer count is known) - Always caps at 99% - job completion handles final 100% This simplifies the code by moving progress tracking to a dedicated module (pull_progress.py) and removing complex size-based scaling logic that tried to account for unknown layer sizes. 🤖 Generated with [Claude Code](https://claude.com/claude-code) Co-Authored-By: Claude <noreply@anthropic.com> * Exclude already-existing layers from pull progress calculation Layers that already exist locally should not count towards download progress since there's nothing to download for them. Only layers that need pulling are included in the progress calculation. 🤖 Generated with [Claude Code](https://claude.com/claude-code) Co-Authored-By: Claude <noreply@anthropic.com> * Add registry manifest fetcher for size-based pull progress Fetch image manifests directly from container registries before pulling to get accurate layer sizes upfront. This enables size-weighted progress tracking where each layer contributes proportionally to its byte size, rather than equal weight per layer. Key changes: - Add RegistryManifestFetcher that handles auth discovery via WWW-Authenticate headers, token fetching with optional credentials, and multi-arch manifest list resolution - Update ImagePullProgress to accept manifest layer sizes via set_manifest() and calculate size-weighted progress - Fall back to count-based progress when manifest fetch fails - Pre-populate layer sizes from manifest when creating layer trackers The manifest fetcher supports ghcr.io, Docker Hub, and private registries by using credentials from Docker config when available. 🤖 Generated with [Claude Code](https://claude.com/claude-code) Co-Authored-By: Claude <noreply@anthropic.com> * Clamp progress to 100 to prevent floating point precision issues Floating point arithmetic in weighted progress calculations can produce values slightly above 100 (e.g., 100.00000000000001). This causes validation errors when the progress value is checked. Add min(100, ...) clamping to both size-weighted and count-based progress calculations to ensure the result never exceeds 100. 🤖 Generated with [Claude Code](https://claude.com/claude-code) Co-Authored-By: Claude <noreply@anthropic.com> * Use sys_websession for manifest fetcher instead of creating new session Reuse the existing CoreSys websession for registry manifest requests instead of creating a new aiohttp session. This improves performance and follows the established pattern used throughout the codebase. 🤖 Generated with [Claude Code](https://claude.com/claude-code) Co-Authored-By: Claude <noreply@anthropic.com> * Make platform parameter required and warn on missing platform - Make platform a required parameter in get_manifest() and _fetch_manifest() since it's always provided by the calling code - Return None and log warning when requested platform is not found in multi-arch manifest list, instead of falling back to first manifest which could be the wrong architecture 🤖 Generated with [Claude Code](https://claude.com/claude-code) Co-Authored-By: Claude <noreply@anthropic.com> * Log manifest fetch failures at warning level Users will notice degraded progress tracking when manifest fetch fails, so log at warning level to help diagnose issues. 🤖 Generated with [Claude Code](https://claude.com/claude-code) Co-Authored-By: Claude <noreply@anthropic.com> * Add pylint disable comments for protected access in manifest tests 🤖 Generated with [Claude Code](https://claude.com/claude-code) Co-Authored-By: Claude <noreply@anthropic.com> * Separate download_current and total_size updates in pull progress Update download_current and total_size independently in the DOWNLOADING handler. This ensures download_current is updated even when total is not yet available. 🤖 Generated with [Claude Code](https://claude.com/claude-code) Co-Authored-By: Claude <noreply@anthropic.com> * Reject invalid platform format in manifest selection --------- Co-authored-by: Claude <noreply@anthropic.com>
1003 lines
32 KiB
Python
1003 lines
32 KiB
Python
"""Tests for image pull progress tracking."""
|
|
|
|
import pytest
|
|
|
|
from supervisor.docker.manager import PullLogEntry, PullProgressDetail
|
|
from supervisor.docker.manifest import ImageManifest
|
|
from supervisor.docker.pull_progress import (
|
|
DOWNLOAD_WEIGHT,
|
|
EXTRACT_WEIGHT,
|
|
ImagePullProgress,
|
|
LayerProgress,
|
|
)
|
|
|
|
|
|
class TestLayerProgress:
|
|
"""Tests for LayerProgress class."""
|
|
|
|
def test_already_exists_layer(self):
|
|
"""Test that already existing layer returns 100%."""
|
|
layer = LayerProgress(layer_id="abc123", already_exists=True)
|
|
assert layer.calculate_progress() == 100.0
|
|
|
|
def test_extract_complete_layer(self):
|
|
"""Test that extracted layer returns 100%."""
|
|
layer = LayerProgress(
|
|
layer_id="abc123",
|
|
total_size=1000,
|
|
download_current=1000,
|
|
download_complete=True,
|
|
extract_complete=True,
|
|
)
|
|
assert layer.calculate_progress() == 100.0
|
|
|
|
def test_download_complete_not_extracted(self):
|
|
"""Test layer that finished downloading but not extracting."""
|
|
layer = LayerProgress(
|
|
layer_id="abc123",
|
|
total_size=1000,
|
|
download_current=1000,
|
|
download_complete=True,
|
|
extract_complete=False,
|
|
)
|
|
assert layer.calculate_progress() == DOWNLOAD_WEIGHT # 70%
|
|
|
|
def test_extraction_progress_overlay2(self):
|
|
"""Test layer with byte-based extraction progress (overlay2)."""
|
|
layer = LayerProgress(
|
|
layer_id="abc123",
|
|
total_size=1000,
|
|
download_current=1000,
|
|
extract_current=500, # 50% extracted
|
|
download_complete=True,
|
|
extract_complete=False,
|
|
)
|
|
# 70% + (50% of 30%) = 70% + 15% = 85%
|
|
assert layer.calculate_progress() == DOWNLOAD_WEIGHT + (0.5 * EXTRACT_WEIGHT)
|
|
|
|
def test_downloading_progress(self):
|
|
"""Test layer during download phase."""
|
|
layer = LayerProgress(
|
|
layer_id="abc123",
|
|
total_size=1000,
|
|
download_current=500, # 50% downloaded
|
|
download_complete=False,
|
|
)
|
|
# 50% of 70% = 35%
|
|
assert layer.calculate_progress() == 35.0
|
|
|
|
def test_no_size_info_yet(self):
|
|
"""Test layer with no size information."""
|
|
layer = LayerProgress(layer_id="abc123")
|
|
assert layer.calculate_progress() == 0.0
|
|
|
|
|
|
class TestImagePullProgress:
|
|
"""Tests for ImagePullProgress class."""
|
|
|
|
def test_empty_progress(self):
|
|
"""Test progress with no layers."""
|
|
progress = ImagePullProgress()
|
|
assert progress.calculate_progress() == 0.0
|
|
|
|
def test_all_layers_already_exist(self):
|
|
"""Test when all layers already exist locally.
|
|
|
|
When an image is fully cached, there are no "Downloading" events.
|
|
Progress stays at 0 until the job completes and sets 100%.
|
|
"""
|
|
progress = ImagePullProgress()
|
|
|
|
# Simulate "Already exists" events
|
|
entry1 = PullLogEntry(
|
|
job_id="test",
|
|
id="layer1",
|
|
status="Already exists",
|
|
progress_detail=PullProgressDetail(),
|
|
)
|
|
entry2 = PullLogEntry(
|
|
job_id="test",
|
|
id="layer2",
|
|
status="Already exists",
|
|
progress_detail=PullProgressDetail(),
|
|
)
|
|
progress.process_event(entry1)
|
|
progress.process_event(entry2)
|
|
|
|
# No downloading events = no progress reported (job completion sets 100%)
|
|
assert progress.calculate_progress() == 0.0
|
|
|
|
def test_single_layer_download(self):
|
|
"""Test progress tracking for single layer download."""
|
|
progress = ImagePullProgress()
|
|
|
|
# Pull fs layer
|
|
progress.process_event(
|
|
PullLogEntry(
|
|
job_id="test",
|
|
id="layer1",
|
|
status="Pulling fs layer",
|
|
progress_detail=PullProgressDetail(),
|
|
)
|
|
)
|
|
|
|
# Start downloading
|
|
progress.process_event(
|
|
PullLogEntry(
|
|
job_id="test",
|
|
id="layer1",
|
|
status="Downloading",
|
|
progress_detail=PullProgressDetail(current=500, total=1000),
|
|
)
|
|
)
|
|
# 50% of download phase = 35%
|
|
assert progress.calculate_progress() == pytest.approx(35.0)
|
|
|
|
# Download complete
|
|
progress.process_event(
|
|
PullLogEntry(
|
|
job_id="test",
|
|
id="layer1",
|
|
status="Download complete",
|
|
progress_detail=PullProgressDetail(),
|
|
)
|
|
)
|
|
assert progress.calculate_progress() == 70.0
|
|
|
|
# Pull complete
|
|
progress.process_event(
|
|
PullLogEntry(
|
|
job_id="test",
|
|
id="layer1",
|
|
status="Pull complete",
|
|
progress_detail=PullProgressDetail(),
|
|
)
|
|
)
|
|
assert progress.calculate_progress() == 100.0
|
|
|
|
def test_multiple_layers_equal_weight_progress(self):
|
|
"""Test count-based progress where each layer contributes equally."""
|
|
progress = ImagePullProgress()
|
|
|
|
# Two layers: sizes don't matter for weight, each layer = 50%
|
|
|
|
# Pulling fs layer for both
|
|
progress.process_event(
|
|
PullLogEntry(
|
|
job_id="test",
|
|
id="large",
|
|
status="Pulling fs layer",
|
|
progress_detail=PullProgressDetail(),
|
|
)
|
|
)
|
|
progress.process_event(
|
|
PullLogEntry(
|
|
job_id="test",
|
|
id="small",
|
|
status="Pulling fs layer",
|
|
progress_detail=PullProgressDetail(),
|
|
)
|
|
)
|
|
|
|
# Large layer: 50% downloaded = 35% layer progress (50% of 70%)
|
|
progress.process_event(
|
|
PullLogEntry(
|
|
job_id="test",
|
|
id="large",
|
|
status="Downloading",
|
|
progress_detail=PullProgressDetail(current=500, total=1000),
|
|
)
|
|
)
|
|
|
|
# Small layer: 100% downloaded, waiting for extraction = 70% layer progress
|
|
progress.process_event(
|
|
PullLogEntry(
|
|
job_id="test",
|
|
id="small",
|
|
status="Download complete",
|
|
progress_detail=PullProgressDetail(),
|
|
)
|
|
)
|
|
progress.process_event(
|
|
PullLogEntry(
|
|
job_id="test",
|
|
id="small",
|
|
status="Downloading",
|
|
progress_detail=PullProgressDetail(current=100, total=100),
|
|
)
|
|
)
|
|
|
|
# Progress calculation (count-based, equal weight per layer):
|
|
# Large layer: 35% (50% of 70% download weight)
|
|
# Small layer: 70% (download complete)
|
|
# Each layer = 50% weight
|
|
# Total: (35 + 70) / 2 = 52.5%
|
|
assert progress.calculate_progress() == pytest.approx(52.5)
|
|
|
|
def test_download_retry(self):
|
|
"""Test that download retry resets progress."""
|
|
progress = ImagePullProgress()
|
|
|
|
progress.process_event(
|
|
PullLogEntry(
|
|
job_id="test",
|
|
id="layer1",
|
|
status="Pulling fs layer",
|
|
progress_detail=PullProgressDetail(),
|
|
)
|
|
)
|
|
|
|
# Download 50%
|
|
progress.process_event(
|
|
PullLogEntry(
|
|
job_id="test",
|
|
id="layer1",
|
|
status="Downloading",
|
|
progress_detail=PullProgressDetail(current=500, total=1000),
|
|
)
|
|
)
|
|
assert progress.calculate_progress() == pytest.approx(35.0)
|
|
|
|
# Retry
|
|
progress.process_event(
|
|
PullLogEntry(
|
|
job_id="test",
|
|
id="layer1",
|
|
status="Retrying in 5 seconds",
|
|
)
|
|
)
|
|
assert progress.calculate_progress() == 0.0
|
|
|
|
def test_layer_skips_download(self):
|
|
"""Test small layer that goes straight to Download complete."""
|
|
progress = ImagePullProgress()
|
|
|
|
progress.process_event(
|
|
PullLogEntry(
|
|
job_id="test",
|
|
id="small",
|
|
status="Pulling fs layer",
|
|
progress_detail=PullProgressDetail(),
|
|
)
|
|
)
|
|
|
|
# Goes directly to Download complete (skipping Downloading events)
|
|
progress.process_event(
|
|
PullLogEntry(
|
|
job_id="test",
|
|
id="small",
|
|
status="Download complete",
|
|
progress_detail=PullProgressDetail(),
|
|
)
|
|
)
|
|
|
|
# Should still work - sets minimal size
|
|
layer = progress.layers["small"]
|
|
assert layer.total_size == 1
|
|
assert layer.download_complete is True
|
|
|
|
def test_containerd_extract_progress(self):
|
|
"""Test extraction progress with containerd snapshotter (time-based)."""
|
|
progress = ImagePullProgress()
|
|
|
|
progress.process_event(
|
|
PullLogEntry(
|
|
job_id="test",
|
|
id="layer1",
|
|
status="Pulling fs layer",
|
|
progress_detail=PullProgressDetail(),
|
|
)
|
|
)
|
|
|
|
# Download complete
|
|
progress.process_event(
|
|
PullLogEntry(
|
|
job_id="test",
|
|
id="layer1",
|
|
status="Downloading",
|
|
progress_detail=PullProgressDetail(current=1000, total=1000),
|
|
)
|
|
)
|
|
progress.process_event(
|
|
PullLogEntry(
|
|
job_id="test",
|
|
id="layer1",
|
|
status="Download complete",
|
|
progress_detail=PullProgressDetail(),
|
|
)
|
|
)
|
|
|
|
# Containerd extraction progress (time-based, not byte-based)
|
|
progress.process_event(
|
|
PullLogEntry(
|
|
job_id="test",
|
|
id="layer1",
|
|
status="Extracting",
|
|
progress_detail=PullProgressDetail(current=5, units="s"),
|
|
)
|
|
)
|
|
|
|
# Should be at 70% (download complete, time-based extraction not tracked)
|
|
assert progress.calculate_progress() == 70.0
|
|
|
|
# Pull complete
|
|
progress.process_event(
|
|
PullLogEntry(
|
|
job_id="test",
|
|
id="layer1",
|
|
status="Pull complete",
|
|
progress_detail=PullProgressDetail(),
|
|
)
|
|
)
|
|
assert progress.calculate_progress() == 100.0
|
|
|
|
def test_overlay2_extract_progress(self):
|
|
"""Test extraction progress with overlay2 (byte-based)."""
|
|
progress = ImagePullProgress()
|
|
|
|
progress.process_event(
|
|
PullLogEntry(
|
|
job_id="test",
|
|
id="layer1",
|
|
status="Pulling fs layer",
|
|
progress_detail=PullProgressDetail(),
|
|
)
|
|
)
|
|
|
|
# Download complete
|
|
progress.process_event(
|
|
PullLogEntry(
|
|
job_id="test",
|
|
id="layer1",
|
|
status="Downloading",
|
|
progress_detail=PullProgressDetail(current=1000, total=1000),
|
|
)
|
|
)
|
|
progress.process_event(
|
|
PullLogEntry(
|
|
job_id="test",
|
|
id="layer1",
|
|
status="Download complete",
|
|
progress_detail=PullProgressDetail(),
|
|
)
|
|
)
|
|
|
|
# At download complete, progress should be 70%
|
|
assert progress.calculate_progress() == 70.0
|
|
|
|
# Overlay2 extraction progress (byte-based, 50% extracted)
|
|
progress.process_event(
|
|
PullLogEntry(
|
|
job_id="test",
|
|
id="layer1",
|
|
status="Extracting",
|
|
progress_detail=PullProgressDetail(current=500, total=1000),
|
|
)
|
|
)
|
|
|
|
# Should be at 70% + (50% of 30%) = 85%
|
|
assert progress.calculate_progress() == pytest.approx(85.0)
|
|
|
|
# Extraction continues to 80%
|
|
progress.process_event(
|
|
PullLogEntry(
|
|
job_id="test",
|
|
id="layer1",
|
|
status="Extracting",
|
|
progress_detail=PullProgressDetail(current=800, total=1000),
|
|
)
|
|
)
|
|
|
|
# Should be at 70% + (80% of 30%) = 94%
|
|
assert progress.calculate_progress() == pytest.approx(94.0)
|
|
|
|
# Pull complete
|
|
progress.process_event(
|
|
PullLogEntry(
|
|
job_id="test",
|
|
id="layer1",
|
|
status="Pull complete",
|
|
progress_detail=PullProgressDetail(),
|
|
)
|
|
)
|
|
assert progress.calculate_progress() == 100.0
|
|
|
|
def test_get_stage(self):
|
|
"""Test stage detection."""
|
|
progress = ImagePullProgress()
|
|
|
|
assert progress.get_stage() is None
|
|
|
|
# Add a layer that needs downloading
|
|
progress.process_event(
|
|
PullLogEntry(
|
|
job_id="test",
|
|
id="layer1",
|
|
status="Pulling fs layer",
|
|
progress_detail=PullProgressDetail(),
|
|
)
|
|
)
|
|
progress.process_event(
|
|
PullLogEntry(
|
|
job_id="test",
|
|
id="layer1",
|
|
status="Downloading",
|
|
progress_detail=PullProgressDetail(current=500, total=1000),
|
|
)
|
|
)
|
|
assert progress.get_stage() == "Downloading"
|
|
|
|
# Download complete
|
|
progress.process_event(
|
|
PullLogEntry(
|
|
job_id="test",
|
|
id="layer1",
|
|
status="Download complete",
|
|
progress_detail=PullProgressDetail(),
|
|
)
|
|
)
|
|
assert progress.get_stage() == "Extracting"
|
|
|
|
# Pull complete
|
|
progress.process_event(
|
|
PullLogEntry(
|
|
job_id="test",
|
|
id="layer1",
|
|
status="Pull complete",
|
|
progress_detail=PullProgressDetail(),
|
|
)
|
|
)
|
|
assert progress.get_stage() == "Pull complete"
|
|
|
|
def test_should_update_job(self):
|
|
"""Test update threshold logic."""
|
|
progress = ImagePullProgress()
|
|
|
|
# Initial state - no updates
|
|
should_update, _ = progress.should_update_job()
|
|
assert not should_update
|
|
|
|
# Add a layer and start downloading
|
|
progress.process_event(
|
|
PullLogEntry(
|
|
job_id="test",
|
|
id="layer1",
|
|
status="Pulling fs layer",
|
|
progress_detail=PullProgressDetail(),
|
|
)
|
|
)
|
|
|
|
# Small progress - 1%
|
|
progress.process_event(
|
|
PullLogEntry(
|
|
job_id="test",
|
|
id="layer1",
|
|
status="Downloading",
|
|
progress_detail=PullProgressDetail(current=20, total=1000),
|
|
)
|
|
)
|
|
# 2% of download = 1.4% total
|
|
should_update, current = progress.should_update_job()
|
|
assert should_update
|
|
assert current == pytest.approx(1.4)
|
|
|
|
# Tiny increment - shouldn't trigger update
|
|
progress.process_event(
|
|
PullLogEntry(
|
|
job_id="test",
|
|
id="layer1",
|
|
status="Downloading",
|
|
progress_detail=PullProgressDetail(current=25, total=1000),
|
|
)
|
|
)
|
|
should_update, _ = progress.should_update_job()
|
|
assert not should_update
|
|
|
|
# Larger increment - should trigger
|
|
progress.process_event(
|
|
PullLogEntry(
|
|
job_id="test",
|
|
id="layer1",
|
|
status="Downloading",
|
|
progress_detail=PullProgressDetail(current=100, total=1000),
|
|
)
|
|
)
|
|
should_update, _ = progress.should_update_job()
|
|
assert should_update
|
|
|
|
def test_verifying_checksum(self):
|
|
"""Test that Verifying Checksum marks download as nearly complete."""
|
|
progress = ImagePullProgress()
|
|
|
|
progress.process_event(
|
|
PullLogEntry(
|
|
job_id="test",
|
|
id="layer1",
|
|
status="Pulling fs layer",
|
|
progress_detail=PullProgressDetail(),
|
|
)
|
|
)
|
|
progress.process_event(
|
|
PullLogEntry(
|
|
job_id="test",
|
|
id="layer1",
|
|
status="Downloading",
|
|
progress_detail=PullProgressDetail(current=800, total=1000),
|
|
)
|
|
)
|
|
progress.process_event(
|
|
PullLogEntry(
|
|
job_id="test",
|
|
id="layer1",
|
|
status="Verifying Checksum",
|
|
progress_detail=PullProgressDetail(),
|
|
)
|
|
)
|
|
|
|
layer = progress.layers["layer1"]
|
|
assert layer.download_current == 1000 # Should be set to total
|
|
|
|
def test_events_without_status_ignored(self):
|
|
"""Test that events without status are ignored."""
|
|
progress = ImagePullProgress()
|
|
|
|
# Event without status (just id field)
|
|
progress.process_event(
|
|
PullLogEntry(
|
|
job_id="test",
|
|
id="abc123",
|
|
)
|
|
)
|
|
|
|
# Event without id
|
|
progress.process_event(
|
|
PullLogEntry(
|
|
job_id="test",
|
|
status="Digest: sha256:abc123",
|
|
)
|
|
)
|
|
|
|
# They shouldn't create layers or cause errors
|
|
assert len(progress.layers) == 0
|
|
|
|
def test_mixed_already_exists_and_pull(self):
|
|
"""Test combination of cached and pulled layers."""
|
|
progress = ImagePullProgress()
|
|
|
|
# Layer 1 already exists
|
|
progress.process_event(
|
|
PullLogEntry(
|
|
job_id="test",
|
|
id="cached",
|
|
status="Already exists",
|
|
progress_detail=PullProgressDetail(),
|
|
)
|
|
)
|
|
|
|
# Layer 2 needs to be pulled
|
|
progress.process_event(
|
|
PullLogEntry(
|
|
job_id="test",
|
|
id="pulled",
|
|
status="Pulling fs layer",
|
|
progress_detail=PullProgressDetail(),
|
|
)
|
|
)
|
|
progress.process_event(
|
|
PullLogEntry(
|
|
job_id="test",
|
|
id="pulled",
|
|
status="Downloading",
|
|
progress_detail=PullProgressDetail(current=500, total=1000),
|
|
)
|
|
)
|
|
|
|
# Only 1 layer needs pulling (cached layer excluded)
|
|
# pulled: 35% (50% of 70% download weight)
|
|
assert progress.calculate_progress() == pytest.approx(35.0)
|
|
|
|
# Complete the pulled layer
|
|
progress.process_event(
|
|
PullLogEntry(
|
|
job_id="test",
|
|
id="pulled",
|
|
status="Download complete",
|
|
progress_detail=PullProgressDetail(),
|
|
)
|
|
)
|
|
progress.process_event(
|
|
PullLogEntry(
|
|
job_id="test",
|
|
id="pulled",
|
|
status="Pull complete",
|
|
progress_detail=PullProgressDetail(),
|
|
)
|
|
)
|
|
|
|
assert progress.calculate_progress() == 100.0
|
|
|
|
def test_pending_layers_prevent_premature_100(self):
|
|
"""Test that layers without size info scale down progress."""
|
|
progress = ImagePullProgress()
|
|
|
|
# First batch of layers - they complete
|
|
progress.process_event(
|
|
PullLogEntry(
|
|
job_id="test",
|
|
id="layer1",
|
|
status="Pulling fs layer",
|
|
progress_detail=PullProgressDetail(),
|
|
)
|
|
)
|
|
progress.process_event(
|
|
PullLogEntry(
|
|
job_id="test",
|
|
id="layer2",
|
|
status="Pulling fs layer",
|
|
progress_detail=PullProgressDetail(),
|
|
)
|
|
)
|
|
|
|
# Layer1 downloads and completes
|
|
progress.process_event(
|
|
PullLogEntry(
|
|
job_id="test",
|
|
id="layer1",
|
|
status="Downloading",
|
|
progress_detail=PullProgressDetail(current=1000, total=1000),
|
|
)
|
|
)
|
|
progress.process_event(
|
|
PullLogEntry(
|
|
job_id="test",
|
|
id="layer1",
|
|
status="Pull complete",
|
|
progress_detail=PullProgressDetail(),
|
|
)
|
|
)
|
|
|
|
# Layer2 is still pending (no size info yet) - simulating Docker rate limiting
|
|
# Progress should NOT be 100% because layer2 hasn't started
|
|
|
|
# Layer1 is 100% complete, layer2 is 0%
|
|
# With scaling: 1 known layer at 100%, 1 pending layer
|
|
# Scale factor = 1/(1+1) = 0.5, so progress = 100 * 0.5 = 50%
|
|
assert progress.calculate_progress() == pytest.approx(50.0)
|
|
|
|
# Now layer2 starts downloading
|
|
progress.process_event(
|
|
PullLogEntry(
|
|
job_id="test",
|
|
id="layer2",
|
|
status="Downloading",
|
|
progress_detail=PullProgressDetail(current=500, total=1000),
|
|
)
|
|
)
|
|
|
|
# Now both layers have size info, no scaling needed
|
|
# Layer1: 100%, Layer2: 35% (50% of 70%)
|
|
# Weighted by equal size: (100 + 35) / 2 = 67.5%
|
|
assert progress.calculate_progress() == pytest.approx(67.5)
|
|
|
|
# Complete layer2
|
|
progress.process_event(
|
|
PullLogEntry(
|
|
job_id="test",
|
|
id="layer2",
|
|
status="Pull complete",
|
|
progress_detail=PullProgressDetail(),
|
|
)
|
|
)
|
|
|
|
assert progress.calculate_progress() == 100.0
|
|
|
|
def test_large_layers_appearing_late_dont_cause_regression(self):
|
|
"""Test that large layers discovered late don't cause progress to drop.
|
|
|
|
This simulates Docker's rate-limiting behavior where small layers complete
|
|
first, then large layers start downloading later.
|
|
"""
|
|
progress = ImagePullProgress()
|
|
|
|
# All layers announced upfront (Docker does this)
|
|
for layer_id in ["small1", "small2", "big1", "big2"]:
|
|
progress.process_event(
|
|
PullLogEntry(
|
|
job_id="test",
|
|
id=layer_id,
|
|
status="Pulling fs layer",
|
|
progress_detail=PullProgressDetail(),
|
|
)
|
|
)
|
|
|
|
# Big layers are "Waiting" (rate limited)
|
|
for layer_id in ["big1", "big2"]:
|
|
progress.process_event(
|
|
PullLogEntry(
|
|
job_id="test",
|
|
id=layer_id,
|
|
status="Waiting",
|
|
progress_detail=PullProgressDetail(),
|
|
)
|
|
)
|
|
|
|
# Small layers download quickly (1KB each)
|
|
for layer_id in ["small1", "small2"]:
|
|
progress.process_event(
|
|
PullLogEntry(
|
|
job_id="test",
|
|
id=layer_id,
|
|
status="Downloading",
|
|
progress_detail=PullProgressDetail(current=1000, total=1000),
|
|
)
|
|
)
|
|
progress.process_event(
|
|
PullLogEntry(
|
|
job_id="test",
|
|
id=layer_id,
|
|
status="Pull complete",
|
|
progress_detail=PullProgressDetail(),
|
|
)
|
|
)
|
|
|
|
# At this point, 2 small layers are complete, 2 big layers are unknown size
|
|
progress_before_big = progress.calculate_progress()
|
|
|
|
# Now big layers start downloading - they're 100MB each!
|
|
progress.process_event(
|
|
PullLogEntry(
|
|
job_id="test",
|
|
id="big1",
|
|
status="Downloading",
|
|
progress_detail=PullProgressDetail(current=1000000, total=100000000),
|
|
)
|
|
)
|
|
|
|
progress_after_big1 = progress.calculate_progress()
|
|
|
|
# Progress should NOT drop significantly when big layer appears
|
|
# The monotonic tracking in should_update_job will help, but the
|
|
# raw calculation should also not regress too badly
|
|
assert progress_after_big1 >= progress_before_big * 0.5, (
|
|
f"Progress dropped too much: {progress_before_big} -> {progress_after_big1}"
|
|
)
|
|
|
|
# Second big layer appears
|
|
progress.process_event(
|
|
PullLogEntry(
|
|
job_id="test",
|
|
id="big2",
|
|
status="Downloading",
|
|
progress_detail=PullProgressDetail(current=1000000, total=100000000),
|
|
)
|
|
)
|
|
|
|
# Should still make forward progress overall
|
|
# Complete all layers
|
|
for layer_id in ["big1", "big2"]:
|
|
progress.process_event(
|
|
PullLogEntry(
|
|
job_id="test",
|
|
id=layer_id,
|
|
status="Pull complete",
|
|
progress_detail=PullProgressDetail(),
|
|
)
|
|
)
|
|
|
|
assert progress.calculate_progress() == 100.0
|
|
|
|
def test_size_weighted_progress_with_manifest(self):
|
|
"""Test size-weighted progress when manifest layer sizes are known."""
|
|
# Create manifest with known layer sizes
|
|
# Small layer: 1KB, Large layer: 100KB
|
|
manifest = ImageManifest(
|
|
digest="sha256:test",
|
|
total_size=101000,
|
|
layers={
|
|
"small123456": 1000, # 1KB - ~1% of total
|
|
"large123456": 100000, # 100KB - ~99% of total
|
|
},
|
|
)
|
|
|
|
progress = ImagePullProgress()
|
|
progress.set_manifest(manifest)
|
|
|
|
# Layer events - small layer first
|
|
progress.process_event(
|
|
PullLogEntry(
|
|
job_id="test",
|
|
id="small123456",
|
|
status="Pulling fs layer",
|
|
progress_detail=PullProgressDetail(),
|
|
)
|
|
)
|
|
progress.process_event(
|
|
PullLogEntry(
|
|
job_id="test",
|
|
id="large123456",
|
|
status="Pulling fs layer",
|
|
progress_detail=PullProgressDetail(),
|
|
)
|
|
)
|
|
|
|
# Small layer downloads completely
|
|
progress.process_event(
|
|
PullLogEntry(
|
|
job_id="test",
|
|
id="small123456",
|
|
status="Downloading",
|
|
progress_detail=PullProgressDetail(current=1000, total=1000),
|
|
)
|
|
)
|
|
|
|
# Size-weighted: small layer is ~1% of total size
|
|
# Small layer at 70% (download done) = contributes ~0.7% to overall
|
|
assert progress.calculate_progress() == pytest.approx(0.69, rel=0.1)
|
|
|
|
# Large layer starts downloading (1% of its size)
|
|
progress.process_event(
|
|
PullLogEntry(
|
|
job_id="test",
|
|
id="large123456",
|
|
status="Downloading",
|
|
progress_detail=PullProgressDetail(current=1000, total=100000),
|
|
)
|
|
)
|
|
|
|
# Large layer at 1% download = contributes ~0.7% (1% * 70% * 99% weight)
|
|
# Total: ~0.7% + ~0.7% = ~1.4%
|
|
current = progress.calculate_progress()
|
|
assert current > 0.7 # More than just small layer
|
|
assert current < 5.0 # But not much more
|
|
|
|
# Complete both layers
|
|
progress.process_event(
|
|
PullLogEntry(
|
|
job_id="test",
|
|
id="small123456",
|
|
status="Pull complete",
|
|
progress_detail=PullProgressDetail(),
|
|
)
|
|
)
|
|
progress.process_event(
|
|
PullLogEntry(
|
|
job_id="test",
|
|
id="large123456",
|
|
status="Pull complete",
|
|
progress_detail=PullProgressDetail(),
|
|
)
|
|
)
|
|
|
|
assert progress.calculate_progress() == 100.0
|
|
|
|
def test_size_weighted_excludes_already_exists(self):
|
|
"""Test that already existing layers are excluded from size-weighted progress."""
|
|
# Manifest has 3 layers, but one will already exist locally
|
|
manifest = ImageManifest(
|
|
digest="sha256:test",
|
|
total_size=200000,
|
|
layers={
|
|
"cached12345": 100000, # Will be cached - shouldn't count
|
|
"layer1_1234": 50000, # Needs pulling
|
|
"layer2_1234": 50000, # Needs pulling
|
|
},
|
|
)
|
|
|
|
progress = ImagePullProgress()
|
|
progress.set_manifest(manifest)
|
|
|
|
# Cached layer already exists
|
|
progress.process_event(
|
|
PullLogEntry(
|
|
job_id="test",
|
|
id="cached12345",
|
|
status="Already exists",
|
|
progress_detail=PullProgressDetail(),
|
|
)
|
|
)
|
|
|
|
# Other layers need pulling
|
|
progress.process_event(
|
|
PullLogEntry(
|
|
job_id="test",
|
|
id="layer1_1234",
|
|
status="Pulling fs layer",
|
|
progress_detail=PullProgressDetail(),
|
|
)
|
|
)
|
|
progress.process_event(
|
|
PullLogEntry(
|
|
job_id="test",
|
|
id="layer2_1234",
|
|
status="Pulling fs layer",
|
|
progress_detail=PullProgressDetail(),
|
|
)
|
|
)
|
|
|
|
# Start downloading layer1 (50% of its size)
|
|
progress.process_event(
|
|
PullLogEntry(
|
|
job_id="test",
|
|
id="layer1_1234",
|
|
status="Downloading",
|
|
progress_detail=PullProgressDetail(current=25000, total=50000),
|
|
)
|
|
)
|
|
|
|
# layer1 is 50% of total that needs pulling (50KB out of 100KB)
|
|
# At 50% download = 35% layer progress (70% * 50%)
|
|
# Size-weighted: 50% * 35% = 17.5%
|
|
assert progress.calculate_progress() == pytest.approx(17.5)
|
|
|
|
# Complete layer1
|
|
progress.process_event(
|
|
PullLogEntry(
|
|
job_id="test",
|
|
id="layer1_1234",
|
|
status="Pull complete",
|
|
progress_detail=PullProgressDetail(),
|
|
)
|
|
)
|
|
|
|
# layer1 at 100%, layer2 at 0%
|
|
# Size-weighted: 50% * 100% + 50% * 0% = 50%
|
|
assert progress.calculate_progress() == pytest.approx(50.0)
|
|
|
|
def test_fallback_to_count_based_without_manifest(self):
|
|
"""Test that without manifest, count-based progress is used."""
|
|
progress = ImagePullProgress()
|
|
|
|
# No manifest set - should use count-based progress
|
|
|
|
# Two layers of different sizes
|
|
progress.process_event(
|
|
PullLogEntry(
|
|
job_id="test",
|
|
id="small",
|
|
status="Pulling fs layer",
|
|
progress_detail=PullProgressDetail(),
|
|
)
|
|
)
|
|
progress.process_event(
|
|
PullLogEntry(
|
|
job_id="test",
|
|
id="large",
|
|
status="Pulling fs layer",
|
|
progress_detail=PullProgressDetail(),
|
|
)
|
|
)
|
|
|
|
# Small layer (1KB) completes
|
|
progress.process_event(
|
|
PullLogEntry(
|
|
job_id="test",
|
|
id="small",
|
|
status="Downloading",
|
|
progress_detail=PullProgressDetail(current=1000, total=1000),
|
|
)
|
|
)
|
|
progress.process_event(
|
|
PullLogEntry(
|
|
job_id="test",
|
|
id="small",
|
|
status="Pull complete",
|
|
progress_detail=PullProgressDetail(),
|
|
)
|
|
)
|
|
|
|
# Large layer (100MB) at 1%
|
|
progress.process_event(
|
|
PullLogEntry(
|
|
job_id="test",
|
|
id="large",
|
|
status="Downloading",
|
|
progress_detail=PullProgressDetail(current=1000000, total=100000000),
|
|
)
|
|
)
|
|
|
|
# Count-based: each layer is 50% weight
|
|
# small: 100% * 50% = 50%
|
|
# large: 0.7% (1% * 70%) * 50% = 0.35%
|
|
# Total: ~50.35%
|
|
assert progress.calculate_progress() == pytest.approx(50.35, rel=0.01)
|