diff --git a/phone_agent/video_learning.py b/phone_agent/video_learning.py index 0bfa636..18891f2 100644 --- a/phone_agent/video_learning.py +++ b/phone_agent/video_learning.py @@ -242,6 +242,10 @@ class VideoLearningAgent: # Video detection: track screenshot changes (simplified) self._last_screenshot_hash: Optional[str] = None + # Skip app startup screens + self._in_app_steps: int = 0 + self._warmup_steps: int = 3 # Skip first 3 steps after entering app + # Screenshot analyzer for content extraction self._analyzer: Optional[ScreenshotAnalyzer] = None try: @@ -405,7 +409,15 @@ class VideoLearningAgent: is_in_target = any(pkg.lower() in current_app.lower() for pkg in packages) if not is_in_target: - print(f"[VideoLearning] Not in target app: {current_app} (step {result.step_count})") + # Reset warmup counter when leaving app + self._in_app_steps = 0 + print(f"[VideoLearning] Not in target app: {current_app}") + return None + + # Warmup: skip first few steps to avoid startup screens + self._in_app_steps += 1 + if self._in_app_steps <= self._warmup_steps: + print(f"[VideoLearning] Warmup step {self._in_app_steps}/{self._warmup_steps}, skipping...") return None # Get screenshot