N.E.K.O/main_logic/activity/tracker.py at 81eba641f08b023b9dba201e476b9f6f4cfe26b0 · Project-N-E-K-O/N.E.K.O · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
611
612
613
614
615
616
617
618
619
620
621
622
623
624
625
626
627
628
629
630
631
632
633
634
635
636
637
638
639
640
641
642
643
644
645
646
647
648
649
650
651
652
653
654
655
656
657
658
659
660
661
662
663
664
665
666
667
668
669
670
671
672
673
674
675
676
677
678
679
680
681
682
683
684
685
686
687
688
689
690
691
692
693
694
695
696
697
698
699
700
701
702
703
704
705
706
707
708
709
710
711
712
713
714
715
716
717
718
719
720
721
722
723
724
725
726
727
728
729
730
731
732
733
734
735
736
737
738
739
740
741
742
743
744
745
746
747
748
749
750
751
752
753
754
755
756
757
758
759
760
761
762
763
764
765
766
767
768
769
770
771
772
773
774
775
776
777
778
779
780
781
782
783
784
785
786
787
788
789
790
791
792
793
794
795
796
797
798
799
800
801
802
803
804
805
806
807
808
809
810
811
812
813
814
815
816
817
818
819
820
821
822
823
824
825
826
827
828
829
830
831
832
833
834
835
836
837
838
839
840
841
842
843
844
845
846
847
848
849
850
851
852
853
854
855
856
857
858
859
860
861
862
863
864
865
866
867
868
869
870
871
872
873
874
875
876
877
878
879
880
881
882
883
884
885
886
887
888
889
890
891
892
893
894
895
896
897
898
899
900
901
902
903
904
905
906
907
908
909
910
911
912
913
914
915
916
917
918
919
920
921
922
923
924
925
926
927
928
929
930
931
932
933
934
935
936
937
938
939
940
941
942
943
944
945
946
947
948
949
950
951
952
953
954
955
956
957
958
959
960
961
962
963
964
965
966
967
968
969
970
971
972
973
974
975
976
977
978
979
980
981
982
983
984
985
986
987
988
989
990
991
992
993
994
995
996
997
998
999
1000
"""Per-character user-activity tracker.

Combines the process-wide ``SystemSignalCollector`` with session-scoped
hooks (user/AI message timestamps, voice mode + RMS) and asks the
``ActivityStateMachine`` to emit a snapshot.

One ``UserActivityTracker`` exists per ``LLMSessionManager`` (so per
character). The collector singleton is shared. Tracker instances are
cheap — ~a few KB of buffers — so spinning one up for every active
character is fine.

Hook contract
-------------

Callers (mostly ``main_logic/core.py``) invoke these short, synchronous
methods at the points where signals occur:

  * ``on_user_message()``  — when the user submits text or finalises voice
  * ``on_ai_message()``    — when the AI's reply turn ends
  * ``on_voice_mode(active=True/False)``  — when entering / leaving voice
  * ``on_voice_rms()``     — when RMS / VAD detects user is speaking
  * ``on_screenshot()``    — placeholder for v2 (vision-described frames)

System signals (window, idle, CPU) are pulled at snapshot time from the
collector — there's no separate update path for those.

Snapshot consumer
-----------------

The proactive-chat code path calls ``get_snapshot()`` with enrichment
enabled. Rule-only consumers can call ``get_snapshot(include_enrichment=False)``
to reuse the same classifier without starting the activity-guess LLM loop.
Both paths run on the order of seconds (not milliseconds), so the small
per-call cost of running the state-machine classifier is irrelevant.
"""

from __future__ import annotations

import asyncio
import logging
import time
from collections import deque
from collections.abc import Awaitable, Callable
from dataclasses import replace as dc_replace

from main_logic.activity.snapshot import (
    ActivitySnapshot, ActivityState, AntiSlackPending, WorkBreakPending,
)
from main_logic.activity.state_machine import (
    ActivityStateMachine, observation_from_system,
)
from main_logic.activity.system_signals import (
    SystemSignalCollector, SystemSnapshot, get_system_signal_collector,
)
from utils.activity_config import get_activity_preferences

logger = logging.getLogger(__name__)

# Conversation buffers: small enough to keep prompt sizes tight, large
# enough to give the emotion-tier LLM real recent context.
_CONV_BUFFER_MAXLEN = 12

# How often the activity_guess background loop wakes up. The user
# specifically asked for 20s polling. The loop itself short-circuits
# when the state signature hasn't changed, so the LLM cost only adds
# up when activity is actually shifting.
_ACTIVITY_GUESS_TICK_SECONDS = 20.0

# After computing activity_guess, suppress recompute for at least this
# long even if signature changes — protects against thrashing during
# rapid window flicker (a 30s minimum interval between LLM calls).
_ACTIVITY_GUESS_MIN_REFRESH_SECONDS = 30.0

# Frontend-pushed external signals are considered fresh for this many
# seconds. After that the tracker falls back to the local collector
# (which on remote deployments will be in degraded mode) — better to
# advertise "no signal" than to keep using stale window data.
#
# 15s = 3× the 5s heartbeat. The push pipeline stacks two unsynchronised
# 5s timers — the NEKO-PC bridge sampler (reads OS signals) and the
# renderer heartbeat (reads the bridge's cached snapshot + POSTs) — so
# worst-case data age can already approach ~10-12s before any loss. 15s
# therefore tolerates ~2 consecutive dropped pushes before falling back.
# Shorter (e.g. 10s) would thrash between fresh/degraded on a single
# drop over a lossy remote link; 30s keeps trusting a stale "user
# active" snapshot for too long after the heartbeat dies. 15s balances
# faster stale-detection against fallback thrash.
_EXTERNAL_SIGNAL_TTL_SECONDS = 15.0

# Minimum interval between accepted external-signal pushes for a given
# lanlan_name. Tuned together with the frontend heartbeat: the Electron
# preload pushes every ~5s, so anything more frequent is either a buggy
# client (re-entering the heartbeat) or spam. Enforced by the
# ``/api/activity_signal`` endpoint, not the tracker itself — the
# tracker is happily idempotent and just overwrites the last push.
#
# Pairs with TTL above: TTL is the "data freshness" window, this is the
# "request frequency" cap. TTL is 3× this interval, so the tracker
# tolerates ~2 consecutive rate-limited/dropped pushes and still has
# data within the freshness window.
_EXTERNAL_SIGNAL_MIN_INTERVAL = 5.0


# ── Break-reminder defaults ─────────────────────────────────────────
# Override per-character via ``user_preferences.json::__global_conversation__::activity::thresholds``.
# All values are minutes / seconds; the probability has its own dedicated
# field on ``ActivityPreferences`` because 0 is meaningful (disabled) and
# the threshold parser rejects ≤0.

# Cumulative focused_work minutes that arms the water-break reminder.
# Once armed, the next proactive_chat round in focused_work fires the
# minimal-Phase-2 nudge and resets the accumulator.
_WORK_BREAK_MINUTES = 30

# How long a queued ``WorkBreakPending`` stays valid if proactive_chat
# never fires. After this window the pending is dropped (the user has
# clearly stopped focusing or the moment passed); the accumulator stays
# at its current value so the next focused_work stretch can re-arm.
_WORK_BREAK_PENDING_WINDOW_SECONDS = 5 * 60

# Minimum focused_work session length before exiting it can fire an
# anti-slack reminder. Below this, the user probably opened the wrong
# window by accident — don't lecture them.
_ANTI_SLACK_MIN_FOCUS_MINUTES = 5

# Per-character cooldown after a successful anti-slack delivery. Decoupled
# from the water-break / mini-game cooldowns so the two reminder types
# don't accidentally throttle each other.
_ANTI_SLACK_COOLDOWN_MINUTES = 15

# How long a queued ``AntiSlackPending`` stays valid. The transition is
# the trigger; if proactive doesn't fire within this window the moment
# is gone (user has already settled into the new activity for a while).
_ANTI_SLACK_PENDING_WINDOW_SECONDS = 5 * 60

# Probability that a fired water-break reminder pivots into a "rest +
# mini-game invite" branch instead of the regular drink/stretch nudge.
# Falls through to ActivityPreferences override (0 disables).
_WORK_BREAK_GAME_INVITE_PROBABILITY = 0.5

# Cap on per-tick accumulator advance. Filters clock jumps / process
# suspends / first-call jitter so a long gap between ticks doesn't
# silently credit minutes the user didn't actually spend focused.
_BREAK_REMINDER_TICK_MAX_DELTA_SECONDS = 30.0

# States that count as "leisure" for anti-slack transition detection.
# Idle is intentionally excluded — sitting at the desk staring is often
# thinking, not slacking — as are voice_engaged / chatting (they are
# producing). transitioning is excluded because it's not an end state.
_ANTI_SLACK_LEISURE_STATES: frozenset[str] = frozenset({
    'casual_browsing', 'gaming',
})


def _privacy_mode_active() -> bool:
    """用户是否开启了隐私模式。开启时整个 tracker 应当短路。

    存储在前端 ``proactiveVisionEnabled`` 的反面（详见 utils.preferences）。
    异常路径 fail-closed：任何读取异常一律按"隐私模式开启"处理，宁可
    短期内 tracker 不可用，也不能让"读不出来"等价于"用户没开隐私"。
    正常的"用户没开隐私"路径走 ``is_privacy_mode_enabled`` 返回 False，
    不进 except 分支。
    """
    try:
        from utils.preferences import is_privacy_mode_enabled
        return is_privacy_mode_enabled()
    except Exception as e:
        logger.warning(
            'privacy mode check failed, defaulting to enabled (fail-closed): %s', e,
        )
        return True


def _proactive_chat_enabled() -> bool:
    """主动搭话总开关是否打开。

    ``activity_guess`` 的 emotion-tier LLM 叙述只喂 proactive Phase 2 的
    state_section，没有别的消费方；主动搭话关时算它纯属浪费。loop 用它跳过
    LLM 部分——这样「实验组为弹窗 kick 起 loop、但用户没开主动搭话」时只剩廉价
    规则轮询 + 情境弹窗检测，零 LLM 开销。

    fail-open：key 缺失 *或* 读取异常都返回 True。误判「关」会把 proactive-on 用户该有
    的活动叙述吞掉（伤用户可见功能），误判「开」只是多算一次叙述（小成本），两害相权
    取「宁可多算」。真正明确关掉主动搭话的用户 key=false（前端总会同步这个键），照样
    走 skip 分支，成本修复对主流场景依旧生效；只有从没同步过设置的全新会话才落到缺失→
    True 这条窄路径，可忽略。
    """
    try:
        from utils.preferences import load_global_conversation_settings
        return bool(load_global_conversation_settings().get('proactiveChatEnabled', True))
    except Exception as e:
        logger.debug('proactive_chat_enabled check failed, defaulting to True: %s', e)
        return True


class UserActivityTracker:
    """Per-character activity inference engine.

    Lifecycle: created when ``LLMSessionManager`` is constructed; lives
    as long as that manager does. The shared system collector is
    started lazily on first ``get_snapshot()`` call so unit tests that
    only construct a tracker don't spin up a poller.
    """

    def __init__(
        self,
        lanlan_name: str,
        *,
        collector: SystemSignalCollector | None = None,
    ) -> None:
        """
        Parameters
        ----------
        lanlan_name:
            Character handle this tracker is bound to. Used for log
            attribution; the tracker itself doesn't reach into character
            state.
        collector:
            Optional collector injection — defaults to the process
            singleton. Kept overridable so tests can pass a fake.
        """
        self.lanlan_name = lanlan_name
        self._sm = ActivityStateMachine()
        self._collector = collector or get_system_signal_collector()
        self._collector_started = False

        # Conversation buffers for emotion-tier LLM enrichment input.
        # Tuples of (timestamp, text). User-side captures whatever the
        # voice transcript / text message handler passes through;
        # AI-side mirrors the per-turn buffer at turn-end time.
        self._user_msg_buffer: deque[tuple[float, str]] = deque(maxlen=_CONV_BUFFER_MAXLEN)
        self._ai_msg_buffer: deque[tuple[float, str]] = deque(maxlen=_CONV_BUFFER_MAXLEN)

        # open_threads cache. ``_conv_seq`` increments on EITHER side of
        # the conversation moving (``on_user_message`` OR ``on_ai_message``)
        # — open threads can be opened by AI promises and abandoned
        # mid-sentences from either party, not just user replies.
        # ``_open_threads_computed_at_seq`` records the seq at the
        # moment of the last successful compute. When seqs match, the
        # cache is fresh; mismatch → kickoff is allowed to spawn a new
        # compute.
        self._conv_seq: int = 0
        self._open_threads_cache: list[str] = []
        self._open_threads_computed_at_seq: int = -1
        self._open_threads_task: asyncio.Task | None = None

        # activity_guess cache. Stale check uses a state-signature tuple
        # (state, active app, idle bucket) — when unchanged for a tick
        # AND we recently computed, the loop short-circuits before
        # paying the LLM cost.
        self._activity_scores_cache: dict[str, float] = {}
        self._activity_guess_cache: str = ''
        self._activity_guess_state_sig: tuple | None = None
        self._activity_guess_at: float = 0.0
        self._activity_guess_loop_task: asyncio.Task | None = None

        # Frontend-pushed system signal (for remote deployments where the
        # backend's local OS APIs see only the server, not the user).
        # When fresh (<= _EXTERNAL_SIGNAL_TTL_SECONDS), this overrides
        # the local collector entirely. Stale → fall back to collector
        # (which on a remote backend reports os_signals_available=False
        # and the state machine's snapshot makes that explicit).
        self._external_system_snap: SystemSnapshot | None = None

        # ── Break-reminder accumulator + transition tracking ────────
        # Single timestamp drives both: each tick computes
        # ``now - _break_tick_last_at`` and credits the delta (capped) to
        # the appropriate timer based on the current state. 0.0 = "first
        # tick, no delta to credit yet".
        self._break_tick_last_at: float = 0.0

        # Cumulative focused_work seconds. Accumulates while state ==
        # focused_work, OR state == transitioning AND accumulator > 0
        # (transitioning extends an in-progress focus session — quick
        # window flicks don't break the timer). Any other state resets
        # to 0 immediately. See ``_tick_break_reminders``.
        self._work_acc_seconds: float = 0.0

        # State + session bookkeeping. ``_last_known_state`` lets us
        # detect transitions across ticks; ``_focused_work_session_*``
        # let us report how long the just-ended focused_work session
        # was when an anti-slack transition fires.
        self._last_known_state: ActivityState | None = None
        self._focused_work_session_started_at: float | None = None
        self._focused_work_session_app: str | None = None

        # Anti-slack cooldown: epoch time of the last successful
        # delivery. Until ``now - this >= cooldown_seconds`` no new
        # AntiSlackPending is emitted (the cooldown gate runs at
        # transition-detection time, not at delivery — symmetrical with
        # the mini-game invite cooldown shape).
        self._anti_slack_last_fired_at: float = 0.0

        # Pending payloads. Lifecycle:
        #   * Set when conditions trigger (water: focused_work +
        #     accumulator past threshold; anti-slack: focused_work →
        #     leisure transition past min focus + cooldown OK).
        #   * Cleared by ``mark_work_break_used`` /
        #     ``mark_anti_slack_used`` after successful delivery.
        #   * Auto-cleared at tick time when the validity window
        #     (``_WORK_BREAK_PENDING_WINDOW_SECONDS`` / ``_ANTI_SLACK_*``)
        #     expires or the state changes to one that invalidates the
        #     pending (e.g. anti-slack pending dies if user returns
        #     to focused_work).
        # Stored as dicts (not frozen dataclasses) so we can stamp a
        # ``set_at`` timestamp for window-expiry checks; the snapshot
        # builds the frozen WorkBreakPending / AntiSlackPending from
        # these.
        self._work_break_pending: dict | None = None
        self._anti_slack_pending: dict | None = None

        # ── 情境弹窗（A/B 实验组前端用）──────────────────────────
        # 当用户「进入」游戏/娱乐 或「进入」专注工作时，给前端推一次性信号，让前端
        # （仅实验组、每会话每类一次）弹窗问要不要开/关屏幕分享来源。后端只负责检测
        # 「进入」这一刻并推送，分组判定 + 去重都在前端。
        #   * ``_context_prompt_pending``：一次性槽位，由 ``_tick_break_reminders``
        #     在检测到进入目标状态时 set（同步安全，只置 dict），由异步
        #     ``_activity_guess_loop`` 心跳 drain 后 await 推送回调。后写覆盖前写
        #     （两次 drain 间多次切换只推最新那次，够用）。
        #   * ``_on_context_prompt``：core.py 注入的 async 回调，签名 ``(context: str)``
        #     —— context 取 'play'（游戏/娱乐）或 'work'（专注工作）。未注入则不推。
        self._context_prompt_pending: dict | None = None
        self._on_context_prompt: Callable[[str], Awaitable[None]] | None = None
        # 情境弹窗专属的「上一状态」基线，独立于 break-reminder 的 _last_known_state
        # ——这样可以在每个 session 开始时单独清掉（reset_context_prompt_baseline），让
        # 「跨 session 仍在同一状态」也能重新算作一次「进入」并再弹（前端按 app 会话去
        # 重），同时不扰动 break/anti-slack 的状态机。
        self._context_prompt_last_state: ActivityState | None = None

    # ── hooks (called from core.py and friends) ─────────────────

    def on_user_message(self, *, text: str | None = None, now: float | None = None) -> None:
        """Stamp a "user said something" event.

        Drives the focused_work `recent_input` heuristic, the
        ``seconds_since_user_msg`` field, and (when ``text`` is given)
        the conversation buffer the emotion-tier LLM enrichment reads
        from. Also bumps ``_conv_seq`` so the next
        ``kickoff_open_threads_compute`` call knows the cache is stale.
        """
        ts = now if now is not None else time.time()
        self._sm.update_user_message(now=ts)
        self._conv_seq += 1
        # 隐私模式：让用户消息文本直接不进 buffer，避免在切回非隐私模式时
        # 旧数据被 enrichment LLM 二次曝光。state machine 的时间戳还要更新
        # （下游 idle / focused_work 判定依赖），文本扔了即可。
        if text and not _privacy_mode_active():
            self._user_msg_buffer.append((ts, text.strip()[:1000]))

    def on_ai_message(self, *, text: str | None = None, now: float | None = None) -> None:
        """Stamp an "AI just spoke" event.

        ``text`` is optional. When provided, the state machine runs the
        question heuristic over it: if the AI's reply trips the heuristic
        (ends with ``?`` / ``？`` / a CN sentence-final question particle),
        an unfinished-thread record opens — Phase 2 will be allowed up to
        ``UNFINISHED_THREAD_MAX_FOLLOWUPS`` (default 2) follow-ups within
        the 5-minute window even in restricted_screen_only states.

        Text is also appended to the AI conversation buffer so the
        emotion-tier LLM enrichment has recent context to reason over.
        """
        ts = now if now is not None else time.time()
        self._sm.update_ai_message(text=text, now=ts)
        if text and not _privacy_mode_active():
            self._ai_msg_buffer.append((ts, text.strip()[:1000]))
            # AI also opens threads (promises, abandoned mid-sentences) →
            # bump _conv_seq so kickoff_open_threads_compute will recompute.
            # Empty / no-text turns (errors / silenced) skip the bump,
            # since nothing in the buffer changed.
            self._conv_seq += 1

    def mark_unfinished_thread_used(self) -> None:
        """Record that a proactive emission just used the override slot.

        Called by ``main_routers/system_router.py`` after a successful
        proactive turn whenever the snapshot's ``unfinished_thread`` was
        active going in. Increments the per-thread follow-up counter;
        once the cap is hit, the state machine drops the thread record
        and the override is no longer offered to the prompt.
        """
        self._sm.mark_unfinished_thread_used()

    def on_voice_mode(self, active: bool) -> None:
        """Toggle voice-mode flag.

        Called when ``LLMSessionManager`` starts/stops a voice session.
        Without this, ``voice_engaged`` cannot fire — the state machine
        treats voice mode as a hard prerequisite.
        """
        self._sm.update_voice_mode(active)

    def on_voice_rms(self, *, now: float | None = None) -> None:
        """Mark user voice activity (RMS / VAD over threshold).

        Called whenever the audio capture path detects the user is
        speaking. Tracker only stores the most recent timestamp;
        ``VOICE_ACTIVE_WINDOW_SECONDS`` decides what counts as "current".
        """
        self._sm.update_voice_rms(now=now)

    def on_screenshot(self, *, now: float | None = None) -> None:
        """Hook for vision-described screenshots.

        v1: no-op. v2 will feed a brief description into a side buffer
        so the state-machine reasons can quote what's on screen. Left
        as a method so the integration sites in core.py can be wired
        now and start emitting events.
        """
        # Intentionally empty — v1 keeps this rules-only.
        return None

    def push_external_system_signal(
        self,
        *,
        window_title: str | None = None,
        process_name: str | None = None,
        idle_seconds: float | None = None,
        cpu_avg_30s: float | None = None,
        gpu_utilization: float | None = None,
        now: float | None = None,
    ) -> None:
        """Inject OS signals from outside the backend (frontend push).

        For remote-deployment scenarios where the Python backend isn't
        running on the user's machine: ``GetForegroundWindow`` and
        friends would report the *server's* state, useless for tracking
        the user. The expected pattern is:

          1. The frontend (Electron / browser / mobile shell) reads its
             local-OS signals — active window title + owning process,
             system idle seconds, GPU utilisation.
          2. It POSTs them to the backend on a heartbeat (~5-10s).
          3. The endpoint calls this method.

        Each push refreshes the timestamp; staleness past
        ``_EXTERNAL_SIGNAL_TTL_SECONDS`` causes the tracker to fall
        back to the local collector (which on remote backends will
        report ``os_signals_available=False`` so the prompt can adapt).

        All fields are optional — pass whatever the frontend can read.
        Missing fields fall through to neutral defaults; ``window_title``
        and ``process_name`` being None means "no foreground window
        right now" (legitimate — e.g., desktop visible).
        """
        ts = now if now is not None else time.time()
        self._external_system_snap = SystemSnapshot(
            timestamp=ts,
            idle_seconds=idle_seconds if idle_seconds is not None else 0.0,
            cpu_avg_30s=cpu_avg_30s if cpu_avg_30s is not None else 0.0,
            cpu_instant=cpu_avg_30s if cpu_avg_30s is not None else 0.0,
            window_title=window_title,
            process_name=process_name,
            gpu_utilization=gpu_utilization,
            os_signals_available=True,
        )

    # ── snapshot ────────────────────────────────────────────────

    async def get_snapshot(
        self,
        *,
        now: float | None = None,
        include_enrichment: bool = True,
        tick_followups: bool = True,
    ) -> ActivitySnapshot:
        """Pull system signals and emit a fresh snapshot.

        Async because it ensures the system collector has been started
        (a one-shot ``await`` on first call). Subsequent calls are
        effectively synchronous. The returned snapshot has cached
        emotion-tier enrichment fields (``activity_scores``,
        ``activity_guess``, ``open_threads``) merged in — except when
        the resolved state is ``private``, in which case enrichment
        is suppressed (LLM input + cached output both bypassed) so the
        user's secret context never reaches the model.

        Set ``include_enrichment=False`` for rule-only consumers that
        need state / active-window / idle signals but do not consume the
        emotion-tier enrichment cache or background activity-guess loop.
        Set ``tick_followups=False`` for read-only pollers that must not
        advance break-reminder / anti-slack pending state.
        """
        await self._ensure_collector_started(
            start_activity_guess_loop=include_enrichment
        )
        self._refresh_prefs()

        ts = now if now is not None else time.time()

        sys_snap = self._select_system_snapshot(ts)
        self._sm.update_system(sys_snap)
        self._sm.update_window(
            observation_from_system(sys_snap, self._sm._prefs),
            now=ts,
        )

        snap = self._sm.get_snapshot(now=ts)
        # Tick break-reminder accumulator + transition detection BEFORE
        # building pending fields. Done after sm.get_snapshot so we have
        # the resolved state (focused_work / leisure / etc) to drive
        # accumulator and transition logic.
        if tick_followups:
            self._tick_break_reminders(snap, now=ts)
        if snap.state == 'private':
            # Privacy lockdown — explicitly empty enrichment fields rather
            # than splicing in caches built from earlier (non-private)
            # state. Even though state machine drops the title/process
            # at update_window, the cached enrichment narrative might
            # still reference what the user was doing 30s ago, which
            # could leak intent ("master is logging into bank...").
            # Pending break-reminder fields also dropped — no proactive
            # interrupt while a sensitive app is foreground.
            return dc_replace(
                snap,
                activity_scores={},
                activity_guess='',
                open_threads=[],
                work_break_pending=None,
                anti_slack_pending=None,
            )
        if not include_enrichment:
            return dc_replace(
                snap,
                activity_scores={},
                activity_guess='',
                open_threads=[],
                work_break_pending=(
                    self._build_work_break_pending() if tick_followups else None
                ),
                anti_slack_pending=(
                    self._build_anti_slack_pending() if tick_followups else None
                ),
            )
        # Patch in emotion-tier enrichment caches. ``snap`` is a frozen
        # dataclass; ``replace`` returns a new instance without mutating
        # the original. Callers always get a self-consistent snapshot.
        return dc_replace(
            snap,
            activity_scores=dict(self._activity_scores_cache),
            activity_guess=self._activity_guess_cache,
            open_threads=list(self._open_threads_cache),
            work_break_pending=(
                self._build_work_break_pending() if tick_followups else None
            ),
            anti_slack_pending=(
                self._build_anti_slack_pending() if tick_followups else None
            ),
        )

    def get_snapshot_sync(self, *, now: float | None = None) -> ActivitySnapshot:
        """Synchronous variant for callers outside an event loop.

        Useful for unit tests and any sync-context debug logging. Skips
        the collector-start guard — callers must ensure collection is
        running, or accept that ``SystemSnapshot`` defaults will be in
        play. Enrichment caches are merged in the same way as
        ``get_snapshot``, with the same private-state suppression.
        """
        self._refresh_prefs()
        ts = now if now is not None else time.time()
        # Use _select_system_snapshot to honour frontend-pushed signals
        # exactly like the async path — otherwise remote deployments
        # would silently fall back to the local (server-side) collector
        # in sync callers.
        sys_snap = self._select_system_snapshot(ts)
        self._sm.update_system(sys_snap)
        self._sm.update_window(
            observation_from_system(sys_snap, self._sm._prefs),
            now=ts,
        )
        snap = self._sm.get_snapshot(now=ts)
        self._tick_break_reminders(snap, now=ts)
        if snap.state == 'private':
            return dc_replace(
                snap,
                activity_scores={},
                activity_guess='',
                open_threads=[],
                work_break_pending=None,
                anti_slack_pending=None,
            )
        return dc_replace(
            snap,
            activity_scores=dict(self._activity_scores_cache),
            activity_guess=self._activity_guess_cache,
            open_threads=list(self._open_threads_cache),
            work_break_pending=self._build_work_break_pending(),
            anti_slack_pending=self._build_anti_slack_pending(),
        )

    # ── break-reminder accumulator + transition detection ──────────

    def _tick_break_reminders(self, snap: ActivitySnapshot, *, now: float) -> None:
        """Advance the focused_work accumulator and detect leisure transitions.

        Idempotent and tolerant of arbitrary call frequency: per-call
        delta is bounded by ``_BREAK_REMINDER_TICK_MAX_DELTA_SECONDS``,
        so a long gap between calls (process suspend, idle deployment,
        first-call bootstrap) doesn't silently credit minutes the user
        didn't actually spend focused.

        Called from ``get_snapshot``, ``get_snapshot_sync``, and the 20s
        ``_activity_guess_loop`` — the latter ensures state transitions
        are caught even when no proactive_chat round queries the tracker.

        Reads thresholds via ``self._sm._prefs.thresholds`` so user
        edits to ``user_preferences.json`` take effect on the next
        cache reload tick (mirrors how the state machine handles
        live-edit user overrides).
        """
        thresholds = self._sm._prefs.thresholds

        # Resolve thresholds with code-default fallbacks. Live-edit safe:
        # _refresh_prefs runs on every get_snapshot path; threshold
        # constants reload via the activity_config 30s cache.
        work_break_seconds = float(
            thresholds.get('work_break_minutes', _WORK_BREAK_MINUTES)
        ) * 60.0
        work_break_window = float(
            thresholds.get('work_break_pending_window_seconds', _WORK_BREAK_PENDING_WINDOW_SECONDS)
        )
        anti_slack_min_focus_seconds = float(
            thresholds.get('anti_slack_min_focus_minutes', _ANTI_SLACK_MIN_FOCUS_MINUTES)
        ) * 60.0
        anti_slack_cooldown_seconds = float(
            thresholds.get('anti_slack_cooldown_minutes', _ANTI_SLACK_COOLDOWN_MINUTES)
        ) * 60.0
        anti_slack_window = float(
            thresholds.get('anti_slack_pending_window_seconds', _ANTI_SLACK_PENDING_WINDOW_SECONDS)
        )

        state = snap.state

        # Capture accumulator BEFORE advance/reset. Used as the
        # authoritative session length when the anti-slack branch fires
        # below — wall-clock ``now - session_started_at`` would inflate
        # after a long process suspend / sleep / stall (the gap discard
        # in the advance block prevents the accumulator from ticking
        # through the dead window, but ``session_started_at`` still
        # points at pre-suspend time). Codex P1 review: PR #1226.
        session_acc_at_start = self._work_acc_seconds

        # ── Accumulator advance ─────────────────────────────────
        # First tick has no delta to credit — record now and exit. The
        # next call computes a real delta against this point.
        if self._break_tick_last_at == 0.0:
            self._break_tick_last_at = now
        else:
            raw_delta = now - self._break_tick_last_at
            self._break_tick_last_at = now
            # Ignore zero / negative (clock jump) and overlong (suspended
            # process / forgot-to-tick) gaps. Either bucket means the
            # accumulator can't safely advance: we don't actually know
            # what state the user was in during that gap.
            if 0 < raw_delta <= _BREAK_REMINDER_TICK_MAX_DELTA_SECONDS:
                if state == 'focused_work':
                    self._work_acc_seconds += raw_delta
                elif state == 'transitioning' and self._work_acc_seconds > 0:
                    # Transitioning during a real focus session = quick
                    # IDE↔terminal↔browser-docs flick. Don't break the
                    # streak. (When acc=0 we never started a session, so
                    # transitioning by itself can't kick one off.)
                    self._work_acc_seconds += raw_delta
                else:
                    # Any other state immediately resets — per user spec.
                    self._work_acc_seconds = 0.0
            else:
                # Unsafe delta — two buckets, same conservative cleanup:
                #   * ``raw_delta > cap`` — long gap (process suspend /
                #     sleep / forgot-to-tick). Don't know what state
                #     the user was in during the gap.
                #   * ``raw_delta <= 0`` — non-monotonic clock (NTP
                #     rollback, manual time change, duplicate ts). Can't
                #     credit; pre-rollback focus also can't be trusted
                #     to extend through the inverted segment.
                # In both cases, allowing the in-range branch above to
                # not run means the "any other state immediately resets"
                # rule never fires for non-focus ticks — pre-transition
                # focus minutes leak forward into post-gap focused_work
                # and trip water_break_pending earlier than 30 min of
                # genuine post-gap focus warrants. Codex P2 reviews:
                # PR #1226 (long-gap and non-positive-delta findings).
                #
                # Conservative reset of everything that could carry
                # stale pre-event context:
                #   * accumulator → 0
                #   * _last_known_state → None forces the bookkeeping
                #     below to treat any post-event focused_work as a
                #     fresh session entry, AND prevents anti-slack from
                #     firing on a focused_work → leisure transition
                #     observed across the unsafe-delta tick.
                #   * Pending dicts cleared since the snapshot they
                #     reference is now ancient.
                self._work_acc_seconds = 0.0
                self._last_known_state = None
                self._context_prompt_last_state = None
                self._work_break_pending = None
                self._anti_slack_pending = None

        # ── Focused_work session bookkeeping (for anti-slack transition) ─
        # Track entry/exit so we can report the just-ended session length
        # and app name when the user pivots to leisure.
        prev_known = self._last_known_state
        active_window = snap.active_window
        active_canonical = (
            active_window.canonical if active_window and active_window.canonical
            else (active_window.title if active_window and active_window.title else None)
        )
        if state == 'focused_work':
            if prev_known != 'focused_work':
                # Entering focused_work. Clear any anti-slack pending —
                # user is back at it, no need to nag.
                self._focused_work_session_started_at = now
                self._focused_work_session_app = active_canonical
                self._anti_slack_pending = None
            elif self._focused_work_session_app is None and active_canonical:
                # Late-arriving canonical (the state already became
                # focused_work but the active_window was None at entry).
                self._focused_work_session_app = active_canonical
        elif state == 'transitioning' and prev_known == 'focused_work':
            # Mid-flick to a sibling work window — keep session timer
            # running, don't reset (mirrors the accumulator rule).
            pass
        elif prev_known == 'focused_work' or (
            prev_known == 'transitioning' and self._focused_work_session_started_at is not None
        ):
            # Just left focused_work (possibly via transitioning). Capture
            # the session length and app, then evaluate anti-slack.
            session_started = self._focused_work_session_started_at
            session_app = self._focused_work_session_app
            self._focused_work_session_started_at = None
            self._focused_work_session_app = None
            if (
                session_started is not None
                and state in _ANTI_SLACK_LEISURE_STATES
            ):
                # Use the accumulator value captured at tick start
                # (before reset) — it honors the long-gap discard rule,
                # while ``now - session_started`` would credit the user
                # with sleep/suspend time as if they'd been working.
                session_seconds = session_acc_at_start
                cooldown_ok = (
                    self._anti_slack_last_fired_at == 0.0
                    or (now - self._anti_slack_last_fired_at) >= anti_slack_cooldown_seconds
                )
                if (
                    session_seconds >= anti_slack_min_focus_seconds
                    and cooldown_ok
                ):
                    new_canonical = active_canonical or ''
                    self._anti_slack_pending = {
                        'set_at': now,
                        'minutes': max(1, int(session_seconds / 60)),
                        'prev_app': session_app or '',
                        'new_app': new_canonical,
                    }

        # Anti-slack pending invalidation: state moved out of leisure
        # before we got to deliver — the moment is gone.
        if (
            self._anti_slack_pending is not None
            and state not in _ANTI_SLACK_LEISURE_STATES
        ):
            self._anti_slack_pending = None
        # Anti-slack pending window expiry.
        if (
            self._anti_slack_pending is not None
            and (now - self._anti_slack_pending['set_at']) > anti_slack_window
        ):
            self._anti_slack_pending = None

        # ── 情境弹窗一次性检测（A/B 实验组前端用）────────────────
        # 只在「进入」目标状态那一刻置 pending（state != 上一状态），状态保持期间不重复
        # 触发，避免 20s 心跳刷屏。分组判定 + 每会话去重都在前端。
        #   gaming / casual_browsing（=娱乐，进游戏/看番/视频）→ 'play'
        #   focused_work（进专注工作）                       → 'work'
        # 用 _context_prompt_last_state（情境弹窗专属基线）而非 _last_known_state：后者
        # 跨 session 长存，会让「上个 session 结束时在游戏、新 session 仍在游戏」检测不到
        # 进入、漏弹；专属基线在每个 session 开始时被 reset_context_prompt_baseline 清成
        # None，于是当前状态重新算作一次「进入」。为 None（首启 / 不安全 delta 重置 /
        # 新 session）都算「进入」，前端按 app 会话去重兜住重复。
        ctx_prev = self._context_prompt_last_state
        _CONTEXT_PROMPT_TARGET_STATES = ('gaming', 'casual_browsing', 'focused_work')
        if state != ctx_prev:
            if state in ('gaming', 'casual_browsing'):
                self._context_prompt_pending = {'context': 'play', 'set_at': now}
            elif state == 'focused_work':
                self._context_prompt_pending = {'context': 'work', 'set_at': now}
        # 离开目标状态（进 idle/away/chatting/transitioning/private 等非目标态）时，清掉
        # 还没 drain 的过期 pending：pending 可能是 get_snapshot 路径（实验组 kick）置的、
        # 还没等到 loop drain，用户就离开了游戏/工作；若不清，loop 会把「已经离开的场景」
        # 推成过期弹窗，甚至据此翻错设置。目标态之间切换（gaming↔casual_browsing↔
        # focused_work）由上面的 overwrite 处理，不受影响。
        if state not in _CONTEXT_PROMPT_TARGET_STATES:
            self._context_prompt_pending = None
        self._context_prompt_last_state = state

        self._last_known_state = state

        # ── Water-break pending ─────────────────────────────────
        # Armed when accumulator crosses threshold AND state is currently
        # focused_work. Stays armed across ticks (no time pin) — the next
        # proactive_chat round in focused_work fires it. If the user
        # leaves focused_work, accumulator resets to 0 (above) which
        # naturally clears the arming condition; we also drop the pending
        # explicitly here for cleanliness.
        if (
            state == 'focused_work'
            and self._work_acc_seconds >= work_break_seconds
        ):
            if self._work_break_pending is None:
                self._work_break_pending = {
                    'set_at': now,
                    'minutes': max(1, int(self._work_acc_seconds / 60)),
                    'app': active_canonical or '',
                }
            else:
                # Refresh minutes (accumulator keeps growing) and app
                # (window may have shifted to a different work app).
                self._work_break_pending['minutes'] = max(
                    1, int(self._work_acc_seconds / 60),
                )
                if active_canonical:
                    self._work_break_pending['app'] = active_canonical
        elif state != 'focused_work' and state != 'transitioning':
            # User left focused work entirely (and isn't mid-flick).
            # Drop pending — accumulator was already reset above.
            self._work_break_pending = None
        # Window expiry as a defense-in-depth: if proactive doesn't fire
        # and the user keeps grinding, the pending stays valid (intent
        # of must-fire) — but if the snapshot pipeline is wedged for
        # >window_seconds and the moment is conceptually gone, reset.
        # ``set_at`` is captured once on first arming and NOT refreshed
        # by the minutes-update branch above, so this expiry check
        # actually bites for any state that holds the pending — most
        # commonly ``transitioning`` lingering past the window. The
        # ``state != 'focused_work'`` gate keeps focused_work itself
        # exempt: as long as the user is actively focused, the pending
        # is canonical and shouldn't time out. CodeRabbit nitpick: PR #1226.
        if (
            self._work_break_pending is not None
            and state != 'focused_work'
            and (now - self._work_break_pending['set_at']) > work_break_window
        ):
            self._work_break_pending = None

    def _build_work_break_pending(self) -> WorkBreakPending | None:
        """Project the internal pending dict into the frozen snapshot type."""
        if self._work_break_pending is None:
            return None
        return WorkBreakPending(
            minutes=self._work_break_pending['minutes'],
            app=self._work_break_pending['app'],
        )

    def _build_anti_slack_pending(self) -> AntiSlackPending | None:
        if self._anti_slack_pending is None:
            return None
        return AntiSlackPending(
            minutes=self._anti_slack_pending['minutes'],
            prev_app=self._anti_slack_pending['prev_app'],
            new_app=self._anti_slack_pending['new_app'],
        )

    def mark_work_break_used(self, *, now: float | None = None) -> None:
        """Reset the water-break accumulator + clear pending after delivery.

        Called from ``main_routers/system_router.py`` once the minimal
        Phase 2 delivery (regular drink/stretch nudge OR the 50% rest+
        game-invite branch) commits successfully. Resets the accumulator
        so the next break is at least ``work_break_minutes`` of
        focused_work away, mirroring the unfinished-thread "used"
        contract.
        """
        # ``now`` accepted for symmetry with other tracker hooks; not
        # actually needed (we just zero out — no timestamp recorded).
        del now
        self._work_acc_seconds = 0.0
        self._work_break_pending = None

    def mark_anti_slack_used(self, *, now: float | None = None) -> None:
        """Stamp anti-slack delivery and start its cooldown.

        Independent of the water-break + mini-game cooldowns so the
        three reminder paths don't accidentally throttle each other.
        """
        ts = now if now is not None else time.time()
        self._anti_slack_last_fired_at = ts
        self._anti_slack_pending = None

    # ── 情境弹窗（A/B 实验组前端用）──────────────────────────────

    def reset_context_prompt_baseline(self) -> None:
        """清掉情境弹窗的「上一状态」基线，让下一 tick 把当前状态重新算作一次「进入」。

        在每个 session 开始时调用（core.py 的实验组 kick 里）。tracker 跨 session 长存，
        若不清，「上个 session 结束时在游戏、新 session 仍在游戏」就检测不到进入、漏弹。
        只动情境弹窗专属基线，不碰 break/anti-slack 的 _last_known_state。

        同时清掉可能遗留的 pending：上个 session 置了 pending 但没来得及 drain（loop 没
        tick 到就 end_session）时，残留会被新 session 的首个 tick 推成过期弹窗。清掉后
        紧跟的 kick get_snapshot 会按新 session 的当前状态重新置 pending。
        """
        self._context_prompt_last_state = None
        self._context_prompt_pending = None

    def set_context_prompt_callback(
        self, callback: Callable[[str], Awaitable[None]] | None
    ) -> None:
        """注入「进入游戏/娱乐 或 进入专注工作」时往前端推送的 async 回调。

        由 core.py 在建好 tracker 后调用，回调内部把信号经 WebSocket 发给前端。
        ``callback(context)`` 的 context 取 'play'（游戏/娱乐）或 'work'（专注工作）。
        传 None 解除注入（如会话结束）。
        """
        self._on_context_prompt = callback

    async def _drain_context_prompt(self) -> None:
        """把 ``_tick_break_reminders`` 攒下的一次性情境信号推给前端。

        只在异步心跳里调用（async 上下文才能 await 回调）。一次消费一个槽位，
        推送失败静默吞掉——埋点性质的提示，丢一次也不该把心跳搞崩。
        """
        pending = self._context_prompt_pending
        if pending is None:
            return
        self._context_prompt_pending = None
        callback = self._on_context_prompt
        if callback is None:
            return
        try:
            await callback(pending['context'])
        except Exception as e:  # noqa: BLE001 — 推送失败不能让心跳挂掉
            logger.debug(
                '[%s] context prompt push failed (%s): %s',
                self.lanlan_name, pending.get('context'), e,
            )

    # ── enrichment kickoff ──────────────────────────────────────

    def kickoff_open_threads_compute(self, lang: str = 'zh') -> None:
        """Spawn an emotion-tier compute of ``open_threads`` if stale.

        Intended call site: top of ``proactive_chat`` Phase 1, in
        parallel with the source-fetch tasks. Returns immediately;
        the result populates the cache by the time Phase 2 reads
        ``get_snapshot``. If the LLM is slow / fails, the cache stays
        on its previous value (potentially empty), which the prompt
        formatter renders or omits accordingly.

        Idempotent in four useful ways:
          * If the rule state is currently ``private`` → skip (no LLM
            calls during privacy lockdown — even the conversation
            buffer might reference sensitive context that was just
            mentioned).
          * If the cache seq matches the current user-message seq, no
            new user has spoken since last compute → skip.
          * If a previous task is still running → skip (don't queue).
          * If conversation buffers are empty → skip (nothing to score).
        """
        # Two privacy gates, OR'd: user-toggled "privacy mode" disables
        # the entire tracker (PR #1024); static-DB ``private`` state means
        # a sensitive app (KeePass etc) is foreground right now even while
        # the user has the tracker on. Either condition skips enrichment
        # — cheap O(1) checks, safe under sync callers.
        if _privacy_mode_active() or self._sm._current_state == 'private':
            return
        if self._open_threads_computed_at_seq == self._conv_seq:
            return
        if self._open_threads_task is not None and not self._open_threads_task.done():
            return
        if not self._user_msg_buffer and not self._ai_msg_buffer:
            return
        self._open_threads_task = asyncio.create_task(
            self._do_open_threads_compute(lang),
            name=f'open_threads_{self.lanlan_name}',
        )

    async def _do_open_threads_compute(self, lang: str) -> None:
        """One-shot LLM call. Updates cache only on parse success.

        In-flight guard: capture ``_conv_seq`` before the LLM call;
        re-check on completion. If new conversation events arrived
        while we were waiting (rev advanced), the result was computed
        from a stale buffer view — discard it. ``_open_threads_computed_at_seq``
        stays at its previous value, so the next ``kickoff`` will see
        the seq mismatch and trigger a fresh compute against the
        current buffer.
        """
        from main_logic.activity.llm_enrichment import call_open_threads
        seen_seq = self._conv_seq
        try:
            result = await call_open_threads(
                user_msgs=list(self._user_msg_buffer),
                ai_msgs=list(self._ai_msg_buffer),
                lang=lang,
            )
        except Exception as e:
            logger.debug('[%s] open_threads compute failed: %s', self.lanlan_name, e)