import ClawdisKit import Network import Observation import SwiftUI @MainActor @Observable final class NodeAppModel { var isBackgrounded: Bool = false let screen = ScreenController() let camera = CameraController() var bridgeStatusText: String = "Not connected" var bridgeServerName: String? var bridgeRemoteAddress: String? var connectedBridgeID: String? private let bridge = BridgeSession() private var bridgeTask: Task? private var voiceWakeSyncTask: Task? let voiceWake = VoiceWakeManager() var bridgeSession: BridgeSession { self.bridge } init() { self.voiceWake.configure { [weak self] cmd in guard let self else { return } let nodeId = UserDefaults.standard.string(forKey: "node.instanceId") ?? "ios-node" let sessionKey = "node-\(nodeId)" do { try await self.sendVoiceTranscript(text: cmd, sessionKey: sessionKey) } catch { // Best-effort only. } } let enabled = UserDefaults.standard.bool(forKey: "voiceWake.enabled") self.voiceWake.setEnabled(enabled) // Wire up deep links from canvas taps self.screen.onDeepLink = { [weak self] url in guard let self else { return } Task { @MainActor in await self.handleDeepLink(url: url) } } } func setScenePhase(_ phase: ScenePhase) { switch phase { case .background: self.isBackgrounded = true case .active, .inactive: self.isBackgrounded = false @unknown default: self.isBackgrounded = false } } func setVoiceWakeEnabled(_ enabled: Bool) { self.voiceWake.setEnabled(enabled) } func connectToBridge( endpoint: NWEndpoint, hello: BridgeHello) { self.bridgeTask?.cancel() self.bridgeServerName = nil self.bridgeRemoteAddress = nil self.connectedBridgeID = BridgeEndpointID.stableID(endpoint) self.voiceWakeSyncTask?.cancel() self.voiceWakeSyncTask = nil self.bridgeTask = Task { var attempt = 0 while !Task.isCancelled { await MainActor.run { if attempt == 0 { self.bridgeStatusText = "Connecting…" } else { self.bridgeStatusText = "Reconnecting…" } self.bridgeServerName = nil self.bridgeRemoteAddress = nil } do { try await self.bridge.connect( endpoint: endpoint, hello: hello, onConnected: { [weak self] serverName in guard let self else { return } await MainActor.run { self.bridgeStatusText = "Connected" self.bridgeServerName = serverName } if let addr = await self.bridge.currentRemoteAddress() { await MainActor.run { self.bridgeRemoteAddress = addr } } await self.startVoiceWakeSync() }, onInvoke: { [weak self] req in guard let self else { return BridgeInvokeResponse( id: req.id, ok: false, error: ClawdisNodeError(code: .unavailable, message: "UNAVAILABLE: node not ready")) } return await self.handleInvoke(req) }) if Task.isCancelled { break } attempt += 1 let sleepSeconds = min(6.0, 0.35 * pow(1.7, Double(attempt))) try? await Task.sleep(nanoseconds: UInt64(sleepSeconds * 1_000_000_000)) } catch { if Task.isCancelled { break } attempt += 1 await MainActor.run { self.bridgeStatusText = "Bridge error: \(error.localizedDescription)" self.bridgeServerName = nil self.bridgeRemoteAddress = nil } let sleepSeconds = min(8.0, 0.5 * pow(1.7, Double(attempt))) try? await Task.sleep(nanoseconds: UInt64(sleepSeconds * 1_000_000_000)) } } await MainActor.run { self.bridgeStatusText = "Disconnected" self.bridgeServerName = nil self.bridgeRemoteAddress = nil self.connectedBridgeID = nil } } } func disconnectBridge() { self.bridgeTask?.cancel() self.bridgeTask = nil self.voiceWakeSyncTask?.cancel() self.voiceWakeSyncTask = nil Task { await self.bridge.disconnect() } self.bridgeStatusText = "Disconnected" self.bridgeServerName = nil self.bridgeRemoteAddress = nil self.connectedBridgeID = nil } func setGlobalWakeWords(_ words: [String]) async { let sanitized = VoiceWakePreferences.sanitizeTriggerWords(words) struct Payload: Codable { var triggers: [String] } let payload = Payload(triggers: sanitized) guard let data = try? JSONEncoder().encode(payload), let json = String(data: data, encoding: .utf8) else { return } do { _ = try await self.bridge.request(method: "voicewake.set", paramsJSON: json, timeoutSeconds: 12) } catch { // Best-effort only. } } private func startVoiceWakeSync() async { self.voiceWakeSyncTask?.cancel() self.voiceWakeSyncTask = Task { [weak self] in guard let self else { return } await self.refreshWakeWordsFromGateway() let stream = await self.bridge.subscribeServerEvents(bufferingNewest: 200) for await evt in stream { if Task.isCancelled { return } guard evt.event == "voicewake.changed" else { continue } guard let payloadJSON = evt.payloadJSON else { continue } guard let triggers = VoiceWakePreferences.decodeGatewayTriggers(from: payloadJSON) else { continue } VoiceWakePreferences.saveTriggerWords(triggers) } } } private func refreshWakeWordsFromGateway() async { do { let data = try await self.bridge.request(method: "voicewake.get", paramsJSON: "{}", timeoutSeconds: 8) guard let triggers = VoiceWakePreferences.decodeGatewayTriggers(from: data) else { return } VoiceWakePreferences.saveTriggerWords(triggers) } catch { // Best-effort only. } } func sendVoiceTranscript(text: String, sessionKey: String?) async throws { struct Payload: Codable { var text: String var sessionKey: String? } let payload = Payload(text: text, sessionKey: sessionKey) let data = try JSONEncoder().encode(payload) guard let json = String(bytes: data, encoding: .utf8) else { throw NSError(domain: "NodeAppModel", code: 1, userInfo: [ NSLocalizedDescriptionKey: "Failed to encode voice transcript payload as UTF-8", ]) } try await self.bridge.sendEvent(event: "voice.transcript", payloadJSON: json) } func handleDeepLink(url: URL) async { guard let route = DeepLinkParser.parse(url) else { return } switch route { case let .agent(link): await self.handleAgentDeepLink(link, originalURL: url) } } private func handleAgentDeepLink(_ link: AgentDeepLink, originalURL: URL) async { let message = link.message.trimmingCharacters(in: .whitespacesAndNewlines) guard !message.isEmpty else { return } if message.count > 20000 { self.screen.errorText = "Deep link too large (message exceeds 20,000 characters)." return } guard await self.isBridgeConnected() else { self.screen.errorText = "Bridge not connected (cannot forward deep link)." return } do { try await self.sendAgentRequest(link: link) self.screen.errorText = nil } catch { self.screen.errorText = "Agent request failed: \(error.localizedDescription)" } } private func sendAgentRequest(link: AgentDeepLink) async throws { if link.message.trimmingCharacters(in: .whitespacesAndNewlines).isEmpty { throw NSError(domain: "DeepLink", code: 1, userInfo: [ NSLocalizedDescriptionKey: "invalid agent message", ]) } // iOS bridge forwards to the gateway; no local auth prompts here. // (Key-based unattended auth is handled on macOS for clawdis:// links.) let data = try JSONEncoder().encode(link) guard let json = String(bytes: data, encoding: .utf8) else { throw NSError(domain: "NodeAppModel", code: 2, userInfo: [ NSLocalizedDescriptionKey: "Failed to encode agent request payload as UTF-8", ]) } try await self.bridge.sendEvent(event: "agent.request", payloadJSON: json) } private func isBridgeConnected() async -> Bool { if case .connected = await self.bridge.state { return true } return false } private func handleInvoke(_ req: BridgeInvokeRequest) async -> BridgeInvokeResponse { if req.command.hasPrefix("screen.") || req.command.hasPrefix("camera."), self.isBackgrounded { return BridgeInvokeResponse( id: req.id, ok: false, error: ClawdisNodeError( code: .backgroundUnavailable, message: "NODE_BACKGROUND_UNAVAILABLE: screen/camera commands require foreground")) } if req.command.hasPrefix("camera."), !self.isCameraEnabled() { return BridgeInvokeResponse( id: req.id, ok: false, error: ClawdisNodeError( code: .unavailable, message: "CAMERA_DISABLED: enable Camera in iOS Settings → Camera → Allow Camera")) } do { switch req.command { case ClawdisScreenCommand.show.rawValue: return BridgeInvokeResponse(id: req.id, ok: true) case ClawdisScreenCommand.hide.rawValue: return BridgeInvokeResponse(id: req.id, ok: true) case ClawdisScreenCommand.setMode.rawValue: let params = try Self.decodeParams(ClawdisScreenSetModeParams.self, from: req.paramsJSON) self.screen.setMode(params.mode) return BridgeInvokeResponse(id: req.id, ok: true) case ClawdisScreenCommand.navigate.rawValue: let params = try Self.decodeParams(ClawdisScreenNavigateParams.self, from: req.paramsJSON) self.screen.navigate(to: params.url) return BridgeInvokeResponse(id: req.id, ok: true) case ClawdisScreenCommand.evalJS.rawValue: let params = try Self.decodeParams(ClawdisScreenEvalParams.self, from: req.paramsJSON) let result = try await self.screen.eval(javaScript: params.javaScript) let payload = try Self.encodePayload(["result": result]) return BridgeInvokeResponse(id: req.id, ok: true, payloadJSON: payload) case ClawdisScreenCommand.snapshot.rawValue: let params = try? Self.decodeParams(ClawdisScreenSnapshotParams.self, from: req.paramsJSON) let maxWidth = params?.maxWidth.map { CGFloat($0) } let base64 = try await self.screen.snapshotPNGBase64(maxWidth: maxWidth) let payload = try Self.encodePayload(["format": "png", "base64": base64]) return BridgeInvokeResponse(id: req.id, ok: true, payloadJSON: payload) case ClawdisCameraCommand.snap.rawValue: let params = (try? Self.decodeParams(ClawdisCameraSnapParams.self, from: req.paramsJSON)) ?? ClawdisCameraSnapParams() let res = try await self.camera.snap(params: params) struct Payload: Codable { var format: String var base64: String var width: Int var height: Int } let payload = try Self.encodePayload(Payload( format: res.format, base64: res.base64, width: res.width, height: res.height)) return BridgeInvokeResponse(id: req.id, ok: true, payloadJSON: payload) case ClawdisCameraCommand.clip.rawValue: let params = (try? Self.decodeParams(ClawdisCameraClipParams.self, from: req.paramsJSON)) ?? ClawdisCameraClipParams() let suspended = (params.includeAudio ?? true) ? self.voiceWake.suspendForExternalAudioCapture() : false defer { self.voiceWake.resumeAfterExternalAudioCapture(wasSuspended: suspended) } let res = try await self.camera.clip(params: params) struct Payload: Codable { var format: String var base64: String var durationMs: Int var hasAudio: Bool } let payload = try Self.encodePayload(Payload( format: res.format, base64: res.base64, durationMs: res.durationMs, hasAudio: res.hasAudio)) return BridgeInvokeResponse(id: req.id, ok: true, payloadJSON: payload) default: return BridgeInvokeResponse( id: req.id, ok: false, error: ClawdisNodeError(code: .invalidRequest, message: "INVALID_REQUEST: unknown command")) } } catch { return BridgeInvokeResponse( id: req.id, ok: false, error: ClawdisNodeError(code: .unavailable, message: error.localizedDescription)) } } private static func decodeParams(_ type: T.Type, from json: String?) throws -> T { guard let json, let data = json.data(using: .utf8) else { throw NSError(domain: "Bridge", code: 20, userInfo: [ NSLocalizedDescriptionKey: "INVALID_REQUEST: paramsJSON required", ]) } return try JSONDecoder().decode(type, from: data) } private static func encodePayload(_ obj: some Encodable) throws -> String { let data = try JSONEncoder().encode(obj) guard let json = String(bytes: data, encoding: .utf8) else { throw NSError(domain: "NodeAppModel", code: 21, userInfo: [ NSLocalizedDescriptionKey: "Failed to encode payload as UTF-8", ]) } return json } private func isCameraEnabled() -> Bool { // Default-on: if the key doesn't exist yet, treat it as enabled. if UserDefaults.standard.object(forKey: "camera.enabled") == nil { return true } return UserDefaults.standard.bool(forKey: "camera.enabled") } }