314 lines
12 KiB
Swift
314 lines
12 KiB
Swift
import ClawdisKit
|
|
import Network
|
|
import SwiftUI
|
|
|
|
@MainActor
|
|
final class NodeAppModel: ObservableObject {
|
|
@Published var isBackgrounded: Bool = false
|
|
let screen = ScreenController()
|
|
let camera = CameraController()
|
|
@Published var bridgeStatusText: String = "Not connected"
|
|
@Published var bridgeServerName: String?
|
|
@Published var bridgeRemoteAddress: String?
|
|
@Published var connectedBridgeID: String?
|
|
|
|
private let bridge = BridgeSession()
|
|
private var bridgeTask: Task<Void, Never>?
|
|
let voiceWake = VoiceWakeManager()
|
|
|
|
var bridgeSession: BridgeSession { self.bridge }
|
|
|
|
init() {
|
|
self.voiceWake.configure { [weak self] cmd in
|
|
guard let self else { return }
|
|
let nodeId = UserDefaults.standard.string(forKey: "node.instanceId") ?? "ios-node"
|
|
let sessionKey = "node-\(nodeId)"
|
|
do {
|
|
try await self.sendVoiceTranscript(text: cmd, sessionKey: sessionKey)
|
|
} catch {
|
|
// Best-effort only.
|
|
}
|
|
}
|
|
|
|
let enabled = UserDefaults.standard.bool(forKey: "voiceWake.enabled")
|
|
self.voiceWake.setEnabled(enabled)
|
|
}
|
|
|
|
func setScenePhase(_ phase: ScenePhase) {
|
|
switch phase {
|
|
case .background:
|
|
self.isBackgrounded = true
|
|
case .active, .inactive:
|
|
self.isBackgrounded = false
|
|
@unknown default:
|
|
self.isBackgrounded = false
|
|
}
|
|
}
|
|
|
|
func setVoiceWakeEnabled(_ enabled: Bool) {
|
|
self.voiceWake.setEnabled(enabled)
|
|
}
|
|
|
|
func connectToBridge(
|
|
endpoint: NWEndpoint,
|
|
hello: BridgeHello)
|
|
{
|
|
self.bridgeTask?.cancel()
|
|
self.bridgeStatusText = "Connecting…"
|
|
self.bridgeServerName = nil
|
|
self.bridgeRemoteAddress = nil
|
|
self.connectedBridgeID = BridgeEndpointID.stableID(endpoint)
|
|
|
|
self.bridgeTask = Task {
|
|
do {
|
|
try await self.bridge.connect(
|
|
endpoint: endpoint,
|
|
hello: hello,
|
|
onConnected: { [weak self] serverName in
|
|
guard let self else { return }
|
|
await MainActor.run {
|
|
self.bridgeStatusText = "Connected"
|
|
self.bridgeServerName = serverName
|
|
}
|
|
if let addr = await self.bridge.currentRemoteAddress() {
|
|
await MainActor.run {
|
|
self.bridgeRemoteAddress = addr
|
|
}
|
|
}
|
|
},
|
|
onInvoke: { [weak self] req in
|
|
guard let self else {
|
|
return BridgeInvokeResponse(
|
|
id: req.id,
|
|
ok: false,
|
|
error: ClawdisNodeError(code: .unavailable, message: "UNAVAILABLE: node not ready"))
|
|
}
|
|
return await self.handleInvoke(req)
|
|
})
|
|
|
|
await MainActor.run {
|
|
self.bridgeStatusText = "Disconnected"
|
|
self.bridgeServerName = nil
|
|
self.bridgeRemoteAddress = nil
|
|
self.connectedBridgeID = nil
|
|
}
|
|
} catch {
|
|
await MainActor.run {
|
|
self.bridgeStatusText = "Bridge error: \(error.localizedDescription)"
|
|
self.bridgeServerName = nil
|
|
self.bridgeRemoteAddress = nil
|
|
self.connectedBridgeID = nil
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
func disconnectBridge() {
|
|
self.bridgeTask?.cancel()
|
|
self.bridgeTask = nil
|
|
Task { await self.bridge.disconnect() }
|
|
self.bridgeStatusText = "Disconnected"
|
|
self.bridgeServerName = nil
|
|
self.bridgeRemoteAddress = nil
|
|
self.connectedBridgeID = nil
|
|
}
|
|
|
|
func sendVoiceTranscript(text: String, sessionKey: String?) async throws {
|
|
struct Payload: Codable {
|
|
var text: String
|
|
var sessionKey: String?
|
|
}
|
|
let payload = Payload(text: text, sessionKey: sessionKey)
|
|
let data = try JSONEncoder().encode(payload)
|
|
guard let json = String(bytes: data, encoding: .utf8) else {
|
|
throw NSError(domain: "NodeAppModel", code: 1, userInfo: [
|
|
NSLocalizedDescriptionKey: "Failed to encode voice transcript payload as UTF-8",
|
|
])
|
|
}
|
|
try await self.bridge.sendEvent(event: "voice.transcript", payloadJSON: json)
|
|
}
|
|
|
|
func handleDeepLink(url: URL) async {
|
|
guard let route = DeepLinkParser.parse(url) else { return }
|
|
|
|
switch route {
|
|
case let .agent(link):
|
|
await self.handleAgentDeepLink(link, originalURL: url)
|
|
}
|
|
}
|
|
|
|
private func handleAgentDeepLink(_ link: AgentDeepLink, originalURL: URL) async {
|
|
let message = link.message.trimmingCharacters(in: .whitespacesAndNewlines)
|
|
guard !message.isEmpty else { return }
|
|
|
|
if message.count > 20000 {
|
|
self.screen.errorText = "Deep link too large (message exceeds 20,000 characters)."
|
|
return
|
|
}
|
|
|
|
guard await self.isBridgeConnected() else {
|
|
self.screen.errorText = "Bridge not connected (cannot forward deep link)."
|
|
return
|
|
}
|
|
|
|
do {
|
|
try await self.sendAgentRequest(link: link)
|
|
self.screen.errorText = nil
|
|
} catch {
|
|
self.screen.errorText = "Agent request failed: \(error.localizedDescription)"
|
|
}
|
|
}
|
|
|
|
private func sendAgentRequest(link: AgentDeepLink) async throws {
|
|
if link.message.trimmingCharacters(in: .whitespacesAndNewlines).isEmpty {
|
|
throw NSError(domain: "DeepLink", code: 1, userInfo: [
|
|
NSLocalizedDescriptionKey: "invalid agent message",
|
|
])
|
|
}
|
|
|
|
// iOS bridge forwards to the gateway; no local auth prompts here.
|
|
// (Key-based unattended auth is handled on macOS for clawdis:// links.)
|
|
let data = try JSONEncoder().encode(link)
|
|
guard let json = String(bytes: data, encoding: .utf8) else {
|
|
throw NSError(domain: "NodeAppModel", code: 2, userInfo: [
|
|
NSLocalizedDescriptionKey: "Failed to encode agent request payload as UTF-8",
|
|
])
|
|
}
|
|
try await self.bridge.sendEvent(event: "agent.request", payloadJSON: json)
|
|
}
|
|
|
|
private func isBridgeConnected() async -> Bool {
|
|
if case .connected = await self.bridge.state { return true }
|
|
return false
|
|
}
|
|
|
|
private func handleInvoke(_ req: BridgeInvokeRequest) async -> BridgeInvokeResponse {
|
|
if req.command.hasPrefix("screen.") || req.command.hasPrefix("camera."), self.isBackgrounded {
|
|
return BridgeInvokeResponse(
|
|
id: req.id,
|
|
ok: false,
|
|
error: ClawdisNodeError(
|
|
code: .backgroundUnavailable,
|
|
message: "NODE_BACKGROUND_UNAVAILABLE: screen/camera commands require foreground"))
|
|
}
|
|
|
|
if req.command.hasPrefix("camera."), !self.isCameraEnabled() {
|
|
return BridgeInvokeResponse(
|
|
id: req.id,
|
|
ok: false,
|
|
error: ClawdisNodeError(
|
|
code: .unavailable,
|
|
message: "CAMERA_DISABLED: enable Camera in iOS Settings → Camera → Allow Camera"))
|
|
}
|
|
|
|
do {
|
|
switch req.command {
|
|
case ClawdisScreenCommand.show.rawValue:
|
|
return BridgeInvokeResponse(id: req.id, ok: true)
|
|
|
|
case ClawdisScreenCommand.hide.rawValue:
|
|
return BridgeInvokeResponse(id: req.id, ok: true)
|
|
|
|
case ClawdisScreenCommand.setMode.rawValue:
|
|
let params = try Self.decodeParams(ClawdisScreenSetModeParams.self, from: req.paramsJSON)
|
|
self.screen.setMode(params.mode)
|
|
return BridgeInvokeResponse(id: req.id, ok: true)
|
|
|
|
case ClawdisScreenCommand.navigate.rawValue:
|
|
let params = try Self.decodeParams(ClawdisScreenNavigateParams.self, from: req.paramsJSON)
|
|
self.screen.navigate(to: params.url)
|
|
return BridgeInvokeResponse(id: req.id, ok: true)
|
|
|
|
case ClawdisScreenCommand.evalJS.rawValue:
|
|
let params = try Self.decodeParams(ClawdisScreenEvalParams.self, from: req.paramsJSON)
|
|
let result = try await self.screen.eval(javaScript: params.javaScript)
|
|
let payload = try Self.encodePayload(["result": result])
|
|
return BridgeInvokeResponse(id: req.id, ok: true, payloadJSON: payload)
|
|
|
|
case ClawdisScreenCommand.snapshot.rawValue:
|
|
let params = try? Self.decodeParams(ClawdisScreenSnapshotParams.self, from: req.paramsJSON)
|
|
let maxWidth = params?.maxWidth.map { CGFloat($0) }
|
|
let base64 = try await self.screen.snapshotPNGBase64(maxWidth: maxWidth)
|
|
let payload = try Self.encodePayload(["format": "png", "base64": base64])
|
|
return BridgeInvokeResponse(id: req.id, ok: true, payloadJSON: payload)
|
|
|
|
case ClawdisCameraCommand.snap.rawValue:
|
|
let params = (try? Self.decodeParams(ClawdisCameraSnapParams.self, from: req.paramsJSON)) ??
|
|
ClawdisCameraSnapParams()
|
|
let res = try await self.camera.snap(params: params)
|
|
|
|
struct Payload: Codable {
|
|
var format: String
|
|
var base64: String
|
|
var width: Int
|
|
var height: Int
|
|
}
|
|
let payload = try Self.encodePayload(Payload(
|
|
format: res.format,
|
|
base64: res.base64,
|
|
width: res.width,
|
|
height: res.height))
|
|
return BridgeInvokeResponse(id: req.id, ok: true, payloadJSON: payload)
|
|
|
|
case ClawdisCameraCommand.clip.rawValue:
|
|
let params = (try? Self.decodeParams(ClawdisCameraClipParams.self, from: req.paramsJSON)) ??
|
|
ClawdisCameraClipParams()
|
|
|
|
let suspended = (params.includeAudio ?? true) ? self.voiceWake.suspendForExternalAudioCapture() : false
|
|
defer { self.voiceWake.resumeAfterExternalAudioCapture(wasSuspended: suspended) }
|
|
|
|
let res = try await self.camera.clip(params: params)
|
|
|
|
struct Payload: Codable {
|
|
var format: String
|
|
var base64: String
|
|
var durationMs: Int
|
|
var hasAudio: Bool
|
|
}
|
|
let payload = try Self.encodePayload(Payload(
|
|
format: res.format,
|
|
base64: res.base64,
|
|
durationMs: res.durationMs,
|
|
hasAudio: res.hasAudio))
|
|
return BridgeInvokeResponse(id: req.id, ok: true, payloadJSON: payload)
|
|
|
|
default:
|
|
return BridgeInvokeResponse(
|
|
id: req.id,
|
|
ok: false,
|
|
error: ClawdisNodeError(code: .invalidRequest, message: "INVALID_REQUEST: unknown command"))
|
|
}
|
|
} catch {
|
|
return BridgeInvokeResponse(
|
|
id: req.id,
|
|
ok: false,
|
|
error: ClawdisNodeError(code: .unavailable, message: error.localizedDescription))
|
|
}
|
|
}
|
|
|
|
private static func decodeParams<T: Decodable>(_ type: T.Type, from json: String?) throws -> T {
|
|
guard let json, let data = json.data(using: .utf8) else {
|
|
throw NSError(domain: "Bridge", code: 20, userInfo: [
|
|
NSLocalizedDescriptionKey: "INVALID_REQUEST: paramsJSON required",
|
|
])
|
|
}
|
|
return try JSONDecoder().decode(type, from: data)
|
|
}
|
|
|
|
private static func encodePayload(_ obj: some Encodable) throws -> String {
|
|
let data = try JSONEncoder().encode(obj)
|
|
guard let json = String(bytes: data, encoding: .utf8) else {
|
|
throw NSError(domain: "NodeAppModel", code: 21, userInfo: [
|
|
NSLocalizedDescriptionKey: "Failed to encode payload as UTF-8",
|
|
])
|
|
}
|
|
return json
|
|
}
|
|
|
|
private func isCameraEnabled() -> Bool {
|
|
// Default-on: if the key doesn't exist yet, treat it as enabled.
|
|
if UserDefaults.standard.object(forKey: "camera.enabled") == nil { return true }
|
|
return UserDefaults.standard.bool(forKey: "camera.enabled")
|
|
}
|
|
}
|