Files
clawdbot/apps/macos/Sources/Clawdis/VoiceWakeForwarder.swift
2025-12-09 02:50:58 +00:00

166 lines
5.9 KiB
Swift

import Foundation
import OSLog
struct VoiceWakeForwardConfig: Sendable {
let enabled: Bool
let target: String
let identityPath: String
let commandTemplate: String
let timeout: TimeInterval
}
enum VoiceWakeForwarder {
private static let logger = Logger(subsystem: "com.steipete.clawdis", category: "voicewake.forward")
static func prefixedTranscript(_ transcript: String, machineName: String? = nil) -> String {
let resolvedMachine = machineName
.flatMap { name -> String? in
let trimmed = name.trimmingCharacters(in: .whitespacesAndNewlines)
return trimmed.isEmpty ? nil : trimmed
}
?? Host.current().localizedName
?? ProcessInfo.processInfo.hostName
let safeMachine = resolvedMachine.isEmpty ? "this Mac" : resolvedMachine
return "User talked via voice recognition on \(safeMachine) - repeat prompt first + remember some words might be incorrectly transcribed.\n\n\(transcript)"
}
static func clearCliCache() {
// Legacy no-op; CLI caching removed now that we rely on AgentRPC.
}
enum VoiceWakeForwardError: LocalizedError, Equatable {
case invalidTarget
case rpcFailed(String)
case disabled
var errorDescription: String? {
switch self {
case .invalidTarget: return "Missing or invalid target"
case let .rpcFailed(message): return message
case .disabled: return "Voice wake forwarding disabled"
}
}
}
@discardableResult
static func forward(
transcript: String,
config: VoiceWakeForwardConfig) async -> Result<Void, VoiceWakeForwardError>
{
guard config.enabled else { return .failure(.disabled) }
let payload = Self.prefixedTranscript(transcript)
let options = self.parseCommandTemplate(config.commandTemplate)
let thinking = options.thinking ?? "default"
let result = await AgentRPC.shared.send(
text: payload,
thinking: thinking,
session: options.session,
deliver: options.deliver,
to: options.to)
if result.ok {
self.logger.info("voice wake forward ok")
return .success(())
}
let message = result.error ?? "agent rpc unavailable"
self.logger.error("voice wake forward failed: \(message, privacy: .public)")
return .failure(.rpcFailed(message))
}
static func checkConnection(config: VoiceWakeForwardConfig) async -> Result<Void, VoiceWakeForwardError> {
guard config.enabled else { return .failure(.disabled) }
guard !self.sanitizedTarget(config.target).isEmpty else { return .failure(.invalidTarget) }
let status = await AgentRPC.shared.status()
if status.ok { return .success(()) }
return .failure(.rpcFailed(status.error ?? "agent rpc unreachable"))
}
static func shellEscape(_ text: String) -> String {
// Single-quote based shell escaping.
let replaced = text.replacingOccurrences(of: "'", with: "'\\''")
return "'\(replaced)'"
}
static func parse(target: String) -> (user: String?, host: String, port: Int)? {
guard !target.isEmpty else { return nil }
var remainder = target
if remainder.hasPrefix("ssh ") {
remainder = remainder.replacingOccurrences(of: "ssh ", with: "")
}
remainder = remainder.trimmingCharacters(in: .whitespacesAndNewlines)
var user: String?
if let at = remainder.firstIndex(of: "@") {
user = String(remainder[..<at])
remainder = String(remainder[remainder.index(after: at)...])
}
var host = remainder
var port = defaultVoiceWakeForwardPort
if let colon = remainder.lastIndex(of: ":"), colon != remainder.startIndex {
let p = String(remainder[remainder.index(after: colon)...])
if let parsedPort = Int(p) {
port = parsedPort
host = String(remainder[..<colon])
}
}
host = host.trimmingCharacters(in: .whitespacesAndNewlines)
guard !host.isEmpty else { return nil }
return (user: user?.trimmingCharacters(in: .whitespacesAndNewlines), host: host, port: port)
}
static func sanitizedTarget(_ raw: String) -> String {
let trimmed = raw.trimmingCharacters(in: .whitespacesAndNewlines)
if trimmed.hasPrefix("ssh ") {
return trimmed.replacingOccurrences(of: "ssh ", with: "").trimmingCharacters(in: .whitespacesAndNewlines)
}
return trimmed
}
// MARK: - Template parsing
struct ForwardOptions {
var session: String = "main"
var thinking: String? = "low"
var deliver: Bool = true
var to: String?
}
private static func parseCommandTemplate(_ template: String) -> ForwardOptions {
var options = ForwardOptions()
let parts = template.split(whereSeparator: { $0.isWhitespace }).map(String.init)
var idx = 0
while idx < parts.count {
let part = parts[idx]
switch part {
case "--session", "--session-id":
if idx + 1 < parts.count { options.session = parts[idx + 1] }
idx += 1
case "--thinking":
if idx + 1 < parts.count { options.thinking = parts[idx + 1] }
idx += 1
case "--deliver":
options.deliver = true
case "--no-deliver":
options.deliver = false
case "--to":
if idx + 1 < parts.count { options.to = parts[idx + 1] }
idx += 1
default:
break
}
idx += 1
}
return options
}
#if DEBUG
static func _testParseCommandTemplate(_ template: String) -> ForwardOptions {
self.parseCommandTemplate(template)
}
#endif
}