Files
clawdbot/apps/macos/Sources/Clawdis/ScreenRecordService.swift
2025-12-19 22:09:38 +01:00

267 lines
9.4 KiB
Swift

import AVFoundation
import Foundation
import OSLog
@preconcurrency import ScreenCaptureKit
@MainActor
final class ScreenRecordService {
enum ScreenRecordError: LocalizedError {
case noDisplays
case invalidScreenIndex(Int)
case noFramesCaptured
case writeFailed(String)
var errorDescription: String? {
switch self {
case .noDisplays:
"No displays available for screen recording"
case let .invalidScreenIndex(idx):
"Invalid screen index \(idx)"
case .noFramesCaptured:
"No frames captured"
case let .writeFailed(msg):
msg
}
}
}
private let logger = Logger(subsystem: "com.steipete.clawdis", category: "screenRecord")
func record(
screenIndex: Int?,
durationMs: Int?,
fps: Double?,
includeAudio: Bool?,
outPath: String?) async throws -> (path: String, hasAudio: Bool)
{
let durationMs = Self.clampDurationMs(durationMs)
let fps = Self.clampFps(fps)
let includeAudio = includeAudio ?? false
let outURL: URL = {
if let outPath, !outPath.trimmingCharacters(in: .whitespacesAndNewlines).isEmpty {
return URL(fileURLWithPath: outPath)
}
return FileManager.default.temporaryDirectory
.appendingPathComponent("clawdis-screen-record-\(UUID().uuidString).mp4")
}()
try? FileManager.default.removeItem(at: outURL)
let content = try await SCShareableContent.current
let displays = content.displays.sorted { $0.displayID < $1.displayID }
guard !displays.isEmpty else { throw ScreenRecordError.noDisplays }
let idx = screenIndex ?? 0
guard idx >= 0, idx < displays.count else { throw ScreenRecordError.invalidScreenIndex(idx) }
let display = displays[idx]
let filter = SCContentFilter(display: display, excludingWindows: [])
let config = SCStreamConfiguration()
config.width = display.width
config.height = display.height
config.queueDepth = 8
config.showsCursor = true
config.minimumFrameInterval = CMTime(value: 1, timescale: CMTimeScale(max(1, Int32(fps.rounded()))))
if includeAudio {
config.capturesAudio = true
}
let recorder = try StreamRecorder(
outputURL: outURL,
width: display.width,
height: display.height,
includeAudio: includeAudio,
logger: self.logger)
let stream = SCStream(filter: filter, configuration: config, delegate: recorder)
try stream.addStreamOutput(recorder, type: .screen, sampleHandlerQueue: recorder.queue)
if includeAudio {
try stream.addStreamOutput(recorder, type: .audio, sampleHandlerQueue: recorder.queue)
}
self.logger.info(
"screen record start idx=\(idx) durationMs=\(durationMs) fps=\(fps) out=\(outURL.path, privacy: .public)")
var started = false
do {
try await stream.startCapture()
started = true
try await Task.sleep(nanoseconds: UInt64(durationMs) * 1_000_000)
try await stream.stopCapture()
} catch {
if started { try? await stream.stopCapture() }
throw error
}
try await recorder.finish()
return (path: outURL.path, hasAudio: recorder.hasAudio)
}
private nonisolated static func clampDurationMs(_ ms: Int?) -> Int {
let v = ms ?? 10000
return min(60000, max(250, v))
}
private nonisolated static func clampFps(_ fps: Double?) -> Double {
let v = fps ?? 10
if !v.isFinite { return 10 }
return min(60, max(1, v))
}
}
private final class StreamRecorder: NSObject, SCStreamOutput, SCStreamDelegate, @unchecked Sendable {
let queue = DispatchQueue(label: "com.steipete.clawdis.screenRecord.writer")
private let logger: Logger
private let writer: AVAssetWriter
private let input: AVAssetWriterInput
private let audioInput: AVAssetWriterInput?
let hasAudio: Bool
private var started = false
private var sawFrame = false
private var didFinish = false
private var pendingErrorMessage: String?
init(outputURL: URL, width: Int, height: Int, includeAudio: Bool, logger: Logger) throws {
self.logger = logger
self.writer = try AVAssetWriter(outputURL: outputURL, fileType: .mp4)
let settings: [String: Any] = [
AVVideoCodecKey: AVVideoCodecType.h264,
AVVideoWidthKey: width,
AVVideoHeightKey: height,
]
self.input = AVAssetWriterInput(mediaType: .video, outputSettings: settings)
self.input.expectsMediaDataInRealTime = true
guard self.writer.canAdd(self.input) else {
throw ScreenRecordService.ScreenRecordError.writeFailed("Cannot add video input")
}
self.writer.add(self.input)
if includeAudio {
let audioSettings: [String: Any] = [
AVFormatIDKey: kAudioFormatMPEG4AAC,
AVNumberOfChannelsKey: 1,
AVSampleRateKey: 44100,
AVEncoderBitRateKey: 96000,
]
let audioInput = AVAssetWriterInput(mediaType: .audio, outputSettings: audioSettings)
audioInput.expectsMediaDataInRealTime = true
if self.writer.canAdd(audioInput) {
self.writer.add(audioInput)
self.audioInput = audioInput
self.hasAudio = true
} else {
self.audioInput = nil
self.hasAudio = false
}
} else {
self.audioInput = nil
self.hasAudio = false
}
super.init()
}
func stream(_ stream: SCStream, didStopWithError error: any Error) {
self.queue.async {
let msg = String(describing: error)
self.pendingErrorMessage = msg
self.logger.error("screen record stream stopped with error: \(msg, privacy: .public)")
_ = stream
}
}
func stream(
_ stream: SCStream,
didOutputSampleBuffer sampleBuffer: CMSampleBuffer,
of type: SCStreamOutputType)
{
guard CMSampleBufferDataIsReady(sampleBuffer) else { return }
// Callback runs on `sampleHandlerQueue` (`self.queue`).
switch type {
case .screen:
self.handleVideo(sampleBuffer: sampleBuffer)
case .audio:
self.handleAudio(sampleBuffer: sampleBuffer)
case .microphone:
break
@unknown default:
break
}
_ = stream
}
private func handleVideo(sampleBuffer: CMSampleBuffer) {
if let msg = self.pendingErrorMessage {
self.logger.error("screen record aborting due to prior error: \(msg, privacy: .public)")
return
}
if self.didFinish { return }
if !self.started {
guard self.writer.startWriting() else {
self.pendingErrorMessage = self.writer.error?.localizedDescription ?? "Failed to start writer"
return
}
let pts = CMSampleBufferGetPresentationTimeStamp(sampleBuffer)
self.writer.startSession(atSourceTime: pts)
self.started = true
}
self.sawFrame = true
if self.input.isReadyForMoreMediaData {
_ = self.input.append(sampleBuffer)
}
}
private func handleAudio(sampleBuffer: CMSampleBuffer) {
guard let audioInput else { return }
if let msg = self.pendingErrorMessage {
self.logger.error("screen record audio aborting due to prior error: \(msg, privacy: .public)")
return
}
if self.didFinish || !self.started { return }
if audioInput.isReadyForMoreMediaData {
_ = audioInput.append(sampleBuffer)
}
}
func finish() async throws {
try await withCheckedThrowingContinuation { (cont: CheckedContinuation<Void, Error>) in
self.queue.async {
if let msg = self.pendingErrorMessage {
cont.resume(throwing: ScreenRecordService.ScreenRecordError.writeFailed(msg))
return
}
guard self.started, self.sawFrame else {
cont.resume(throwing: ScreenRecordService.ScreenRecordError.noFramesCaptured)
return
}
if self.didFinish {
cont.resume()
return
}
self.didFinish = true
self.input.markAsFinished()
self.audioInput?.markAsFinished()
self.writer.finishWriting {
if let err = self.writer.error {
cont
.resume(throwing: ScreenRecordService.ScreenRecordError
.writeFailed(err.localizedDescription))
} else if self.writer.status != .completed {
cont
.resume(throwing: ScreenRecordService.ScreenRecordError
.writeFailed("Failed to finalize video"))
} else {
cont.resume()
}
}
}
}
}
}