Created April 9, 2021 10:00
import AVFoundation
import RxCocoa
import RxSwift
protocol CameraManagerDelegate: AnyObject {
func didStartRecord()
func didCapturedImage(_ image: CapturedImage)
func videoCapture(didCaptureVideoFrame pixelBuffer: CVPixelBuffer)
enum CameraManagerError: Error {
case cameraDeviceNotAvailable
case cameraDeviceNotSet
case unableToSetPhotoSession
case unableToAddCameraInput
case unableToAddDataOutput
case unableToAddPhotoOutput
struct CameraConfig {
let defaultVideoZoom: CGFloat = 3
// swiftlint:disable:next type_body_length
final class CameraManager: NSObject {
enum FlashState {
case auto
case off
case on
case unavailable
var toggled: FlashState {
switch self {
case .auto:
return .off
case .off:
return .on
case .on:
return .auto
case .unavailable:
return .unavailable
var mode: AVCaptureDevice.FlashMode? {
switch self {
case .auto:
return .auto
case .off:
return .off
case .on:
return .on
case .unavailable:
return .none
enum ZoomLevel {
case normal
case magnify
var level: CGFloat {
switch self {
case .normal:
return 1.0
case .magnify:
return 2.0
let config: CameraConfig
var flashState: FlashState = .off
var zoomLevel: ZoomLevel = .magnify
let isCaptureSessionRunning: BehaviorRelay<Bool> = BehaviorRelay(value: false)
let videoImage: PublishRelay<(CIImage, CVImageBuffer)> = PublishRelay() // hot!
let isTorchEnabled: BehaviorRelay<Bool> = BehaviorRelay(value: false)
private(set) lazy var previewLayer = AVCaptureVideoPreviewLayer(session: session)
var cameraPosition: AVCaptureDevice.Position = .back
weak var delegate: CameraManagerDelegate?
private let sessionQueue = DispatchQueue(label: "\(UUID().uuidString)")
private let dataOutputQueue = DispatchQueue(label: "\(UUID().uuidString)")
private let session = AVCaptureSession()
public var fps = 240
public var desiredFrameRate = 240
var lastTimestamp = CMTime()
private var cameraDevice: AVCaptureDevice? {
didSet {
if oldValue != cameraDevice {
private lazy var photoOutput: AVCapturePhotoOutput = {
let output = AVCapturePhotoOutput()
output.isHighResolutionCaptureEnabled = true
return output
private lazy var videoDataOutput: AVCaptureVideoDataOutput = {
let output = AVCaptureVideoDataOutput()
output.alwaysDiscardsLateVideoFrames = true
output.videoSettings = [kCVPixelBufferPixelFormatTypeKey as String: kCVPixelFormatType_32BGRA]
return output
private var videoDataOutputEnabled = true
private let disposeBag = DisposeBag()
private var cameraDisposeBag = DisposeBag()
override private init() {
init(config: CameraConfig = CameraConfig()) {
self.config = config
func setCamera(position: AVCaptureDevice.Position) throws {
cameraDevice = AVCaptureDevice.DiscoverySession(
deviceTypes: [.builtInWideAngleCamera],
mediaType: .video,
position: position
guard cameraDevice != nil else {
throw CameraManagerError.cameraDeviceNotAvailable
func flipCamera() {
cameraDevice = nil
zoomLevel = .magnify
flashState = .off
/// This should do the flip here
switch cameraPosition {
case .back:
try? startSession(position: .front)
case .front:
try? startSession(position: .back)
case .unspecified:
@unknown default:
/// Reconfigure everything here
try? configureSession()
try? configureCamera()
startRecording(async: true)
/// Configures and starts capture session.
/// Does not reconfigure the session if already configured nor restart if already running.
/// Create AVCaptureVideoPreviewLayer to see the preview or observe video data ouput.
func startSession(position: AVCaptureDevice.Position = .back) throws {
#if targetEnvironment(simulator)
guard session.isRunning == false else {
if cameraDevice == nil {
try setCamera(position: position)
let sessionConfigured = !session.inputs.isEmpty && !session.outputs.isEmpty
if !sessionConfigured {
try configureSession()
try configureCamera()
startRecording(async: true)
} else {
// it just does not look good to have the preview "replaced"
// block until session is started
startRecording(async: false)
cameraPosition = position
private func observeSession() {
#if targetEnvironment(simulator)
let currentSessionStarted = NotificationCenter.default.rx.notification(.AVCaptureSessionDidStartRunning)
.map { $0.object as? AVCaptureSession }
.filter { [weak self] in self?.session == $0 }
let currentSessionStopped = NotificationCenter.default.rx.notification(.AVCaptureSessionDidStopRunning)
.map { $0.object as? AVCaptureSession }
.filter { [weak self] in self?.session == $0 }
Observable.merge( { _ in true }, { _ in false })
.bind(to: isCaptureSessionRunning)
.disposed(by: disposeBag)
.filter { [weak self] in self?.session == $0.object as? AVCaptureSession }
.map { $0.userInfo?[AVCaptureSessionErrorKey] as? Error }
.subscribe(onNext: { error in
env.log.warning("AV Capture runtime error: \(error)")
.disposed(by: disposeBag)
.filter { [weak self] in self?.session == $0.object as? AVCaptureSession }
.map { $0.userInfo?[AVCaptureSessionInterruptionReasonKey] as? AVCaptureSession.InterruptionReason }
.subscribe(onNext: { reason in
env.log.warning("AV Capture interrupted because: \(reason)")
.disposed(by: disposeBag)
private func observeCamera() {
cameraDisposeBag = DisposeBag()
guard let camera = cameraDevice else { return }
camera.rx.observe(AVCaptureDevice.TorchMode.self, "torchMode")
.map({ $0 == .on || $0 == .auto })
.bind(to: isTorchEnabled)
.disposed(by: cameraDisposeBag)
private func configureSession() throws {
guard let camera = cameraDevice else {
throw CameraManagerError.cameraDeviceNotSet
session.sessionPreset = AVCaptureSession.Preset.hd1280x720
defer { session.commitConfiguration() }
if session.canSetSessionPreset(.photo) {
session.sessionPreset = .photo
} else {
throw CameraManagerError.unableToSetPhotoSession
// remove old camera input and output
session.inputs.compactMap { $0 as? AVCaptureDeviceInput }.forEach { self.session.removeInput($0) }
session.outputs.compactMap { $0 as? AVCapturePhotoOutput }.forEach { self.session.removeOutput($0) }
session.outputs.compactMap { $0 as? AVCaptureVideoDataOutput }.forEach { self.session.removeOutput($0) }
let input = try AVCaptureDeviceInput(device: camera)
if session.canAddInput(input) {
} else {
throw CameraManagerError.unableToAddCameraInput
if session.canAddOutput(videoDataOutput) {
videoDataOutput.setSampleBufferDelegate(self, queue: dataOutputQueue)
} else {
throw CameraManagerError.unableToAddDataOutput
if session.canAddOutput(photoOutput) {
} else {
throw CameraManagerError.unableToAddPhotoOutput
// We want the buffers to be in portrait orientation otherwise they are
// rotated by 90 degrees. Need to set this _after_ addOutput()!
videoDataOutput.connection(with: = .portrait
// Based on code from
let activeDimensions = CMVideoFormatDescriptionGetDimensions(camera.activeFormat.formatDescription)
for vFormat in camera.formats {
let dimensions = CMVideoFormatDescriptionGetDimensions(vFormat.formatDescription)
let ranges = vFormat.videoSupportedFrameRateRanges as [AVFrameRateRange]
if let frameRate = ranges.first,
frameRate.maxFrameRate >= Float64(desiredFrameRate),
frameRate.minFrameRate <= Float64(desiredFrameRate),
activeDimensions.width == dimensions.width,
activeDimensions.height == dimensions.height,
CMFormatDescriptionGetMediaSubType(vFormat.formatDescription) == 875_704_422
{ // meant for full range 420f
do {
try camera.lockForConfiguration()
camera.activeFormat = vFormat as AVCaptureDevice.Format
camera.activeVideoMinFrameDuration = CMTimeMake(value: 1, timescale: Int32(desiredFrameRate))
camera.activeVideoMaxFrameDuration = CMTimeMake(value: 1, timescale: Int32(desiredFrameRate))
} catch {
print("Camera format:", camera.activeFormat)
func setVideoOutputEnabled(_ isEnabled: Bool) {
videoDataOutputEnabled = isEnabled
func toggleZoom() {
try? cameraDevice?.lockForConfiguration()
switch zoomLevel {
case .normal:
zoomLevel = .magnify
case .magnify:
zoomLevel = .normal
cameraDevice?.ramp(toVideoZoomFactor: zoomLevel.level, withRate: 2)
private func configureCamera() throws {
guard let camera = cameraDevice else {
throw CameraManagerError.cameraDeviceNotSet
do {
try camera.lockForConfiguration()
defer {
camera.videoZoomFactor = zoomLevel.level
let focusPoint = CGPoint(x: 0.5, y: 0.5)
if camera.isFocusModeSupported(.continuousAutoFocus), camera.isFocusPointOfInterestSupported {
camera.focusPointOfInterest = focusPoint
camera.focusMode = .continuousAutoFocus
} else {
env.log.warning("focus mode not supported")
if camera.isExposureModeSupported(.continuousAutoExposure), camera.isExposurePointOfInterestSupported {
camera.exposurePointOfInterest = focusPoint
camera.exposureMode = .continuousAutoExposure
} else {
env.log.warning("exposure mode not supported")
if camera.isAutoFocusRangeRestrictionSupported {
camera.autoFocusRangeRestriction = .near
} else {
env.log.warning("range restirction not supported")
} catch {
env.log.warning("unable to lock the camera for initial configuration: \(error.localizedDescription)")
private func stopRecording(async: Bool = false) {
let curSession = session
guard curSession.isRunning else { return }
if async {
sessionQueue.async {
} else {
sessionQueue.sync {
private func startRecording(async: Bool = true) {
let curSession = session
guard curSession.isRunning == false else { return }
if async {
sessionQueue.async {
} else {
sessionQueue.sync {
func focusAtCenter() {
let centerFocusPoint = CGPoint(x: 0.5, y: 0.5)
focus(at: centerFocusPoint)
func focus(at focusPoint: CGPoint) {
guard let camera = cameraDevice else { return }
guard session.isRunning else { return }
do {
try camera.lockForConfiguration()
defer { camera.unlockForConfiguration() }
if camera.isFocusModeSupported(.continuousAutoFocus), camera.isFocusPointOfInterestSupported {
camera.focusPointOfInterest = focusPoint
camera.focusMode = .continuousAutoFocus
} else {
env.log.warning("focus mode not supported")
if camera.isExposureModeSupported(.continuousAutoExposure), camera.isExposurePointOfInterestSupported {
camera.exposurePointOfInterest = focusPoint
camera.exposureMode = .continuousAutoExposure
} else {
env.log.warning("exposure mode not supported")
} catch {
env.log.warning("unable to lock the camera to set focus: \(error.localizedDescription)")
func captureImage() {
guard delegate != nil else {
env.log.warning("delegate not set")
// check if simulator
#if targetEnvironment(simulator)
delegate?.didCapturedImage(CapturedImage(image: createImage(), metadata: ImageMetadata()))
let format = photoOutput.supportedPhotoCodecTypes(for: .jpg).first
else {
env.log.error("JPEG not supported")
let settings = AVCapturePhotoSettings(format: [
AVVideoCodecKey: format,
AVVideoCompressionPropertiesKey: [AVVideoQualityKey: 8],
settings.isAutoStillImageStabilizationEnabled = photoOutput.isStillImageStabilizationSupported
settings.isHighResolutionPhotoEnabled = true
switch flashState {
case .off, .on, .unavailable:
settings.flashMode = .off
case .auto:
settings.flashMode = .auto
photoOutput.capturePhoto(with: settings, delegate: self)
func toggleFlashSetting() {
flashState = flashState.toggled
guard cameraDevice?.isTorchAvailable == true else { return }
try? cameraDevice?.lockForConfiguration()
if case .on = flashState {
try? cameraDevice?.setTorchModeOn(level: 1)
} else {
cameraDevice?.torchMode = .off
func toggleTorch() {
let device = cameraDevice,
else {
let isActive = device.isTorchActive
do {
try device.lockForConfiguration()
defer { device.unlockForConfiguration() }
if isActive {
device.torchMode = .off
} else {
try device.setTorchModeOn(level: 1)
} catch {
env.log.error("unable to toggle torch: \(error.localizedDescription)")
func setTorchActive(_ isActive: Bool) {
let device = cameraDevice,
device.isTorchActive != isActive
else {
do {
try device.lockForConfiguration()
defer { device.unlockForConfiguration() }
if !isActive {
device.torchMode = .off
} else {
try device.setTorchModeOn(level: 1)
} catch {
env.log.error("unable to activate torch: \(error.localizedDescription)")
func setZoom(_ zoomFactor: CGFloat) {
let device = cameraDevice,
device.videoZoomFactor != zoomFactor
else {
zoomFactor <= device.maxAvailableVideoZoomFactor,
zoomFactor >= device.minAvailableVideoZoomFactor
else {
env.log.warning("not supported zoom factor: \(zoomFactor)")
do {
try device.lockForConfiguration()
defer { device.unlockForConfiguration() }
device.videoZoomFactor = zoomFactor
} catch {
env.log.error("unable to set zoom: \(error.localizedDescription)")
private extension CapturedImage {
init?(photo: AVCapturePhoto) {
guard let cgImage = photo.cgImageRepresentation()?.takeUnretainedValue().copy() else { return nil }
image = cgImage
metadata = photo.metadata
extension CameraManager: AVCapturePhotoCaptureDelegate {
func photoOutput(_: AVCapturePhotoOutput, didFinishProcessingPhoto photo: AVCapturePhoto, error: Error?) {
guard let delegate = delegate else { return }
error == nil,
let image = CapturedImage(photo: photo)
else {
if let error = error {
} else {
env.log.error("Unable to process captured image")
do {
let normalizedImage = try image.oriented().centerSquared()
env.log.debug("captured \(normalizedImage)")
} catch {
env.log.error("Unable to normalize captured image")
extension CameraManager: AVCaptureVideoDataOutputSampleBufferDelegate {
func captureOutput(_: AVCaptureOutput, didOutput sampleBuffer: CMSampleBuffer, from _: AVCaptureConnection) {
guard videoDataOutputEnabled else { return }
let formatDesc = CMSampleBufferGetFormatDescription(sampleBuffer),
let imageBuffer = CMSampleBufferGetImageBuffer(sampleBuffer)
else {
env.log.error("unable to get video data image buffer")
let srcImage = CIImage(cvImageBuffer: imageBuffer)
// rotate to have portrait video
let videoDimension = CMVideoFormatDescriptionGetDimensions(formatDesc)
let videoWidth = CGFloat(videoDimension.width)
let transform = CGAffineTransform(rotationAngle: -.pi / 2).translatedBy(x: -videoWidth, y: 0)
let transformedImage = srcImage.transformed(by: transform)
// videoImage.accept(transformedImage)
// Because lowering the capture device's FPS looks ugly in the preview,
// we capture at full speed but only call the delegate at its desired
// framerate.
let timestamp = CMSampleBufferGetPresentationTimeStamp(sampleBuffer)
let deltaTime = timestamp - lastTimestamp
if deltaTime >= CMTimeMake(value: 1, timescale: Int32(fps)) {
lastTimestamp = timestamp
delegate?.videoCapture(didCaptureVideoFrame: imageBuffer)
videoImage.accept((transformedImage, imageBuffer))
func captureOutput(_: AVCaptureOutput, didDrop _: CMSampleBuffer, from _: AVCaptureConnection) {
env.log.verbose("didDrop video data frame")
private func createImage() -> CGImage {
let size = CGSize(width: 800, height: 800)
let image = UIImage.withColor(UIColor.random(), size: size)
guard let cgImage = image.cgImage else {
fatalError("unable to create CGImage for simuator image")
return cgImage
extension UIColor {
static func random() -> UIColor {
return UIColor(
hue: .random(in: 0 ... 1),
saturation: .random(in: 0.5 ... 1),
brightness: .random(in: 0.5 ... 1),
alpha: 1
