obs-studio/plugins/mac-videotoolbox/encoder.c

#include <obs-module.h>
#include <util/darray.h>
#include <util/platform.h>
#include <obs-avc.h>

#include <CoreFoundation/CoreFoundation.h>
#include <VideoToolbox/VideoToolbox.h>
#include <VideoToolbox/VTVideoEncoderList.h>
#include <CoreMedia/CoreMedia.h>

#include <util/apple/cfstring-utils.h>

#include <assert.h>

#define VT_LOG(level, format, ...) \
	blog(level, "[VideoToolbox encoder]: " format, ##__VA_ARGS__)
#define VT_LOG_ENCODER(encoder, codec_type, level, format, ...) \
	blog(level, "[VideoToolbox %s: '%s']: " format,         \
	     obs_encoder_get_name(encoder),                     \
	     codec_type_to_print_fmt(codec_type), ##__VA_ARGS__)
#define VT_BLOG(level, format, ...)                                  \
	VT_LOG_ENCODER(enc->encoder, enc->codec_type, level, format, \
		       ##__VA_ARGS__)

struct vt_encoder_type_data {
	const char *disp_name;
	const char *id;
	CMVideoCodecType codec_type;
	bool hardware_accelerated;
};

struct vt_prores_encoder_data {
	FourCharCode codec_type;
	CFStringRef encoder_id;
};
static DARRAY(struct vt_prores_encoder_data) vt_prores_hardware_encoder_list;
static DARRAY(struct vt_prores_encoder_data) vt_prores_software_encoder_list;

#ifdef __aarch64__
bool is_apple_silicon = true;
#else
bool is_apple_silicon = false;
#endif

struct vt_encoder {
	obs_encoder_t *encoder;

	const char *vt_encoder_id;
	uint32_t width;
	uint32_t height;
	uint32_t keyint;
	uint32_t fps_num;
	uint32_t fps_den;
	const char *rate_control;
	uint32_t bitrate;
	float quality;
	bool limit_bitrate;
	uint32_t rc_max_bitrate;
	double rc_max_bitrate_window;
	const char *profile;
	CMVideoCodecType codec_type;
	bool bframes;

	int vt_pix_fmt;
	enum video_colorspace colorspace;

	VTCompressionSessionRef session;
	CMSimpleQueueRef queue;
	bool hw_enc;
	DARRAY(uint8_t) packet_data;
	DARRAY(uint8_t) extra_data;
};

static const char *codec_type_to_print_fmt(CMVideoCodecType codec_type)
{
	switch (codec_type) {
	case kCMVideoCodecType_H264:
		return "h264";
	case kCMVideoCodecType_HEVC:
		return "hevc";
	case kCMVideoCodecType_AppleProRes4444XQ:
		return "ap4x";
	case kCMVideoCodecType_AppleProRes4444:
		return "ap4h";
	case kCMVideoCodecType_AppleProRes422Proxy:
		return "apco";
	case kCMVideoCodecType_AppleProRes422LT:
		return "apcs";
	case kCMVideoCodecType_AppleProRes422:
		return "apcn";
	case kCMVideoCodecType_AppleProRes422HQ:
		return "apch";
	default:
		return "";
	}
}

static void log_osstatus(int log_level, struct vt_encoder *enc,
			 const char *context, OSStatus code)
{
	char *c_str = NULL;
	CFErrorRef err = CFErrorCreate(kCFAllocatorDefault,
				       kCFErrorDomainOSStatus, code, NULL);
	CFStringRef str = CFErrorCopyDescription(err);

	c_str = cfstr_copy_cstr(str, kCFStringEncodingUTF8);
	if (c_str) {
		if (enc)
			VT_BLOG(log_level, "Error in %s: %s", context, c_str);
		else
			VT_LOG(log_level, "Error in %s: %s", context, c_str);
	}

	bfree(c_str);
	CFRelease(str);
	CFRelease(err);
}

static CFStringRef obs_to_vt_profile(CMVideoCodecType codec_type,
				     const char *profile,
				     enum video_format format)
{
	if (codec_type == kCMVideoCodecType_H264) {
		if (strcmp(profile, "baseline") == 0)
			return kVTProfileLevel_H264_Baseline_AutoLevel;
		else if (strcmp(profile, "main") == 0)
			return kVTProfileLevel_H264_Main_AutoLevel;
		else if (strcmp(profile, "high") == 0)
			return kVTProfileLevel_H264_High_AutoLevel;
		else
			return kVTProfileLevel_H264_Main_AutoLevel;
#ifdef ENABLE_HEVC
	} else if (codec_type == kCMVideoCodecType_HEVC) {
		if (strcmp(profile, "main") == 0) {
			if (format == VIDEO_FORMAT_P010) {
				VT_LOG(LOG_WARNING, "Forcing main10 for P010");
				return kVTProfileLevel_HEVC_Main10_AutoLevel;
			} else {
				return kVTProfileLevel_HEVC_Main_AutoLevel;
			}
		}
		if (strcmp(profile, "main10") == 0)
			return kVTProfileLevel_HEVC_Main10_AutoLevel;
#if __MAC_OS_X_VERSION_MAX_ALLOWED >= 120300 // macOS 12.3
		if (__builtin_available(macOS 12.3, *)) {
			if (strcmp(profile, "main42210") == 0)
				return kVTProfileLevel_HEVC_Main42210_AutoLevel;
		}
#endif // macOS 12.3
		return kVTProfileLevel_HEVC_Main_AutoLevel;
#else
		(void)format;
#endif // ENABLE_HEVC
	} else {
		return kVTProfileLevel_H264_Baseline_AutoLevel;
	}
}

static CFStringRef obs_to_vt_colorspace(enum video_colorspace cs)
{
	switch (cs) {
	case VIDEO_CS_601:
		return kCVImageBufferYCbCrMatrix_ITU_R_601_4;
	case VIDEO_CS_2100_PQ:
	case VIDEO_CS_2100_HLG:
		return kCVImageBufferYCbCrMatrix_ITU_R_2020;
	default:
		return kCVImageBufferYCbCrMatrix_ITU_R_709_2;
	}
}

static CFStringRef obs_to_vt_primaries(enum video_colorspace cs)
{
	switch (cs) {
	case VIDEO_CS_601:
		return kCVImageBufferColorPrimaries_SMPTE_C;
	case VIDEO_CS_2100_PQ:
	case VIDEO_CS_2100_HLG:
		return kCVImageBufferColorPrimaries_ITU_R_2020;
	default:
		return kCVImageBufferColorPrimaries_ITU_R_709_2;
	}
}

static CFStringRef obs_to_vt_transfer(enum video_colorspace cs)
{
	switch (cs) {
	case VIDEO_CS_SRGB:
		return kCVImageBufferTransferFunction_sRGB;
	case VIDEO_CS_2100_PQ:
		return kCVImageBufferTransferFunction_SMPTE_ST_2084_PQ;
	case VIDEO_CS_2100_HLG:
		return kCVImageBufferTransferFunction_ITU_R_2100_HLG;
	default:
		return kCVImageBufferTransferFunction_ITU_R_709_2;
	}
}

/* Adapted from Chromium GenerateMasteringDisplayColorVolume */
static CFDataRef obs_to_vt_masteringdisplay(uint32_t hdr_nominal_peak_level)
{
	struct mastering_display_colour_volume {
		uint16_t display_primaries[3][2];
		uint16_t white_point[2];
		uint32_t max_display_mastering_luminance;
		uint32_t min_display_mastering_luminance;
	};
	static_assert(sizeof(struct mastering_display_colour_volume) == 24,
		      "May need to adjust struct packing");

	struct mastering_display_colour_volume mdcv;
	mdcv.display_primaries[0][0] = __builtin_bswap16(13250);
	mdcv.display_primaries[0][1] = __builtin_bswap16(34500);
	mdcv.display_primaries[1][0] = __builtin_bswap16(7500);
	mdcv.display_primaries[1][1] = __builtin_bswap16(3000);
	mdcv.display_primaries[2][0] = __builtin_bswap16(34000);
	mdcv.display_primaries[2][1] = __builtin_bswap16(16000);
	mdcv.white_point[0] = __builtin_bswap16(15635);
	mdcv.white_point[1] = __builtin_bswap16(16450);
	mdcv.max_display_mastering_luminance =
		__builtin_bswap32(hdr_nominal_peak_level * 10000);
	mdcv.min_display_mastering_luminance = 0;

	UInt8 bytes[sizeof(struct mastering_display_colour_volume)];
	memcpy(bytes, &mdcv, sizeof(bytes));
	return CFDataCreate(kCFAllocatorDefault, bytes, sizeof(bytes));
}

/* Adapted from Chromium GenerateContentLightLevelInfo */
static CFDataRef
obs_to_vt_contentlightlevelinfo(uint16_t hdr_nominal_peak_level)
{
	struct content_light_level_info {
		uint16_t max_content_light_level;
		uint16_t max_pic_average_light_level;
	};
	static_assert(sizeof(struct content_light_level_info) == 4,
		      "May need to adjust struct packing");

	struct content_light_level_info clli;
	clli.max_content_light_level =
		__builtin_bswap16(hdr_nominal_peak_level);
	clli.max_pic_average_light_level =
		__builtin_bswap16(hdr_nominal_peak_level);

	UInt8 bytes[sizeof(struct content_light_level_info)];
	memcpy(bytes, &clli, sizeof(bytes));
	return CFDataCreate(kCFAllocatorDefault, bytes, sizeof(bytes));
}

static OSStatus session_set_prop_float(VTCompressionSessionRef session,
				       CFStringRef key, float val)
{
	CFNumberRef n = CFNumberCreate(NULL, kCFNumberFloat32Type, &val);
	OSStatus code = VTSessionSetProperty(session, key, n);
	CFRelease(n);

	return code;
}

static OSStatus session_set_prop_int(VTCompressionSessionRef session,
				     CFStringRef key, int32_t val)
{
	CFNumberRef n = CFNumberCreate(NULL, kCFNumberSInt32Type, &val);
	OSStatus code = VTSessionSetProperty(session, key, n);
	CFRelease(n);

	return code;
}

static OSStatus session_set_prop_str(VTCompressionSessionRef session,
				     CFStringRef key, char *val)
{
	CFStringRef s = CFStringCreateWithFileSystemRepresentation(NULL, val);
	OSStatus code = VTSessionSetProperty(session, key, s);
	CFRelease(s);

	return code;
}

static OSStatus session_set_prop(VTCompressionSessionRef session,
				 CFStringRef key, CFTypeRef val)
{
	return VTSessionSetProperty(session, key, val);
}

static OSStatus session_set_bitrate(VTCompressionSessionRef session,
				    const char *rate_control, int new_bitrate,
				    float quality, bool limit_bitrate,
				    int max_bitrate, double max_bitrate_window)
{
	OSStatus code;

	bool can_limit_bitrate;
	CFStringRef compressionPropertyKey;

	if (strcmp(rate_control, "CBR") == 0) {
		compressionPropertyKey =
			kVTCompressionPropertyKey_AverageBitRate;
		can_limit_bitrate = true;

		if (__builtin_available(macOS 13.0, *)) {
#if __MAC_OS_X_VERSION_MAX_ALLOWED >= 130000
			if (is_apple_silicon) {
				compressionPropertyKey =
					kVTCompressionPropertyKey_ConstantBitRate;
				can_limit_bitrate = false;
			} else {
				VT_LOG(LOG_WARNING,
				       "CBR support for VideoToolbox encoder requires Apple Silicon. "
				       "Will use ABR instead.");
			}
#else
			VT_LOG(LOG_WARNING,
			       "CBR support for VideoToolbox not available in this build of OBS. "
			       "Will use ABR instead.");
#endif
		} else {
			VT_LOG(LOG_WARNING,
			       "CBR support for VideoToolbox encoder requires macOS 13 or newer. "
			       "Will use ABR instead.");
		}
	} else if (strcmp(rate_control, "ABR") == 0) {
		compressionPropertyKey =
			kVTCompressionPropertyKey_AverageBitRate;
		can_limit_bitrate = true;
	} else if (strcmp(rate_control, "CRF") == 0) {
		if (is_apple_silicon) {
			compressionPropertyKey =
				kVTCompressionPropertyKey_Quality;
			code = session_set_prop_float(
				session, compressionPropertyKey, quality);
			if (code != noErr) {
				return code;
			}
		} else {
			VT_LOG(LOG_WARNING,
			       "CRF support for VideoToolbox encoder requires Apple Silicon. "
			       "Will use ABR instead.");
			compressionPropertyKey =
				kVTCompressionPropertyKey_AverageBitRate;
		}
		can_limit_bitrate = true;
	} else {
		VT_LOG(LOG_ERROR,
		       "Selected rate control method is not supported: %s",
		       rate_control);
		return kVTParameterErr;
	}

	if (compressionPropertyKey != kVTCompressionPropertyKey_Quality) {
		code = session_set_prop_int(session, compressionPropertyKey,
					    new_bitrate * 1000);
		if (code != noErr) {
			return code;
		}
	}

	if (limit_bitrate && can_limit_bitrate) {
		double cpb_size = max_bitrate * 125 * max_bitrate_window;

		CFNumberRef cf_cpb_size = CFNumberCreate(
			kCFAllocatorDefault, kCFNumberIntType, &cpb_size);
		CFNumberRef cf_cpb_window_size =
			CFNumberCreate(kCFAllocatorDefault, kCFNumberFloatType,
				       &max_bitrate_window);

		CFTypeRef values[2] = {cf_cpb_size, cf_cpb_window_size};

		CFArrayRef rate_control_data = CFArrayCreate(
			kCFAllocatorDefault, values, 2, &kCFTypeArrayCallBacks);

		code = session_set_prop(
			session, kVTCompressionPropertyKey_DataRateLimits,
			rate_control_data);

		CFRelease(cf_cpb_size);
		CFRelease(cf_cpb_window_size);
		CFRelease(rate_control_data);

		if (code == kVTPropertyNotSupportedErr) {
			log_osstatus(LOG_WARNING, NULL,
				     "setting DataRateLimits on session", code);
			return noErr;
		}
	}

	return noErr;
}

static OSStatus session_set_colorspace(VTCompressionSessionRef session,
				       enum video_colorspace cs)
{
	OSStatus code;

	CFTypeRef keys[5] = {kVTCompressionPropertyKey_ColorPrimaries,
			     kVTCompressionPropertyKey_TransferFunction,
			     kVTCompressionPropertyKey_YCbCrMatrix, NULL, NULL};

	CFTypeRef values[5] = {obs_to_vt_primaries(cs), obs_to_vt_transfer(cs),
			       obs_to_vt_colorspace(cs), NULL, NULL};

	CFDataRef masteringDisplayColorVolume = NULL;
	CFDataRef contentLightLevel = NULL;

	if (cs == VIDEO_CS_2100_PQ) {
		const uint16_t hdr_nominal_peak_level =
			(uint16_t)obs_get_video_hdr_nominal_peak_level();

		masteringDisplayColorVolume =
			obs_to_vt_masteringdisplay(hdr_nominal_peak_level);
		contentLightLevel =
			obs_to_vt_contentlightlevelinfo(hdr_nominal_peak_level);

		keys[3] = kVTCompressionPropertyKey_MasteringDisplayColorVolume;
		keys[4] = kVTCompressionPropertyKey_ContentLightLevelInfo;
		values[3] = masteringDisplayColorVolume;
		values[4] = contentLightLevel;
	} else if (cs == VIDEO_CS_2100_HLG) {
		masteringDisplayColorVolume = obs_to_vt_masteringdisplay(1000);
		contentLightLevel = obs_to_vt_contentlightlevelinfo(1000);

		keys[3] = kVTCompressionPropertyKey_MasteringDisplayColorVolume;
		keys[4] = kVTCompressionPropertyKey_ContentLightLevelInfo;
		values[3] = masteringDisplayColorVolume;
		values[4] = contentLightLevel;
	}

	CFDictionaryRef session_properties =
		CFDictionaryCreate(kCFAllocatorDefault, keys, values, 5,
				   &kCFTypeDictionaryKeyCallBacks,
				   &kCFTypeDictionaryValueCallBacks);

	code = VTSessionSetProperties(session, session_properties);

	CFRelease(session_properties);

	if (masteringDisplayColorVolume != NULL) {
		CFRelease(masteringDisplayColorVolume);
	}

	if (contentLightLevel != NULL) {
		CFRelease(contentLightLevel);
	}

	return code;
}

void sample_encoded_callback(void *data, void *source, OSStatus status,
			     VTEncodeInfoFlags info_flags,
			     CMSampleBufferRef buffer)
{

	if (status != noErr) {
		log_osstatus(LOG_ERROR, NULL, "encoder callback", status);
		return;
	}

	if (info_flags == kVTEncodeInfo_FrameDropped) {
		VT_LOG(LOG_INFO, "Frame dropped by encoder");
	}

	CMSimpleQueueRef queue = data;
	CVPixelBufferRef pixbuf = source;
	if (buffer != NULL) {
		CFRetain(buffer);
		CMSimpleQueueEnqueue(queue, buffer);
	}
	CFRelease(pixbuf);
}

static inline CFDictionaryRef create_encoder_spec(const char *vt_encoder_id)
{
	CFStringRef id =
		CFStringCreateWithFileSystemRepresentation(NULL, vt_encoder_id);

	CFTypeRef keys[1] = {kVTVideoEncoderSpecification_EncoderID};
	CFTypeRef values[1] = {id};

	CFDictionaryRef encoder_spec =
		CFDictionaryCreate(kCFAllocatorDefault, keys, values, 1,
				   &kCFTypeDictionaryKeyCallBacks,
				   &kCFTypeDictionaryValueCallBacks);

	CFRelease(id);

	return encoder_spec;
}

static inline CFDictionaryRef
create_prores_encoder_spec(CMVideoCodecType target_codec_type,
			   bool hardware_accelerated)
{
	CFStringRef encoder_id = NULL;

	size_t size = 0;
	struct vt_prores_encoder_data *encoder_list = NULL;
	if (hardware_accelerated) {
		size = vt_prores_hardware_encoder_list.num;
		encoder_list = vt_prores_hardware_encoder_list.array;
	} else {
		size = vt_prores_software_encoder_list.num;
		encoder_list = vt_prores_software_encoder_list.array;
	}

	for (size_t i = 0; i < size; ++i) {
		if (target_codec_type == encoder_list[i].codec_type) {
			encoder_id = encoder_list[i].encoder_id;
		}
	}

	CFTypeRef keys[1] = {kVTVideoEncoderSpecification_EncoderID};
	CFTypeRef values[1] = {encoder_id};

	CFDictionaryRef encoder_spec =
		CFDictionaryCreate(kCFAllocatorDefault, keys, values, 1,
				   &kCFTypeDictionaryKeyCallBacks,
				   &kCFTypeDictionaryValueCallBacks);

	return encoder_spec;
}

static inline CFDictionaryRef create_pixbuf_spec(struct vt_encoder *enc)
{
	CFNumberRef PixelFormat = CFNumberCreate(
		kCFAllocatorDefault, kCFNumberSInt32Type, &enc->vt_pix_fmt);
	CFNumberRef Width = CFNumberCreate(kCFAllocatorDefault,
					   kCFNumberSInt32Type, &enc->width);
	CFNumberRef Height = CFNumberCreate(kCFAllocatorDefault,
					    kCFNumberSInt32Type, &enc->height);

	CFTypeRef keys[3] = {kCVPixelBufferPixelFormatTypeKey,
			     kCVPixelBufferWidthKey, kCVPixelBufferHeightKey};
	CFTypeRef values[3] = {PixelFormat, Width, Height};

	CFDictionaryRef pixbuf_spec =
		CFDictionaryCreate(kCFAllocatorDefault, keys, values, 3,
				   &kCFTypeDictionaryKeyCallBacks,
				   &kCFTypeDictionaryValueCallBacks);

	CFRelease(PixelFormat);
	CFRelease(Width);
	CFRelease(Height);

	return pixbuf_spec;
}

static bool create_encoder(struct vt_encoder *enc)
{
	OSStatus code;

	VTCompressionSessionRef s;

	const char *codec_name = obs_encoder_get_codec(enc->encoder);

	CFDictionaryRef encoder_spec;
	if (strcmp(codec_name, "prores") == 0) {
		struct vt_encoder_type_data *type_data =
			(struct vt_encoder_type_data *)
				obs_encoder_get_type_data(enc->encoder);
		encoder_spec = create_prores_encoder_spec(
			enc->codec_type, type_data->hardware_accelerated);
	} else {
		encoder_spec = create_encoder_spec(enc->vt_encoder_id);
	}

	CFDictionaryRef pixbuf_spec = create_pixbuf_spec(enc);

	code = VTCompressionSessionCreate(kCFAllocatorDefault, enc->width,
					  enc->height, enc->codec_type,
					  encoder_spec, pixbuf_spec, NULL,
					  &sample_encoded_callback, enc->queue,
					  &s);

	if (code != noErr) {
		log_osstatus(LOG_ERROR, enc, "VTCompressionSessionCreate",
			     code);
	}

	CFRelease(encoder_spec);
	CFRelease(pixbuf_spec);

	CFBooleanRef b = NULL;
	code = VTSessionCopyProperty(
		s,
		kVTCompressionPropertyKey_UsingHardwareAcceleratedVideoEncoder,
		NULL, &b);

	if (code == noErr && (enc->hw_enc = CFBooleanGetValue(b)))
		VT_BLOG(LOG_INFO, "session created with hardware encoding");
	else
		enc->hw_enc = false;

	if (b != NULL)
		CFRelease(b);

	if (enc->codec_type == kCMVideoCodecType_H264 ||
	    enc->codec_type == kCMVideoCodecType_HEVC) {
		/* Apple's documentation states that a keyframe interval of 0 will result in
		 * the encoder automatically picking times to insert them; However, Apple's
		 * encoder, when in CRF mode, will never actually insert any keyframes past
		 * the very first one, rendering the files near-unusable in editors or
		 * video players. So to avoid that happening, enforce a reasonable default
		 * of 10 seconds in CRF mode. */
		if (enc->keyint == 0 && strcmp(enc->rate_control, "CRF") == 0) {
			VT_BLOG(LOG_INFO,
				"Enforcing non-zero keyframe interval in CRF mode");
			enc->keyint = 10;
		}

		// This can fail when using GPU hardware encoding
		code = session_set_prop_int(
			s,
			kVTCompressionPropertyKey_MaxKeyFrameIntervalDuration,
			enc->keyint);
		if (code != noErr)
			log_osstatus(
				LOG_WARNING, enc,
				"setting kVTCompressionPropertyKey_MaxKeyFrameIntervalDuration failed, "
				"keyframe interval might be incorrect",
				code);

		CFTypeRef session_keys[4] = {
			kVTCompressionPropertyKey_MaxKeyFrameInterval,
			kVTCompressionPropertyKey_ExpectedFrameRate,
			kVTCompressionPropertyKey_AllowFrameReordering,
			kVTCompressionPropertyKey_ProfileLevel};

		SInt32 key_frame_interval =
			(SInt32)(enc->keyint *
				 ((float)enc->fps_num / enc->fps_den));
		float expected_framerate = (float)enc->fps_num / enc->fps_den;
		CFNumberRef MaxKeyFrameInterval =
			CFNumberCreate(kCFAllocatorDefault, kCFNumberSInt32Type,
				       &key_frame_interval);
		CFNumberRef ExpectedFrameRate = CFNumberCreate(
			kCFAllocatorDefault, kCFNumberFloat32Type,
			&expected_framerate);
		CFTypeRef AllowFrameReordering = enc->bframes ? kCFBooleanTrue
							      : kCFBooleanFalse;

		video_t *video = obs_encoder_video(enc->encoder);
		const struct video_output_info *voi =
			video_output_get_info(video);
		CFTypeRef ProfileLevel = obs_to_vt_profile(
			enc->codec_type, enc->profile, voi->format);

		CFTypeRef session_values[4] = {MaxKeyFrameInterval,
					       ExpectedFrameRate,
					       AllowFrameReordering,
					       ProfileLevel};

		CFDictionaryRef session_properties = CFDictionaryCreate(
			kCFAllocatorDefault, session_keys, session_values, 4,
			&kCFTypeDictionaryKeyCallBacks,
			&kCFTypeDictionaryValueCallBacks);

		code = VTSessionSetProperties(s, session_properties);

		CFRelease(MaxKeyFrameInterval);
		CFRelease(ExpectedFrameRate);
		CFRelease(AllowFrameReordering);
		CFRelease(ProfileLevel);
		CFRelease(session_properties);

		if (code != noErr) {
			return code;
		}

		code = session_set_bitrate(s, enc->rate_control, enc->bitrate,
					   enc->quality, enc->limit_bitrate,
					   enc->rc_max_bitrate,
					   enc->rc_max_bitrate_window);
		if (code != noErr) {
			return code;
		}
	}

	// This can fail depending on hardware configuration
	code = session_set_prop(s, kVTCompressionPropertyKey_RealTime,
				kCFBooleanFalse);
	if (code != noErr)
		log_osstatus(
			LOG_WARNING, enc,
			"setting kVTCompressionPropertyKey_RealTime failed, "
			"frame delay might be increased",
			code);

	code = session_set_colorspace(s, enc->colorspace);
	if (code != noErr) {
		return code;
	}

	code = VTCompressionSessionPrepareToEncodeFrames(s);
	if (code != noErr) {
		return code;
	}

	enc->session = s;

	return true;

fail:
	if (encoder_spec != NULL)
		CFRelease(encoder_spec);
	if (pixbuf_spec != NULL)
		CFRelease(pixbuf_spec);

	return false;
}

static void vt_destroy(void *data)
{
	struct vt_encoder *enc = data;

	if (enc) {
		if (enc->session != NULL) {
			VTCompressionSessionInvalidate(enc->session);
			CFRelease(enc->session);
		}
		da_free(enc->packet_data);
		da_free(enc->extra_data);
		bfree(enc);
	}
}

static void dump_encoder_info(struct vt_encoder *enc)
{
	VT_BLOG(LOG_INFO,
		"settings:\n"
		"\tvt_encoder_id          %s\n"
		"\trate_control:          %s\n"
		"\tbitrate:               %d (kbps)\n"
		"\tquality:               %f\n"
		"\tfps_num:               %d\n"
		"\tfps_den:               %d\n"
		"\twidth:                 %d\n"
		"\theight:                %d\n"
		"\tkeyint:                %d (s)\n"
		"\tlimit_bitrate:         %s\n"
		"\trc_max_bitrate:        %d (kbps)\n"
		"\trc_max_bitrate_window: %f (s)\n"
		"\thw_enc:                %s\n"
		"\tprofile:               %s\n"
		"\tcodec_type:            %.4s\n",
		enc->vt_encoder_id, enc->rate_control, enc->bitrate,
		enc->quality, enc->fps_num, enc->fps_den, enc->width,
		enc->height, enc->keyint, enc->limit_bitrate ? "on" : "off",
		enc->rc_max_bitrate, enc->rc_max_bitrate_window,
		enc->hw_enc ? "on" : "off",
		(enc->profile != NULL && !!strlen(enc->profile)) ? enc->profile
								 : "default",
		codec_type_to_print_fmt(enc->codec_type));
}

typedef enum {
	kResultSuccess = 0,
	kResultColorFormatUnsupported = 1,
	kResultFullRangeUnsupported = 2,
} SetVideoFormatResult;

static SetVideoFormatResult set_video_format(struct vt_encoder *enc,
					     enum video_format format,
					     enum video_range_type range)
{
	bool full_range = range == VIDEO_RANGE_FULL;
	switch (format) {
	case VIDEO_FORMAT_I420:
		enc->vt_pix_fmt =
			full_range
				? kCVPixelFormatType_420YpCbCr8PlanarFullRange
				: kCVPixelFormatType_420YpCbCr8Planar;
		return kResultSuccess;
	case VIDEO_FORMAT_NV12:
		enc->vt_pix_fmt =
			full_range
				? kCVPixelFormatType_420YpCbCr8BiPlanarFullRange
				: kCVPixelFormatType_420YpCbCr8BiPlanarVideoRange;
		return kResultSuccess;
	case VIDEO_FORMAT_P010:
		if (enc->codec_type == kCMVideoCodecType_HEVC) {
			enc->vt_pix_fmt =
				full_range
					? kCVPixelFormatType_420YpCbCr10BiPlanarFullRange
					: kCVPixelFormatType_420YpCbCr10BiPlanarVideoRange;
			return kResultSuccess;
		}
		break;
	case VIDEO_FORMAT_P216:
		if (!full_range) {
			enc->vt_pix_fmt =
				kCVPixelFormatType_422YpCbCr16BiPlanarVideoRange;
			return kResultSuccess;
		} else {
			return kResultFullRangeUnsupported;
		}
		break;
	case VIDEO_FORMAT_P416:
		if (!full_range) {
			enc->vt_pix_fmt =
				kCVPixelFormatType_444YpCbCr16BiPlanarVideoRange;
			return kResultSuccess;
		} else {
			return kResultFullRangeUnsupported;
		}
		break;
	default:
		return kResultColorFormatUnsupported;
	}
	return kResultColorFormatUnsupported;
}

static bool update_params(struct vt_encoder *enc, obs_data_t *settings)
{
	video_t *video = obs_encoder_video(enc->encoder);
	const struct video_output_info *voi = video_output_get_info(video);

	const char *codec = obs_encoder_get_codec(enc->encoder);
	if (strcmp(codec, "h264") == 0) {
		enc->codec_type = kCMVideoCodecType_H264;
		obs_data_set_int(settings, "codec_type", enc->codec_type);
#ifdef ENABLE_HEVC
	} else if (strcmp(codec, "hevc") == 0) {
		enc->codec_type = kCMVideoCodecType_HEVC;
		obs_data_set_int(settings, "codec_type", enc->codec_type);
#endif
	} else {
		enc->codec_type = (CMVideoCodecType)obs_data_get_int(
			settings, "codec_type");
	}

	SetVideoFormatResult res =
		set_video_format(enc, voi->format, voi->range);
	if (res == kResultColorFormatUnsupported) {
		obs_encoder_set_last_error(
			enc->encoder,
			obs_module_text("ColorFormatUnsupported"));
		VT_BLOG(LOG_WARNING, "Unsupported color format selected");
		return false;
	} else if (res == kResultFullRangeUnsupported) {
		obs_encoder_set_last_error(
			enc->encoder, obs_module_text("FullRangeUnsupported"));
		VT_BLOG(LOG_WARNING, "Unsupported color range (full) selected");
		return false;
	}
	enc->colorspace = voi->colorspace;
	enc->width = obs_encoder_get_width(enc->encoder);
	enc->height = obs_encoder_get_height(enc->encoder);
	enc->fps_num = voi->fps_num;
	enc->fps_den = voi->fps_den;
	enc->keyint = (uint32_t)obs_data_get_int(settings, "keyint_sec");
	enc->rate_control = obs_data_get_string(settings, "rate_control");
	enc->bitrate = (uint32_t)obs_data_get_int(settings, "bitrate");
	enc->quality = ((float)obs_data_get_int(settings, "quality")) / 100;
	enc->profile = obs_data_get_string(settings, "profile");
	enc->limit_bitrate = obs_data_get_bool(settings, "limit_bitrate");
	enc->rc_max_bitrate =
		(uint32_t)obs_data_get_int(settings, "max_bitrate");
	enc->rc_max_bitrate_window =
		obs_data_get_double(settings, "max_bitrate_window");
	enc->bframes = obs_data_get_bool(settings, "bframes");

	return true;
}

static bool vt_update(void *data, obs_data_t *settings)
{
	struct vt_encoder *enc = data;

	uint32_t old_bitrate = enc->bitrate;
	bool old_limit_bitrate = enc->limit_bitrate;

	update_params(enc, settings);

	if (old_bitrate == enc->bitrate &&
	    old_limit_bitrate == enc->limit_bitrate)
		return true;

	OSStatus code = session_set_bitrate(enc->session, enc->rate_control,
					    enc->bitrate, enc->quality,
					    enc->limit_bitrate,
					    enc->rc_max_bitrate,
					    enc->rc_max_bitrate_window);
	if (code != noErr)
		VT_BLOG(LOG_WARNING, "Failed to set bitrate to session");

	dump_encoder_info(enc);
	return true;
}

static void *vt_create(obs_data_t *settings, obs_encoder_t *encoder)
{
	struct vt_encoder *enc = bzalloc(sizeof(struct vt_encoder));

	OSStatus code;

	enc->encoder = encoder;
	enc->vt_encoder_id = obs_encoder_get_id(encoder);

	if (!update_params(enc, settings))
		goto fail;

	code = CMSimpleQueueCreate(NULL, 100, &enc->queue);
	if (code != noErr) {
		goto fail;
	}

	if (!create_encoder(enc))
		goto fail;

	dump_encoder_info(enc);

	return enc;

fail:
	vt_destroy(enc);
	return NULL;
}

static const uint8_t annexb_startcode[4] = {0, 0, 0, 1};

static void packet_put(struct darray *packet, const uint8_t *buf, size_t size)
{
	darray_push_back_array(sizeof(uint8_t), packet, buf, size);
}

static void packet_put_startcode(struct darray *packet, int size)
{
	assert(size == 3 || size == 4);

	packet_put(packet, &annexb_startcode[4 - size], size);
}

static bool handle_prores_packet(struct vt_encoder *enc,
				 CMSampleBufferRef buffer)
{
	OSStatus err = 0;
	size_t block_size = 0;
	uint8_t *block_buf = NULL;

	CMBlockBufferRef block = CMSampleBufferGetDataBuffer(buffer);
	if (block == NULL) {
		VT_BLOG(LOG_ERROR,
			"Failed to get block buffer for ProRes frame.");
		return false;
	}
	err = CMBlockBufferGetDataPointer(block, 0, NULL, &block_size,
					  (char **)&block_buf);
	if (err != 0) {
		VT_BLOG(LOG_ERROR,
			"Failed to get data buffer pointer for ProRes frame.");
		return false;
	}

	packet_put(&enc->packet_data.da, block_buf, block_size);

	return true;
}

static void convert_block_nals_to_annexb(struct vt_encoder *enc,
					 struct darray *packet,
					 CMBlockBufferRef block,
					 int nal_length_bytes)
{
	size_t block_size;
	uint8_t *block_buf;

	CMBlockBufferGetDataPointer(block, 0, NULL, &block_size,
				    (char **)&block_buf);

	size_t bytes_remaining = block_size;

	while (bytes_remaining > 0) {
		uint32_t nal_size;
		if (nal_length_bytes == 1)
			nal_size = block_buf[0];
		else if (nal_length_bytes == 2)
			nal_size = CFSwapInt16BigToHost(
				((uint16_t *)block_buf)[0]);
		else if (nal_length_bytes == 4)
			nal_size = CFSwapInt32BigToHost(
				((uint32_t *)block_buf)[0]);
		else
			return;

		bytes_remaining -= nal_length_bytes;
		block_buf += nal_length_bytes;

		if (bytes_remaining < nal_size) {
			VT_BLOG(LOG_ERROR, "invalid nal block");
			return;
		}

		packet_put_startcode(packet, 3);
		packet_put(packet, block_buf, nal_size);

		bytes_remaining -= nal_size;
		block_buf += nal_size;
	}
}

static bool handle_keyframe(struct vt_encoder *enc,
			    CMFormatDescriptionRef format_desc,
			    size_t param_count, struct darray *packet,
			    struct darray *extra_data)
{
	OSStatus code;
	const uint8_t *param;
	size_t param_size;

	for (size_t i = 0; i < param_count; i++) {
		if (enc->codec_type == kCMVideoCodecType_H264) {
			code = CMVideoFormatDescriptionGetH264ParameterSetAtIndex(
				format_desc, i, &param, &param_size, NULL,
				NULL);
#ifdef ENABLE_HEVC
		} else if (enc->codec_type == kCMVideoCodecType_HEVC) {
			code = CMVideoFormatDescriptionGetHEVCParameterSetAtIndex(
				format_desc, i, &param, &param_size, NULL,
				NULL);
#endif
		}
		if (code != noErr) {
			log_osstatus(LOG_ERROR, enc,
				     "getting NAL parameter "
				     "at index",
				     code);
			return false;
		}

		packet_put_startcode(packet, 4);
		packet_put(packet, param, param_size);
	}

	// if we were passed an extra_data array, fill it with
	// SPS, PPS, etc.
	if (extra_data != NULL)
		packet_put(extra_data, packet->array, packet->num);

	return true;
}

static bool convert_sample_to_annexb(struct vt_encoder *enc,
				     struct darray *packet,
				     struct darray *extra_data,
				     CMSampleBufferRef buffer, bool keyframe)
{
	OSStatus code;
	CMFormatDescriptionRef format_desc =
		CMSampleBufferGetFormatDescription(buffer);

	size_t param_count;
	int nal_length_bytes;
	if (enc->codec_type == kCMVideoCodecType_H264) {
		code = CMVideoFormatDescriptionGetH264ParameterSetAtIndex(
			format_desc, 0, NULL, NULL, &param_count,
			&nal_length_bytes);
#ifdef ENABLE_HEVC
	} else if (enc->codec_type == kCMVideoCodecType_HEVC) {
		code = CMVideoFormatDescriptionGetHEVCParameterSetAtIndex(
			format_desc, 0, NULL, NULL, &param_count,
			&nal_length_bytes);
#endif
	}
	// it is not clear what errors this function can return
	// so we check the two most reasonable
	if (code == kCMFormatDescriptionBridgeError_InvalidParameter ||
	    code == kCMFormatDescriptionError_InvalidParameter) {
		VT_BLOG(LOG_WARNING, "assuming 2 parameter sets "
				     "and 4 byte NAL length header");
		param_count = 2;
		nal_length_bytes = 4;

	} else if (code != noErr) {
		log_osstatus(LOG_ERROR, enc,
			     "getting parameter count from sample", code);
		return false;
	}

	if (keyframe &&
	    !handle_keyframe(enc, format_desc, param_count, packet, extra_data))
		return false;

	CMBlockBufferRef block = CMSampleBufferGetDataBuffer(buffer);
	convert_block_nals_to_annexb(enc, packet, block, nal_length_bytes);

	return true;
}

static bool is_sample_keyframe(CMSampleBufferRef buffer)
{
	CFArrayRef attachments =
		CMSampleBufferGetSampleAttachmentsArray(buffer, false);
	if (attachments != NULL) {
		CFDictionaryRef attachment;
		CFBooleanRef has_dependencies;
		attachment =
			(CFDictionaryRef)CFArrayGetValueAtIndex(attachments, 0);
		has_dependencies = (CFBooleanRef)CFDictionaryGetValue(
			attachment, kCMSampleAttachmentKey_DependsOnOthers);
		return has_dependencies == kCFBooleanFalse;
	}

	return false;
}

static bool parse_sample(struct vt_encoder *enc, CMSampleBufferRef buffer,
			 struct encoder_packet *packet, CMTime off)
{
	CMTime pts = CMSampleBufferGetPresentationTimeStamp(buffer);
	CMTime dts = CMSampleBufferGetDecodeTimeStamp(buffer);

	if (CMTIME_IS_INVALID(dts))
		dts = pts;
	// imitate x264's negative dts when bframes might have pts < dts
	else if (enc->bframes)
		dts = CMTimeSubtract(dts, off);

	pts = CMTimeMultiply(pts, enc->fps_num);
	dts = CMTimeMultiply(dts, enc->fps_num);

	const bool is_avc = enc->codec_type == kCMVideoCodecType_H264;
	const bool has_annexb = is_avc ||
				(enc->codec_type == kCMVideoCodecType_HEVC);

	// All ProRes frames are "keyframes"
	const bool keyframe = !has_annexb || is_sample_keyframe(buffer);

	da_resize(enc->packet_data, 0);

	// If we are still looking for extra data
	struct darray *extra_data = NULL;
	if (enc->extra_data.num == 0)
		extra_data = &enc->extra_data.da;

	if (has_annexb) {
		if (!convert_sample_to_annexb(enc, &enc->packet_data.da,
					      extra_data, buffer, keyframe))
			goto fail;
	} else {
		if (!handle_prores_packet(enc, buffer))
			goto fail;
	}

	packet->type = OBS_ENCODER_VIDEO;
	packet->pts = (int64_t)(CMTimeGetSeconds(pts));
	packet->dts = (int64_t)(CMTimeGetSeconds(dts));
	packet->data = enc->packet_data.array;
	packet->size = enc->packet_data.num;
	packet->keyframe = keyframe;

	if (is_avc) {
		// VideoToolbox produces packets with priority lower than the RTMP code
		// expects, which causes it to be unable to recover from frame drops.
		// Fix this by manually adjusting the priority.
		uint8_t *start = enc->packet_data.array;
		uint8_t *end = start + enc->packet_data.num;

		start = (uint8_t *)obs_avc_find_startcode(start, end);
		while (true) {
			while (start < end && !*(start++))
				;

			if (start == end)
				break;

			const int type = start[0] & 0x1F;
			if (type == OBS_NAL_SLICE_IDR ||
			    type == OBS_NAL_SLICE) {
				uint8_t prev_type = (start[0] >> 5) & 0x3;
				start[0] &= ~(3 << 5);

				if (type == OBS_NAL_SLICE_IDR)
					start[0] |= OBS_NAL_PRIORITY_HIGHEST
						    << 5;
				else if (type == OBS_NAL_SLICE &&
					 prev_type !=
						 OBS_NAL_PRIORITY_DISPOSABLE)
					start[0] |= OBS_NAL_PRIORITY_HIGH << 5;
				else
					start[0] |= prev_type << 5;
			}

			start = (uint8_t *)obs_avc_find_startcode(start, end);
		}
	}

	CFRelease(buffer);
	return true;

fail:
	CFRelease(buffer);
	return false;
}

bool get_cached_pixel_buffer(struct vt_encoder *enc, CVPixelBufferRef *buf)
{
	OSStatus code;
	CVPixelBufferPoolRef pool =
		VTCompressionSessionGetPixelBufferPool(enc->session);
	if (!pool)
		return kCVReturnError;

	CVPixelBufferRef pixbuf;
	code = CVPixelBufferPoolCreatePixelBuffer(NULL, pool, &pixbuf);
	if (code != noErr) {
		goto fail;
	}

	// Why aren't these already set on the pixel buffer?
	// I would have expected pixel buffers from the session's
	// pool to have the correct color space stuff set

	const enum video_colorspace cs = enc->colorspace;
	CVBufferSetAttachment(pixbuf, kCVImageBufferYCbCrMatrixKey,
			      obs_to_vt_colorspace(cs),
			      kCVAttachmentMode_ShouldPropagate);
	CVBufferSetAttachment(pixbuf, kCVImageBufferColorPrimariesKey,
			      obs_to_vt_primaries(cs),
			      kCVAttachmentMode_ShouldPropagate);
	CVBufferSetAttachment(pixbuf, kCVImageBufferTransferFunctionKey,
			      obs_to_vt_transfer(cs),
			      kCVAttachmentMode_ShouldPropagate);
	const bool pq = cs == VIDEO_CS_2100_PQ;
	const bool hlg = cs == VIDEO_CS_2100_HLG;
	if (pq || hlg) {
		const uint16_t hdr_nominal_peak_level =
			pq ? (uint16_t)obs_get_video_hdr_nominal_peak_level()
			   : (hlg ? 1000 : 0);
		CFDataRef masteringDisplayColorVolume =
			obs_to_vt_masteringdisplay(hdr_nominal_peak_level);
		CFDataRef contentLightLevel =
			obs_to_vt_contentlightlevelinfo(hdr_nominal_peak_level);

		CVBufferSetAttachment(
			pixbuf, kCVImageBufferMasteringDisplayColorVolumeKey,
			masteringDisplayColorVolume,
			kCVAttachmentMode_ShouldPropagate);
		CVBufferSetAttachment(pixbuf,
				      kCVImageBufferContentLightLevelInfoKey,
				      contentLightLevel,
				      kCVAttachmentMode_ShouldPropagate);

		CFRelease(masteringDisplayColorVolume);
		CFRelease(contentLightLevel);
	}

	*buf = pixbuf;
	return true;

fail:
	return false;
}

static bool vt_encode(void *data, struct encoder_frame *frame,
		      struct encoder_packet *packet, bool *received_packet)
{
	struct vt_encoder *enc = data;

	OSStatus code;

	CMTime dur = CMTimeMake(enc->fps_den, enc->fps_num);
	CMTime off = CMTimeMultiply(dur, 2);
	CMTime pts = CMTimeMake(frame->pts, enc->fps_num);

	CVPixelBufferRef pixbuf = NULL;

	if (!get_cached_pixel_buffer(enc, &pixbuf)) {
		VT_BLOG(LOG_ERROR, "Unable to create pixel buffer");
		goto fail;
	}

	code = CVPixelBufferLockBaseAddress(pixbuf, 0);
	if (code != noErr) {
		goto fail;
	}

	for (int i = 0; i < MAX_AV_PLANES; i++) {
		if (frame->data[i] == NULL)
			break;
		uint8_t *p = (uint8_t *)CVPixelBufferGetBaseAddressOfPlane(
			pixbuf, i);
		uint8_t *f = frame->data[i];
		size_t plane_linesize =
			CVPixelBufferGetBytesPerRowOfPlane(pixbuf, i);
		size_t plane_height = CVPixelBufferGetHeightOfPlane(pixbuf, i);

		for (size_t j = 0; j < plane_height; j++) {
			memcpy(p, f, frame->linesize[i]);
			p += plane_linesize;
			f += frame->linesize[i];
		}
	}

	code = CVPixelBufferUnlockBaseAddress(pixbuf, 0);
	if (code != noErr) {
		goto fail;
	}

	code = VTCompressionSessionEncodeFrame(enc->session, pixbuf, pts, dur,
					       NULL, pixbuf, NULL);
	if (code != noErr) {
		goto fail;
	}

	CMSampleBufferRef buffer =
		(CMSampleBufferRef)CMSimpleQueueDequeue(enc->queue);

	// No samples waiting in the queue
	if (buffer == NULL)
		return true;

	*received_packet = true;
	return parse_sample(enc, buffer, packet, off);

fail:
	return false;
}

static bool vt_extra_data(void *data, uint8_t **extra_data, size_t *size)
{
	struct vt_encoder *enc = (struct vt_encoder *)data;
	*extra_data = enc->extra_data.array;
	*size = enc->extra_data.num;
	return true;
}

static const char *vt_getname(void *data)
{
	struct vt_encoder_type_data *type_data = data;

	if (strcmp("Apple H.264 (HW)", type_data->disp_name) == 0) {
		return obs_module_text("VTH264EncHW");
	} else if (strcmp("Apple H.264 (SW)", type_data->disp_name) == 0) {
		return obs_module_text("VTH264EncSW");
#ifdef ENABLE_HEVC
	} else if (strcmp("Apple HEVC (HW)", type_data->disp_name) == 0) {
		return obs_module_text("VTHEVCEncHW");
	} else if (strcmp("Apple HEVC (AVE)", type_data->disp_name) == 0) {
		return obs_module_text("VTHEVCEncT2");
	} else if (strcmp("Apple HEVC (SW)", type_data->disp_name) == 0) {
		return obs_module_text("VTHEVCEncSW");
#endif
	} else if (strncmp("AppleProResHW", type_data->disp_name, 13) == 0) {
		return obs_module_text("VTProResEncHW");
	} else if (strncmp("Apple ProRes", type_data->disp_name, 12) == 0) {
		return obs_module_text("VTProResEncSW");
	}
	return type_data->disp_name;
}

static bool rate_control_limit_bitrate_modified(obs_properties_t *ppts,
						obs_property_t *p,
						obs_data_t *settings)
{
	bool has_bitrate = true;
	bool can_limit_bitrate = true;
	bool use_limit_bitrate = obs_data_get_bool(settings, "limit_bitrate");
	const char *rate_control =
		obs_data_get_string(settings, "rate_control");

	if (strcmp(rate_control, "CBR") == 0) {
		can_limit_bitrate = false;
		has_bitrate = true;
	} else if (strcmp(rate_control, "CRF") == 0) {
		can_limit_bitrate = true;
		has_bitrate = false;
	} else if (strcmp(rate_control, "ABR") == 0) {
		can_limit_bitrate = true;
		has_bitrate = true;
	}

	p = obs_properties_get(ppts, "limit_bitrate");
	obs_property_set_visible(p, can_limit_bitrate);
	p = obs_properties_get(ppts, "max_bitrate");
	obs_property_set_visible(p, can_limit_bitrate && use_limit_bitrate);
	p = obs_properties_get(ppts, "max_bitrate_window");
	obs_property_set_visible(p, can_limit_bitrate && use_limit_bitrate);

	p = obs_properties_get(ppts, "bitrate");
	obs_property_set_visible(p, has_bitrate);
	p = obs_properties_get(ppts, "quality");
	obs_property_set_visible(p, !has_bitrate);
	return true;
}

static obs_properties_t *vt_properties_h26x(void *data __unused,
					    void *type_data)
{
	struct vt_encoder_type_data *encoder_type_data = type_data;

	obs_properties_t *props = obs_properties_create();
	obs_property_t *p;

	p = obs_properties_add_list(props, "rate_control",
				    obs_module_text("RateControl"),
				    OBS_COMBO_TYPE_LIST,
				    OBS_COMBO_FORMAT_STRING);

	if (__builtin_available(macOS 13.0, *)) {
		if (encoder_type_data->hardware_accelerated &&
		    is_apple_silicon) {
			obs_property_list_add_string(p, "CBR", "CBR");
		}
	}

	obs_property_list_add_string(p, "ABR", "ABR");

	if (encoder_type_data->hardware_accelerated && is_apple_silicon) {
		obs_property_list_add_string(p, "CRF", "CRF");
	}

	obs_property_set_modified_callback(p,
					   rate_control_limit_bitrate_modified);

	p = obs_properties_add_int(props, "bitrate", obs_module_text("Bitrate"),
				   50, 10000000, 50);
	obs_property_int_set_suffix(p, " Kbps");
	obs_properties_add_int_slider(props, "quality",
				      obs_module_text("Quality"), 0, 100, 1);

	p = obs_properties_add_bool(props, "limit_bitrate",
				    obs_module_text("UseMaxBitrate"));
	obs_property_set_modified_callback(p,
					   rate_control_limit_bitrate_modified);

	p = obs_properties_add_int(props, "max_bitrate",
				   obs_module_text("MaxBitrate"), 50, 10000000,
				   50);
	obs_property_int_set_suffix(p, " Kbps");

	p = obs_properties_add_float(props, "max_bitrate_window",
				     obs_module_text("MaxBitrateWindow"), 0.10f,
				     10.0f, 0.25f);
	obs_property_float_set_suffix(p, " s");

	p = obs_properties_add_int(props, "keyint_sec",
				   obs_module_text("KeyframeIntervalSec"), 0,
				   20, 1);
	obs_property_int_set_suffix(p, " s");

	p = obs_properties_add_list(props, "profile",
				    obs_module_text("Profile"),
				    OBS_COMBO_TYPE_LIST,
				    OBS_COMBO_FORMAT_STRING);

	if (encoder_type_data->codec_type == kCMVideoCodecType_H264) {
		obs_property_list_add_string(p, "baseline", "baseline");
		obs_property_list_add_string(p, "main", "main");
		obs_property_list_add_string(p, "high", "high");
#ifdef ENABLE_HEVC
	} else if (encoder_type_data->codec_type == kCMVideoCodecType_HEVC) {
		obs_property_list_add_string(p, "main", "main");
		obs_property_list_add_string(p, "main10", "main10");
		if (__builtin_available(macOS 12.3, *)) {
			obs_property_list_add_string(p, "main 4:2:2 10",
						     "main42210");
		}
#endif
	}

	obs_properties_add_bool(props, "bframes",
				obs_module_text("UseBFrames"));

	return props;
}

static obs_properties_t *vt_properties_prores(void *data __unused,
					      void *type_data)
{
	struct vt_encoder_type_data *encoder_type_data = type_data;

	obs_properties_t *props = obs_properties_create();
	obs_property_t *p;

	p = obs_properties_add_list(props, "codec_type",
				    obs_module_text("ProResCodec"),
				    OBS_COMBO_TYPE_LIST, OBS_COMBO_FORMAT_INT);

	uint32_t codec_availability_flags = 0;

	size_t size = 0;
	struct vt_prores_encoder_data *encoder_list = NULL;
	if (encoder_type_data->hardware_accelerated) {
		size = vt_prores_hardware_encoder_list.num;
		encoder_list = vt_prores_hardware_encoder_list.array;
	} else {
		size = vt_prores_software_encoder_list.num;
		encoder_list = vt_prores_software_encoder_list.array;
	}

	for (size_t i = 0; i < size; ++i) {

		switch (encoder_list[i].codec_type) {
		case kCMVideoCodecType_AppleProRes4444XQ:
			codec_availability_flags |= (1 << 0);
			break;
		case kCMVideoCodecType_AppleProRes4444:
			codec_availability_flags |= (1 << 1);
			break;
		case kCMVideoCodecType_AppleProRes422Proxy:
			codec_availability_flags |= (1 << 2);
			break;
		case kCMVideoCodecType_AppleProRes422LT:
			codec_availability_flags |= (1 << 3);
			break;
		case kCMVideoCodecType_AppleProRes422:
			codec_availability_flags |= (1 << 4);
			break;
		case kCMVideoCodecType_AppleProRes422HQ:
			codec_availability_flags |= (1 << 5);
			break;
		}
	}

	if (codec_availability_flags & (1 << 0))
		obs_property_list_add_int(p, obs_module_text("ProRes4444XQ"),
					  kCMVideoCodecType_AppleProRes4444XQ);
	if (codec_availability_flags & (1 << 1))
		obs_property_list_add_int(p, obs_module_text("ProRes4444"),
					  kCMVideoCodecType_AppleProRes4444);
	if (codec_availability_flags & (1 << 2))
		obs_property_list_add_int(
			p, obs_module_text("ProRes422Proxy"),
			kCMVideoCodecType_AppleProRes422Proxy);
	if (codec_availability_flags & (1 << 3))
		obs_property_list_add_int(p, obs_module_text("ProRes422LT"),
					  kCMVideoCodecType_AppleProRes422LT);
	if (codec_availability_flags & (1 << 4))
		obs_property_list_add_int(p, obs_module_text("ProRes422"),
					  kCMVideoCodecType_AppleProRes422);
	if (codec_availability_flags & (1 << 5))
		obs_property_list_add_int(p, obs_module_text("ProRes422HQ"),
					  kCMVideoCodecType_AppleProRes422HQ);

	return props;
}

static void vt_defaults(obs_data_t *settings, void *data)
{
	struct vt_encoder_type_data *type_data = data;

	obs_data_set_default_string(settings, "rate_control", "ABR");
	if (__builtin_available(macOS 13.0, *)) {
		if (type_data->hardware_accelerated && is_apple_silicon) {
			obs_data_set_default_string(settings, "rate_control",
						    "CBR");
		}
	}
	obs_data_set_default_int(settings, "bitrate", 2500);
	obs_data_set_default_int(settings, "quality", 60);
	obs_data_set_default_bool(settings, "limit_bitrate", false);
	obs_data_set_default_int(settings, "max_bitrate", 2500);
	obs_data_set_default_double(settings, "max_bitrate_window", 1.5f);
	obs_data_set_default_int(settings, "keyint_sec", 0);
	obs_data_set_default_string(
		settings, "profile",
		type_data->codec_type == kCMVideoCodecType_H264 ? "high"
								: "main");
	obs_data_set_default_int(settings, "codec_type",
				 kCMVideoCodecType_AppleProRes422);
	obs_data_set_default_bool(settings, "bframes", true);
}

static void vt_free_type_data(void *data)
{
	struct vt_encoder_type_data *type_data = data;

	bfree((char *)type_data->disp_name);
	bfree((char *)type_data->id);
	bfree(type_data);
}

static inline void
vt_add_prores_encoder_data_to_list(CFDictionaryRef encoder_dict,
				   FourCharCode codec_type)
{
	struct vt_prores_encoder_data *encoder_data = NULL;

	CFBooleanRef hardware_accelerated = CFDictionaryGetValue(
		encoder_dict, kVTVideoEncoderList_IsHardwareAccelerated);
	if (hardware_accelerated == kCFBooleanTrue)
		encoder_data =
			da_push_back_new(vt_prores_hardware_encoder_list);
	else
		encoder_data =
			da_push_back_new(vt_prores_software_encoder_list);

	encoder_data->encoder_id = CFDictionaryGetValue(
		encoder_dict, kVTVideoEncoderList_EncoderID);

	encoder_data->codec_type = codec_type;
}

static CFComparisonResult compare_encoder_list(const void *left_val,
					       const void *right_val,
					       void *context __unused)
{
	CFDictionaryRef left = (CFDictionaryRef)left_val;
	CFDictionaryRef right = (CFDictionaryRef)right_val;

	CFNumberRef left_codec_num =
		CFDictionaryGetValue(left, kVTVideoEncoderList_CodecType);
	CFNumberRef right_codec_num =
		CFDictionaryGetValue(right, kVTVideoEncoderList_CodecType);
	CFComparisonResult result =
		CFNumberCompare(left_codec_num, right_codec_num, NULL);

	if (result != kCFCompareEqualTo)
		return result;

	CFBooleanRef left_hardware_accel = CFDictionaryGetValue(
		left, kVTVideoEncoderList_IsHardwareAccelerated);
	CFBooleanRef right_hardware_accel = CFDictionaryGetValue(
		right, kVTVideoEncoderList_IsHardwareAccelerated);

	if (left_hardware_accel == right_hardware_accel)
		return kCFCompareEqualTo;
	else if (left_hardware_accel == kCFBooleanTrue)
		return kCFCompareGreaterThan;
	else
		return kCFCompareLessThan;
}

OBS_DECLARE_MODULE()
OBS_MODULE_USE_DEFAULT_LOCALE("mac-videotoolbox", "en-US")
dispatch_group_t encoder_list_dispatch_group;
CFArrayRef encoder_list_const;

bool obs_module_load(void)
{
	dispatch_queue_t queue =
		dispatch_queue_create("Encoder list load queue", NULL);
	encoder_list_dispatch_group = dispatch_group_create();
	dispatch_group_async(encoder_list_dispatch_group, queue, ^{
		VTCopyVideoEncoderList(NULL, &encoder_list_const);
	});
	// The group dispatch keeps a reference until it's finished
	dispatch_release(queue);

#ifndef __aarch64__
	is_apple_silicon = os_get_emulation_status();
#endif
	return true;
}

void obs_module_post_load(void)
{
	struct obs_encoder_info info = {
		.type = OBS_ENCODER_VIDEO,
		.get_name = vt_getname,
		.create = vt_create,
		.destroy = vt_destroy,
		.encode = vt_encode,
		.update = vt_update,
		.get_defaults2 = vt_defaults,
		.get_extra_data = vt_extra_data,
		.free_type_data = vt_free_type_data,
		.caps = OBS_ENCODER_CAP_DYN_BITRATE,
	};

	da_init(vt_prores_hardware_encoder_list);
	da_init(vt_prores_software_encoder_list);

	dispatch_group_wait(encoder_list_dispatch_group, DISPATCH_TIME_FOREVER);
	dispatch_release(encoder_list_dispatch_group);
	CFIndex size = CFArrayGetCount(encoder_list_const);

	CFMutableArrayRef encoder_list = CFArrayCreateMutableCopy(
		kCFAllocatorDefault, size, encoder_list_const);
	CFRelease(encoder_list_const);

	CFArraySortValues(encoder_list, CFRangeMake(0, size),
			  &compare_encoder_list, NULL);

	for (CFIndex i = 0; i < size; i++) {
		CFDictionaryRef encoder_dict =
			CFArrayGetValueAtIndex(encoder_list, i);

		CMVideoCodecType codec_type = 0;
		{
			CFNumberRef codec_type_num = CFDictionaryGetValue(
				encoder_dict, kVTVideoEncoderList_CodecType);
			CFNumberGetValue(codec_type_num, kCFNumberSInt32Type,
					 &codec_type);
		}

		switch (codec_type) {
		case kCMVideoCodecType_H264:
			info.get_properties2 = vt_properties_h26x;
			info.codec = "h264";
			break;
#ifdef ENABLE_HEVC
		case kCMVideoCodecType_HEVC:
			info.get_properties2 = vt_properties_h26x;
			info.codec = "hevc";
			break;
#endif
			// 422 is used as a marker for all ProRes types,
			// since the type is stored as a profile
		case kCMVideoCodecType_AppleProRes422:
			info.get_properties2 = vt_properties_prores;
			info.codec = "prores";
			vt_add_prores_encoder_data_to_list(encoder_dict,
							   codec_type);
			break;

		case kCMVideoCodecType_AppleProRes4444XQ:
		case kCMVideoCodecType_AppleProRes4444:
		case kCMVideoCodecType_AppleProRes422Proxy:
		case kCMVideoCodecType_AppleProRes422LT:
		case kCMVideoCodecType_AppleProRes422HQ:
			vt_add_prores_encoder_data_to_list(encoder_dict,
							   codec_type);
			continue;

		default:
			continue;
		}

		CFStringRef EncoderID = CFDictionaryGetValue(
			encoder_dict, kVTVideoEncoderList_EncoderID);
		CFIndex id_len =
			CFStringGetMaximumSizeOfFileSystemRepresentation(
				EncoderID);
		char *id = bzalloc(id_len + 1);
		CFStringGetFileSystemRepresentation(EncoderID, id, id_len);

		CFStringRef DisplayName = CFDictionaryGetValue(
			encoder_dict, kVTVideoEncoderList_DisplayName);
		CFIndex disp_name_len =
			CFStringGetMaximumSizeOfFileSystemRepresentation(
				DisplayName);
		char *disp_name = bzalloc(disp_name_len + 1);
		CFStringGetFileSystemRepresentation(DisplayName, disp_name,
						    disp_name_len);

		CFBooleanRef hardware_ref = CFDictionaryGetValue(
			encoder_dict,
			kVTVideoEncoderList_IsHardwareAccelerated);

		bool hardware_accelerated =
			(hardware_ref) ? CFBooleanGetValue(hardware_ref)
				       : false;

		info.id = id;
		struct vt_encoder_type_data *type_data =
			bzalloc(sizeof(struct vt_encoder_type_data));
		type_data->disp_name = disp_name;
		type_data->id = id;
		type_data->codec_type = codec_type;
		type_data->hardware_accelerated = hardware_accelerated;
		info.type_data = type_data;

		obs_register_encoder(&info);
	}

	CFRelease(encoder_list);

	VT_LOG(LOG_INFO, "Added VideoToolbox encoders");
}

void obs_module_unload(void)
{
	da_free(vt_prores_hardware_encoder_list);
	da_free(vt_prores_software_encoder_list);
}