Skip to content

Commit

Permalink
Merge pull request #44 from gregcotten/gc-develop
Browse files Browse the repository at this point in the history
Expose AVFrameSideData in AVFrame
  • Loading branch information
gregcotten authored Sep 30, 2020
2 parents 495b68d + 4bd08ab commit 8ebc966
Show file tree
Hide file tree
Showing 4 changed files with 273 additions and 0 deletions.
1 change: 1 addition & 0 deletions Sources/CFFmpeg/avutil_shim.h
Original file line number Diff line number Diff line change
Expand Up @@ -14,6 +14,7 @@
#include <libavutil/imgutils.h>
#include <libavutil/channel_layout.h>
#include <libavutil/md5.h>
#include <libavutil/mastering_display_metadata.h>

static const int64_t swift_AV_NOPTS_VALUE = AV_NOPTS_VALUE;

Expand Down
13 changes: 13 additions & 0 deletions Sources/SwiftFFmpeg/AVFrame.swift
Original file line number Diff line number Diff line change
Expand Up @@ -162,6 +162,19 @@ public final class AVFrame {
public var extendedBufferCount: Int {
Int(native.pointee.nb_extended_buf)
}

public var sideData: [AVFrameSideData] {
var list = [AVFrameSideData]()
for i in 0 ..< sideDataCount {
list.append(AVFrameSideData(native: native.pointee.side_data[i]!))
}
return list
}

/// The number of elements in `sideData`.
public var sideDataCount: Int {
Int(native.pointee.nb_side_data)
}

/// The frame timestamp estimated using various heuristics, in stream timebase.
///
Expand Down
168 changes: 168 additions & 0 deletions Sources/SwiftFFmpeg/AVFrameSideData.swift
Original file line number Diff line number Diff line change
@@ -0,0 +1,168 @@
//
// AVSideData.swift
// SwiftFFmpeg
//
// Created by Greg Cotten on 3/31/20.
//
//

import CFFmpeg

public typealias AVFrameSideDataType = CFFmpeg.AVFrameSideDataType

extension AVFrameSideDataType {

/// The data is the AVPanScan struct defined in libavcodec.
public static let panScan = AV_FRAME_DATA_PANSCAN

/// ATSC A53 Part 4 Closed Captions.
/// A53 CC bitstream is stored as uint8_t in AVFrameSideData.data.
/// The number of bytes of CC data is AVFrameSideData.size.
public static let a53CC = AV_FRAME_DATA_A53_CC

/// Stereoscopic 3d metadata.
/// The data is the AVStereo3D struct defined in libavutil/stereo3d.h.
public static let stereo3D = AV_FRAME_DATA_STEREO3D

/// The data is the AVMatrixEncoding enum defined in libavutil/channel_layout.h.
public static let matrixEncoding = AV_FRAME_DATA_MATRIXENCODING

/// Metadata relevant to a downmix procedure.
/// The data is the AVDownmixInfo struct defined in libavutil/downmix_info.h.
public static let downMixInfo = AV_FRAME_DATA_DOWNMIX_INFO

/// ReplayGain information in the form of the AVReplayGain struct.
public static let replayGain = AV_FRAME_DATA_REPLAYGAIN

/// This side data contains a 3x3 transformation matrix describing an affine
/// transformation that needs to be applied to the frame for correct
/// presentation.
/// See libavutil/display.h for a detailed description of the data.
public static let displayMatrix = AV_FRAME_DATA_DISPLAYMATRIX

/// Active Format Description data consisting of a single byte as specified
/// in ETSI TS 101 154 using AVActiveFormatDescription enum.
public static let afd = AV_FRAME_DATA_AFD

/// Motion vectors exported by some codecs (on demand through the export_mvs
/// flag set in the libavcodec AVCodecContext flags2 option).
/// The data is the AVMotionVector struct defined in
/// libavutil/motion_vector.h.
public static let motionVectors = AV_FRAME_DATA_MOTION_VECTORS

/// Recommmends skipping the specified number of samples. This is exported
/// only if the "skip_manual" AVOption is set in libavcodec.
/// This has the same format as AV_PKT_DATA_SKIP_SAMPLES.
/// @code
/// u32le number of samples to skip from start of this packet
/// u32le number of samples to skip from end of this packet
/// u8 reason for start skip
/// u8 reason for end skip (0=padding silence, 1=convergence)
/// @endcode
public static let skipSamples = AV_FRAME_DATA_SKIP_SAMPLES

/// This side data must be associated with an audio frame and corresponds to
/// enum AVAudioServiceType defined in avcodec.h.
public static let audioServiceType = AV_FRAME_DATA_AUDIO_SERVICE_TYPE

/// Mastering display metadata associated with a video frame. The payload is
/// an AVMasteringDisplayMetadata type and contains information about the
/// mastering display color volume.
public static let masteringDisplayMetadata = AV_FRAME_DATA_MASTERING_DISPLAY_METADATA

/// The GOP timecode in 25 bit timecode format. Data format is 64-bit integer.
/// This is set on the first frame of a GOP that has a temporal reference of 0.
public static let gopTimecode = AV_FRAME_DATA_GOP_TIMECODE


/// The data represents the AVSphericalMapping structure defined in
/// libavutil/spherical.h.
public static let spherical = AV_FRAME_DATA_SPHERICAL


/// Content light level (based on CTA-861.3). This payload contains data in
/// the form of the AVContentLightMetadata struct.
public static let contentLightLevel = AV_FRAME_DATA_CONTENT_LIGHT_LEVEL


/// The data contains an ICC profile as an opaque octet buffer following the
/// format described by ISO 15076-1 with an optional name defined in the
/// metadata key entry "name".
public static let iccProfile = AV_FRAME_DATA_ICC_PROFILE

#if FF_API_FRAME_QP

/// Implementation-specific description of the format of AV_FRAME_QP_TABLE_DATA.
/// The contents of this side data are undocumented and internal; use
/// av_frame_set_qp_table() and av_frame_get_qp_table() to access this in a
/// meaningful way instead.
public static let qpTableProperties = AV_FRAME_DATA_QP_TABLE_PROPERTIES

/// Raw QP table data. Its format is described by
/// AV_FRAME_DATA_QP_TABLE_PROPERTIES. Use av_frame_set_qp_table() and
/// av_frame_get_qp_table() to access this instead.
public static let qpTableData = AV_FRAME_DATA_QP_TABLE_DATA
#endif

/// Timecode which conforms to SMPTE ST 12-1. The data is an array of 4 uint32_t
/// where the first uint32_t describes how many (1-3) of the other timecodes are used.
/// The timecode format is described in the av_timecode_get_smpte_from_framenum()
/// function in libavutil/timecode.c.
public static let S12MTimecode = AV_FRAME_DATA_S12M_TIMECODE

/// HDR dynamic metadata associated with a video frame. The payload is
/// an AVDynamicHDRPlus type and contains information for color
/// volume transform - application 4 of SMPTE 2094-40:2016 standard.
public static let dynamicHDRPlus = AV_FRAME_DATA_DYNAMIC_HDR_PLUS

///Regions Of Interest, the data is an array of AVRegionOfInterest type, the number of
///array element is implied by AVFrameSideData.size / AVRegionOfInterest.self_size.
public static let regionsOfInterest = AV_FRAME_DATA_REGIONS_OF_INTEREST

/// The name of the type.
public var name: String {
String(cString: av_frame_side_data_name(self))
}
}



typealias CAVFrameSideData = CFFmpeg.AVFrameSideData

/// Structure to hold side data for an AVFrame.
///
/// sizeof(AVFrameSideData) is not a part of the public ABI, so new fields may be added
/// o the end with a minor bump.
public final class AVFrameSideData {
let native: UnsafeMutablePointer<CAVFrameSideData>

init(native: UnsafeMutablePointer<CAVFrameSideData>) {
self.native = native
}

public var type: AVFrameSideDataType {
AVFrameSideDataType(rawValue: native.pointee.type.rawValue)
}

public var data: UnsafeMutablePointer<UInt8> {
native.pointee.data
}

public var size: Int {
Int(native.pointee.size)
}

public var metadata: [String: String] {
var dict = [String: String]()
var tag: UnsafeMutablePointer<AVDictionaryEntry>?
while let next = av_dict_get(native.pointee.metadata, "", tag, AV_DICT_IGNORE_SUFFIX) {
dict[String(cString: next.pointee.key)] = String(cString: next.pointee.value)
tag = next
}
return dict
}

public var buffer: AVBuffer {
AVBuffer(native: native.pointee.buf)
}
}
91 changes: 91 additions & 0 deletions Sources/SwiftFFmpeg/HDRMetadata.swift
Original file line number Diff line number Diff line change
@@ -0,0 +1,91 @@
//
// MasteringDisplayMetadata.swift
// SwiftFFmpeg
//
// Created by Greg Cotten on 4/1/20.
//
//

import CFFmpeg

public typealias CAVMasteringDisplayMetadata = CFFmpeg.AVMasteringDisplayMetadata

public struct AVMasteringDisplayMetadata {

/// CIE 1931 xy chromaticity coords of color primaries (r, g, b order).
public var display_primaries: [[AVRational]]


/// CIE 1931 xy chromaticity coords of white point.
public var white_point: [AVRational]


/// Min luminance of mastering display (cd/m^2).
public var min_luminance: AVRational


/// Max luminance of mastering display (cd/m^2).
public var max_luminance: AVRational


/// Flag indicating whether the display primaries (and white point) are set.
public var has_primaries: Bool


/// Flag indicating whether the luminance (min_ and max_) have been set.
public var has_luminance: Bool

init(cMasteringDisplayMetadata cData: CAVMasteringDisplayMetadata) {
display_primaries = [[cData.display_primaries.0.0, cData.display_primaries.0.1], [cData.display_primaries.1.0, cData.display_primaries.1.1], [cData.display_primaries.2.0, cData.display_primaries.2.1]]
white_point = [cData.white_point.0, cData.white_point.1]

min_luminance = cData.min_luminance

max_luminance = cData.max_luminance

has_primaries = cData.has_primaries == 1

has_luminance = cData.has_luminance == 1
}
}

public extension AVFrameSideData {
var masteringDisplayMetadata: AVMasteringDisplayMetadata? {
guard type == .masteringDisplayMetadata else { return nil }

return data.withMemoryRebound(to: CAVMasteringDisplayMetadata.self, capacity: 1) { (cMasteringDisplayMetadata) -> AVMasteringDisplayMetadata in
.init(cMasteringDisplayMetadata: cMasteringDisplayMetadata.pointee)
}
}
}

public typealias CAVContentLightMetadata = CFFmpeg.AVContentLightMetadata


/// Content light level needed by to transmit HDR over HDMI (CTA-861.3).
/// To be used as payload of a AVFrameSideData or AVPacketSideData with the
/// appropriate type.
/// @note The struct should be allocated with av_content_light_metadata_alloc()
/// and its size is not a part of the public ABI.
public struct AVContentLightMetadata {
/// Max content light level (cd/m^2).
public var maxFALL: UInt32

/// Max average light level per frame (cd/m^2).
public var maxCLL: UInt32

init(cContentLightMetadata cData: CAVContentLightMetadata) {
maxFALL = cData.MaxFALL
maxCLL = cData.MaxCLL
}
}

public extension AVFrameSideData {
var contentLightMetadata: AVContentLightMetadata? {
guard type == .contentLightLevel else { return nil }

return data.withMemoryRebound(to: CAVContentLightMetadata.self, capacity: 1) { (cContentLightMetadata) -> AVContentLightMetadata in
.init(cContentLightMetadata: cContentLightMetadata.pointee)
}
}
}

0 comments on commit 8ebc966

Please sign in to comment.