Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

Use IntEnums for codec flags #1656

Merged
merged 1 commit into from
Dec 1, 2024
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
2 changes: 1 addition & 1 deletion av/codec/codec.pyx
Original file line number Diff line number Diff line change
Expand Up @@ -117,7 +117,7 @@ cdef class Codec:
if self.is_encoder and lib.av_codec_is_decoder(self.ptr):
raise RuntimeError("%s is both encoder and decoder.")

def create(self, str kind = None):
def create(self, kind = None):
"""Create a :class:`.CodecContext` for this codec.

:param str kind: Gives a hint to static type checkers for what exact CodecContext is used.
Expand Down
90 changes: 35 additions & 55 deletions av/codec/context.pyi
Original file line number Diff line number Diff line change
@@ -1,8 +1,7 @@
from enum import Enum, Flag
from enum import Flag, IntEnum
from fractions import Fraction
from typing import ClassVar, Literal

from av.enum import EnumFlag, EnumItem
from av.packet import Packet

from .codec import Codec
Expand All @@ -15,38 +14,39 @@ class ThreadType(Flag):
def __get__(self, i: object | None, owner: type | None = None) -> ThreadType: ...
def __set__(self, instance: object, value: int | str | ThreadType) -> None: ...

class Flags(EnumFlag):
NONE: int
UNALIGNED: int
QSCALE: int
# 4MV
OUTPUT_CORRUPT: int
QPEL: int
DROPCHANGED: int
PASS1: int
PASS2: int
LOOP_FILTER: int
GRAY: int
PSNR: int
INTERLACED_DCT: int
LOW_DELAY: int
GLOBAL_HEADER: int
BITEXACT: int
AC_PRED: int
INTERLACED_ME: int
CLOSED_GOP: int
class Flags(IntEnum):
unaligned: int
qscale: int
four_mv: int
output_corrupt: int
qpel: int
drop_changed: int
recon_frame: int
copy_opaque: int
frame_duration: int
pass1: int
pass2: int
loop_filter: int
gray: int
psnr: int
interlaced_dct: int
low_delay: int
global_header: int
bitexact: int
ac_pred: int
interlaced_me: int
closed_gop: int

class Flags2(EnumFlag):
NONE: int
FAST: int
NO_OUTPUT: int
LOCAL_HEADER: int
CHUNKS: int
IGNORE_CROP: int
SHOW_ALL: int
EXPORT_MVS: int
SKIP_MANUAL: int
RO_FLUSH_NOOP: int
class Flags2(IntEnum):
fast: int
no_output: int
local_header: int
chunks: int
ignore_crop: int
show_all: int
export_mvs: int
skip_manual: int
ro_flush_noop: int

class CodecContext:
name: str
Expand All @@ -65,30 +65,10 @@ class CodecContext:
skip_frame: Literal[
"NONE", "DEFAULT", "NONREF", "BIDIR", "NONINTRA", "NONKEY", "ALL"
]

# flags
unaligned: bool
flags: int
qscale: bool
four_mv: bool
output_corrupt: bool
qpel: bool
drop_changed: bool
recon_frame: bool
copy_opaque: bool
frame_duration: bool
pass1: bool
pass2: bool
loop_filter: bool
gray: bool
psnr: bool
interlaced_dct: bool
low_delay: bool
global_header: bool
bitexact: bool
ac_pred: bool
interlaced_me: bool
closed_gop: bool

flags2: int
@property
def is_open(self) -> bool: ...
@property
Expand Down
179 changes: 79 additions & 100 deletions av/codec/context.pyx
Original file line number Diff line number Diff line change
Expand Up @@ -6,12 +6,11 @@ from libc.string cimport memcpy
from av.bytesource cimport ByteSource, bytesource
from av.codec.codec cimport Codec, wrap_codec
from av.dictionary cimport _Dictionary
from av.enum cimport define_enum
from av.error cimport err_check
from av.packet cimport Packet
from av.utils cimport avrational_to_fraction, to_avrational

from enum import Enum, Flag
from enum import Flag, IntEnum

from av.dictionary import Dictionary

Expand Down Expand Up @@ -47,65 +46,39 @@ class ThreadType(Flag):
SLICE: "Decode more than one part of a single frame at once" = lib.FF_THREAD_SLICE
AUTO: "Decode using both FRAME and SLICE methods." = lib.FF_THREAD_SLICE | lib.FF_THREAD_FRAME


Flags = define_enum("Flags", __name__, (
("NONE", 0),
("UNALIGNED", lib.AV_CODEC_FLAG_UNALIGNED,
"Allow decoders to produce frames with data planes that are not aligned to CPU requirements (e.g. due to cropping)."
),
("QSCALE", lib.AV_CODEC_FLAG_QSCALE, "Use fixed qscale."),
("4MV", lib.AV_CODEC_FLAG_4MV, "4 MV per MB allowed / advanced prediction for H.263."),
("OUTPUT_CORRUPT", lib.AV_CODEC_FLAG_OUTPUT_CORRUPT, "Output even those frames that might be corrupted."),
("QPEL", lib.AV_CODEC_FLAG_QPEL, "Use qpel MC."),
("DROPCHANGED", 1 << 5,
"Don't output frames whose parameters differ from first decoded frame in stream."
),
("RECON_FRAME", lib.AV_CODEC_FLAG_RECON_FRAME, "Request the encoder to output reconstructed frames, i.e. frames that would be produced by decoding the encoded bistream."),
("COPY_OPAQUE", lib.AV_CODEC_FLAG_COPY_OPAQUE,
"""Request the decoder to propagate each packet's AVPacket.opaque and AVPacket.opaque_ref
to its corresponding output AVFrame. Request the encoder to propagate each frame's
AVFrame.opaque and AVFrame.opaque_ref values to its corresponding output AVPacket."""),
("FRAME_DURATION", lib.AV_CODEC_FLAG_FRAME_DURATION,
"""Signal to the encoder that the values of AVFrame.duration are valid and should be
used (typically for transferring them to output packets)."""),
("PASS1", lib.AV_CODEC_FLAG_PASS1, "Use internal 2pass ratecontrol in first pass mode."),
("PASS2", lib.AV_CODEC_FLAG_PASS2, "Use internal 2pass ratecontrol in second pass mode."),
("LOOP_FILTER", lib.AV_CODEC_FLAG_LOOP_FILTER, "loop filter."),
("GRAY", lib.AV_CODEC_FLAG_GRAY, "Only decode/encode grayscale."),
("PSNR", lib.AV_CODEC_FLAG_PSNR, "error[?] variables will be set during encoding."),
("INTERLACED_DCT", lib.AV_CODEC_FLAG_INTERLACED_DCT, "Use interlaced DCT."),
("LOW_DELAY", lib.AV_CODEC_FLAG_LOW_DELAY, "Force low delay."),
("GLOBAL_HEADER", lib.AV_CODEC_FLAG_GLOBAL_HEADER,
"Place global headers in extradata instead of every keyframe."
),
("BITEXACT", lib.AV_CODEC_FLAG_BITEXACT, "Use only bitexact stuff (except (I)DCT)."),
("AC_PRED", lib.AV_CODEC_FLAG_AC_PRED, "H.263 advanced intra coding / MPEG-4 AC prediction"),
("INTERLACED_ME", lib.AV_CODEC_FLAG_INTERLACED_ME, "Interlaced motion estimation"),
("CLOSED_GOP", lib.AV_CODEC_FLAG_CLOSED_GOP),
), is_flags=True)

Flags2 = define_enum("Flags2", __name__, (
("NONE", 0),
("FAST", lib.AV_CODEC_FLAG2_FAST,
"""Allow non spec compliant speedup tricks."""),
("NO_OUTPUT", lib.AV_CODEC_FLAG2_NO_OUTPUT,
"""Skip bitstream encoding."""),
("LOCAL_HEADER", lib.AV_CODEC_FLAG2_LOCAL_HEADER,
"""Place global headers at every keyframe instead of in extradata."""),
("CHUNKS", lib.AV_CODEC_FLAG2_CHUNKS,
"""Input bitstream might be truncated at a packet boundaries
instead of only at frame boundaries."""),
("IGNORE_CROP", lib.AV_CODEC_FLAG2_IGNORE_CROP,
"""Discard cropping information from SPS."""),
("SHOW_ALL", lib.AV_CODEC_FLAG2_SHOW_ALL,
"""Show all frames before the first keyframe"""),
("EXPORT_MVS", lib.AV_CODEC_FLAG2_EXPORT_MVS,
"""Export motion vectors through frame side data"""),
("SKIP_MANUAL", lib.AV_CODEC_FLAG2_SKIP_MANUAL,
"""Do not skip samples and export skip information as frame side data"""),
("RO_FLUSH_NOOP", lib.AV_CODEC_FLAG2_RO_FLUSH_NOOP,
"""Do not reset ASS ReadOrder field on flush (subtitles decoding)"""),
), is_flags=True)
class Flags(IntEnum):
unaligned = lib.AV_CODEC_FLAG_UNALIGNED
qscale = lib.AV_CODEC_FLAG_QSCALE
four_mv = lib.AV_CODEC_FLAG_4MV
output_corrupt = lib.AV_CODEC_FLAG_OUTPUT_CORRUPT
qpel = lib.AV_CODEC_FLAG_QPEL
drop_changed = 1 << 5
recon_frame = lib.AV_CODEC_FLAG_RECON_FRAME
copy_opaque = lib.AV_CODEC_FLAG_COPY_OPAQUE
frame_duration = lib.AV_CODEC_FLAG_FRAME_DURATION
pass1 = lib.AV_CODEC_FLAG_PASS1
pass2 = lib.AV_CODEC_FLAG_PASS2
loop_filter = lib.AV_CODEC_FLAG_LOOP_FILTER
gray = lib.AV_CODEC_FLAG_GRAY
psnr = lib.AV_CODEC_FLAG_PSNR
interlaced_dct = lib.AV_CODEC_FLAG_INTERLACED_DCT
low_delay = lib.AV_CODEC_FLAG_LOW_DELAY
global_header = lib.AV_CODEC_FLAG_GLOBAL_HEADER
bitexact = lib.AV_CODEC_FLAG_BITEXACT
ac_pred = lib.AV_CODEC_FLAG_AC_PRED
interlaced_me = lib.AV_CODEC_FLAG_INTERLACED_ME
closed_gop = lib.AV_CODEC_FLAG_CLOSED_GOP

class Flags2(IntEnum):
fast = lib.AV_CODEC_FLAG2_FAST
no_output = lib.AV_CODEC_FLAG2_NO_OUTPUT
local_header = lib.AV_CODEC_FLAG2_LOCAL_HEADER
chunks = lib.AV_CODEC_FLAG2_CHUNKS
ignore_crop = lib.AV_CODEC_FLAG2_IGNORE_CROP
show_all = lib.AV_CODEC_FLAG2_SHOW_ALL
export_mvs = lib.AV_CODEC_FLAG2_EXPORT_MVS
skip_manual = lib.AV_CODEC_FLAG2_SKIP_MANUAL
ro_flush_noop = lib.AV_CODEC_FLAG2_RO_FLUSH_NOOP


cdef class CodecContext:
Expand Down Expand Up @@ -133,53 +106,59 @@ cdef class CodecContext:
self.ptr.thread_count = 0 # use as many threads as there are CPUs.
self.ptr.thread_type = 0x02 # thread within a frame. Does not change the API.

def _get_flags(self):
@property
def flags(self):
"""
Get and set the flags bitmask of CodecContext.

:rtype: int
"""
return self.ptr.flags

def _set_flags(self, value):
@flags.setter
def flags(self, int value):
self.ptr.flags = value

flags = Flags.property(_get_flags, _set_flags, "Flag property of :class:`.Flags`.")

unaligned = flags.flag_property("UNALIGNED")
qscale = flags.flag_property("QSCALE")
four_mv = flags.flag_property("4MV")
output_corrupt = flags.flag_property("OUTPUT_CORRUPT")
qpel = flags.flag_property("QPEL")
drop_changed = flags.flag_property("DROPCHANGED")
recon_frame = flags.flag_property("RECON_FRAME")
copy_opaque = flags.flag_property("COPY_OPAQUE")
frame_duration = flags.flag_property("FRAME_DURATION")
pass1 = flags.flag_property("PASS1")
pass2 = flags.flag_property("PASS2")
loop_filter = flags.flag_property("LOOP_FILTER")
gray = flags.flag_property("GRAY")
psnr = flags.flag_property("PSNR")
interlaced_dct = flags.flag_property("INTERLACED_DCT")
low_delay = flags.flag_property("LOW_DELAY")
global_header = flags.flag_property("GLOBAL_HEADER")
bitexact = flags.flag_property("BITEXACT")
ac_pred = flags.flag_property("AC_PRED")
interlaced_me = flags.flag_property("INTERLACED_ME")
closed_gop = flags.flag_property("CLOSED_GOP")

def _get_flags2(self):
@property
def qscale(self):
"""
Use fixed qscale.

:rtype: bool
"""
return bool(self.ptr.flags & lib.AV_CODEC_FLAG_QSCALE)

@qscale.setter
def qscale(self, value):
if value:
self.ptr.flags |= lib.AV_CODEC_FLAG_QSCALE
else:
self.ptr.flags &= ~lib.AV_CODEC_FLAG_QSCALE

@property
def copy_opaque(self):
return bool(self.ptr.flags & lib.AV_CODEC_FLAG_COPY_OPAQUE)

@copy_opaque.setter
def copy_opaque(self, value):
if value:
self.ptr.flags |= lib.AV_CODEC_FLAG_COPY_OPAQUE
else:
self.ptr.flags &= ~lib.AV_CODEC_FLAG_COPY_OPAQUE

@property
def flags2(self):
"""
Get and set the flags2 bitmask of CodecContext.

:rtype: int
"""
return self.ptr.flags2

def _set_flags2(self, value):
@flags2.setter
def flags2(self, int value):
self.ptr.flags2 = value

flags2 = Flags2.property(_get_flags2, _set_flags2, "Flag property of :class:`.Flags2`.")
fast = flags2.flag_property("FAST")
no_output = flags2.flag_property("NO_OUTPUT")
local_header = flags2.flag_property("LOCAL_HEADER")
chunks = flags2.flag_property("CHUNKS")
ignore_crop = flags2.flag_property("IGNORE_CROP")
show_all = flags2.flag_property("SHOW_ALL")
export_mvs = flags2.flag_property("EXPORT_MVS")
skip_manual = flags2.flag_property("SKIP_MANUAL")
ro_flush_noop = flags2.flag_property("RO_FLUSH_NOOP")

@property
def extradata(self):
if self.ptr is NULL:
Expand Down
40 changes: 0 additions & 40 deletions av/enum.pyx
Original file line number Diff line number Diff line change
Expand Up @@ -198,46 +198,6 @@ cdef class EnumItem:


cdef class EnumFlag(EnumItem):

"""
Flags are sets of boolean attributes, which the FFmpeg API represents as individual
bits in a larger integer which you manipulate with the bitwise operators.
We associate names with each flag that are easier to operate with.

Consider :data:`CodecContextFlags`, whis is the type of the :attr:`CodecContext.flags`
attribute, and the set of boolean properties::

>>> fh = av.open(video_path)
>>> cc = fh.streams.video[0].codec_context

>>> cc.flags
<av.codec.context.Flags:NONE(0x0)>

>>> # You can set flags via bitwise operations with the objects, names, or values:
>>> cc.flags |= cc.flags.OUTPUT_CORRUPT
>>> cc.flags |= 'GLOBAL_HEADER'
>>> cc.flags
<av.codec.context.Flags:OUTPUT_CORRUPT|GLOBAL_HEADER(0x400008)>

>>> # You can test flags via bitwise operations with objects, names, or values:
>>> bool(cc.flags & cc.flags.OUTPUT_CORRUPT)
True
>>> bool(cc.flags & 'QSCALE')
False

>>> # There are boolean properties for each flag:
>>> cc.output_corrupt
True
>>> cc.qscale
False

>>> # You can set them:
>>> cc.qscale = True
>>> cc.flags
<av.codec.context.Flags:QSCALE|OUTPUT_CORRUPT|GLOBAL_HEADER(0x40000a)>

"""

cdef readonly tuple flags

def __cinit__(self, sentinel, name, value, doc=None):
Expand Down
7 changes: 6 additions & 1 deletion tests/test_videoframe.py
Original file line number Diff line number Diff line change
Expand Up @@ -31,7 +31,12 @@ def assertPixelValue16(plane, expected, byteorder: str) -> None:
def test_opaque() -> None:
with av.open(fate_suite("h264/interlaced_crop.mp4")) as container:
video_stream = container.streams.video[0]
video_stream.codec_context.copy_opaque = True

ctx = video_stream.codec_context
ctx.flags |= av.codec.context.Flags.copy_opaque

assert video_stream.codec_context.copy_opaque

for packet_idx, packet in enumerate(container.demux()):
packet.opaque = (time.time(), packet_idx)
for frame in packet.decode():
Expand Down
Loading