415 lines
		
	
	
		
			14 KiB
		
	
	
	
		
			Python
		
	
	
	
	
	
			
		
		
	
	
			415 lines
		
	
	
		
			14 KiB
		
	
	
	
		
			Python
		
	
	
	
	
	
# People's Video Editor: high quality, GPU accelerated mp4 editor
 | 
						|
# Copyright (C) 2025 Roz K <roz@rozk.net>
 | 
						|
#
 | 
						|
# This file is part of People's Video Editor.
 | 
						|
#
 | 
						|
# People's Video Editor is free software: you can redistribute it and/or modify it under the terms of the
 | 
						|
# GNU General Public License as published by the Free Software Foundation, either version 3 of the License,
 | 
						|
# or (at your option) any later version.
 | 
						|
#
 | 
						|
# People's Video Editor is distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY;
 | 
						|
# without even the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.
 | 
						|
# See the GNU General Public License for more details.
 | 
						|
#
 | 
						|
# You should have received a copy of the GNU General Public License along with People's Video Editor.
 | 
						|
# If not, see <https://www.gnu.org/licenses/>.
 | 
						|
 | 
						|
import errno
 | 
						|
import ctypes
 | 
						|
from pathlib import PurePath
 | 
						|
 | 
						|
shared_library_path = PurePath(__file__).parent
 | 
						|
 | 
						|
def load_shared_library(name):
 | 
						|
    path = str(shared_library_path / ("lib" + name  + ".so"))
 | 
						|
    return ctypes.cdll.LoadLibrary(path)
 | 
						|
 | 
						|
_avutil = load_shared_library("avutil")
 | 
						|
_avformat = load_shared_library("avformat")
 | 
						|
_avcodec = load_shared_library("avcodec")
 | 
						|
 | 
						|
def _errtag(a, b, c, d):
 | 
						|
    return -(ord(a) | (ord(b) << 8) | (ord(c) << 16) | (ord(d) << 24))
 | 
						|
 | 
						|
if errno.EAGAIN < 0:
 | 
						|
    AVERROR_EAGAIN = errno.EAGAIN
 | 
						|
else:
 | 
						|
    AVERROR_EAGAIN = -errno.EAGAIN
 | 
						|
 | 
						|
AVERROR_EOF = _errtag('E', 'O', 'F', ' ')
 | 
						|
 | 
						|
_AV_ERROR_MAX_STRING_SIZE = 64
 | 
						|
 | 
						|
AVMEDIA_TYPE_UNKNOWN = -1
 | 
						|
AVMEDIA_TYPE_VIDEO = 0
 | 
						|
AVMEDIA_TYPE_AUDIO = 1
 | 
						|
AVMEDIA_TYPE_DATA = 2
 | 
						|
AVMEDIA_TYPE_SUBTITLE = 3
 | 
						|
AVMEDIA_TYPE_ATTACHMENT = 4
 | 
						|
 | 
						|
AV_NUM_DATA_POINTERS = 8
 | 
						|
 | 
						|
FF_THREAD_FRAME = 1
 | 
						|
FF_THREAD_SLICE = 2
 | 
						|
 | 
						|
c_uint8_p = ctypes.POINTER(ctypes.c_uint8)
 | 
						|
c_uint8_pp = ctypes.POINTER(c_uint8_p)
 | 
						|
 | 
						|
class AVRational(ctypes.Structure):
 | 
						|
    _fields_ = [
 | 
						|
        ("num", ctypes.c_int),
 | 
						|
        ("den", ctypes.c_int)]
 | 
						|
 | 
						|
class AVFrame(ctypes.Structure):
 | 
						|
    _fields_ = [
 | 
						|
        ("data", c_uint8_p * AV_NUM_DATA_POINTERS),
 | 
						|
        ("linesize", ctypes.c_int * AV_NUM_DATA_POINTERS),
 | 
						|
        ("extended_data", c_uint8_pp),
 | 
						|
        ("width", ctypes.c_int),
 | 
						|
        ("height", ctypes.c_int),
 | 
						|
        ("nb_samples", ctypes.c_int),
 | 
						|
        ("format", ctypes.c_int),
 | 
						|
        ("key_frame", ctypes.c_int),
 | 
						|
        ("pict_type", ctypes.c_int),
 | 
						|
        ("sample_aspect_ratio", AVRational),
 | 
						|
        ("pts", ctypes.c_int64),
 | 
						|
        ("pkt_dts", ctypes.c_int64),
 | 
						|
        ("time_base", AVRational)]
 | 
						|
        # ...
 | 
						|
 | 
						|
AVFrame_p = ctypes.POINTER(AVFrame)
 | 
						|
AVFrame_pp = ctypes.POINTER(AVFrame_p)
 | 
						|
 | 
						|
class AVCodecParameters(ctypes.Structure):
 | 
						|
    pass
 | 
						|
 | 
						|
AVCodecParameters_p = ctypes.POINTER(AVCodecParameters)
 | 
						|
 | 
						|
class AVStream(ctypes.Structure):
 | 
						|
    _fields_ = [
 | 
						|
        ("av_class", ctypes.c_void_p),
 | 
						|
        ("index", ctypes.c_int),
 | 
						|
        ("id", ctypes.c_int),
 | 
						|
        ("codecpar", AVCodecParameters_p),
 | 
						|
        ("priv_data", ctypes.c_void_p),
 | 
						|
        ("time_base", AVRational)]
 | 
						|
        # ...
 | 
						|
 | 
						|
AVStream_p = ctypes.POINTER(AVStream)
 | 
						|
AVStream_pp = ctypes.POINTER(AVStream_p)
 | 
						|
 | 
						|
class AVFormatContext(ctypes.Structure):
 | 
						|
    _fields_ = [
 | 
						|
        ("av_class", ctypes.c_void_p),
 | 
						|
        ("iformat", ctypes.c_void_p),
 | 
						|
        ("oformat", ctypes.c_void_p),
 | 
						|
        ("priv_data", ctypes.c_void_p),
 | 
						|
        ("pb", ctypes.c_void_p),
 | 
						|
        ("ctx_flags", ctypes.c_int),
 | 
						|
        ("nb_streams", ctypes.c_uint),
 | 
						|
        ("streams", AVStream_pp)]
 | 
						|
        # ...
 | 
						|
 | 
						|
AVFormatContext_p = ctypes.POINTER(AVFormatContext)
 | 
						|
AVFormatContext_pp = ctypes.POINTER(AVFormatContext_p)
 | 
						|
 | 
						|
class AVPacket(ctypes.Structure):
 | 
						|
    _fields_ = [
 | 
						|
        ("buf", ctypes.c_void_p),
 | 
						|
        ("pts", ctypes.c_int64),
 | 
						|
        ("dts", ctypes.c_int64),
 | 
						|
        ("data", ctypes.c_void_p),
 | 
						|
        ("size", ctypes.c_int),
 | 
						|
        ("stream_index", ctypes.c_int)]
 | 
						|
        # ...
 | 
						|
 | 
						|
AVPacket_p = ctypes.POINTER(AVPacket)
 | 
						|
AVPacket_pp = ctypes.POINTER(AVPacket_p)
 | 
						|
 | 
						|
class AVCodec(ctypes.Structure):
 | 
						|
    _fields_ = [
 | 
						|
        ("name", ctypes.c_char_p),
 | 
						|
        ("long_name", ctypes.c_char_p),
 | 
						|
        ("type", ctypes.c_int), # AVMediaType
 | 
						|
        ("id", ctypes.c_int), # AVCodecID
 | 
						|
        ("capabilities", ctypes.c_int), # AV_CODEC_CAP_*
 | 
						|
        ("max_lowres", ctypes.c_uint8),
 | 
						|
        ("deprecated_supported_framerates", ctypes.c_void_p),
 | 
						|
        ("deprecated_pix_fmts", ctypes.c_void_p),
 | 
						|
        ("deprecated_supported_samplerates", ctypes.c_void_p),
 | 
						|
        ("deprecated_sample_fmts", ctypes.c_void_p),
 | 
						|
        ("priv_class", ctypes.c_void_p),
 | 
						|
        ("profiles", ctypes.c_void_p), # AVProfile
 | 
						|
        ("wrapper_name", ctypes.c_char_p)]
 | 
						|
        # ...
 | 
						|
 | 
						|
AVCodec_p = ctypes.POINTER(AVCodec)
 | 
						|
AVCodec_pp = ctypes.POINTER(AVCodec_p)
 | 
						|
 | 
						|
class AVChannelLayout_u(ctypes.Union):
 | 
						|
    _fields_ = [
 | 
						|
        ("mask", ctypes.c_uint64),
 | 
						|
        ("map", ctypes.c_void_p)] # AVChannelCustom
 | 
						|
 | 
						|
class AVChannelLayout(ctypes.Structure):
 | 
						|
    _fields_ = [
 | 
						|
        ("order", ctypes.c_int), # AVChannelOrder
 | 
						|
        ("nb_channels", ctypes.c_int),
 | 
						|
        ("u", AVChannelLayout_u),
 | 
						|
        ("opaque", ctypes.c_void_p)]
 | 
						|
 | 
						|
class AVCodecContext(ctypes.Structure):
 | 
						|
    _fields_ = [
 | 
						|
    ("av_class", ctypes.c_void_p),
 | 
						|
    ("log_level_offset", ctypes.c_int),
 | 
						|
    ("codec_type", ctypes.c_int),
 | 
						|
    ("codec", AVCodec_p),
 | 
						|
    ("codec_id", ctypes.c_int),
 | 
						|
    ("codec_tag", ctypes.c_uint),
 | 
						|
    ("priv_data", ctypes.c_void_p),
 | 
						|
    ("internal", ctypes.c_void_p), # AVCodecInternal
 | 
						|
    ("opaque", ctypes.c_void_p),
 | 
						|
    ("bit_rate", ctypes.c_int64),
 | 
						|
    ("flags", ctypes.c_int),
 | 
						|
    ("flags2", ctypes.c_int),
 | 
						|
    ("extradata", ctypes.POINTER(ctypes.c_uint8)),
 | 
						|
    ("extradata_size", ctypes.c_int),
 | 
						|
    ("time_base", AVRational),
 | 
						|
    ("pkt_timebase", AVRational),
 | 
						|
    ("framerate", AVRational),
 | 
						|
    ("delay", ctypes.c_int),
 | 
						|
    ("width", ctypes.c_int),
 | 
						|
    ("height", ctypes.c_int),
 | 
						|
    ("coded_width", ctypes.c_int),
 | 
						|
    ("coded_height", ctypes.c_int),
 | 
						|
    ("sample_aspect_ratio", AVRational),
 | 
						|
    ("pix_fmt", ctypes.c_int), # AVPixelFormat
 | 
						|
    ("sw_pix_fmt", ctypes.c_int), # AVPixelFormat
 | 
						|
    ("color_primaries", ctypes.c_int), # AVColorPrimaries
 | 
						|
    ("color_trc", ctypes.c_int), # AVColorTransferCharacteristic
 | 
						|
    ("colorspace", ctypes.c_int), # AVColorSpace
 | 
						|
    ("color_range", ctypes.c_int), # AVColorRange
 | 
						|
    ("chroma_sample_location", ctypes.c_int), # AVChromaLocation
 | 
						|
    ("field_order", ctypes.c_int), # AVFieldOrder
 | 
						|
    ("refs", ctypes.c_int),
 | 
						|
    ("has_b_frames", ctypes.c_int),
 | 
						|
    ("slice_flags", ctypes.c_int),
 | 
						|
    ("draw_horiz_band", ctypes.c_void_p),
 | 
						|
    ("get_format", ctypes.c_void_p),
 | 
						|
    ("max_b_frames", ctypes.c_int),
 | 
						|
    ("b_quant_factor", ctypes.c_float),
 | 
						|
    ("b_quant_offset", ctypes.c_float),
 | 
						|
    ("i_quant_factor", ctypes.c_float),
 | 
						|
    ("i_quant_offset", ctypes.c_float),
 | 
						|
    ("lumi_masking", ctypes.c_float),
 | 
						|
    ("temporal_cplx_masking", ctypes.c_float),
 | 
						|
    ("spatial_cplx_masking", ctypes.c_float),
 | 
						|
    ("p_masking", ctypes.c_float),
 | 
						|
    ("dark_masking", ctypes.c_float),
 | 
						|
    ("nsse_weight", ctypes.c_int),
 | 
						|
    ("me_cmp", ctypes.c_int),
 | 
						|
    ("me_sub_cmp", ctypes.c_int),
 | 
						|
    ("mb_cmp", ctypes.c_int),
 | 
						|
    ("ildct_cmp", ctypes.c_int),
 | 
						|
    ("dia_size", ctypes.c_int),
 | 
						|
    ("last_predictor_count", ctypes.c_int),
 | 
						|
    ("me_pre_cmp", ctypes.c_int),
 | 
						|
    ("pre_dia_size", ctypes.c_int),
 | 
						|
    ("me_subpel_quality", ctypes.c_int),
 | 
						|
    ("me_range", ctypes.c_int),
 | 
						|
    ("mb_decision", ctypes.c_int),
 | 
						|
    ("intra_matrix", ctypes.POINTER(ctypes.c_uint16)),
 | 
						|
    ("inter_matrix", ctypes.POINTER(ctypes.c_uint16)),
 | 
						|
    ("chroma_intra_matrix", ctypes.POINTER(ctypes.c_uint16)),
 | 
						|
    ("intra_dc_precision", ctypes.c_int),
 | 
						|
    ("mb_lmin", ctypes.c_int),
 | 
						|
    ("mb_lmax", ctypes.c_int),
 | 
						|
    ("bidir_refine", ctypes.c_int),
 | 
						|
    ("keyint_min", ctypes.c_int),
 | 
						|
    ("gop_size", ctypes.c_int),
 | 
						|
    ("mv0_threshold", ctypes.c_int),
 | 
						|
    ("slices", ctypes.c_int),
 | 
						|
    ("sample_rate", ctypes.c_int),
 | 
						|
    ("sample_fmt", ctypes.c_int), # AVSampleFormat
 | 
						|
    ("ch_layout", AVChannelLayout),
 | 
						|
    ("frame_size", ctypes.c_int),
 | 
						|
    ("block_align", ctypes.c_int),
 | 
						|
    ("cutoff", ctypes.c_int),
 | 
						|
    ("audio_service_type", ctypes.c_int), # AVAudioServiceType
 | 
						|
    ("request_sample_fmt", ctypes.c_int), # AVSampleFormat
 | 
						|
    ("initial_padding", ctypes.c_int),
 | 
						|
    ("trailing_padding", ctypes.c_int),
 | 
						|
    ("seek_preroll", ctypes.c_int),
 | 
						|
    ("get_buffer2", ctypes.c_void_p),
 | 
						|
    ("bit_rate_tolerance", ctypes.c_int),
 | 
						|
    ("global_quality", ctypes.c_int),
 | 
						|
    ("compression_level", ctypes.c_int),
 | 
						|
    ("qcompress", ctypes.c_float),
 | 
						|
    ("qblur", ctypes.c_float),
 | 
						|
    ("qmin", ctypes.c_int),
 | 
						|
    ("qmax", ctypes.c_int),
 | 
						|
    ("max_qdiff", ctypes.c_int),
 | 
						|
    ("rc_buffer_size", ctypes.c_int),
 | 
						|
    ("rc_override_count", ctypes.c_int),
 | 
						|
    ("rc_override", ctypes.c_void_p), # RcOverride
 | 
						|
    ("rc_max_rate", ctypes.c_int64),
 | 
						|
    ("rc_min_rate", ctypes.c_int64),
 | 
						|
    ("rc_max_available_vbv_use", ctypes.c_float),
 | 
						|
    ("rc_min_vbv_overflow_use", ctypes.c_float),
 | 
						|
    ("rc_initial_buffer_occupancy", ctypes.c_int),
 | 
						|
    ("trellis", ctypes.c_int),
 | 
						|
    ("stats_out", ctypes.c_char_p),
 | 
						|
    ("stats_in", ctypes.c_char_p),
 | 
						|
    ("workaround_bugs", ctypes.c_int),
 | 
						|
    ("strict_std_compliance", ctypes.c_int),
 | 
						|
    ("error_concealment", ctypes.c_int),
 | 
						|
    ("debug", ctypes.c_int),
 | 
						|
    ("err_recognition", ctypes.c_int),
 | 
						|
    ("hwaccel", ctypes.c_void_p), # AVHWAccel
 | 
						|
    ("hwaccel_context", ctypes.c_void_p),
 | 
						|
    ("hw_frames_ctx", ctypes.c_void_p), # AVBufferRef
 | 
						|
    ("hw_device_ctx", ctypes.c_void_p), # AVBufferRef
 | 
						|
    ("hwaccel_flags", ctypes.c_int),
 | 
						|
    ("extra_hw_frames", ctypes.c_int),
 | 
						|
    ("error", ctypes.c_uint64 * AV_NUM_DATA_POINTERS),
 | 
						|
    ("dct_algo", ctypes.c_int),
 | 
						|
    ("idct_algo", ctypes.c_int),
 | 
						|
    ("bits_per_coded_sample", ctypes.c_int),
 | 
						|
    ("bits_per_raw_sample", ctypes.c_int),
 | 
						|
    ("thread_count", ctypes.c_int),
 | 
						|
    ("thread_type", ctypes.c_int)]
 | 
						|
    # ...
 | 
						|
 | 
						|
AVCodecContext_p = ctypes.POINTER(AVCodecContext)
 | 
						|
AVCodecContext_pp = ctypes.POINTER(AVCodecContext_p)
 | 
						|
 | 
						|
_avutil.av_strerror.restype = ctypes.c_int
 | 
						|
_avutil.av_strerror.argtypes = [
 | 
						|
    ctypes.c_int, # errno
 | 
						|
    ctypes.c_char_p, # errbuf
 | 
						|
    ctypes.c_size_t] # errbuff_size
 | 
						|
 | 
						|
def strerror(errno):
 | 
						|
    errbuf = ctypes.create_string_buffer(_AV_ERROR_MAX_STRING_SIZE)
 | 
						|
    _avutil.av_strerror(errno, errbuf, _AV_ERROR_MAX_STRING_SIZE)
 | 
						|
    return errbuf.value.decode("utf-8")
 | 
						|
 | 
						|
_avutil.av_frame_alloc.restype = AVFrame_p
 | 
						|
_avutil.av_frame_alloc.argtypes = None
 | 
						|
 | 
						|
def frame_alloc():
 | 
						|
    return _avutil.av_frame_alloc()
 | 
						|
 | 
						|
_avutil.av_frame_free.restype = None
 | 
						|
_avutil.av_frame_free.argtypes = [AVFrame_pp]
 | 
						|
 | 
						|
def frame_free(frame):
 | 
						|
    _avutil.av_frame_free(ctypes.byref(frame))
 | 
						|
 | 
						|
_avformat.avformat_alloc_context.restype = AVFormatContext_p
 | 
						|
_avformat.avformat_alloc_context.argtypes = None
 | 
						|
 | 
						|
def format_alloc_context():
 | 
						|
    return _avformat.avformat_alloc_context()
 | 
						|
 | 
						|
_avformat.avformat_free_context.restype = None
 | 
						|
_avformat.avformat_free_context.argtypes = [AVFormatContext_p]
 | 
						|
 | 
						|
def format_free_context(context):
 | 
						|
    _avformat.avformat_free_context(context)
 | 
						|
 | 
						|
_avformat.avformat_open_input.restype = ctypes.c_int
 | 
						|
_avformat.avformat_open_input.argtypes = [
 | 
						|
    AVFormatContext_pp,
 | 
						|
    ctypes.c_char_p, # url
 | 
						|
    ctypes.c_void_p, # format
 | 
						|
    ctypes.POINTER(ctypes.c_void_p)] # options
 | 
						|
 | 
						|
def format_open_input(context, url):
 | 
						|
    return _avformat.avformat_open_input(ctypes.byref(context), url.encode('ascii', 'ignore'), None, None)
 | 
						|
 | 
						|
_avformat.avformat_close_input.restype = None
 | 
						|
_avformat.avformat_close_input.argtypes = [AVFormatContext_pp]
 | 
						|
 | 
						|
def format_close_input(context):
 | 
						|
    _avformat.avformat_close_input(ctypes.byref(context))
 | 
						|
 | 
						|
_avformat.avformat_find_stream_info.restype = ctypes.c_int
 | 
						|
_avformat.avformat_find_stream_info.argtypes = [
 | 
						|
    AVFormatContext_p,
 | 
						|
    ctypes.POINTER(ctypes.c_void_p)] # options
 | 
						|
 | 
						|
def format_find_stream_info(context):
 | 
						|
    return _avformat.avformat_find_stream_info(context, None)
 | 
						|
 | 
						|
_avformat.av_find_best_stream.restype = ctypes.c_int
 | 
						|
_avformat.av_find_best_stream.argtypes = [
 | 
						|
    AVFormatContext_p,
 | 
						|
    ctypes.c_int, # type
 | 
						|
    ctypes.c_int, # wanted stream
 | 
						|
    ctypes.c_int, # related stream
 | 
						|
    AVCodec_pp,
 | 
						|
    ctypes.c_int] # flags
 | 
						|
 | 
						|
def format_find_best_stream(context, type):
 | 
						|
    codec = AVCodec_p()
 | 
						|
    index = _avformat.av_find_best_stream(context, type, -1, -1, ctypes.byref(codec), 0)
 | 
						|
    return index, codec
 | 
						|
 | 
						|
_avformat.av_packet_alloc.restype = AVPacket_p
 | 
						|
_avformat.av_packet_alloc.argtypes = None
 | 
						|
 | 
						|
def packet_alloc():
 | 
						|
    return _avformat.av_packet_alloc()
 | 
						|
 | 
						|
_avformat.av_packet_free.restype = None
 | 
						|
_avformat.av_packet_free.argtypes = [AVPacket_pp]
 | 
						|
 | 
						|
def packet_free(packet):
 | 
						|
    _avformat.av_packet_free(ctypes.byref(packet))
 | 
						|
 | 
						|
_avformat.av_read_frame.restype = ctypes.c_int
 | 
						|
_avformat.av_read_frame.argtypes = [AVFormatContext_p, AVPacket_p]
 | 
						|
 | 
						|
def read_frame(context, packet):
 | 
						|
    return _avformat.av_read_frame(context, packet)
 | 
						|
 | 
						|
_avcodec.avcodec_alloc_context3.restype = AVCodecContext_p
 | 
						|
_avcodec.avcodec_alloc_context3.argtypes = [AVCodec_p]
 | 
						|
 | 
						|
def codec_alloc_context(codec):
 | 
						|
    return _avcodec.avcodec_alloc_context3(codec)
 | 
						|
 | 
						|
_avcodec.avcodec_free_context.restype = None
 | 
						|
_avcodec.avcodec_free_context.argtypes = [AVCodecContext_pp]
 | 
						|
 | 
						|
def codec_free_context(context):
 | 
						|
    _avcodec.avcodec_free_context(ctypes.byref(context))
 | 
						|
 | 
						|
_avcodec.avcodec_parameters_to_context.restype = ctypes.c_int
 | 
						|
_avcodec.avcodec_parameters_to_context.argtypes = [AVCodecContext_p, AVCodecParameters_p]
 | 
						|
 | 
						|
def codec_parameters_to_context(context, parameters):
 | 
						|
    return _avcodec.avcodec_parameters_to_context(context, parameters)
 | 
						|
 | 
						|
_avcodec.avcodec_open2.restype = ctypes.c_int
 | 
						|
_avcodec.avcodec_open2.argtypes = [
 | 
						|
    AVCodecContext_p,
 | 
						|
    AVCodec_p,
 | 
						|
    ctypes.POINTER(ctypes.c_void_p)] # options
 | 
						|
 | 
						|
def codec_open(context, codec):
 | 
						|
    return _avcodec.avcodec_open2(context, codec, None)
 | 
						|
 | 
						|
_avcodec.avcodec_send_packet.restype = ctypes.c_int
 | 
						|
_avcodec.avcodec_send_packet.argtypes = [AVCodecContext_p, AVPacket_p]
 | 
						|
 | 
						|
def codec_send_packet(context, packet):
 | 
						|
    return _avcodec.avcodec_send_packet(context, packet)
 | 
						|
 | 
						|
_avcodec.avcodec_receive_frame.restype = ctypes.c_int
 | 
						|
_avcodec.avcodec_receive_frame.argtypes = [AVCodecContext_p, AVFrame_p]
 | 
						|
 | 
						|
def codec_receive_frame(context, frame):
 | 
						|
    return _avcodec.avcodec_receive_frame(context, frame)
 |