/* SPDX-License-Identifier: GPL-2.0-or-later * Partial Copyright 2006 Peter Schlaile. */ /** \file * \ingroup bke */ #ifdef WITH_FFMPEG # include # include # include # include "MEM_guardedalloc.h" # include "DNA_scene_types.h" # include "BLI_blenlib.h" # ifdef WITH_AUDASPACE # include # include # endif # include "BLI_endian_defines.h" # include "BLI_math_base.h" # include "BLI_threads.h" # include "BLI_utildefines.h" # include "BKE_global.h" # include "BKE_idprop.h" # include "BKE_image.h" # include "BKE_lib_id.h" # include "BKE_main.h" # include "BKE_report.h" # include "BKE_sound.h" # include "BKE_writeffmpeg.h" # include "IMB_imbuf.h" /* This needs to be included after BLI_math_base.h otherwise it will redefine some math defines * like M_SQRT1_2 leading to warnings with MSVC */ # include # include # include # include # include # include # include # include # include "ffmpeg_compat.h" struct StampData; typedef struct FFMpegContext { int ffmpeg_type; int ffmpeg_codec; int ffmpeg_audio_codec; int ffmpeg_video_bitrate; int ffmpeg_audio_bitrate; int ffmpeg_gop_size; int ffmpeg_max_b_frames; int ffmpeg_autosplit; int ffmpeg_autosplit_count; bool ffmpeg_preview; int ffmpeg_crf; /* set to 0 to not use CRF mode; we have another flag for lossless anyway. */ int ffmpeg_preset; /* see eFFMpegPreset */ AVFormatContext *outfile; AVCodecContext *video_codec; AVCodecContext *audio_codec; AVStream *video_stream; AVStream *audio_stream; AVFrame *current_frame; /* Image frame in output pixel format. */ int video_time; /* Image frame in Blender's own pixel format, may need conversion to the output pixel format. */ AVFrame *img_convert_frame; struct SwsContext *img_convert_ctx; uint8_t *audio_input_buffer; uint8_t *audio_deinterleave_buffer; int audio_input_samples; double audio_time; double audio_time_total; bool audio_deinterleave; int audio_sample_size; struct StampData *stamp_data; # ifdef WITH_AUDASPACE AUD_Device *audio_mixdown_device; # endif } FFMpegContext; # define FFMPEG_AUTOSPLIT_SIZE 2000000000 # define PRINT \ if (G.debug & G_DEBUG_FFMPEG) \ printf static void ffmpeg_dict_set_int(AVDictionary **dict, const char *key, int value); static void ffmpeg_filepath_get(FFMpegContext *context, char *string, const struct RenderData *rd, bool preview, const char *suffix); /* Delete a picture buffer */ static void delete_picture(AVFrame *f) { if (f) { if (f->data[0]) { MEM_freeN(f->data[0]); } av_free(f); } } static int request_float_audio_buffer(int codec_id) { /* If any of these codecs, we prefer the float sample format (if supported) */ return codec_id == AV_CODEC_ID_AAC || codec_id == AV_CODEC_ID_AC3 || codec_id == AV_CODEC_ID_VORBIS; } # ifdef WITH_AUDASPACE static int write_audio_frame(FFMpegContext *context) { AVFrame *frame = NULL; AVCodecContext *c = context->audio_codec; AUD_Device_read( context->audio_mixdown_device, context->audio_input_buffer, context->audio_input_samples); frame = av_frame_alloc(); frame->pts = context->audio_time / av_q2d(c->time_base); frame->nb_samples = context->audio_input_samples; frame->format = c->sample_fmt; av_channel_layout_copy(&frame->ch_layout, &c->ch_layout); if (context->audio_deinterleave) { int channel, i; uint8_t *temp; for (channel = 0; channel < c->ch_layout.nb_channels; channel++) { for (i = 0; i < frame->nb_samples; i++) { memcpy(context->audio_deinterleave_buffer + (i + channel * frame->nb_samples) * context->audio_sample_size, context->audio_input_buffer + (c->ch_layout.nb_channels * i + channel) * context->audio_sample_size, context->audio_sample_size); } } temp = context->audio_deinterleave_buffer; context->audio_deinterleave_buffer = context->audio_input_buffer; context->audio_input_buffer = temp; } avcodec_fill_audio_frame(frame, c->ch_layout.nb_channels, c->sample_fmt, context->audio_input_buffer, context->audio_input_samples * c->ch_layout.nb_channels * context->audio_sample_size, 1); int success = 1; int ret = avcodec_send_frame(c, frame); if (ret < 0) { /* Can't send frame to encoder. This shouldn't happen. */ fprintf(stderr, "Can't send audio frame: %s\n", av_err2str(ret)); success = -1; } AVPacket *pkt = av_packet_alloc(); while (ret >= 0) { ret = avcodec_receive_packet(c, pkt); if (ret == AVERROR(EAGAIN) || ret == AVERROR_EOF) { break; } if (ret < 0) { fprintf(stderr, "Error encoding audio frame: %s\n", av_err2str(ret)); success = -1; } pkt->stream_index = context->audio_stream->index; av_packet_rescale_ts(pkt, c->time_base, context->audio_stream->time_base); # ifdef FFMPEG_USE_DURATION_WORKAROUND my_guess_pkt_duration(context->outfile, context->audio_stream, pkt); # endif pkt->flags |= AV_PKT_FLAG_KEY; int write_ret = av_interleaved_write_frame(context->outfile, pkt); if (write_ret != 0) { fprintf(stderr, "Error writing audio packet: %s\n", av_err2str(write_ret)); success = -1; break; } } av_packet_free(&pkt); av_frame_free(&frame); return success; } # endif /* #ifdef WITH_AUDASPACE */ /* Allocate a temporary frame */ static AVFrame *alloc_picture(int pix_fmt, int width, int height) { AVFrame *f; uint8_t *buf; int size; /* allocate space for the struct */ f = av_frame_alloc(); if (!f) { return NULL; } size = av_image_get_buffer_size(pix_fmt, width, height, 1); /* allocate the actual picture buffer */ buf = MEM_mallocN(size, "AVFrame buffer"); if (!buf) { free(f); return NULL; } av_image_fill_arrays(f->data, f->linesize, buf, pix_fmt, width, height, 1); f->format = pix_fmt; f->width = width; f->height = height; return f; } /* Get the correct file extensions for the requested format, * first is always desired guess_format parameter */ static const char **get_file_extensions(int format) { switch (format) { case FFMPEG_DV: { static const char *rv[] = {".dv", NULL}; return rv; } case FFMPEG_MPEG1: { static const char *rv[] = {".mpg", ".mpeg", NULL}; return rv; } case FFMPEG_MPEG2: { static const char *rv[] = {".dvd", ".vob", ".mpg", ".mpeg", NULL}; return rv; } case FFMPEG_MPEG4: { static const char *rv[] = {".mp4", ".mpg", ".mpeg", NULL}; return rv; } case FFMPEG_AVI: { static const char *rv[] = {".avi", NULL}; return rv; } case FFMPEG_MOV: { static const char *rv[] = {".mov", NULL}; return rv; } case FFMPEG_H264: { /* FIXME: avi for now... */ static const char *rv[] = {".avi", NULL}; return rv; } case FFMPEG_XVID: { /* FIXME: avi for now... */ static const char *rv[] = {".avi", NULL}; return rv; } case FFMPEG_FLV: { static const char *rv[] = {".flv", NULL}; return rv; } case FFMPEG_MKV: { static const char *rv[] = {".mkv", NULL}; return rv; } case FFMPEG_OGG: { static const char *rv[] = {".ogv", ".ogg", NULL}; return rv; } case FFMPEG_WEBM: { static const char *rv[] = {".webm", NULL}; return rv; } case FFMPEG_AV1: { static const char *rv[] = {".mp4", ".mkv", NULL}; return rv; } default: return NULL; } } /* Write a frame to the output file */ static int write_video_frame(FFMpegContext *context, AVFrame *frame, ReportList *reports) { int ret, success = 1; AVPacket *packet = av_packet_alloc(); AVCodecContext *c = context->video_codec; frame->pts = context->video_time; context->video_time++; ret = avcodec_send_frame(c, frame); if (ret < 0) { /* Can't send frame to encoder. This shouldn't happen. */ fprintf(stderr, "Can't send video frame: %s\n", av_err2str(ret)); success = -1; } while (ret >= 0) { ret = avcodec_receive_packet(c, packet); if (ret == AVERROR(EAGAIN) || ret == AVERROR_EOF) { /* No more packets available. */ break; } if (ret < 0) { fprintf(stderr, "Error encoding frame: %s\n", av_err2str(ret)); break; } packet->stream_index = context->video_stream->index; av_packet_rescale_ts(packet, c->time_base, context->video_stream->time_base); # ifdef FFMPEG_USE_DURATION_WORKAROUND my_guess_pkt_duration(context->outfile, context->video_stream, packet); # endif if (av_interleaved_write_frame(context->outfile, packet) != 0) { success = -1; break; } } if (!success) { BKE_report(reports, RPT_ERROR, "Error writing frame"); PRINT("Error writing frame: %s\n", av_err2str(ret)); } av_packet_free(&packet); return success; } /* read and encode a frame of video from the buffer */ static AVFrame *generate_video_frame(FFMpegContext *context, const uint8_t *pixels) { AVCodecParameters *codec = context->video_stream->codecpar; int height = codec->height; AVFrame *rgb_frame; if (context->img_convert_frame != NULL) { /* Pixel format conversion is needed. */ rgb_frame = context->img_convert_frame; } else { /* The output pixel format is Blender's internal pixel format. */ rgb_frame = context->current_frame; } /* Copy the Blender pixels into the FFmpeg datastructure, taking care of endianness and flipping * the image vertically. */ int linesize = rgb_frame->linesize[0]; for (int y = 0; y < height; y++) { uint8_t *target = rgb_frame->data[0] + linesize * (height - y - 1); const uint8_t *src = pixels + linesize * y; # if ENDIAN_ORDER == L_ENDIAN memcpy(target, src, linesize); # elif ENDIAN_ORDER == B_ENDIAN const uint8_t *end = src + linesize; while (src != end) { target[3] = src[0]; target[2] = src[1]; target[1] = src[2]; target[0] = src[3]; target += 4; src += 4; } # else # error ENDIAN_ORDER should either be L_ENDIAN or B_ENDIAN. # endif } /* Convert to the output pixel format, if it's different that Blender's internal one. */ if (context->img_convert_frame != NULL) { BLI_assert(context->img_convert_ctx != NULL); sws_scale(context->img_convert_ctx, (const uint8_t *const *)rgb_frame->data, rgb_frame->linesize, 0, codec->height, context->current_frame->data, context->current_frame->linesize); } return context->current_frame; } static AVRational calc_time_base(uint den, double num, int codec_id) { /* Convert the input 'num' to an integer. Simply shift the decimal places until we get an integer * (within a floating point error range). * For example if we have `den = 3` and `num = 0.1` then the fps is: `den/num = 30` fps. * When converting this to a FFMPEG time base, we want num to be an integer. * So we simply move the decimal places of both numbers. i.e. `den = 30`, `num = 1`. */ float eps = FLT_EPSILON; const uint DENUM_MAX = (codec_id == AV_CODEC_ID_MPEG4) ? (1UL << 16) - 1 : (1UL << 31) - 1; /* Calculate the precision of the initial floating point number. */ if (num > 1.0) { const uint num_integer_bits = log2_floor_u((uint)num); /* Formula for calculating the epsilon value: (power of two range) / (pow mantissa bits) * For example, a float has 23 mantissa bits and the float value 3.5f as a pow2 range of * (4-2=2): * (2) / pow2(23) = floating point precision for 3.5f */ eps = (float)(1 << num_integer_bits) * FLT_EPSILON; } /* Calculate how many decimal shifts we can do until we run out of precision. */ const int max_num_shift = fabsf(log10f(eps)); /* Calculate how many times we can shift the denominator. */ const int max_den_shift = log10f(DENUM_MAX) - log10f(den); const int max_iter = min_ii(max_num_shift, max_den_shift); for (int i = 0; i < max_iter && fabs(num - round(num)) > eps; i++) { /* Increase the number and denominator until both are integers. */ num *= 10; den *= 10; eps *= 10; } AVRational time_base; time_base.den = den; time_base.num = (int)num; return time_base; } static const AVCodec *get_av1_encoder( FFMpegContext *context, RenderData *rd, AVDictionary **opts, int rectx, int recty) { /* There are three possible encoders for AV1: libaom-av1, librav1e, and libsvtav1. librav1e tends * to give the best compression quality while libsvtav1 tends to be the fastest encoder. One of * each will be picked based on the preset setting, and if a particular encoder is not available, * then use the default returned by FFMpeg. */ const AVCodec *codec = NULL; switch (context->ffmpeg_preset) { case FFM_PRESET_BEST: /* Default to libaom-av1 for BEST preset due to it performing better than rav1e in terms of * video quality (VMAF scores). Fallback to rav1e if libaom-av1 isn't available. */ codec = avcodec_find_encoder_by_name("libaom-av1"); if (!codec) { codec = avcodec_find_encoder_by_name("librav1e"); } break; case FFM_PRESET_REALTIME: codec = avcodec_find_encoder_by_name("libsvtav1"); break; case FFM_PRESET_GOOD: default: codec = avcodec_find_encoder_by_name("libaom-av1"); break; } /* Use the default AV1 encoder if the specified encoder wasn't found. */ if (!codec) { codec = avcodec_find_encoder(AV_CODEC_ID_AV1); } /* Apply AV1 encoder specific settings. */ if (codec) { if (STREQ(codec->name, "librav1e")) { /* Set "tiles" to 8 to enable multi-threaded encoding. */ if (rd->threads > 8) { ffmpeg_dict_set_int(opts, "tiles", rd->threads); } else { ffmpeg_dict_set_int(opts, "tiles", 8); } /* Use a reasonable speed setting based on preset. Speed ranges from 0-10. * Must check context->ffmpeg_preset again in case this encoder was selected due to the * absence of another. */ switch (context->ffmpeg_preset) { case FFM_PRESET_BEST: ffmpeg_dict_set_int(opts, "speed", 4); break; case FFM_PRESET_REALTIME: ffmpeg_dict_set_int(opts, "speed", 10); break; case FFM_PRESET_GOOD: default: ffmpeg_dict_set_int(opts, "speed", 6); break; } if (context->ffmpeg_crf >= 0) { /* librav1e does not use -crf, but uses -qp in the range of 0-255. Calculates the roughly * equivalent float, and truncates it to an integer. */ unsigned int qp_value = ((float)context->ffmpeg_crf) * 255.0F / 51.0F; if (qp_value > 255) { qp_value = 255; } ffmpeg_dict_set_int(opts, "qp", qp_value); } /* Set gop_size as rav1e's "--keyint". */ char buffer[64]; BLI_snprintf(buffer, sizeof(buffer), "keyint=%d", context->ffmpeg_gop_size); av_dict_set(opts, "rav1e-params", buffer, 0); } else if (STREQ(codec->name, "libsvtav1")) { /* Set preset value based on ffmpeg_preset. * Must check context->ffmpeg_preset again in case this encoder was selected due to the * absence of another. */ switch (context->ffmpeg_preset) { case FFM_PRESET_REALTIME: ffmpeg_dict_set_int(opts, "preset", 8); break; case FFM_PRESET_BEST: ffmpeg_dict_set_int(opts, "preset", 3); break; case FFM_PRESET_GOOD: default: ffmpeg_dict_set_int(opts, "preset", 5); break; } if (context->ffmpeg_crf >= 0) { /* libsvtav1 does not support crf until FFmpeg builds since 2022-02-24, use qp as fallback. */ ffmpeg_dict_set_int(opts, "qp", context->ffmpeg_crf); } } else if (STREQ(codec->name, "libaom-av1")) { /* Speed up libaom-av1 encoding by enabling multithreading and setting tiles. */ ffmpeg_dict_set_int(opts, "row-mt", 1); const char *tiles_string = NULL; bool tiles_string_is_dynamic = false; if (rd->threads > 0) { /* See if threads is a square. */ int threads_sqrt = sqrtf(rd->threads); if (threads_sqrt < 4) { /* Ensure a default minimum. */ threads_sqrt = 4; } if (is_power_of_2_i(threads_sqrt) && threads_sqrt * threads_sqrt == rd->threads) { /* Is a square num, therefore just do "sqrt x sqrt" for tiles parameter. */ int digits = 0; for (int t_sqrt_copy = threads_sqrt; t_sqrt_copy > 0; t_sqrt_copy /= 10) { ++digits; } /* A char array need only an alignment of 1. */ char *tiles_string_mut = (char *)calloc(digits * 2 + 2, 1); BLI_snprintf(tiles_string_mut, digits * 2 + 2, "%dx%d", threads_sqrt, threads_sqrt); tiles_string_is_dynamic = true; tiles_string = tiles_string_mut; } else { /* Is not a square num, set greater side based on longer side, or use a square if both sides are equal. */ int sqrt_p2 = power_of_2_min_i(threads_sqrt); if (sqrt_p2 < 2) { /* Ensure a default minimum. */ sqrt_p2 = 2; } int sqrt_p2_next = power_of_2_min_i((int)rd->threads / sqrt_p2); if (sqrt_p2_next < 1) { sqrt_p2_next = 1; } if (sqrt_p2 > sqrt_p2_next) { /* Ensure sqrt_p2_next is greater or equal to sqrt_p2. */ int temp = sqrt_p2; sqrt_p2 = sqrt_p2_next; sqrt_p2_next = temp; } int combined_digits = 0; for (int sqrt_p2_copy = sqrt_p2; sqrt_p2_copy > 0; sqrt_p2_copy /= 10) { ++combined_digits; } for (int sqrt_p2_copy = sqrt_p2_next; sqrt_p2_copy > 0; sqrt_p2_copy /= 10) { ++combined_digits; } /* A char array need only an alignment of 1. */ char *tiles_string_mut = (char *)calloc(combined_digits + 2, 1); if (rectx > recty) { BLI_snprintf(tiles_string_mut, combined_digits + 2, "%dx%d", sqrt_p2_next, sqrt_p2); } else if (rectx < recty) { BLI_snprintf(tiles_string_mut, combined_digits + 2, "%dx%d", sqrt_p2, sqrt_p2_next); } else { BLI_snprintf(tiles_string_mut, combined_digits + 2, "%dx%d", sqrt_p2, sqrt_p2); } tiles_string_is_dynamic = true; tiles_string = tiles_string_mut; } } else { /* Thread count unknown, default to 8. */ if (rectx > recty) { tiles_string = "4x2"; } else if (rectx < recty) { tiles_string = "2x4"; } else { tiles_string = "2x2"; } } av_dict_set(opts, "tiles", tiles_string, 0); if (tiles_string_is_dynamic) { free((void *)tiles_string); } /* libaom-av1 uses "cpu-used" instead of "preset" for defining compression quality. * This value is in a range from 0-8. 0 and 8 are extremes, but we will allow 8. * Must check context->ffmpeg_preset again in case this encoder was selected due to the * absence of another. */ switch (context->ffmpeg_preset) { case FFM_PRESET_REALTIME: ffmpeg_dict_set_int(opts, "cpu-used", 8); break; case FFM_PRESET_BEST: ffmpeg_dict_set_int(opts, "cpu-used", 4); break; case FFM_PRESET_GOOD: default: ffmpeg_dict_set_int(opts, "cpu-used", 6); break; } /* CRF related settings is similar to H264 for libaom-av1, so we will rely on those settings * applied later. */ } } return codec; } /* prepare a video stream for the output file */ static AVStream *alloc_video_stream(FFMpegContext *context, RenderData *rd, int codec_id, AVFormatContext *of, int rectx, int recty, char *error, int error_size) { AVStream *st; const AVCodec *codec; AVDictionary *opts = NULL; error[0] = '\0'; st = avformat_new_stream(of, NULL); if (!st) { return NULL; } st->id = 0; /* Set up the codec context */ if (codec_id == AV_CODEC_ID_AV1) { /* Use get_av1_encoder() to get the ideal (hopefully) encoder for AV1 based * on given parameters, and also set up opts. */ codec = get_av1_encoder(context, rd, &opts, rectx, recty); } else { codec = avcodec_find_encoder(codec_id); } if (!codec) { fprintf(stderr, "Couldn't find valid video codec\n"); context->video_codec = NULL; return NULL; } context->video_codec = avcodec_alloc_context3(codec); AVCodecContext *c = context->video_codec; /* Get some values from the current render settings */ c->width = rectx; c->height = recty; if (context->ffmpeg_type == FFMPEG_DV && rd->frs_sec != 25) { /* FIXME: Really bad hack (tm) for NTSC support */ c->time_base.den = 2997; c->time_base.num = 100; } else if ((float)((int)rd->frs_sec_base) == rd->frs_sec_base) { c->time_base.den = rd->frs_sec; c->time_base.num = (int)rd->frs_sec_base; } else { c->time_base = calc_time_base(rd->frs_sec, rd->frs_sec_base, codec_id); } /* As per the time-base documentation here: * https://www.ffmpeg.org/ffmpeg-codecs.html#Codec-Options * We want to set the time base to (1 / fps) for fixed frame rate video. * If it is not possible, we want to set the time-base numbers to something as * small as possible. */ if (c->time_base.num != 1) { AVRational new_time_base; if (av_reduce( &new_time_base.num, &new_time_base.den, c->time_base.num, c->time_base.den, INT_MAX)) { /* Exact reduction was possible. Use the new value. */ c->time_base = new_time_base; } } st->time_base = c->time_base; c->gop_size = context->ffmpeg_gop_size; c->max_b_frames = context->ffmpeg_max_b_frames; if (context->ffmpeg_type == FFMPEG_WEBM && context->ffmpeg_crf == 0) { ffmpeg_dict_set_int(&opts, "lossless", 1); } else if (context->ffmpeg_crf >= 0) { /* As per https://trac.ffmpeg.org/wiki/Encode/VP9 we must set the bit rate to zero when * encoding with vp9 in crf mode. * Set this to always be zero for other codecs as well. * We don't care about bit rate in crf mode. */ c->bit_rate = 0; ffmpeg_dict_set_int(&opts, "crf", context->ffmpeg_crf); } else { c->bit_rate = context->ffmpeg_video_bitrate * 1000; c->rc_max_rate = rd->ffcodecdata.rc_max_rate * 1000; c->rc_min_rate = rd->ffcodecdata.rc_min_rate * 1000; c->rc_buffer_size = rd->ffcodecdata.rc_buffer_size * 1024; } if (context->ffmpeg_preset) { /* 'preset' is used by h.264, 'deadline' is used by webm/vp9. I'm not * setting those properties conditionally based on the video codec, * as the FFmpeg encoder simply ignores unknown settings anyway. */ char const *preset_name = NULL; /* used by h.264 */ char const *deadline_name = NULL; /* used by webm/vp9 */ switch (context->ffmpeg_preset) { case FFM_PRESET_GOOD: preset_name = "medium"; deadline_name = "good"; break; case FFM_PRESET_BEST: preset_name = "slower"; deadline_name = "best"; break; case FFM_PRESET_REALTIME: preset_name = "superfast"; deadline_name = "realtime"; break; default: printf("Unknown preset number %i, ignoring.\n", context->ffmpeg_preset); } /* "codec_id != AV_CODEC_ID_AV1" is required due to "preset" already being set by an AV1 codec. */ if (preset_name != NULL && codec_id != AV_CODEC_ID_AV1) { av_dict_set(&opts, "preset", preset_name, 0); } if (deadline_name != NULL) { av_dict_set(&opts, "deadline", deadline_name, 0); } } /* Be sure to use the correct pixel format(e.g. RGB, YUV) */ if (codec->pix_fmts) { c->pix_fmt = codec->pix_fmts[0]; } else { /* makes HuffYUV happy ... */ c->pix_fmt = AV_PIX_FMT_YUV422P; } if (context->ffmpeg_type == FFMPEG_XVID) { /* arghhhh ... */ c->pix_fmt = AV_PIX_FMT_YUV420P; c->codec_tag = (('D' << 24) + ('I' << 16) + ('V' << 8) + 'X'); } /* Keep lossless encodes in the RGB domain. */ if (codec_id == AV_CODEC_ID_HUFFYUV) { if (rd->im_format.planes == R_IMF_PLANES_RGBA) { c->pix_fmt = AV_PIX_FMT_BGRA; } else { c->pix_fmt = AV_PIX_FMT_RGB32; } } if (codec_id == AV_CODEC_ID_DNXHD) { if (rd->ffcodecdata.flags & FFMPEG_LOSSLESS_OUTPUT) { /* Set the block decision algorithm to be of the highest quality ("rd" == 2). */ c->mb_decision = 2; } } if (codec_id == AV_CODEC_ID_FFV1) { c->pix_fmt = AV_PIX_FMT_RGB32; } if (codec_id == AV_CODEC_ID_QTRLE) { if (rd->im_format.planes == R_IMF_PLANES_RGBA) { c->pix_fmt = AV_PIX_FMT_ARGB; } } if (codec_id == AV_CODEC_ID_VP9 && rd->im_format.planes == R_IMF_PLANES_RGBA) { c->pix_fmt = AV_PIX_FMT_YUVA420P; } else if (ELEM(codec_id, AV_CODEC_ID_H264, AV_CODEC_ID_VP9) && (context->ffmpeg_crf == 0)) { /* Use 4:4:4 instead of 4:2:0 pixel format for lossless rendering. */ c->pix_fmt = AV_PIX_FMT_YUV444P; } if (codec_id == AV_CODEC_ID_PNG) { if (rd->im_format.planes == R_IMF_PLANES_RGBA) { c->pix_fmt = AV_PIX_FMT_RGBA; } } if (of->oformat->flags & AVFMT_GLOBALHEADER) { PRINT("Using global header\n"); c->flags |= AV_CODEC_FLAG_GLOBAL_HEADER; } /* xasp & yasp got float lately... */ st->sample_aspect_ratio = c->sample_aspect_ratio = av_d2q(((double)rd->xasp / (double)rd->yasp), 255); st->avg_frame_rate = av_inv_q(c->time_base); if (codec->capabilities & AV_CODEC_CAP_AUTO_THREADS) { c->thread_count = 0; } else { c->thread_count = BLI_system_thread_count(); } if (codec->capabilities & AV_CODEC_CAP_FRAME_THREADS) { c->thread_type = FF_THREAD_FRAME; } else if (codec->capabilities & AV_CODEC_CAP_SLICE_THREADS) { c->thread_type = FF_THREAD_SLICE; } int ret = avcodec_open2(c, codec, &opts); if (ret < 0) { fprintf(stderr, "Couldn't initialize video codec: %s\n", av_err2str(ret)); BLI_strncpy(error, IMB_ffmpeg_last_error(), error_size); av_dict_free(&opts); avcodec_free_context(&c); context->video_codec = NULL; return NULL; } av_dict_free(&opts); /* FFmpeg expects its data in the output pixel format. */ context->current_frame = alloc_picture(c->pix_fmt, c->width, c->height); if (c->pix_fmt == AV_PIX_FMT_RGBA) { /* Output pixel format is the same we use internally, no conversion necessary. */ context->img_convert_frame = NULL; context->img_convert_ctx = NULL; } else { /* Output pixel format is different, allocate frame for conversion. */ context->img_convert_frame = alloc_picture(AV_PIX_FMT_RGBA, c->width, c->height); context->img_convert_ctx = sws_getContext(c->width, c->height, AV_PIX_FMT_RGBA, c->width, c->height, c->pix_fmt, SWS_BICUBIC, NULL, NULL, NULL); } avcodec_parameters_from_context(st->codecpar, c); context->video_time = 0.0f; return st; } static AVStream *alloc_audio_stream(FFMpegContext *context, RenderData *rd, int codec_id, AVFormatContext *of, char *error, int error_size) { AVStream *st; const AVCodec *codec; error[0] = '\0'; st = avformat_new_stream(of, NULL); if (!st) { return NULL; } st->id = 1; codec = avcodec_find_encoder(codec_id); if (!codec) { fprintf(stderr, "Couldn't find valid audio codec\n"); context->audio_codec = NULL; return NULL; } context->audio_codec = avcodec_alloc_context3(codec); AVCodecContext *c = context->audio_codec; c->thread_count = BLI_system_thread_count(); c->thread_type = FF_THREAD_SLICE; c->sample_rate = rd->ffcodecdata.audio_mixrate; c->bit_rate = context->ffmpeg_audio_bitrate * 1000; c->sample_fmt = AV_SAMPLE_FMT_S16; c->ch_layout.nb_channels = rd->ffcodecdata.audio_channels; switch (rd->ffcodecdata.audio_channels) { case FFM_CHANNELS_MONO: av_channel_layout_from_mask(&c->ch_layout, AV_CH_LAYOUT_MONO); break; case FFM_CHANNELS_STEREO: av_channel_layout_from_mask(&c->ch_layout, AV_CH_LAYOUT_STEREO); break; case FFM_CHANNELS_SURROUND4: av_channel_layout_from_mask(&c->ch_layout, AV_CH_LAYOUT_QUAD); break; case FFM_CHANNELS_SURROUND51: av_channel_layout_from_mask(&c->ch_layout, AV_CH_LAYOUT_5POINT1_BACK); break; case FFM_CHANNELS_SURROUND71: av_channel_layout_from_mask(&c->ch_layout, AV_CH_LAYOUT_7POINT1); break; } if (request_float_audio_buffer(codec_id)) { /* mainly for AAC codec which is experimental */ c->strict_std_compliance = FF_COMPLIANCE_EXPERIMENTAL; c->sample_fmt = AV_SAMPLE_FMT_FLT; } if (codec->sample_fmts) { /* Check if the preferred sample format for this codec is supported. * this is because, depending on the version of libav, * and with the whole ffmpeg/libav fork situation, * you have various implementations around. * Float samples in particular are not always supported. */ const enum AVSampleFormat *p = codec->sample_fmts; for (; *p != -1; p++) { if (*p == c->sample_fmt) { break; } } if (*p == -1) { /* sample format incompatible with codec. Defaulting to a format known to work */ c->sample_fmt = codec->sample_fmts[0]; } } if (codec->supported_samplerates) { const int *p = codec->supported_samplerates; int best = 0; int best_dist = INT_MAX; for (; *p; p++) { int dist = abs(c->sample_rate - *p); if (dist < best_dist) { best_dist = dist; best = *p; } } /* best is the closest supported sample rate (same as selected if best_dist == 0) */ c->sample_rate = best; } if (of->oformat->flags & AVFMT_GLOBALHEADER) { c->flags |= AV_CODEC_FLAG_GLOBAL_HEADER; } int ret = avcodec_open2(c, codec, NULL); if (ret < 0) { fprintf(stderr, "Couldn't initialize audio codec: %s\n", av_err2str(ret)); BLI_strncpy(error, IMB_ffmpeg_last_error(), error_size); avcodec_free_context(&c); context->audio_codec = NULL; return NULL; } /* Need to prevent floating point exception when using VORBIS audio codec, * initialize this value in the same way as it's done in FFmpeg itself (sergey) */ c->time_base.num = 1; c->time_base.den = c->sample_rate; if (c->frame_size == 0) { /* Used to be if ((c->codec_id >= CODEC_ID_PCM_S16LE) && (c->codec_id <= CODEC_ID_PCM_DVD)) * not sure if that is needed anymore, so let's try out if there are any * complaints regarding some FFmpeg versions users might have. */ context->audio_input_samples = AV_INPUT_BUFFER_MIN_SIZE * 8 / c->bits_per_coded_sample / c->ch_layout.nb_channels; } else { context->audio_input_samples = c->frame_size; } context->audio_deinterleave = av_sample_fmt_is_planar(c->sample_fmt); context->audio_sample_size = av_get_bytes_per_sample(c->sample_fmt); context->audio_input_buffer = (uint8_t *)av_malloc( context->audio_input_samples * c->ch_layout.nb_channels * context->audio_sample_size); if (context->audio_deinterleave) { context->audio_deinterleave_buffer = (uint8_t *)av_malloc( context->audio_input_samples * c->ch_layout.nb_channels * context->audio_sample_size); } context->audio_time = 0.0f; avcodec_parameters_from_context(st->codecpar, c); return st; } /* essential functions -- start, append, end */ static void ffmpeg_dict_set_int(AVDictionary **dict, const char *key, int value) { char buffer[32]; BLI_snprintf(buffer, sizeof(buffer), "%d", value); av_dict_set(dict, key, buffer, 0); } static void ffmpeg_add_metadata_callback(void *data, const char *propname, char *propvalue, int UNUSED(len)) { AVDictionary **metadata = (AVDictionary **)data; av_dict_set(metadata, propname, propvalue, 0); } static int start_ffmpeg_impl(FFMpegContext *context, struct RenderData *rd, int rectx, int recty, const char *suffix, ReportList *reports) { /* Handle to the output file */ AVFormatContext *of; const AVOutputFormat *fmt; char name[FILE_MAX], error[1024]; const char **exts; context->ffmpeg_type = rd->ffcodecdata.type; context->ffmpeg_codec = rd->ffcodecdata.codec; context->ffmpeg_audio_codec = rd->ffcodecdata.audio_codec; context->ffmpeg_video_bitrate = rd->ffcodecdata.video_bitrate; context->ffmpeg_audio_bitrate = rd->ffcodecdata.audio_bitrate; context->ffmpeg_gop_size = rd->ffcodecdata.gop_size; context->ffmpeg_autosplit = rd->ffcodecdata.flags & FFMPEG_AUTOSPLIT_OUTPUT; context->ffmpeg_crf = rd->ffcodecdata.constant_rate_factor; context->ffmpeg_preset = rd->ffcodecdata.ffmpeg_preset; if ((rd->ffcodecdata.flags & FFMPEG_USE_MAX_B_FRAMES) != 0) { context->ffmpeg_max_b_frames = rd->ffcodecdata.max_b_frames; } /* Determine the correct filename */ ffmpeg_filepath_get(context, name, rd, context->ffmpeg_preview, suffix); PRINT( "Starting output to %s(ffmpeg)...\n" " Using type=%d, codec=%d, audio_codec=%d,\n" " video_bitrate=%d, audio_bitrate=%d,\n" " gop_size=%d, autosplit=%d\n" " render width=%d, render height=%d\n", name, context->ffmpeg_type, context->ffmpeg_codec, context->ffmpeg_audio_codec, context->ffmpeg_video_bitrate, context->ffmpeg_audio_bitrate, context->ffmpeg_gop_size, context->ffmpeg_autosplit, rectx, recty); /* Sanity checks for the output file extensions. */ exts = get_file_extensions(context->ffmpeg_type); if (!exts) { BKE_report(reports, RPT_ERROR, "No valid formats found"); return 0; } fmt = av_guess_format(NULL, exts[0], NULL); if (!fmt) { BKE_report(reports, RPT_ERROR, "No valid formats found"); return 0; } of = avformat_alloc_context(); if (!of) { BKE_report(reports, RPT_ERROR, "Can't allocate ffmpeg format context"); return 0; } enum AVCodecID audio_codec = context->ffmpeg_audio_codec; enum AVCodecID video_codec = context->ffmpeg_codec; of->url = av_strdup(name); /* Check if we need to force change the codec because of file type codec restrictions */ switch (context->ffmpeg_type) { case FFMPEG_OGG: video_codec = AV_CODEC_ID_THEORA; break; case FFMPEG_DV: video_codec = AV_CODEC_ID_DVVIDEO; break; case FFMPEG_MPEG1: video_codec = AV_CODEC_ID_MPEG1VIDEO; break; case FFMPEG_MPEG2: video_codec = AV_CODEC_ID_MPEG2VIDEO; break; case FFMPEG_H264: video_codec = AV_CODEC_ID_H264; break; case FFMPEG_XVID: video_codec = AV_CODEC_ID_MPEG4; break; case FFMPEG_FLV: video_codec = AV_CODEC_ID_FLV1; break; case FFMPEG_AV1: video_codec = AV_CODEC_ID_AV1; break; default: /* These containers are not restricted to any specific codec types. * Currently we expect these to be .avi, .mov, .mkv, and .mp4. */ video_codec = context->ffmpeg_codec; break; } /* Returns after this must 'goto fail;' */ # if LIBAVFORMAT_VERSION_MAJOR >= 59 of->oformat = fmt; # else /* *DEPRECATED* 2022/08/01 For FFMPEG (<5.0) remove this else branch and the `ifdef` above. */ of->oformat = (AVOutputFormat *)fmt; # endif if (video_codec == AV_CODEC_ID_DVVIDEO) { if (rectx != 720) { BKE_report(reports, RPT_ERROR, "Render width has to be 720 pixels for DV!"); goto fail; } if (rd->frs_sec != 25 && recty != 480) { BKE_report(reports, RPT_ERROR, "Render height has to be 480 pixels for DV-NTSC!"); goto fail; } if (rd->frs_sec == 25 && recty != 576) { BKE_report(reports, RPT_ERROR, "Render height has to be 576 pixels for DV-PAL!"); goto fail; } } if (context->ffmpeg_type == FFMPEG_DV) { audio_codec = AV_CODEC_ID_PCM_S16LE; if (context->ffmpeg_audio_codec != AV_CODEC_ID_NONE && rd->ffcodecdata.audio_mixrate != 48000 && rd->ffcodecdata.audio_channels != 2) { BKE_report(reports, RPT_ERROR, "FFMPEG only supports 48khz / stereo audio for DV!"); goto fail; } } if (video_codec != AV_CODEC_ID_NONE) { context->video_stream = alloc_video_stream( context, rd, video_codec, of, rectx, recty, error, sizeof(error)); PRINT("alloc video stream %p\n", context->video_stream); if (!context->video_stream) { if (error[0]) { BKE_report(reports, RPT_ERROR, error); PRINT("Video stream error: %s\n", error); } else { BKE_report(reports, RPT_ERROR, "Error initializing video stream"); PRINT("Error initializing video stream"); } goto fail; } } if (context->ffmpeg_audio_codec != AV_CODEC_ID_NONE) { context->audio_stream = alloc_audio_stream(context, rd, audio_codec, of, error, sizeof(error)); if (!context->audio_stream) { if (error[0]) { BKE_report(reports, RPT_ERROR, error); PRINT("Audio stream error: %s\n", error); } else { BKE_report(reports, RPT_ERROR, "Error initializing audio stream"); PRINT("Error initializing audio stream"); } goto fail; } } if (!(fmt->flags & AVFMT_NOFILE)) { if (avio_open(&of->pb, name, AVIO_FLAG_WRITE) < 0) { BKE_report(reports, RPT_ERROR, "Could not open file for writing"); PRINT("Could not open file for writing\n"); goto fail; } } if (context->stamp_data != NULL) { BKE_stamp_info_callback( &of->metadata, context->stamp_data, ffmpeg_add_metadata_callback, false); } int ret = avformat_write_header(of, NULL); if (ret < 0) { BKE_report(reports, RPT_ERROR, "Could not initialize streams, probably unsupported codec combination"); PRINT("Could not write media header: %s\n", av_err2str(ret)); goto fail; } context->outfile = of; av_dump_format(of, 0, name, 1); return 1; fail: if (of->pb) { avio_close(of->pb); } if (context->video_stream) { context->video_stream = NULL; } if (context->audio_stream) { context->audio_stream = NULL; } avformat_free_context(of); return 0; } /** * Writes any delayed frames in the encoder. This function is called before * closing the encoder. * *

* Since an encoder may use both past and future frames to predict * inter-frames (H.264 B-frames, for example), it can output the frames * in a different order from the one it was given. * For example, when sending frames 1, 2, 3, 4 to the encoder, it may write * them in the order 1, 4, 2, 3 - first the two frames used for prediction, * and then the bidirectionally-predicted frames. What this means in practice * is that the encoder may not immediately produce one output frame for each * input frame. These delayed frames must be flushed before we close the * stream. We do this by calling avcodec_encode_video with NULL for the last * parameter. *

*/ static void flush_ffmpeg(AVCodecContext *c, AVStream *stream, AVFormatContext *outfile) { AVPacket *packet = av_packet_alloc(); avcodec_send_frame(c, NULL); /* Get the packets frames. */ int ret = 1; while (ret >= 0) { ret = avcodec_receive_packet(c, packet); if (ret == AVERROR(EAGAIN) || ret == AVERROR_EOF) { /* No more packets to flush. */ break; } if (ret < 0) { fprintf(stderr, "Error encoding delayed frame: %s\n", av_err2str(ret)); break; } packet->stream_index = stream->index; av_packet_rescale_ts(packet, c->time_base, stream->time_base); # ifdef FFMPEG_USE_DURATION_WORKAROUND my_guess_pkt_duration(outfile, stream, packet); # endif int write_ret = av_interleaved_write_frame(outfile, packet); if (write_ret != 0) { fprintf(stderr, "Error writing delayed frame: %s\n", av_err2str(write_ret)); break; } } av_packet_free(&packet); } /* ********************************************************************** * * public interface * ********************************************************************** */ /* Get the output filename-- similar to the other output formats */ static void ffmpeg_filepath_get( FFMpegContext *context, char *string, const RenderData *rd, bool preview, const char *suffix) { char autosplit[20]; const char **exts = get_file_extensions(rd->ffcodecdata.type); const char **fe = exts; int sfra, efra; if (!string || !exts) { return; } if (preview) { sfra = rd->psfra; efra = rd->pefra; } else { sfra = rd->sfra; efra = rd->efra; } strcpy(string, rd->pic); BLI_path_abs(string, BKE_main_blendfile_path_from_global()); BLI_make_existing_file(string); autosplit[0] = '\0'; if ((rd->ffcodecdata.flags & FFMPEG_AUTOSPLIT_OUTPUT) != 0) { if (context) { sprintf(autosplit, "_%03d", context->ffmpeg_autosplit_count); } } if (rd->scemode & R_EXTENSION) { while (*fe) { if (BLI_strcasecmp(string + strlen(string) - strlen(*fe), *fe) == 0) { break; } fe++; } if (*fe == NULL) { strcat(string, autosplit); BLI_path_frame_range(string, sfra, efra, 4); strcat(string, *exts); } else { *(string + strlen(string) - strlen(*fe)) = '\0'; strcat(string, autosplit); strcat(string, *fe); } } else { if (BLI_path_frame_check_chars(string)) { BLI_path_frame_range(string, sfra, efra, 4); } strcat(string, autosplit); } BLI_path_suffix(string, FILE_MAX, suffix, ""); } void BKE_ffmpeg_filepath_get(char *string, const RenderData *rd, bool preview, const char *suffix) { ffmpeg_filepath_get(NULL, string, rd, preview, suffix); } int BKE_ffmpeg_start(void *context_v, const struct Scene *scene, RenderData *rd, int rectx, int recty, ReportList *reports, bool preview, const char *suffix) { int success; FFMpegContext *context = context_v; context->ffmpeg_autosplit_count = 0; context->ffmpeg_preview = preview; context->stamp_data = BKE_stamp_info_from_scene_static(scene); success = start_ffmpeg_impl(context, rd, rectx, recty, suffix, reports); # ifdef WITH_AUDASPACE if (context->audio_stream) { AVCodecContext *c = context->audio_codec; AUD_DeviceSpecs specs; specs.channels = c->ch_layout.nb_channels; switch (av_get_packed_sample_fmt(c->sample_fmt)) { case AV_SAMPLE_FMT_U8: specs.format = AUD_FORMAT_U8; break; case AV_SAMPLE_FMT_S16: specs.format = AUD_FORMAT_S16; break; case AV_SAMPLE_FMT_S32: specs.format = AUD_FORMAT_S32; break; case AV_SAMPLE_FMT_FLT: specs.format = AUD_FORMAT_FLOAT32; break; case AV_SAMPLE_FMT_DBL: specs.format = AUD_FORMAT_FLOAT64; break; default: return -31415; } specs.rate = rd->ffcodecdata.audio_mixrate; context->audio_mixdown_device = BKE_sound_mixdown( scene, specs, preview ? rd->psfra : rd->sfra, rd->ffcodecdata.audio_volume); } # endif return success; } static void end_ffmpeg_impl(FFMpegContext *context, int is_autosplit); # ifdef WITH_AUDASPACE static void write_audio_frames(FFMpegContext *context, double to_pts) { AVCodecContext *c = context->audio_codec; while (context->audio_stream) { if ((context->audio_time_total >= to_pts) || !write_audio_frame(context)) { break; } context->audio_time_total += (double)context->audio_input_samples / (double)c->sample_rate; context->audio_time += (double)context->audio_input_samples / (double)c->sample_rate; } } # endif int BKE_ffmpeg_append(void *context_v, RenderData *rd, int start_frame, int frame, int *pixels, int rectx, int recty, const char *suffix, ReportList *reports) { FFMpegContext *context = context_v; AVFrame *avframe; int success = 1; PRINT("Writing frame %i, render width=%d, render height=%d\n", frame, rectx, recty); if (context->video_stream) { avframe = generate_video_frame(context, (uchar *)pixels); success = (avframe && write_video_frame(context, avframe, reports)); # ifdef WITH_AUDASPACE /* Add +1 frame because we want to encode audio up until the next video frame. */ write_audio_frames( context, (frame - start_frame + 1) / (((double)rd->frs_sec) / (double)rd->frs_sec_base)); # else UNUSED_VARS(start_frame); # endif if (context->ffmpeg_autosplit) { if (avio_tell(context->outfile->pb) > FFMPEG_AUTOSPLIT_SIZE) { end_ffmpeg_impl(context, true); context->ffmpeg_autosplit_count++; success &= start_ffmpeg_impl(context, rd, rectx, recty, suffix, reports); } } } return success; } static void end_ffmpeg_impl(FFMpegContext *context, int is_autosplit) { PRINT("Closing ffmpeg...\n"); # ifdef WITH_AUDASPACE if (is_autosplit == false) { if (context->audio_mixdown_device) { AUD_Device_free(context->audio_mixdown_device); context->audio_mixdown_device = NULL; } } # else UNUSED_VARS(is_autosplit); # endif if (context->video_stream) { PRINT("Flushing delayed video frames...\n"); flush_ffmpeg(context->video_codec, context->video_stream, context->outfile); } if (context->audio_stream) { PRINT("Flushing delayed audio frames...\n"); flush_ffmpeg(context->audio_codec, context->audio_stream, context->outfile); } if (context->outfile) { av_write_trailer(context->outfile); } /* Close the video codec */ if (context->video_stream != NULL) { PRINT("zero video stream %p\n", context->video_stream); context->video_stream = NULL; } if (context->audio_stream != NULL) { context->audio_stream = NULL; } /* free the temp buffer */ if (context->current_frame != NULL) { delete_picture(context->current_frame); context->current_frame = NULL; } if (context->img_convert_frame != NULL) { delete_picture(context->img_convert_frame); context->img_convert_frame = NULL; } if (context->outfile != NULL && context->outfile->oformat) { if (!(context->outfile->oformat->flags & AVFMT_NOFILE)) { avio_close(context->outfile->pb); } } if (context->video_codec != NULL) { avcodec_free_context(&context->video_codec); context->video_codec = NULL; } if (context->audio_codec != NULL) { avcodec_free_context(&context->audio_codec); context->audio_codec = NULL; } if (context->outfile != NULL) { avformat_free_context(context->outfile); context->outfile = NULL; } if (context->audio_input_buffer != NULL) { av_free(context->audio_input_buffer); context->audio_input_buffer = NULL; } if (context->audio_deinterleave_buffer != NULL) { av_free(context->audio_deinterleave_buffer); context->audio_deinterleave_buffer = NULL; } if (context->img_convert_ctx != NULL) { sws_freeContext(context->img_convert_ctx); context->img_convert_ctx = NULL; } } void BKE_ffmpeg_end(void *context_v) { FFMpegContext *context = context_v; end_ffmpeg_impl(context, false); } void BKE_ffmpeg_preset_set(RenderData *rd, int preset) { bool is_ntsc = (rd->frs_sec != 25); switch (preset) { case FFMPEG_PRESET_VCD: rd->ffcodecdata.type = FFMPEG_MPEG1; rd->ffcodecdata.video_bitrate = 1150; rd->xsch = 352; rd->ysch = is_ntsc ? 240 : 288; rd->ffcodecdata.gop_size = is_ntsc ? 18 : 15; rd->ffcodecdata.rc_max_rate = 1150; rd->ffcodecdata.rc_min_rate = 1150; rd->ffcodecdata.rc_buffer_size = 40 * 8; rd->ffcodecdata.mux_packet_size = 2324; rd->ffcodecdata.mux_rate = 2352 * 75 * 8; break; case FFMPEG_PRESET_SVCD: rd->ffcodecdata.type = FFMPEG_MPEG2; rd->ffcodecdata.video_bitrate = 2040; rd->xsch = 480; rd->ysch = is_ntsc ? 480 : 576; rd->ffcodecdata.gop_size = is_ntsc ? 18 : 15; rd->ffcodecdata.rc_max_rate = 2516; rd->ffcodecdata.rc_min_rate = 0; rd->ffcodecdata.rc_buffer_size = 224 * 8; rd->ffcodecdata.mux_packet_size = 2324; rd->ffcodecdata.mux_rate = 0; break; case FFMPEG_PRESET_DVD: rd->ffcodecdata.type = FFMPEG_MPEG2; rd->ffcodecdata.video_bitrate = 6000; # if 0 /* Don't set resolution, see T21351. */ rd->xsch = 720; rd->ysch = isntsc ? 480 : 576; # endif rd->ffcodecdata.gop_size = is_ntsc ? 18 : 15; rd->ffcodecdata.rc_max_rate = 9000; rd->ffcodecdata.rc_min_rate = 0; rd->ffcodecdata.rc_buffer_size = 224 * 8; rd->ffcodecdata.mux_packet_size = 2048; rd->ffcodecdata.mux_rate = 10080000; break; case FFMPEG_PRESET_DV: rd->ffcodecdata.type = FFMPEG_DV; rd->xsch = 720; rd->ysch = is_ntsc ? 480 : 576; break; case FFMPEG_PRESET_H264: rd->ffcodecdata.type = FFMPEG_AVI; rd->ffcodecdata.codec = AV_CODEC_ID_H264; rd->ffcodecdata.video_bitrate = 6000; rd->ffcodecdata.gop_size = is_ntsc ? 18 : 15; rd->ffcodecdata.rc_max_rate = 9000; rd->ffcodecdata.rc_min_rate = 0; rd->ffcodecdata.rc_buffer_size = 224 * 8; rd->ffcodecdata.mux_packet_size = 2048; rd->ffcodecdata.mux_rate = 10080000; break; case FFMPEG_PRESET_THEORA: case FFMPEG_PRESET_XVID: if (preset == FFMPEG_PRESET_XVID) { rd->ffcodecdata.type = FFMPEG_AVI; rd->ffcodecdata.codec = AV_CODEC_ID_MPEG4; } else if (preset == FFMPEG_PRESET_THEORA) { rd->ffcodecdata.type = FFMPEG_OGG; /* XXX broken */ rd->ffcodecdata.codec = AV_CODEC_ID_THEORA; } rd->ffcodecdata.video_bitrate = 6000; rd->ffcodecdata.gop_size = is_ntsc ? 18 : 15; rd->ffcodecdata.rc_max_rate = 9000; rd->ffcodecdata.rc_min_rate = 0; rd->ffcodecdata.rc_buffer_size = 224 * 8; rd->ffcodecdata.mux_packet_size = 2048; rd->ffcodecdata.mux_rate = 10080000; break; case FFMPEG_PRESET_AV1: rd->ffcodecdata.type = FFMPEG_AV1; rd->ffcodecdata.codec = AV_CODEC_ID_AV1; rd->ffcodecdata.video_bitrate = 6000; rd->ffcodecdata.gop_size = is_ntsc ? 18 : 15; rd->ffcodecdata.rc_max_rate = 9000; rd->ffcodecdata.rc_min_rate = 0; rd->ffcodecdata.rc_buffer_size = 224 * 8; rd->ffcodecdata.mux_packet_size = 2048; rd->ffcodecdata.mux_rate = 10080000; break; } } void BKE_ffmpeg_image_type_verify(RenderData *rd, const ImageFormatData *imf) { int audio = 0; if (imf->imtype == R_IMF_IMTYPE_FFMPEG) { if (rd->ffcodecdata.type <= 0 || rd->ffcodecdata.codec <= 0 || rd->ffcodecdata.audio_codec <= 0 || rd->ffcodecdata.video_bitrate <= 1) { BKE_ffmpeg_preset_set(rd, FFMPEG_PRESET_H264); rd->ffcodecdata.constant_rate_factor = FFM_CRF_MEDIUM; rd->ffcodecdata.ffmpeg_preset = FFM_PRESET_GOOD; rd->ffcodecdata.type = FFMPEG_MKV; } if (rd->ffcodecdata.type == FFMPEG_OGG) { rd->ffcodecdata.type = FFMPEG_MPEG2; } audio = 1; } else if (imf->imtype == R_IMF_IMTYPE_H264) { if (rd->ffcodecdata.codec != AV_CODEC_ID_H264) { BKE_ffmpeg_preset_set(rd, FFMPEG_PRESET_H264); audio = 1; } } else if (imf->imtype == R_IMF_IMTYPE_XVID) { if (rd->ffcodecdata.codec != AV_CODEC_ID_MPEG4) { BKE_ffmpeg_preset_set(rd, FFMPEG_PRESET_XVID); audio = 1; } } else if (imf->imtype == R_IMF_IMTYPE_THEORA) { if (rd->ffcodecdata.codec != AV_CODEC_ID_THEORA) { BKE_ffmpeg_preset_set(rd, FFMPEG_PRESET_THEORA); audio = 1; } } else if (imf->imtype == R_IMF_IMTYPE_AV1) { if (rd->ffcodecdata.codec != AV_CODEC_ID_AV1) { BKE_ffmpeg_preset_set(rd, FFMPEG_PRESET_AV1); audio = 1; } } if (audio && rd->ffcodecdata.audio_codec < 0) { rd->ffcodecdata.audio_codec = AV_CODEC_ID_NONE; rd->ffcodecdata.audio_bitrate = 128; } } bool BKE_ffmpeg_alpha_channel_is_supported(const RenderData *rd) { int codec = rd->ffcodecdata.codec; return ELEM(codec, AV_CODEC_ID_FFV1, AV_CODEC_ID_QTRLE, AV_CODEC_ID_PNG, AV_CODEC_ID_VP9, AV_CODEC_ID_HUFFYUV); } void *BKE_ffmpeg_context_create(void) { FFMpegContext *context; /* new ffmpeg data struct */ context = MEM_callocN(sizeof(FFMpegContext), "new ffmpeg context"); context->ffmpeg_codec = AV_CODEC_ID_MPEG4; context->ffmpeg_audio_codec = AV_CODEC_ID_NONE; context->ffmpeg_video_bitrate = 1150; context->ffmpeg_audio_bitrate = 128; context->ffmpeg_gop_size = 12; context->ffmpeg_autosplit = 0; context->ffmpeg_autosplit_count = 0; context->ffmpeg_preview = false; context->stamp_data = NULL; context->audio_time_total = 0.0; return context; } void BKE_ffmpeg_context_free(void *context_v) { FFMpegContext *context = context_v; if (context == NULL) { return; } if (context->stamp_data) { MEM_freeN(context->stamp_data); } MEM_freeN(context); } #endif /* WITH_FFMPEG */