123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393 |
- /*
- * copyright (c) 2022 Anton Khirnov <anton@khirnov.net>
- *
- * This file is part of FFmpeg.
- *
- * FFmpeg is free software; you can redistribute it and/or
- * modify it under the terms of the GNU Lesser General Public
- * License as published by the Free Software Foundation; either
- * version 2.1 of the License, or (at your option) any later version.
- *
- * FFmpeg is distributed in the hope that it will be useful,
- * but WITHOUT ANY WARRANTY; without even the implied warranty of
- * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
- * Lesser General Public License for more details.
- *
- * You should have received a copy of the GNU Lesser General Public
- * License along with FFmpeg; if not, write to the Free Software
- * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
- */
- /* A test for AV_CODEC_FLAG_RECON_FRAME
- * TODO: dump reconstructed frames to disk */
- #include <stdio.h>
- #include <stdint.h>
- #include <stdlib.h>
- #include "decode_simple.h"
- #include "libavutil/adler32.h"
- #include "libavutil/common.h"
- #include "libavutil/error.h"
- #include "libavutil/frame.h"
- #include "libavutil/imgutils.h"
- #include "libavutil/opt.h"
- #include "libavformat/avformat.h"
- #include "libavcodec/avcodec.h"
- #include "libavcodec/codec.h"
- #include "libswscale/swscale.h"
- typedef struct FrameChecksum {
- int64_t ts;
- uint32_t checksum[4];
- } FrameChecksum;
- typedef struct PrivData {
- AVCodecContext *enc;
- AVCodecContext *dec;
- int64_t pts_in;
- AVPacket *pkt;
- AVFrame *frame, *frame_recon;
- struct SwsContext *scaler;
- FrameChecksum *checksums_decoded;
- size_t nb_checksums_decoded;
- FrameChecksum *checksums_recon;
- size_t nb_checksums_recon;
- } PrivData;
- static int frame_hash(FrameChecksum **pc, size_t *nb_c, int64_t ts,
- const AVFrame *frame)
- {
- FrameChecksum *c;
- int shift_h[4] = { 0 }, shift_v[4] = { 0 };
- c = av_realloc_array(*pc, *nb_c + 1, sizeof(*c));
- if (!c)
- return AVERROR(ENOMEM);
- *pc = c;
- (*nb_c)++;
- c += *nb_c - 1;
- memset(c, 0, sizeof(*c));
- av_pix_fmt_get_chroma_sub_sample(frame->format, &shift_h[1], &shift_v[1]);
- shift_h[2] = shift_h[1];
- shift_v[2] = shift_v[1];
- c->ts = ts;
- for (int p = 0; frame->data[p]; p++) {
- const uint8_t *data = frame->data[p];
- int linesize = av_image_get_linesize(frame->format, frame->width, p);
- uint32_t checksum = 0;
- for (int j = 0; j < frame->height >> shift_v[p]; j++) {
- checksum = av_adler32_update(checksum, data, linesize);
- data += frame->linesize[p];
- }
- c->checksum[p] = checksum;
- }
- return 0;
- }
- static int recon_frame_process(PrivData *pd, const AVPacket *pkt)
- {
- AVFrame *f = pd->frame_recon;
- int ret;
- ret = avcodec_receive_frame(pd->enc, f);
- if (ret < 0) {
- fprintf(stderr, "Error retrieving a reconstructed frame\n");
- return ret;
- }
- // the encoder's internal format (in which the reconsturcted frames are
- // exported) may be different from the user-facing pixel format
- if (f->format != pd->enc->pix_fmt) {
- if (!pd->scaler) {
- pd->scaler = sws_getContext(f->width, f->height, f->format,
- f->width, f->height, pd->enc->pix_fmt,
- SWS_BITEXACT, NULL, NULL, NULL);
- if (!pd->scaler)
- return AVERROR(ENOMEM);
- }
- ret = sws_scale_frame(pd->scaler, pd->frame, f);
- if (ret < 0) {
- fprintf(stderr, "Error converting pixel formats\n");
- return ret;
- }
- av_frame_unref(f);
- f = pd->frame;
- }
- ret = frame_hash(&pd->checksums_recon, &pd->nb_checksums_recon,
- pkt->pts, f);
- av_frame_unref(f);
- return 0;
- }
- static int process_frame(DecodeContext *dc, AVFrame *frame)
- {
- PrivData *pd = dc->opaque;
- int ret;
- if (!avcodec_is_open(pd->enc)) {
- if (!frame) {
- fprintf(stderr, "No input frames were decoded\n");
- return AVERROR_INVALIDDATA;
- }
- pd->enc->width = frame->width;
- pd->enc->height = frame->height;
- pd->enc->pix_fmt = frame->format;
- pd->enc->thread_count = dc->decoder->thread_count;
- pd->enc->thread_type = dc->decoder->thread_type;
- // real timestamps do not matter for this test, so we just
- // pretend the input is 25fps CFR to avoid any timestamp issues
- pd->enc->time_base = (AVRational){ 1, 25 };
- ret = avcodec_open2(pd->enc, NULL, NULL);
- if (ret < 0) {
- fprintf(stderr, "Error opening the encoder\n");
- return ret;
- }
- }
- if (frame) {
- frame->pts = pd->pts_in++;
- // avoid forcing coded frame type
- frame->pict_type = AV_PICTURE_TYPE_NONE;
- }
- ret = avcodec_send_frame(pd->enc, frame);
- if (ret < 0) {
- fprintf(stderr, "Error submitting a frame for encoding\n");
- return ret;
- }
- while (1) {
- AVPacket *pkt = pd->pkt;
- ret = avcodec_receive_packet(pd->enc, pkt);
- if (ret == AVERROR(EAGAIN))
- break;
- else if (ret == AVERROR_EOF)
- pkt = NULL;
- else if (ret < 0) {
- fprintf(stderr, "Error receiving a frame from the encoder\n");
- return ret;
- }
- if (pkt) {
- ret = recon_frame_process(pd, pkt);
- if (ret < 0)
- return ret;
- }
- if (!avcodec_is_open(pd->dec)) {
- if (!pkt) {
- fprintf(stderr, "No packets were received from the encoder\n");
- return AVERROR(EINVAL);
- }
- pd->dec->width = pd->enc->width;
- pd->dec->height = pd->enc->height;
- pd->dec->pix_fmt = pd->enc->pix_fmt;
- pd->dec->thread_count = dc->decoder->thread_count;
- pd->dec->thread_type = dc->decoder->thread_type;
- if (pd->enc->extradata_size) {
- pd->dec->extradata = av_memdup(pd->enc->extradata,
- pd->enc->extradata_size + AV_INPUT_BUFFER_PADDING_SIZE);
- if (!pd->dec->extradata)
- return AVERROR(ENOMEM);
- }
- ret = avcodec_open2(pd->dec, NULL, NULL);
- if (ret < 0) {
- fprintf(stderr, "Error opening the decoder\n");
- return ret;
- }
- }
- ret = avcodec_send_packet(pd->dec, pkt);
- if (ret < 0) {
- fprintf(stderr, "Error sending a packet to decoder\n");
- return ret;
- }
- while (1) {
- ret = avcodec_receive_frame(pd->dec, pd->frame);
- if (ret == AVERROR(EAGAIN))
- break;
- else if (ret == AVERROR_EOF)
- return 0;
- else if (ret < 0) {
- fprintf(stderr, "Error receving a frame from decoder\n");
- return ret;
- }
- ret = frame_hash(&pd->checksums_decoded, &pd->nb_checksums_decoded,
- pd->frame->pts, pd->frame);
- av_frame_unref(pd->frame);
- if (ret < 0)
- return ret;
- }
- }
- return 0;
- }
- static int frame_checksum_compare(const void *a, const void *b)
- {
- const FrameChecksum *ca = a;
- const FrameChecksum *cb = b;
- if (ca->ts == cb->ts)
- return 0;
- return FFSIGN(ca->ts - cb->ts);
- }
- int main(int argc, char **argv)
- {
- PrivData pd;
- DecodeContext dc;
- const char *filename, *enc_name, *enc_opts, *thread_type = NULL, *nb_threads = NULL;
- const AVCodec *enc, *dec;
- int ret = 0, max_frames = 0;
- if (argc < 4) {
- fprintf(stderr,
- "Usage: %s <input file> <encoder> <encoder options> "
- "[<max frame count> [<thread count> <thread type>]\n",
- argv[0]);
- return 0;
- }
- filename = argv[1];
- enc_name = argv[2];
- enc_opts = argv[3];
- if (argc >= 5)
- max_frames = strtol(argv[4], NULL, 0);
- if (argc >= 6)
- nb_threads = argv[5];
- if (argc >= 7)
- thread_type = argv[6];
- memset(&dc, 0, sizeof(dc));
- memset(&pd, 0, sizeof(pd));
- enc = avcodec_find_encoder_by_name(enc_name);
- if (!enc) {
- fprintf(stderr, "No such encoder: %s\n", enc_name);
- return 1;
- }
- if (!(enc->capabilities & AV_CODEC_CAP_ENCODER_RECON_FRAME)) {
- fprintf(stderr, "Encoder '%s' cannot ouput reconstructed frames\n",
- enc->name);
- return 1;
- }
- dec = avcodec_find_decoder(enc->id);
- if (!dec) {
- fprintf(stderr, "No decoder for: %s\n", avcodec_get_name(enc->id));
- return 1;
- }
- pd.enc = avcodec_alloc_context3(enc);
- if (!pd.enc) {
- fprintf(stderr, "Error allocating encoder\n");
- return 1;
- }
- ret = av_set_options_string(pd.enc, enc_opts, "=", ",");
- if (ret < 0) {
- fprintf(stderr, "Error setting encoder options\n");
- goto fail;
- }
- pd.enc->flags |= AV_CODEC_FLAG_RECON_FRAME | AV_CODEC_FLAG_BITEXACT;
- pd.dec = avcodec_alloc_context3(dec);
- if (!pd.dec) {
- fprintf(stderr, "Error allocating decoder\n");
- goto fail;
- }
- pd.dec->flags |= AV_CODEC_FLAG_BITEXACT;
- pd.dec->err_recognition |= AV_EF_CRCCHECK;
- pd.frame = av_frame_alloc();
- pd.frame_recon = av_frame_alloc();
- pd.pkt = av_packet_alloc();
- if (!pd.frame ||!pd.frame_recon || !pd.pkt) {
- ret = 1;
- goto fail;
- }
- ret = ds_open(&dc, filename, 0);
- if (ret < 0) {
- fprintf(stderr, "Error opening the file\n");
- goto fail;
- }
- dc.process_frame = process_frame;
- dc.opaque = &pd;
- dc.max_frames = max_frames;
- ret = av_dict_set(&dc.decoder_opts, "threads", nb_threads, 0);
- ret |= av_dict_set(&dc.decoder_opts, "thread_type", thread_type, 0);
- ret = ds_run(&dc);
- if (ret < 0)
- goto fail;
- if (pd.nb_checksums_decoded != pd.nb_checksums_recon) {
- fprintf(stderr, "Mismatching frame counts: recon=%zu decoded=%zu\n",
- pd.nb_checksums_recon, pd.nb_checksums_decoded);
- ret = 1;
- goto fail;
- }
- // reconstructed frames are in coded order, sort them by pts into presentation order
- qsort(pd.checksums_recon, pd.nb_checksums_recon, sizeof(*pd.checksums_recon),
- frame_checksum_compare);
- for (size_t i = 0; i < pd.nb_checksums_decoded; i++) {
- const FrameChecksum *d = &pd.checksums_decoded[i];
- const FrameChecksum *r = &pd.checksums_recon[i];
- for (int p = 0; p < FF_ARRAY_ELEMS(d->checksum); p++)
- if (d->checksum[p] != r->checksum[p]) {
- fprintf(stderr, "Checksum mismatch in frame ts=%"PRId64", plane %d\n",
- d->ts, p);
- ret = 1;
- goto fail;
- }
- }
- fprintf(stderr, "All %zu encoded frames match\n", pd.nb_checksums_decoded);
- fail:
- avcodec_free_context(&pd.enc);
- avcodec_free_context(&pd.dec);
- av_freep(&pd.checksums_decoded);
- av_freep(&pd.checksums_recon);
- av_frame_free(&pd.frame);
- av_frame_free(&pd.frame_recon);
- av_packet_free(&pd.pkt);
- ds_free(&dc);
- return !!ret;
- }
|