/* * Copyright (c) 2017, Alliance for Open Media. All rights reserved * * This source code is subject to the terms of the BSD 2 Clause License and * the Alliance for Open Media Patent License 1.0. If the BSD 2 Clause License * was not distributed with this source code in the LICENSE file, you can * obtain it at www.aomedia.org/license/software. If the Alliance for Open * Media Patent License 1.0 was not distributed with this source code in the * PATENTS file, you can obtain it at www.aomedia.org/license/patent. */ // Lightfield Decoder // ================== // // This is an example of a simple lightfield decoder. It builds upon the // simple_decoder.c example. It takes an input file containing the compressed // data (in webm format), treating it as a lightfield instead of a video and // will decode a single lightfield tile. The lf_width and lf_height arguments // are the number of lightfield images in each dimension. The tile to decode // is specified by the tile_u, tile_v, tile_s, tile_t arguments. The tile_u, // tile_v specify the image and tile_s, tile_t specify the tile in the image. // After running the lightfield encoder, run lightfield decoder to decode a // single tile: // examples/lightfield_decoder vase10x10.webm vase_tile.yuv 10 10 3 4 5 10 5 #include #include #include #include "aom/aom_decoder.h" #include "aom/aomdx.h" #include "../tools_common.h" #include "../video_reader.h" #include "./aom_config.h" static const char *exec_name; void usage_exit(void) { fprintf(stderr, "Usage: %s " " \n", exec_name); exit(EXIT_FAILURE); } aom_image_t *aom_img_copy(aom_image_t *src, aom_image_t *dst) { dst = aom_img_alloc(dst, src->fmt, src->d_w, src->d_h, 16); int plane; for (plane = 0; plane < 3; ++plane) { uint8_t *src_buf = src->planes[plane]; const int src_stride = src->stride[plane]; const int src_w = plane == 0 ? src->d_w : src->d_w >> 1; const int src_h = plane == 0 ? src->d_h : src->d_h >> 1; uint8_t *dst_buf = dst->planes[plane]; const int dst_stride = dst->stride[plane]; int y; for (y = 0; y < src_h; ++y) { memcpy(dst_buf, src_buf, src_w); src_buf += src_stride; dst_buf += dst_stride; } } return dst; } int main(int argc, char **argv) { int frame_cnt = 0; FILE *outfile = NULL; aom_codec_ctx_t codec; AvxVideoReader *reader = NULL; const AvxInterface *decoder = NULL; const AvxVideoInfo *info = NULL; const char *lf_width_arg; const char *lf_height_arg; const char *tile_u_arg; const char *tile_v_arg; const char *tile_s_arg; const char *tile_t_arg; const char *lf_blocksize_arg; int lf_width, lf_height; int tile_u, tile_v, tile_s, tile_t; int lf_blocksize; int u_blocks; int v_blocks; exec_name = argv[0]; if (argc != 10) die("Invalid number of arguments."); reader = aom_video_reader_open(argv[1]); if (!reader) die("Failed to open %s for reading.", argv[1]); if (!(outfile = fopen(argv[2], "wb"))) die("Failed to open %s for writing.", argv[2]); lf_width_arg = argv[3]; lf_height_arg = argv[4]; tile_u_arg = argv[5]; tile_v_arg = argv[6]; tile_s_arg = argv[7]; tile_t_arg = argv[8]; lf_blocksize_arg = argv[9]; lf_width = (int)strtol(lf_width_arg, NULL, 0); lf_height = (int)strtol(lf_height_arg, NULL, 0); tile_u = (int)strtol(tile_u_arg, NULL, 0); tile_v = (int)strtol(tile_v_arg, NULL, 0); tile_s = (int)strtol(tile_s_arg, NULL, 0); tile_t = (int)strtol(tile_t_arg, NULL, 0); lf_blocksize = (int)strtol(lf_blocksize_arg, NULL, 0); info = aom_video_reader_get_info(reader); decoder = get_aom_decoder_by_fourcc(info->codec_fourcc); if (!decoder) die("Unknown input codec."); printf("Using %s\n", aom_codec_iface_name(decoder->codec_interface())); if (aom_codec_dec_init(&codec, decoder->codec_interface(), NULL, 0)) die_codec(&codec, "Failed to initialize decoder."); // How many reference images we need to encode. u_blocks = (lf_width + lf_blocksize - 1) / lf_blocksize; v_blocks = (lf_height + lf_blocksize - 1) / lf_blocksize; aom_image_t *reference_images = (aom_image_t *)malloc(u_blocks * v_blocks * sizeof(aom_image_t)); for (int bv = 0; bv < v_blocks; ++bv) { for (int bu = 0; bu < u_blocks; ++bu) { aom_video_reader_read_frame(reader); aom_codec_iter_t iter = NULL; aom_image_t *img = NULL; size_t frame_size = 0; const unsigned char *frame = aom_video_reader_get_frame(reader, &frame_size); if (aom_codec_decode(&codec, frame, (unsigned int)frame_size, NULL, 0)) die_codec(&codec, "Failed to decode frame."); while ((img = aom_codec_get_frame(&codec, &iter)) != NULL) { aom_img_copy(img, &reference_images[bu + bv * u_blocks]); char name[1024]; snprintf(name, sizeof(name), "ref_%d_%d.yuv", bu, bv); printf("writing ref image to %s, %d, %d\n", name, img->d_w, img->d_h); FILE *ref_file = fopen(name, "wb"); aom_img_write(img, ref_file); fclose(ref_file); ++frame_cnt; } } } int decode_frame_index = tile_v * lf_width + tile_u; do { aom_video_reader_read_frame(reader); } while (frame_cnt++ != decode_frame_index); size_t frame_size = 0; const unsigned char *frame = aom_video_reader_get_frame(reader, &frame_size); int ref_bu = tile_u / lf_blocksize; int ref_bv = tile_v / lf_blocksize; int ref_bi = ref_bu + ref_bv * u_blocks; av1_ref_frame_t ref; ref.idx = 0; ref.img = reference_images[ref_bi]; // This is too slow for real lightfield rendering. This copies the // reference image bytes. We need a way to just set a pointer // in order to make this fast enough. if (aom_codec_control(&codec, AV1_SET_REFERENCE, &ref)) { die_codec(&codec, "Failed to set reference image."); } aom_codec_control_(&codec, AV1_SET_DECODE_TILE_ROW, tile_t); aom_codec_control_(&codec, AV1_SET_DECODE_TILE_COL, tile_s); aom_codec_err_t aom_status = aom_codec_decode(&codec, frame, frame_size, NULL, 0); if (aom_status) die_codec(&codec, "Failed to decode tile."); aom_codec_iter_t iter = NULL; aom_image_t *img = aom_codec_get_frame(&codec, &iter); aom_img_write(img, outfile); if (aom_codec_destroy(&codec)) die_codec(&codec, "Failed to destroy codec"); aom_video_reader_close(reader); fclose(outfile); return EXIT_SUCCESS; }