/* * Copyright © 2018, VideoLAN and dav1d authors * Copyright © 2018, Two Orioles, LLC * All rights reserved. * * Redistribution and use in source and binary forms, with or without * modification, are permitted provided that the following conditions are met: * * 1. Redistributions of source code must retain the above copyright notice, this * list of conditions and the following disclaimer. * * 2. Redistributions in binary form must reproduce the above copyright notice, * this list of conditions and the following disclaimer in the documentation * and/or other materials provided with the distribution. * * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED * WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE * DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE LIABLE FOR * ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES * (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND * ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS * SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. */ #include "config.h" #include "vcs_version.h" #include "cli_config.h" #include #include #include #include #include #include #include #include #ifdef HAVE_UNISTD_H # include #endif #ifdef HAVE_IO_H # include #endif #ifdef _WIN32 # include #endif #ifdef __APPLE__ #include #endif #include "dav1d/dav1d.h" #include "input/input.h" #include "output/output.h" #include "dav1d_cli_parse.h" static uint64_t get_time_nanos(void) { #ifdef _WIN32 LARGE_INTEGER frequency; QueryPerformanceFrequency(&frequency); LARGE_INTEGER t; QueryPerformanceCounter(&t); uint64_t seconds = t.QuadPart / frequency.QuadPart; uint64_t fractions = t.QuadPart % frequency.QuadPart; return 1000000000 * seconds + 1000000000 * fractions / frequency.QuadPart; #elif defined(HAVE_CLOCK_GETTIME) struct timespec ts; clock_gettime(CLOCK_MONOTONIC, &ts); return 1000000000ULL * ts.tv_sec + ts.tv_nsec; #elif defined(__APPLE__) mach_timebase_info_data_t info; mach_timebase_info(&info); return mach_absolute_time() * info.numer / info.denom; #endif } static void sleep_nanos(uint64_t d) { #ifdef _WIN32 Sleep((unsigned)(d / 1000000)); #else const struct timespec ts = { .tv_sec = (time_t)(d / 1000000000), .tv_nsec = d % 1000000000, }; nanosleep(&ts, NULL); #endif } static void synchronize(const int realtime, const unsigned cache, const unsigned n_out, const uint64_t nspf, const uint64_t tfirst, uint64_t *const elapsed, FILE *const frametimes) { const uint64_t tcurr = get_time_nanos(); const uint64_t last = *elapsed; *elapsed = tcurr - tfirst; if (realtime) { const uint64_t deadline = nspf * n_out; if (*elapsed < deadline) { const uint64_t remaining = deadline - *elapsed; if (remaining > nspf * cache) sleep_nanos(remaining - nspf * cache); *elapsed = deadline; } } if (frametimes) { const uint64_t frametime = *elapsed - last; fprintf(frametimes, "%" PRIu64 "\n", frametime); fflush(frametimes); } } static void print_stats(const int istty, const unsigned n, const unsigned num, const uint64_t elapsed, const double i_fps) { char buf[80], *b = buf, *const end = buf + 80; if (istty) *b++ = '\r'; if (num == 0xFFFFFFFF) b += snprintf(b, end - b, "Decoded %u frames", n); else b += snprintf(b, end - b, "Decoded %u/%u frames (%.1lf%%)", n, num, 100.0 * n / num); if (b < end) { const double d_fps = 1e9 * n / elapsed; if (i_fps) { const double speed = d_fps / i_fps; b += snprintf(b, end - b, " - %.2lf/%.2lf fps (%.2lfx)", d_fps, i_fps, speed); } else { b += snprintf(b, end - b, " - %.2lf fps", d_fps); } } if (!istty) strcpy(b > end - 2 ? end - 2 : b, "\n"); fputs(buf, stderr); } static int picture_alloc(Dav1dPicture *const p, void *const _) { const int hbd = p->p.bpc > 8; const int aligned_w = (p->p.w + 127) & ~127; const int aligned_h = (p->p.h + 127) & ~127; const int has_chroma = p->p.layout != DAV1D_PIXEL_LAYOUT_I400; const int ss_ver = p->p.layout == DAV1D_PIXEL_LAYOUT_I420; const int ss_hor = p->p.layout != DAV1D_PIXEL_LAYOUT_I444; ptrdiff_t y_stride = aligned_w << hbd; ptrdiff_t uv_stride = has_chroma ? y_stride >> ss_hor : 0; /* Due to how mapping of addresses to sets works in most L1 and L2 cache * implementations, strides of multiples of certain power-of-two numbers * may cause multiple rows of the same superblock to map to the same set, * causing evictions of previous rows resulting in a reduction in cache * hit rate. Avoid that by slightly padding the stride when necessary. */ if (!(y_stride & 1023)) y_stride += DAV1D_PICTURE_ALIGNMENT; if (!(uv_stride & 1023) && has_chroma) uv_stride += DAV1D_PICTURE_ALIGNMENT; p->stride[0] = -y_stride; p->stride[1] = -uv_stride; const size_t y_sz = y_stride * aligned_h; const size_t uv_sz = uv_stride * (aligned_h >> ss_ver); const size_t pic_size = y_sz + 2 * uv_sz; uint8_t *const buf = malloc(pic_size + DAV1D_PICTURE_ALIGNMENT * 2); if (!buf) return DAV1D_ERR(ENOMEM); p->allocator_data = buf; const ptrdiff_t align_m1 = DAV1D_PICTURE_ALIGNMENT - 1; uint8_t *const data = (uint8_t *)(((ptrdiff_t)buf + align_m1) & ~align_m1); p->data[0] = data + y_sz - y_stride; p->data[1] = has_chroma ? data + y_sz + uv_sz * 1 - uv_stride : NULL; p->data[2] = has_chroma ? data + y_sz + uv_sz * 2 - uv_stride : NULL; return 0; } static void picture_release(Dav1dPicture *const p, void *const _) { free(p->allocator_data); } int main(const int argc, char *const *const argv) { const int istty = isatty(fileno(stderr)); int res = 0; CLISettings cli_settings; Dav1dSettings lib_settings; DemuxerContext *in; MuxerContext *out = NULL; Dav1dPicture p; Dav1dContext *c; Dav1dData data; unsigned n_out = 0, total, fps[2], timebase[2]; uint64_t nspf, tfirst, elapsed; double i_fps; FILE *frametimes = NULL; const unsigned version = dav1d_version_api(); const int major = DAV1D_API_MAJOR(version); const int minor = DAV1D_API_MINOR(version); const int patch = DAV1D_API_PATCH(version); if (DAV1D_API_VERSION_MAJOR != major || DAV1D_API_VERSION_MINOR > minor) { fprintf(stderr, "Version mismatch (library: %d.%d.%d, executable: %d.%d.%d)\n", major, minor, patch, DAV1D_API_VERSION_MAJOR, DAV1D_API_VERSION_MINOR, DAV1D_API_VERSION_PATCH); return EXIT_FAILURE; } parse(argc, argv, &cli_settings, &lib_settings); if (cli_settings.neg_stride) { lib_settings.allocator.alloc_picture_callback = picture_alloc; lib_settings.allocator.release_picture_callback = picture_release; } if ((res = input_open(&in, cli_settings.demuxer, cli_settings.inputfile, fps, &total, timebase)) < 0) { return EXIT_FAILURE; } for (unsigned i = 0; i <= cli_settings.skip; i++) { if ((res = input_read(in, &data)) < 0) { input_close(in); return EXIT_FAILURE; } if (i < cli_settings.skip) dav1d_data_unref(&data); } if (!cli_settings.quiet) fprintf(stderr, "dav1d %s - by VideoLAN\n", dav1d_version()); // skip frames until a sequence header is found if (cli_settings.skip) { Dav1dSequenceHeader seq; unsigned seq_skip = 0; while (dav1d_parse_sequence_header(&seq, data.data, data.sz)) { if ((res = input_read(in, &data)) < 0) { input_close(in); return EXIT_FAILURE; } seq_skip++; } if (seq_skip && !cli_settings.quiet) fprintf(stderr, "skipped %u packets due to missing sequence header\n", seq_skip); } if (cli_settings.limit != 0 && cli_settings.limit < total) total = cli_settings.limit; if ((res = dav1d_open(&c, &lib_settings))) return EXIT_FAILURE; if (cli_settings.frametimes) frametimes = fopen(cli_settings.frametimes, "w"); if (cli_settings.realtime != REALTIME_CUSTOM) { if (fps[1] == 0) { i_fps = 0; nspf = 0; } else { i_fps = (double)fps[0] / fps[1]; nspf = 1000000000ULL * fps[1] / fps[0]; } } else { i_fps = cli_settings.realtime_fps; nspf = (uint64_t)(1000000000.0 / cli_settings.realtime_fps); } tfirst = get_time_nanos(); do { memset(&p, 0, sizeof(p)); if ((res = dav1d_send_data(c, &data)) < 0) { if (res != DAV1D_ERR(EAGAIN)) { dav1d_data_unref(&data); fprintf(stderr, "Error decoding frame: %s\n", strerror(DAV1D_ERR(res))); if (res != DAV1D_ERR(EINVAL)) break; } } if ((res = dav1d_get_picture(c, &p)) < 0) { if (res != DAV1D_ERR(EAGAIN)) { fprintf(stderr, "Error decoding frame: %s\n", strerror(DAV1D_ERR(res))); if (res != DAV1D_ERR(EINVAL)) break; } res = 0; } else { if (!n_out) { if ((res = output_open(&out, cli_settings.muxer, cli_settings.outputfile, &p.p, fps)) < 0) { if (frametimes) fclose(frametimes); return EXIT_FAILURE; } } if ((res = output_write(out, &p)) < 0) break; n_out++; if (nspf || !cli_settings.quiet) { synchronize(cli_settings.realtime, cli_settings.realtime_cache, n_out, nspf, tfirst, &elapsed, frametimes); } if (!cli_settings.quiet) print_stats(istty, n_out, total, elapsed, i_fps); } if (cli_settings.limit && n_out == cli_settings.limit) break; } while (data.sz > 0 || !input_read(in, &data)); if (data.sz > 0) dav1d_data_unref(&data); // flush if (res == 0) while (!cli_settings.limit || n_out < cli_settings.limit) { if ((res = dav1d_get_picture(c, &p)) < 0) { if (res != DAV1D_ERR(EAGAIN)) { fprintf(stderr, "Error decoding frame: %s\n", strerror(DAV1D_ERR(res))); if (res != DAV1D_ERR(EINVAL)) break; } else { res = 0; break; } } else { if (!n_out) { if ((res = output_open(&out, cli_settings.muxer, cli_settings.outputfile, &p.p, fps)) < 0) { if (frametimes) fclose(frametimes); return EXIT_FAILURE; } } if ((res = output_write(out, &p)) < 0) break; n_out++; if (nspf || !cli_settings.quiet) { synchronize(cli_settings.realtime, cli_settings.realtime_cache, n_out, nspf, tfirst, &elapsed, frametimes); } if (!cli_settings.quiet) print_stats(istty, n_out, total, elapsed, i_fps); } } if (frametimes) fclose(frametimes); input_close(in); if (out) { if (!cli_settings.quiet && istty) fprintf(stderr, "\n"); if (cli_settings.verify) res |= output_verify(out, cli_settings.verify); else output_close(out); } else { fprintf(stderr, "No data decoded\n"); res = 1; } dav1d_close(&c); return (res == 0) ? EXIT_SUCCESS : EXIT_FAILURE; }