Files
daedalus-v4l2/tools/test_m2m_stream.c
T
marfrit 5965805d86 Phase 8.7: media controller + multi-frame streaming verification
Two pieces — both shipped:

1. Media controller binding closes the last v4l2-compliance
   failure from 8.6 (DECODER_CMD, which requires has_media on
   stateless decoders) and unlocks the V4L2 request API for
   libva-v4l2-request.

2. Multi-frame streaming test exercises the daemon's
   AVCodecContext state preservation across many REQ_DECODE
   calls — Phase 8.6's tests pushed exactly one keyframe per
   invocation; real content has P-frame references.

Compliance now reaches **49/49 passing.**

Kernel (kernel/daedalus_v4l2_main.{c,h}):
- Added `struct media_device mdev` to daedalus_dev.
- media_device_init(&mdev) BEFORE v4l2_device_register so
  v4l2-core sees v4l2_dev.mdev = &mdev and binds the m2m
  entities into the graph during register.
- After video_register_device:
  v4l2_m2m_register_media_controller(..., MEDIA_ENT_F_PROC_VIDEO_DECODER)
  then media_device_register so userspace sees the complete
  graph in /dev/mediaN with the decoder entity tagged.
- daedalus_remove unwinds in reverse: unregister media,
  unregister mc, unregister video, release m2m, unregister
  v4l2, cleanup mdev.
- Error paths added for both new failure points.

Test harness (tools/test_m2m_stream.c, new):
- Multi-frame V4L2 m2m client: parses IVF → 4-deep buffer
  rings on both queues → per-frame QBUF/DQBUF loop →
  concatenates decoded NV12 to output file. Returns 0 only
  if every input frame decoded without error.
- Same codec vocabulary as test_m2m_decode (vp9 | av1 |
  h264 via 5th arg).

Verification on hertz (Pi 5, 6.12.75+rpt-rpi-2712):

v4l2-compliance: 49 tests, 49 passed, 0 failed, 0 warnings.

  $ v4l2-ctl --list-devices
  daedalus-fourier V3D7+NEON (platform:daedalus_v4l2):
        /dev/video0
        /dev/media3

VP9 320×240 30 frames (1 keyframe + 29 P-frames, 3.46 MB
NV12): byte-for-byte match vs `ffmpeg -i in.ivf -pix_fmt
nv12 -f rawvideo`.

VP9 1920×1080 10 frames (31 MB NV12 through the dmabuf
path): byte-for-byte match vs same reference command.

Daemon log shows cookies 1..30 all completing cleanly in
order; lazily-opened AVCodecContext maintains reference
frames across the chardev round-trips.

Clean SIGTERM + rmmod, no oops/WARN.

Roadmap update (docs/roadmap.md):
- 8.7 marked closed with closure-doc reference.
- 8.8 reshaped: perf profiling, QPU dispatch substitution
  via daedalus-fourier, multi-frame AV1/H.264, HDR (P010M).

Per correctness-before-speed:
- Order-correct media controller lifecycle (init → bind
  v4l2_dev → register video → register mc → register
  media; reverse for teardown).
- 4-deep buffer rings on both queues — the scheduler
  actually pipelines multiple in-flight cookies through
  the chardev (not just one-at-a-time as in 8.5/8.6 tests).
- Bit-exact comparison against ffmpeg, not "looks right."
- All resource paths cleaned on every error branch.

Phase 8.8 next: profile daemon hot loops, dlopen
daedalus-fourier from the daemon, swap FFmpeg per-block
calls for daedalus_dispatch_* where the kernel matches,
target 30fps@1080p from 30fps-floor-is-fine memory.

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
2026-05-18 16:21:58 +00:00

360 lines
9.6 KiB
C

/* SPDX-License-Identifier: BSD-2-Clause */
/*
* test_m2m_stream — multi-frame V4L2 m2m streaming verification.
*
* Drives a complete VP9 IVF file through /dev/video0:
* 1. parse IVF (per-frame size+data)
* 2. open + S_FMT both queues
* 3. REQBUFS N buffers each
* 4. Loop: QBUF OUTPUT[i % N] (mmap + copy), DQBUF OUTPUT,
* DQBUF CAPTURE → dump NV12 to file
* 5. STREAMOFF, close
*
* Concatenates all decoded frames into one big NV12 dump; the
* caller compares against a reference `ffmpeg -pix_fmt nv12 -f
* rawvideo` dump for the same input.
*
* Usage:
* test_m2m_stream <input.ivf> <out.nv12> [w] [h] [codec]
* defaults: w=320 h=240 codec=vp9
*/
#include <stdint.h>
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <errno.h>
#include <fcntl.h>
#include <unistd.h>
#include <sys/ioctl.h>
#include <sys/mman.h>
#include <sys/stat.h>
#include <poll.h>
#include <linux/videodev2.h>
#define V4L2_DEV "/dev/video0"
#define POLL_TIMEOUT_MS 5000
#define NUM_OUTPUT_BUFS 4
#define NUM_CAPTURE_BUFS 4
static void die(const char *msg)
{
perror(msg);
exit(1);
}
struct ivf_frame {
uint8_t *data;
uint32_t size;
};
/* Parse an IVF file into a vector of frames (caller frees). */
static struct ivf_frame *parse_ivf(const char *path, int *out_count,
uint32_t *out_w, uint32_t *out_h)
{
uint8_t *buf;
struct stat st;
int fd;
ssize_t n;
size_t off = 32;
int count = 0, cap = 16;
struct ivf_frame *frames;
fd = open(path, O_RDONLY);
if (fd < 0)
die("open ivf");
if (fstat(fd, &st) < 0)
die("fstat");
buf = malloc(st.st_size);
if (!buf)
die("malloc ivf");
n = read(fd, buf, st.st_size);
if (n != st.st_size)
die("read ivf");
close(fd);
if (memcmp(buf, "DKIF", 4)) {
fprintf(stderr, "not IVF\n");
exit(1);
}
*out_w = buf[12] | (buf[13] << 8);
*out_h = buf[14] | (buf[15] << 8);
frames = malloc(cap * sizeof(*frames));
if (!frames)
die("malloc frames");
while (off + 12 <= (size_t) st.st_size) {
uint32_t sz = buf[off] | (buf[off + 1] << 8) |
(buf[off + 2] << 16) | (buf[off + 3] << 24);
off += 12;
if (off + sz > (size_t) st.st_size) {
fprintf(stderr, "truncated frame at %zu\n", off);
break;
}
if (count >= cap) {
cap *= 2;
frames = realloc(frames, cap * sizeof(*frames));
if (!frames)
die("realloc frames");
}
frames[count].size = sz;
frames[count].data = malloc(sz);
if (!frames[count].data)
die("malloc frame");
memcpy(frames[count].data, buf + off, sz);
off += sz;
count++;
}
free(buf);
*out_count = count;
return frames;
}
static void free_frames(struct ivf_frame *f, int n)
{
int i;
for (i = 0; i < n; i++)
free(f[i].data);
free(f);
}
int main(int argc, char **argv)
{
const char *ivf_path, *out_path;
uint32_t override_w = 0, override_h = 0;
uint32_t output_fourcc = V4L2_PIX_FMT_VP9_FRAME;
uint32_t w, h;
int fd, frame_count;
struct ivf_frame *frames;
struct v4l2_format fmt;
struct v4l2_requestbuffers reqbuf;
struct v4l2_buffer buf;
struct v4l2_plane planes[2];
enum v4l2_buf_type t;
void *out_maps[NUM_OUTPUT_BUFS];
size_t out_map_size = 0;
void *cap_y[NUM_CAPTURE_BUFS], *cap_uv[NUM_CAPTURE_BUFS];
size_t cap_y_size = 0, cap_uv_size = 0;
FILE *of;
int i, decoded = 0;
if (argc < 3) {
fprintf(stderr,
"usage: %s <input.ivf> <out.nv12> [w] [h] [codec]\n"
" codec: vp9 | av1 | h264 (default vp9)\n",
argv[0]);
return 2;
}
ivf_path = argv[1];
out_path = argv[2];
if (argc >= 5) {
override_w = (uint32_t) atoi(argv[3]);
override_h = (uint32_t) atoi(argv[4]);
}
if (argc >= 6) {
const char *cn = argv[5];
if (!strcmp(cn, "vp9")) output_fourcc = V4L2_PIX_FMT_VP9_FRAME;
else if (!strcmp(cn, "av1")) output_fourcc = V4L2_PIX_FMT_AV1_FRAME;
else if (!strcmp(cn, "h264")) output_fourcc = V4L2_PIX_FMT_H264_SLICE;
else {
fprintf(stderr, "unknown codec %s\n", cn);
return 2;
}
}
frames = parse_ivf(ivf_path, &frame_count, &w, &h);
if (override_w) w = override_w;
if (override_h) h = override_h;
printf("parsed %d frames, %ux%u\n", frame_count, w, h);
fd = open(V4L2_DEV, O_RDWR);
if (fd < 0)
die("open " V4L2_DEV);
/* S_FMT OUTPUT */
memset(&fmt, 0, sizeof(fmt));
fmt.type = V4L2_BUF_TYPE_VIDEO_OUTPUT_MPLANE;
fmt.fmt.pix_mp.width = w;
fmt.fmt.pix_mp.height = h;
fmt.fmt.pix_mp.pixelformat = output_fourcc;
if (ioctl(fd, VIDIOC_S_FMT, &fmt) < 0)
die("S_FMT OUTPUT");
/* S_FMT CAPTURE */
memset(&fmt, 0, sizeof(fmt));
fmt.type = V4L2_BUF_TYPE_VIDEO_CAPTURE_MPLANE;
fmt.fmt.pix_mp.width = w;
fmt.fmt.pix_mp.height = h;
fmt.fmt.pix_mp.pixelformat = V4L2_PIX_FMT_NV12M;
if (ioctl(fd, VIDIOC_S_FMT, &fmt) < 0)
die("S_FMT CAPTURE");
cap_y_size = fmt.fmt.pix_mp.plane_fmt[0].sizeimage;
cap_uv_size = fmt.fmt.pix_mp.plane_fmt[1].sizeimage;
/* REQBUFS OUTPUT + mmap each */
memset(&reqbuf, 0, sizeof(reqbuf));
reqbuf.type = V4L2_BUF_TYPE_VIDEO_OUTPUT_MPLANE;
reqbuf.memory = V4L2_MEMORY_MMAP;
reqbuf.count = NUM_OUTPUT_BUFS;
if (ioctl(fd, VIDIOC_REQBUFS, &reqbuf) < 0)
die("REQBUFS OUTPUT");
printf("OUTPUT reqbufs -> %u\n", reqbuf.count);
for (i = 0; i < NUM_OUTPUT_BUFS; i++) {
memset(&buf, 0, sizeof(buf));
memset(planes, 0, sizeof(planes));
buf.type = V4L2_BUF_TYPE_VIDEO_OUTPUT_MPLANE;
buf.memory = V4L2_MEMORY_MMAP;
buf.index = i;
buf.m.planes = planes;
buf.length = 1;
if (ioctl(fd, VIDIOC_QUERYBUF, &buf) < 0)
die("QUERYBUF OUTPUT");
out_map_size = planes[0].length;
out_maps[i] = mmap(NULL, planes[0].length,
PROT_READ | PROT_WRITE, MAP_SHARED, fd,
planes[0].m.mem_offset);
if (out_maps[i] == MAP_FAILED)
die("mmap OUTPUT");
}
/* REQBUFS CAPTURE + mmap each */
memset(&reqbuf, 0, sizeof(reqbuf));
reqbuf.type = V4L2_BUF_TYPE_VIDEO_CAPTURE_MPLANE;
reqbuf.memory = V4L2_MEMORY_MMAP;
reqbuf.count = NUM_CAPTURE_BUFS;
if (ioctl(fd, VIDIOC_REQBUFS, &reqbuf) < 0)
die("REQBUFS CAPTURE");
printf("CAPTURE reqbufs -> %u\n", reqbuf.count);
for (i = 0; i < NUM_CAPTURE_BUFS; i++) {
memset(&buf, 0, sizeof(buf));
memset(planes, 0, sizeof(planes));
buf.type = V4L2_BUF_TYPE_VIDEO_CAPTURE_MPLANE;
buf.memory = V4L2_MEMORY_MMAP;
buf.index = i;
buf.m.planes = planes;
buf.length = 2;
if (ioctl(fd, VIDIOC_QUERYBUF, &buf) < 0)
die("QUERYBUF CAPTURE");
cap_y[i] = mmap(NULL, planes[0].length,
PROT_READ, MAP_SHARED, fd,
planes[0].m.mem_offset);
cap_uv[i] = mmap(NULL, planes[1].length,
PROT_READ, MAP_SHARED, fd,
planes[1].m.mem_offset);
if (cap_y[i] == MAP_FAILED || cap_uv[i] == MAP_FAILED)
die("mmap CAPTURE");
/* QBUF all capture buffers up front */
memset(&buf, 0, sizeof(buf));
memset(planes, 0, sizeof(planes));
buf.type = V4L2_BUF_TYPE_VIDEO_CAPTURE_MPLANE;
buf.memory = V4L2_MEMORY_MMAP;
buf.index = i;
buf.m.planes = planes;
buf.length = 2;
if (ioctl(fd, VIDIOC_QBUF, &buf) < 0)
die("QBUF CAPTURE init");
}
t = V4L2_BUF_TYPE_VIDEO_OUTPUT_MPLANE;
if (ioctl(fd, VIDIOC_STREAMON, &t) < 0)
die("STREAMON OUTPUT");
t = V4L2_BUF_TYPE_VIDEO_CAPTURE_MPLANE;
if (ioctl(fd, VIDIOC_STREAMON, &t) < 0)
die("STREAMON CAPTURE");
printf("STREAMON both\n");
of = fopen(out_path, "wb");
if (!of)
die("fopen out");
/* Feed one bitstream frame at a time; serialise DQBUF after each. */
for (i = 0; i < frame_count; i++) {
int idx = i % NUM_OUTPUT_BUFS;
struct pollfd p = { .fd = fd, .events = POLLIN | POLLOUT };
size_t y_actual, uv_actual;
int cap_idx;
if (frames[i].size > out_map_size) {
fprintf(stderr, "frame %d too big: %u > %zu\n",
i, frames[i].size, out_map_size);
break;
}
memcpy(out_maps[idx], frames[i].data, frames[i].size);
memset(&buf, 0, sizeof(buf));
memset(planes, 0, sizeof(planes));
buf.type = V4L2_BUF_TYPE_VIDEO_OUTPUT_MPLANE;
buf.memory = V4L2_MEMORY_MMAP;
buf.index = idx;
buf.m.planes = planes;
buf.length = 1;
planes[0].bytesused = frames[i].size;
if (ioctl(fd, VIDIOC_QBUF, &buf) < 0)
die("QBUF OUTPUT");
if (poll(&p, 1, POLL_TIMEOUT_MS) <= 0)
die("poll");
/* DQBUF OUTPUT (returns the buffer to userspace pool) */
memset(&buf, 0, sizeof(buf));
memset(planes, 0, sizeof(planes));
buf.type = V4L2_BUF_TYPE_VIDEO_OUTPUT_MPLANE;
buf.memory = V4L2_MEMORY_MMAP;
buf.m.planes = planes;
buf.length = 1;
if (ioctl(fd, VIDIOC_DQBUF, &buf) < 0)
die("DQBUF OUTPUT");
/* DQBUF CAPTURE */
memset(&buf, 0, sizeof(buf));
memset(planes, 0, sizeof(planes));
buf.type = V4L2_BUF_TYPE_VIDEO_CAPTURE_MPLANE;
buf.memory = V4L2_MEMORY_MMAP;
buf.m.planes = planes;
buf.length = 2;
if (ioctl(fd, VIDIOC_DQBUF, &buf) < 0)
die("DQBUF CAPTURE");
cap_idx = buf.index;
if (buf.flags & V4L2_BUF_FLAG_ERROR) {
fprintf(stderr, " frame %d CAPTURE ERROR\n", i);
break;
}
y_actual = planes[0].bytesused ? planes[0].bytesused
: cap_y_size;
uv_actual = planes[1].bytesused ? planes[1].bytesused
: cap_uv_size;
fwrite(cap_y[cap_idx], 1, y_actual, of);
fwrite(cap_uv[cap_idx], 1, uv_actual, of);
decoded++;
/* Recycle the CAPTURE buffer */
memset(&buf, 0, sizeof(buf));
memset(planes, 0, sizeof(planes));
buf.type = V4L2_BUF_TYPE_VIDEO_CAPTURE_MPLANE;
buf.memory = V4L2_MEMORY_MMAP;
buf.index = cap_idx;
buf.m.planes = planes;
buf.length = 2;
if (ioctl(fd, VIDIOC_QBUF, &buf) < 0)
die("QBUF CAPTURE recycle");
}
fclose(of);
printf("decoded %d / %d frames to %s\n", decoded, frame_count, out_path);
t = V4L2_BUF_TYPE_VIDEO_OUTPUT_MPLANE;
ioctl(fd, VIDIOC_STREAMOFF, &t);
t = V4L2_BUF_TYPE_VIDEO_CAPTURE_MPLANE;
ioctl(fd, VIDIOC_STREAMOFF, &t);
close(fd);
free_frames(frames, frame_count);
return decoded == frame_count ? 0 : 1;
}