// This file is part of Moonfire NVR, a security camera digital video recorder. // Copyright (C) 2016 Scott Lamb // // This program is free software: you can redistribute it and/or modify // it under the terms of the GNU General Public License as published by // the Free Software Foundation, either version 3 of the License, or // (at your option) any later version. // // In addition, as a special exception, the copyright holders give // permission to link the code of portions of this program with the // OpenSSL library under certain conditions as described in each // individual source file, and distribute linked combinations including // the two. // // You must obey the GNU General Public License in all respects for all // of the code used other than OpenSSL. If you modify file(s) with this // exception, you may extend this exception to your version of the // file(s), but you are not obligated to do so. If you do not wish to do // so, delete this exception statement from your version. If you delete // this exception statement from all source files in the program, then // also delete it here. // // This program is distributed in the hope that it will be useful, // but WITHOUT ANY WARRANTY; without even the implied warranty of // MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the // GNU General Public License for more details. // // You should have received a copy of the GNU General Public License // along with this program. If not, see . //! `.mp4` virtual file serving. //! //! The `mp4` module builds virtual files representing ISO/IEC 14496-12 (ISO base media format / //! MPEG-4 / `.mp4`) video. These can be constructed from one or more recordings and are suitable //! for HTTP range serving or download. The generated `.mp4` file has the `moov` box before the //! `mdat` box for fast start. More specifically, boxes are arranged in the order suggested by //! ISO/IEC 14496-12 section 6.2.3 (Table 1): //! //! * ftyp (file type and compatibility) //! * moov (container for all the metadata) //! ** mvhd (movie header, overall declarations) //! //! ** trak (video: container for an individual track or stream) //! *** tkhd (track header, overall information about the track) //! *** (optional) edts (edit list container) //! **** elst (an edit list) //! *** mdia (container for the media information in a track) //! **** mdhd (media header, overall information about the media) //! *** minf (media information container) //! **** vmhd (video media header, overall information (video track only)) //! **** dinf (data information box, container) //! ***** dref (data reference box, declares source(s) of media data in track) //! **** stbl (sample table box, container for the time/space map) //! ***** stsd (sample descriptions (codec types, initilization etc.) //! ***** stts ((decoding) time-to-sample) //! ***** stsc (sample-to-chunk, partial data-offset information) //! ***** stsz (samples sizes (framing)) //! ***** co64 (64-bit chunk offset) //! ***** stss (sync sample table) //! //! ** (optional) trak (subtitle: container for an individual track or stream) //! *** tkhd (track header, overall information about the track) //! *** mdia (container for the media information in a track) //! **** mdhd (media header, overall information about the media) //! *** minf (media information container) //! **** nmhd (null media header, overall information) //! **** dinf (data information box, container) //! ***** dref (data reference box, declares source(s) of media data in track) //! **** stbl (sample table box, container for the time/space map) //! ***** stsd (sample descriptions (codec types, initilization etc.) //! ***** stts ((decoding) time-to-sample) //! ***** stsc (sample-to-chunk, partial data-offset information) //! ***** stsz (samples sizes (framing)) //! ***** co64 (64-bit chunk offset) //! //! * mdat (media data container) //! ``` extern crate byteorder; extern crate time; use byteorder::{BigEndian, ByteOrder, WriteBytesExt}; use db; use dir; use error::{Error, Result}; use hyper::header; use mmapfile; use mime; use openssl::crypto::hash; use pieces; use pieces::ContextWriter; use pieces::Slices; use recording::{self, TIME_UNITS_PER_SEC}; use resource; use smallvec::SmallVec; use std::cell::RefCell; use std::cmp; use std::io; use std::ops::Range; use std::mem; use std::sync::{Arc, MutexGuard}; use time::Timespec; /// This value should be incremented any time a change is made to this file that causes different /// bytes to be output for a particular set of `Mp4Builder` options. Incrementing this value will /// cause the etag to change as well. const FORMAT_VERSION: [u8; 1] = [0x03]; /// An `ftyp` (ISO/IEC 14496-12 section 4.3 `FileType`) box. const FTYP_BOX: &'static [u8] = &[ 0x00, 0x00, 0x00, 0x20, // length = 32, sizeof(FTYP_BOX) b'f', b't', b'y', b'p', // type b'i', b's', b'o', b'm', // major_brand 0x00, 0x00, 0x02, 0x00, // minor_version b'i', b's', b'o', b'm', // compatible_brands[0] b'i', b's', b'o', b'2', // compatible_brands[1] b'a', b'v', b'c', b'1', // compatible_brands[2] b'm', b'p', b'4', b'1', // compatible_brands[3] ]; /// An `hdlr` (ISO/IEC 14496-12 section 8.4.3 `HandlerBox`) box suitable for video. const VIDEO_HDLR_BOX: &'static [u8] = &[ 0x00, 0x00, 0x00, 0x21, // length == sizeof(kHdlrBox) b'h', b'd', b'l', b'r', // type == hdlr, ISO/IEC 14496-12 section 8.4.3. 0x00, 0x00, 0x00, 0x00, // version + flags 0x00, 0x00, 0x00, 0x00, // pre_defined b'v', b'i', b'd', b'e', // handler = vide 0x00, 0x00, 0x00, 0x00, // reserved[0] 0x00, 0x00, 0x00, 0x00, // reserved[1] 0x00, 0x00, 0x00, 0x00, // reserved[2] 0x00, // name, zero-terminated (empty) ]; /// An `hdlr` (ISO/IEC 14496-12 section 8.4.3 `HandlerBox`) box suitable for subtitles. const SUBTITLE_HDLR_BOX: &'static [u8] = &[ 0x00, 0x00, 0x00, 0x21, // length == sizeof(kHdlrBox) b'h', b'd', b'l', b'r', // type == hdlr, ISO/IEC 14496-12 section 8.4.3. 0x00, 0x00, 0x00, 0x00, // version + flags 0x00, 0x00, 0x00, 0x00, // pre_defined b's', b'b', b't', b'l', // handler = sbtl 0x00, 0x00, 0x00, 0x00, // reserved[0] 0x00, 0x00, 0x00, 0x00, // reserved[1] 0x00, 0x00, 0x00, 0x00, // reserved[2] 0x00, // name, zero-terminated (empty) ]; /// Part of an `mvhd` (`MovieHeaderBox` version 0, ISO/IEC 14496-12 section 8.2.2), used from /// `append_mvhd`. const MVHD_JUNK: &'static [u8] = &[ 0x00, 0x01, 0x00, 0x00, // rate 0x01, 0x00, // volume 0x00, 0x00, // reserved 0x00, 0x00, 0x00, 0x00, // reserved 0x00, 0x00, 0x00, 0x00, // reserved 0x00, 0x01, 0x00, 0x00, // matrix[0] 0x00, 0x00, 0x00, 0x00, // matrix[1] 0x00, 0x00, 0x00, 0x00, // matrix[2] 0x00, 0x00, 0x00, 0x00, // matrix[3] 0x00, 0x01, 0x00, 0x00, // matrix[4] 0x00, 0x00, 0x00, 0x00, // matrix[5] 0x00, 0x00, 0x00, 0x00, // matrix[6] 0x00, 0x00, 0x00, 0x00, // matrix[7] 0x40, 0x00, 0x00, 0x00, // matrix[8] 0x00, 0x00, 0x00, 0x00, // pre_defined[0] 0x00, 0x00, 0x00, 0x00, // pre_defined[1] 0x00, 0x00, 0x00, 0x00, // pre_defined[2] 0x00, 0x00, 0x00, 0x00, // pre_defined[3] 0x00, 0x00, 0x00, 0x00, // pre_defined[4] 0x00, 0x00, 0x00, 0x00, // pre_defined[5] ]; /// Part of a `tkhd` (`TrackHeaderBox` version 0, ISO/IEC 14496-12 section 8.3.2), used from /// `append_video_tkhd` and `append_subtitle_tkhd`. const TKHD_JUNK: &'static [u8] = &[ 0x00, 0x00, 0x00, 0x00, // reserved 0x00, 0x00, 0x00, 0x00, // reserved 0x00, 0x00, 0x00, 0x00, // layer + alternate_group 0x00, 0x00, 0x00, 0x00, // volume + reserved 0x00, 0x01, 0x00, 0x00, // matrix[0] 0x00, 0x00, 0x00, 0x00, // matrix[1] 0x00, 0x00, 0x00, 0x00, // matrix[2] 0x00, 0x00, 0x00, 0x00, // matrix[3] 0x00, 0x01, 0x00, 0x00, // matrix[4] 0x00, 0x00, 0x00, 0x00, // matrix[5] 0x00, 0x00, 0x00, 0x00, // matrix[6] 0x00, 0x00, 0x00, 0x00, // matrix[7] 0x40, 0x00, 0x00, 0x00, // matrix[8] ]; /// Part of a `minf` (`MediaInformationBox`, ISO/IEC 14496-12 section 8.4.4), used from /// `append_video_minf`. const VIDEO_MINF_JUNK: &'static [u8] = &[ b'm', b'i', b'n', b'f', // type = minf, ISO/IEC 14496-12 section 8.4.4. // A vmhd box; the "graphicsmode" and "opcolor" values don't have any // meaningful use. 0x00, 0x00, 0x00, 0x14, // length == sizeof(kVmhdBox) b'v', b'm', b'h', b'd', // type = vmhd, ISO/IEC 14496-12 section 12.1.2. 0x00, 0x00, 0x00, 0x01, // version + flags(1) 0x00, 0x00, 0x00, 0x00, // graphicsmode (copy), opcolor[0] 0x00, 0x00, 0x00, 0x00, // opcolor[1], opcolor[2] // A dinf box suitable for a "self-contained" .mp4 file (no URL/URN // references to external data). 0x00, 0x00, 0x00, 0x24, // length == sizeof(kDinfBox) b'd', b'i', b'n', b'f', // type = dinf, ISO/IEC 14496-12 section 8.7.1. 0x00, 0x00, 0x00, 0x1c, // length b'd', b'r', b'e', b'f', // type = dref, ISO/IEC 14496-12 section 8.7.2. 0x00, 0x00, 0x00, 0x00, // version and flags 0x00, 0x00, 0x00, 0x01, // entry_count 0x00, 0x00, 0x00, 0x0c, // length b'u', b'r', b'l', b' ', // type = url, ISO/IEC 14496-12 section 8.7.2. 0x00, 0x00, 0x00, 0x01, // version=0, flags=self-contained ]; /// Part of a `minf` (`MediaInformationBox`, ISO/IEC 14496-12 section 8.4.4), used from /// `append_subtitle_minf`. const SUBTITLE_MINF_JUNK: &'static [u8] = &[ b'm', b'i', b'n', b'f', // type = minf, ISO/IEC 14496-12 section 8.4.4. // A nmhd box. 0x00, 0x00, 0x00, 0x0c, // length == sizeof(kNmhdBox) b'n', b'm', b'h', b'd', // type = nmhd, ISO/IEC 14496-12 section 12.1.2. 0x00, 0x00, 0x00, 0x01, // version + flags(1) // A dinf box suitable for a "self-contained" .mp4 file (no URL/URN // references to external data). 0x00, 0x00, 0x00, 0x24, // length == sizeof(kDinfBox) b'd', b'i', b'n', b'f', // type = dinf, ISO/IEC 14496-12 section 8.7.1. 0x00, 0x00, 0x00, 0x1c, // length b'd', b'r', b'e', b'f', // type = dref, ISO/IEC 14496-12 section 8.7.2. 0x00, 0x00, 0x00, 0x00, // version and flags 0x00, 0x00, 0x00, 0x01, // entry_count 0x00, 0x00, 0x00, 0x0c, // length b'u', b'r', b'l', b' ', // type = url, ISO/IEC 14496-12 section 8.7.2. 0x00, 0x00, 0x00, 0x01, // version=0, flags=self-contained ]; /// Part of a `stbl` (`SampleTableBox`, ISO/IEC 14496 section 8.5.1) used from /// `append_subtitle_stbl`. const SUBTITLE_STBL_JUNK: &'static [u8] = &[ b's', b't', b'b', b'l', // type = stbl, ISO/IEC 14496-12 section 8.5.1. // A stsd box. 0x00, 0x00, 0x00, 0x54, // length b's', b't', b's', b'd', // type == stsd, ISO/IEC 14496-12 section 8.5.2. 0x00, 0x00, 0x00, 0x00, // version + flags 0x00, 0x00, 0x00, 0x01, // entry_count == 1 // SampleEntry, ISO/IEC 14496-12 section 8.5.2.2. 0x00, 0x00, 0x00, 0x44, // length b't', b'x', b'3', b'g', // type == tx3g, 3GPP TS 26.245 section 5.16. 0x00, 0x00, 0x00, 0x00, // reserved 0x00, 0x00, 0x00, 0x01, // reserved, data_reference_index == 1 // TextSampleEntry 0x00, 0x00, 0x00, 0x00, // displayFlags == none 0x00, // horizontal-justification == left 0x00, // vertical-justification == top 0x00, 0x00, 0x00, 0x00, // background-color-rgba == transparent // TextSampleEntry.BoxRecord 0x00, 0x00, // top 0x00, 0x00, // left 0x00, 0x00, // bottom 0x00, 0x00, // right // TextSampleEntry.StyleRecord 0x00, 0x00, // startChar 0x00, 0x00, // endChar 0x00, 0x01, // font-ID 0x00, // face-style-flags 0x12, // font-size == 18 px 0xff, 0xff, 0xff, 0xff, // text-color-rgba == opaque white // TextSampleEntry.FontTableBox 0x00, 0x00, 0x00, 0x16, // length b'f', b't', b'a', b'b', // type == ftab, section 5.16 0x00, 0x01, // entry-count == 1 0x00, 0x01, // font-ID == 1 0x09, // font-name-length == 9 b'M', b'o', b'n', b'o', b's', b'p', b'a', b'c', b'e', ]; /// Pointers to each static bytestrings. /// The order here must match the `StaticBytestring` enum. const STATIC_BYTESTRINGS: [&'static [u8]; 8] = [ FTYP_BOX, VIDEO_HDLR_BOX, SUBTITLE_HDLR_BOX, MVHD_JUNK, TKHD_JUNK, VIDEO_MINF_JUNK, SUBTITLE_MINF_JUNK, SUBTITLE_STBL_JUNK, ]; /// Enumeration of the static bytestrings. The order here must match the `STATIC_BYTESTRINGS` /// array. The advantage of this enum over direct pointers to the relevant strings is that it /// fits into a u32 on 64-bit platforms, allowing an `Mp4FileSlice` to fit into 8 bytes. #[derive(Copy, Clone, Debug)] enum StaticBytestring { FtypBox, VideoHdlrBox, SubtitleHdlrBox, MvhdJunk, TkhdJunk, VideoMinfJunk, SubtitleMinfJunk, SubtitleStblJunk, } /// The template fed into strtime for a timestamp subtitle. This must produce fixed-length output /// (see `SUBTITLE_LENGTH`) to allow quick calculation of the total size of the subtitles for /// a given time range. const SUBTITLE_TEMPLATE: &'static str = "%Y-%m-%d %H:%M:%S %z"; /// The length of the output of `SUBTITLE_TEMPLATE`. const SUBTITLE_LENGTH: usize = 25; // "2015-07-02 17:10:00 -0700".len(); /// Holds the sample indexes for a given video segment: `stts`, `stsz`, and `stss`. struct Mp4SegmentIndex { /// Holds all three sample indexes: /// &buf[.. stsz_start] is stts. /// &buf[stsz_start .. stss_start] is stsz. /// &buf[stss_start ..] is stss. buf: Box<[u8]>, stsz_start: u32, stss_start: u32, } impl Mp4SegmentIndex { fn stts(&self) -> &[u8] { &self.buf[.. self.stsz_start as usize] } fn stsz(&self) -> &[u8] { &self.buf[self.stsz_start as usize .. self.stss_start as usize] } fn stss(&self) -> &[u8] { &self.buf[self.stss_start as usize ..] } } /// A wrapper around `recording::Segment` that keeps some additional `.mp4`-specific state. struct Mp4Segment { s: recording::Segment, /// Holds the `stts`, `stsz`, and `stss` if they've been generated. /// Access only through `with_index`. index: RefCell>, /// The 1-indexed frame number in the `Mp4File` of the first frame in this segment. first_frame_num: u32, num_subtitle_samples: u32, } impl Mp4Segment { fn with_index(&self, db: &db::Database, f: F) -> Result where F: FnOnce(&Mp4SegmentIndex) -> Result { let mut i = self.index.borrow_mut(); if let Some(ref i) = *i { return f(i); } let index = self.build_index(db)?; let r = f(&index); *i = Some(index); r } fn build_index(&self, db: &db::Database) -> Result { let s = &self.s; let stts_len = mem::size_of::() * 2 * (s.frames as usize); let stsz_len = mem::size_of::() * s.frames as usize; let stss_len = mem::size_of::() * s.key_frames as usize; let len = stts_len + stsz_len + stss_len; let mut buf = unsafe { let mut v = Vec::with_capacity(len); v.set_len(len); v.into_boxed_slice() }; { let (stts, mut rest) = buf.split_at_mut(stts_len); let (stsz, stss) = rest.split_at_mut(stsz_len); let mut frame = 0; let mut key_frame = 0; let mut last_start_and_dur = None; s.foreach(db, |it| { last_start_and_dur = Some((it.start_90k, it.duration_90k)); BigEndian::write_u32(&mut stts[8*frame .. 8*frame+4], 1); BigEndian::write_u32(&mut stts[8*frame+4 .. 8*frame+8], it.duration_90k as u32); BigEndian::write_u32(&mut stsz[4*frame .. 4*frame+4], it.bytes as u32); if it.is_key { BigEndian::write_u32(&mut stss[4*key_frame .. 4*key_frame+4], self.first_frame_num + (frame as u32)); key_frame += 1; } frame += 1; Ok(()) })?; // Fix up the final frame's duration. // Doing this after the fact is more efficient than having a condition on every // iteration. if let Some((last_start, dur)) = last_start_and_dur { BigEndian::write_u32(&mut stts[8*frame-4 ..], cmp::min(s.desired_range_90k.end - last_start, dur) as u32); } } Ok(Mp4SegmentIndex{ buf: buf, stsz_start: stts_len as u32, stss_start: (stts_len + stsz_len) as u32, }) } } pub struct Mp4FileBuilder { /// Segments of video: one per "recording" table entry as they should /// appear in the video. segments: Vec, video_sample_entries: SmallVec<[Arc; 1]>, next_frame_num: u32, duration_90k: u32, num_subtitle_samples: u32, subtitle_co64_pos: Option, body: BodyState, include_timestamp_subtitle_track: bool, } /// The portion of `Mp4FileBuilder` which is mutated while building the body of the file. /// This is separated out from the rest so that it can be borrowed in a loop over /// `Mp4FileBuilder::segments`; otherwise this would cause a double-self-borrow. struct BodyState { slices: Slices, /// `self.buf[unflushed_buf_pos .. self.buf.len()]` holds bytes that should be /// appended to `slices` before any other slice. See `flush_buf()`. unflushed_buf_pos: usize, buf: Vec, } /// A single slice of a `Mp4File`, for use with a `Slices` object. Each slice is responsible for /// some portion of the generated `.mp4` file. The box headers and such are generally in `Static` /// or `Buf` slices; the others generally represent a single segment's contribution to the /// like-named box. #[derive(Debug)] enum Mp4FileSlice { Static(StaticBytestring), // param is index into STATIC_BYTESTRINGS Buf(u32), // param is index into m.buf VideoSampleEntry(u32), // param is index into m.video_sample_entries Stts(u32), // param is index into m.segments Stsz(u32), // param is index into m.segments Co64, Stss(u32), // param is index into m.segments VideoSampleData(u32), // param is index into m.segments SubtitleSampleData(u32), // param is index into m.segments } impl ContextWriter for Mp4FileSlice { fn write_to(&self, f: &Mp4File, r: Range, l: u64, out: &mut io::Write) -> Result<()> { trace!("write {:?}, range {:?} out of len {}", self, r, l); match *self { Mp4FileSlice::Static(off) => { let s = STATIC_BYTESTRINGS[off as usize]; let part = &s[r.start as usize .. r.end as usize]; out.write_all(part)?; Ok(()) }, Mp4FileSlice::Buf(off) => { let off = off as usize; out.write_all( &f.buf[off+r.start as usize .. off+r.end as usize])?; Ok(()) }, Mp4FileSlice::VideoSampleEntry(off) => { let e = &f.video_sample_entries[off as usize]; let part = &e.data[r.start as usize .. r.end as usize]; out.write_all(part)?; Ok(()) }, Mp4FileSlice::Stts(index) => { f.write_stts(index as usize, r, l, out) }, Mp4FileSlice::Stsz(index) => { f.write_stsz(index as usize, r, l, out) }, Mp4FileSlice::Co64 => { f.write_co64(r, l, out) }, Mp4FileSlice::Stss(index) => { f.write_stss(index as usize, r, l, out) }, Mp4FileSlice::VideoSampleData(index) => { f.write_video_sample_data(index as usize, r, out) }, Mp4FileSlice::SubtitleSampleData(index) => { f.write_subtitle_sample_data(index as usize, r, l, out) } } } } /// Converts from 90kHz units since Unix epoch (1970-01-01 00:00:00 UTC) to seconds since /// ISO-14496 epoch (1904-01-01 00:00:00 UTC). fn to_iso14496_timestamp(t: recording::Time) -> u32 { (t.unix_seconds() + 24107 * 86400) as u32 } /// Writes a box length for everything appended in the supplied scope. /// Used only within Mp4FileBuilder::build (and methods it calls internally). macro_rules! write_length { ($_self:ident, $b:block) => {{ let len_pos = $_self.body.buf.len(); let len_start = $_self.body.slices.len() + $_self.body.buf.len() as u64 - $_self.body.unflushed_buf_pos as u64; $_self.body.append_u32(0); // placeholder. { $b; } let len_end = $_self.body.slices.len() + $_self.body.buf.len() as u64 - $_self.body.unflushed_buf_pos as u64; BigEndian::write_u32(&mut $_self.body.buf[len_pos .. len_pos + 4], (len_end - len_start) as u32); }} } /// Returns a hex-encoded version of the input. fn hex(raw: &[u8]) -> String { const HEX_CHARS: [u8; 16] = [b'0', b'1', b'2', b'3', b'4', b'5', b'6', b'7', b'8', b'9', b'a', b'b', b'c', b'd', b'e', b'f']; let mut hex = Vec::with_capacity(2 * raw.len()); for b in raw { hex.push(HEX_CHARS[((b & 0xf0) >> 4) as usize]); hex.push(HEX_CHARS[( b & 0x0f ) as usize]); } unsafe { String::from_utf8_unchecked(hex) } } impl Mp4FileBuilder { pub fn new() -> Self { Mp4FileBuilder{ segments: Vec::new(), video_sample_entries: SmallVec::new(), next_frame_num: 1, duration_90k: 0, num_subtitle_samples: 0, subtitle_co64_pos: None, body: BodyState{ slices: Slices::new(), buf: Vec::new(), unflushed_buf_pos: 0, }, include_timestamp_subtitle_track: false, } } /// Sets if the generated `.mp4` should include a subtitle track with second-level timestamps. /// Default is false. pub fn include_timestamp_subtitle_track(&mut self, b: bool) { self.include_timestamp_subtitle_track = b; } /// Reserves space for the given number of additional segments. pub fn reserve(&mut self, additional: usize) { self.segments.reserve(additional); } pub fn len(&self) -> usize { self.segments.len() } /// Appends a segment for (a subset of) the given recording. pub fn append(&mut self, db: &MutexGuard, row: db::ListCameraRecordingsRow, rel_range_90k: Range) -> Result<()> { self.segments.push(Mp4Segment{ s: recording::Segment::new(db, &row, rel_range_90k)?, index: RefCell::new(None), first_frame_num: self.next_frame_num, num_subtitle_samples: 0, }); self.next_frame_num += row.video_samples as u32; if !self.video_sample_entries.iter().any(|e| e.id == row.video_sample_entry.id) { self.video_sample_entries.push(row.video_sample_entry); } Ok(()) } /// Builds the `Mp4File`, consuming the builder. pub fn build(mut self, db: Arc, dir: Arc) -> Result { let mut max_end = None; let mut etag = hash::Hasher::new(hash::Type::SHA1)?; etag.update(&FORMAT_VERSION[..])?; if self.include_timestamp_subtitle_track { etag.update(b":ts:")?; } for s in &mut self.segments { let d = &s.s.desired_range_90k; self.duration_90k += (d.end - d.start) as u32; let end = s.s.start + recording::Duration(d.end as i64); max_end = match max_end { None => Some(end), Some(v) => Some(cmp::max(v, end)), }; if self.include_timestamp_subtitle_track { // Calculate the number of subtitle samples: starting to ending time (rounding up). let start_sec = (s.s.start + recording::Duration(d.start as i64)).unix_seconds(); let end_sec = (s.s.start + recording::Duration(d.end as i64 + TIME_UNITS_PER_SEC - 1)) .unix_seconds(); s.num_subtitle_samples = (end_sec - start_sec) as u32; self.num_subtitle_samples += s.num_subtitle_samples; } // Update the etag to reflect this segment. let mut data = [0_u8; 24]; let mut cursor = io::Cursor::new(&mut data[..]); cursor.write_i64::(s.s.id)?; cursor.write_i64::(s.s.start.0)?; cursor.write_i32::(d.start)?; cursor.write_i32::(d.end)?; etag.update(cursor.into_inner())?; } let max_end = match max_end { None => return Err(Error::new("no segments!".to_owned())), Some(v) => v, }; let creation_ts = to_iso14496_timestamp(max_end); let mut est_slices = 16 + self.video_sample_entries.len() + 4 * self.segments.len(); if self.include_timestamp_subtitle_track { est_slices += 16 + self.segments.len(); } self.body.slices.reserve(est_slices); const EST_BUF_LEN: usize = 2048; self.body.buf.reserve(EST_BUF_LEN); self.body.append_static(StaticBytestring::FtypBox); self.append_moov(creation_ts)?; // Write the mdat header. Use the large format to support files over 2^32-1 bytes long. // Write zeroes for the length as a placeholder; fill it in after it's known. // It'd be nice to use the until-EOF form, but QuickTime Player doesn't support it. self.body.buf.extend_from_slice(b"\x00\x00\x00\x01mdat\x00\x00\x00\x00\x00\x00\x00\x00"); let mdat_len_pos = self.body.buf.len() - 8; self.body.flush_buf(); let initial_sample_byte_pos = self.body.slices.len(); for (i, s) in self.segments.iter().enumerate() { let r = s.s.sample_file_range(); self.body.slices.append(r.end - r.start, Mp4FileSlice::VideoSampleData(i as u32)); } if let Some(p) = self.subtitle_co64_pos { BigEndian::write_u64(&mut self.body.buf[p .. p + 8], self.body.slices.len()); for (i, s) in self.segments.iter().enumerate() { self.body.slices.append( s.num_subtitle_samples as u64 * (mem::size_of::() + SUBTITLE_LENGTH) as u64, Mp4FileSlice::SubtitleSampleData(i as u32)); } } // Fill in the length left as a placeholder above. Note the 16 here is the length // of the mdat header. BigEndian::write_u64(&mut self.body.buf[mdat_len_pos .. mdat_len_pos + 8], 16 + self.body.slices.len() - initial_sample_byte_pos); if est_slices < self.body.slices.num() { warn!("Estimated {} slices; actually were {} slices", est_slices, self.body.slices.num()); } else { debug!("Estimated {} slices; actually were {} slices", est_slices, self.body.slices.num()); } if EST_BUF_LEN < self.body.buf.len() { warn!("Estimated {} buf bytes; actually were {}", EST_BUF_LEN, self.body.buf.len()); } else { debug!("Estimated {} buf bytes; actually were {}", EST_BUF_LEN, self.body.buf.len()); } debug!("slices: {:?}", self.body.slices); Ok(Mp4File{ db: db, dir: dir, segments: self.segments, slices: self.body.slices, buf: self.body.buf, video_sample_entries: self.video_sample_entries, initial_sample_byte_pos: initial_sample_byte_pos, last_modified: header::HttpDate(time::at(Timespec::new(max_end.unix_seconds(), 0))), etag: header::EntityTag::strong(hex(&etag.finish()?)), }) } /// Appends a `MovieBox` (ISO/IEC 14496-12 section 8.2.1). fn append_moov(&mut self, creation_ts: u32) -> Result<()> { write_length!(self, { self.body.buf.extend_from_slice(b"moov"); self.append_mvhd(creation_ts); self.append_video_trak(creation_ts)?; if self.include_timestamp_subtitle_track { self.append_subtitle_trak(creation_ts); } }); Ok(()) } /// Appends a `MovieHeaderBox` version 0 (ISO/IEC 14496-12 section 8.2.2). fn append_mvhd(&mut self, creation_ts: u32) { write_length!(self, { self.body.buf.extend_from_slice(b"mvhd\x00\x00\x00\x00"); self.body.append_u32(creation_ts); self.body.append_u32(creation_ts); self.body.append_u32(TIME_UNITS_PER_SEC as u32); let d = self.duration_90k; self.body.append_u32(d); self.body.append_static(StaticBytestring::MvhdJunk); let next_track_id = if self.include_timestamp_subtitle_track { 3 } else { 2 }; self.body.append_u32(next_track_id); }); } /// Appends a `TrackBox` (ISO/IEC 14496-12 section 8.3.1) suitable for video. fn append_video_trak(&mut self, creation_ts: u32) -> Result<()> { write_length!(self, { self.body.buf.extend_from_slice(b"trak"); self.append_video_tkhd(creation_ts); self.maybe_append_video_edts()?; self.append_video_mdia(creation_ts); }); Ok(()) } /// Appends a `TrackBox` (ISO/IEC 14496-12 section 8.3.1) suitable for subtitles. fn append_subtitle_trak(&mut self, creation_ts: u32) { write_length!(self, { self.body.buf.extend_from_slice(b"trak"); self.append_subtitle_tkhd(creation_ts); self.append_subtitle_mdia(creation_ts); }); } /// Appends a `TrackHeaderBox` (ISO/IEC 14496-12 section 8.3.2) suitable for video. fn append_video_tkhd(&mut self, creation_ts: u32) { write_length!(self, { // flags 7: track_enabled | track_in_movie | track_in_preview self.body.buf.extend_from_slice(b"tkhd\x00\x00\x00\x07"); self.body.append_u32(creation_ts); self.body.append_u32(creation_ts); self.body.append_u32(1); // track_id self.body.append_u32(0); // reserved self.body.append_u32(self.duration_90k); self.body.append_static(StaticBytestring::TkhdJunk); let width = self.video_sample_entries.iter().map(|e| e.width).max().unwrap(); let height = self.video_sample_entries.iter().map(|e| e.height).max().unwrap(); self.body.append_u32((width as u32) << 16); self.body.append_u32((height as u32) << 16); }); } /// Appends a `TrackHeaderBox` (ISO/IEC 14496-12 section 8.3.2) suitable for subtitles. fn append_subtitle_tkhd(&mut self, creation_ts: u32) { write_length!(self, { // flags 7: track_enabled | track_in_movie | track_in_preview self.body.buf.extend_from_slice(b"tkhd\x00\x00\x00\x07"); self.body.append_u32(creation_ts); self.body.append_u32(creation_ts); self.body.append_u32(2); // track_id self.body.append_u32(0); // reserved self.body.append_u32(self.duration_90k); self.body.append_static(StaticBytestring::TkhdJunk); self.body.append_u32(0); // width, unused. self.body.append_u32(0); // height, unused. }); } /// Appends an `EditBox` (ISO/IEC 14496-12 section 8.6.5) suitable for video, if necessary. fn maybe_append_video_edts(&mut self) -> Result<()> { #[derive(Debug, Default)] struct Entry { segment_duration: u64, media_time: u64, }; let mut flushed: Vec = Vec::new(); let mut unflushed: Entry = Default::default(); let mut cur_media_time: u64 = 0; for s in &self.segments { // The actual range may start before the desired range because it can only start on a // key frame. This relationship should hold true: // actual start <= desired start < desired end let actual = s.s.actual_time_90k(); let skip = s.s.desired_range_90k.start - actual.start; let keep = s.s.desired_range_90k.end - s.s.desired_range_90k.start; assert!(skip >= 0 && keep > 0, "desired={}..{} actual={}..{}", s.s.desired_range_90k.start, s.s.desired_range_90k.end, actual.start, actual.end); cur_media_time += skip as u64; if unflushed.segment_duration + unflushed.media_time == cur_media_time { unflushed.segment_duration += keep as u64; } else { if unflushed.segment_duration > 0 { flushed.push(unflushed); } unflushed = Entry{ segment_duration: keep as u64, media_time: cur_media_time, }; } cur_media_time += keep as u64; } if flushed.is_empty() && unflushed.media_time == 0 { return Ok(()); // use implicit one-to-one mapping. } flushed.push(unflushed); debug!("Using edit list: {:?}", flushed); write_length!(self, { self.body.buf.extend_from_slice(b"edts"); write_length!(self, { // Use version 1 for 64-bit times. self.body.buf.extend_from_slice(b"elst\x01\x00\x00\x00"); self.body.append_u32(flushed.len() as u32); for e in &flushed { self.body.append_u64(e.segment_duration); self.body.append_u64(e.media_time); // media_rate_integer + media_rate_fraction: both fixed at 1 self.body.buf.extend_from_slice(b"\x00\x01\x00\x01"); } }); }); Ok(()) } /// Appends a `MediaBox` (ISO/IEC 14496-12 section 8.4.1) suitable for video. fn append_video_mdia(&mut self, creation_ts: u32) { write_length!(self, { self.body.buf.extend_from_slice(b"mdia"); self.append_mdhd(creation_ts); self.body.append_static(StaticBytestring::VideoHdlrBox); self.append_video_minf(); }); } /// Appends a `MediaBox` (ISO/IEC 14496-12 section 8.4.1) suitable for subtitles. fn append_subtitle_mdia(&mut self, creation_ts: u32) { write_length!(self, { self.body.buf.extend_from_slice(b"mdia"); self.append_mdhd(creation_ts); self.body.append_static(StaticBytestring::SubtitleHdlrBox); self.append_subtitle_minf(); }); } /// Appends a `MediaHeaderBox` (ISO/IEC 14496-12 section 8.4.2.) suitable for either the video /// or subtitle track. fn append_mdhd(&mut self, creation_ts: u32) { write_length!(self, { self.body.buf.extend_from_slice(b"mdhd\x00\x00\x00\x00"); self.body.append_u32(creation_ts); self.body.append_u32(creation_ts); self.body.append_u32(TIME_UNITS_PER_SEC as u32); self.body.append_u32(self.duration_90k); self.body.append_u32(0x55c40000); // language=und + pre_defined }); } /// Appends a `MediaInformationBox` (ISO/IEC 14496-12 section 8.4.4) suitable for video. fn append_video_minf(&mut self) { write_length!(self, { self.body.append_static(StaticBytestring::VideoMinfJunk); self.append_video_stbl(); }); } /// Appends a `MediaInformationBox` (ISO/IEC 14496-12 section 8.4.4) suitable for subtitles. fn append_subtitle_minf(&mut self) { write_length!(self, { self.body.append_static(StaticBytestring::SubtitleMinfJunk); self.append_subtitle_stbl(); }); } /// Appends a `SampleTableBox` (ISO/IEC 14496-12 section 8.5.1) suitable for video. fn append_video_stbl(&mut self) { write_length!(self, { self.body.buf.extend_from_slice(b"stbl"); self.append_video_stsd(); self.append_video_stts(); self.append_video_stsc(); self.append_video_stsz(); self.append_video_co64(); self.append_video_stss(); }); } /// Appends a `SampleTableBox` (ISO/IEC 14496-12 section 8.5.1) suitable for subtitles. fn append_subtitle_stbl(&mut self) { write_length!(self, { self.body.append_static(StaticBytestring::SubtitleStblJunk); self.append_subtitle_stts(); self.append_subtitle_stsc(); self.append_subtitle_stsz(); self.append_subtitle_co64(); }); } /// Appends a `SampleDescriptionBox` (ISO/IEC 14496-12 section 8.5.2) suitable for video. fn append_video_stsd(&mut self) { write_length!(self, { self.body.buf.extend_from_slice(b"stsd\x00\x00\x00\x00"); let n_entries = self.video_sample_entries.len() as u32; self.body.append_u32(n_entries); self.body.flush_buf(); for (i, e) in self.video_sample_entries.iter().enumerate() { self.body.slices.append(e.data.len() as u64, Mp4FileSlice::VideoSampleEntry(i as u32)); } }); } /// Appends a `TimeToSampleBox` (ISO/IEC 14496-12 section 8.6.1) suitable for video. fn append_video_stts(&mut self) { write_length!(self, { self.body.buf.extend_from_slice(b"stts\x00\x00\x00\x00"); let mut entry_count = 0; for s in &self.segments { entry_count += s.s.frames as u32; } self.body.append_u32(entry_count); self.body.flush_buf(); for (i, s) in self.segments.iter().enumerate() { self.body.slices.append( 2 * (mem::size_of::() as u64) * (s.s.frames as u64), Mp4FileSlice::Stts(i as u32)); } }); } /// Appends a `TimeToSampleBox` (ISO/IEC 14496-12 section 8.6.1) suitable for subtitles. fn append_subtitle_stts(&mut self) { write_length!(self, { self.body.buf.extend_from_slice(b"stts\x00\x00\x00\x00"); let entry_count_pos = self.body.buf.len(); self.body.append_u32(0); // placeholder for entry_count let mut entry_count = 0; for s in &self.segments { let r = &s.s.desired_range_90k; let start = s.s.start + recording::Duration(r.start as i64); let end = s.s.start + recording::Duration(r.end as i64); let start_next_sec = recording::Time( start.0 + TIME_UNITS_PER_SEC - (start.0 % TIME_UNITS_PER_SEC)); if end <= start_next_sec { // Segment doesn't last past the next second. entry_count += 1; self.body.append_u32(1); // count self.body.append_u32((end - start).0 as u32); // duration } else { // The first subtitle just lasts until the next second. entry_count += 1; self.body.append_u32(1); // count self.body.append_u32((start_next_sec - start).0 as u32); // duration // Then there are zero or more "interior" subtitles, one second each. let end_prev_sec = recording::Time(end.0 - (end.0 % TIME_UNITS_PER_SEC)); if start_next_sec < end_prev_sec { entry_count += 1; let interior = (end_prev_sec - start_next_sec).0 / TIME_UNITS_PER_SEC; self.body.append_u32(interior as u32); // count self.body.append_u32(TIME_UNITS_PER_SEC as u32); // duration } // Then there's a final subtitle for the remaining fraction of a second. entry_count += 1; self.body.append_u32(1); // count self.body.append_u32((end - end_prev_sec).0 as u32); // duration } } BigEndian::write_u32(&mut self.body.buf[entry_count_pos .. entry_count_pos + 4], entry_count); }); } /// Appends a `SampleToChunkBox` (ISO/IEC 14496-12 section 8.7.4) suitable for video. fn append_video_stsc(&mut self) { write_length!(self, { self.body.buf.extend_from_slice(b"stsc\x00\x00\x00\x00"); self.body.append_u32(self.segments.len() as u32); for (i, s) in self.segments.iter().enumerate() { self.body.append_u32((i + 1) as u32); self.body.append_u32(s.s.frames as u32); // Write sample_description_index. let i = self.video_sample_entries.iter().position( |e| e.id == s.s.video_sample_entry_id).unwrap(); self.body.append_u32((i + 1) as u32); } }); } /// Appends a `SampleToChunkBox` (ISO/IEC 14496-12 section 8.7.4) suitable for subtitles. fn append_subtitle_stsc(&mut self) { write_length!(self, { self.body.buf.extend_from_slice( b"stsc\x00\x00\x00\x00\x00\x00\x00\x01\x00\x00\x00\x01"); self.body.append_u32(self.num_subtitle_samples); self.body.append_u32(1); }); } /// Appends a `SampleSizeBox` (ISO/IEC 14496-12 section 8.7.3) suitable for video. fn append_video_stsz(&mut self) { write_length!(self, { self.body.buf.extend_from_slice(b"stsz\x00\x00\x00\x00\x00\x00\x00\x00"); let mut entry_count = 0; for s in &self.segments { entry_count += s.s.frames as u32; } self.body.append_u32(entry_count); self.body.flush_buf(); for (i, s) in self.segments.iter().enumerate() { self.body.slices.append( (mem::size_of::()) as u64 * (s.s.frames as u64), Mp4FileSlice::Stsz(i as u32)); } }); } /// Appends a `SampleSizeBox` (ISO/IEC 14496-12 section 8.7.3) suitable for subtitles. fn append_subtitle_stsz(&mut self) { write_length!(self, { self.body.buf.extend_from_slice(b"stsz\x00\x00\x00\x00"); self.body.append_u32((mem::size_of::() + SUBTITLE_LENGTH) as u32); self.body.append_u32(self.num_subtitle_samples); }); } /// Appends a `ChunkLargeOffsetBox` (ISO/IEC 14496-12 section 8.7.5) suitable for video. fn append_video_co64(&mut self) { write_length!(self, { self.body.buf.extend_from_slice(b"co64\x00\x00\x00\x00"); self.body.append_u32(self.segments.len() as u32); self.body.flush_buf(); self.body.slices.append( (mem::size_of::()) as u64 * (self.segments.len() as u64), Mp4FileSlice::Co64); }); } /// Appends a `ChunkLargeOffsetBox` (ISO/IEC 14496-12 section 8.7.5) suitable for subtitles. fn append_subtitle_co64(&mut self) { write_length!(self, { // Write a placeholder; the actual value will be filled in later. self.body.buf.extend_from_slice( b"co64\x00\x00\x00\x00\x00\x00\x00\x01\x00\x00\x00\x00\x00\x00\x00\x00"); self.subtitle_co64_pos = Some(self.body.buf.len() - 8); }); } /// Appends a `SyncSampleBox` (ISO/IEC 14496-12 section 8.6.2) suitable for video. fn append_video_stss(&mut self) { write_length!(self, { self.body.buf.extend_from_slice(b"stss\x00\x00\x00\x00"); let mut entry_count = 0; for s in &self.segments { entry_count += s.s.key_frames as u32; } self.body.append_u32(entry_count); self.body.flush_buf(); for (i, s) in self.segments.iter().enumerate() { self.body.slices.append( (mem::size_of::() as u64) * (s.s.key_frames as u64), Mp4FileSlice::Stss(i as u32)); } }); } } impl BodyState { fn append_u32(&mut self, v: u32) { self.buf.write_u32::(v).expect("Vec write shouldn't fail"); } fn append_u64(&mut self, v: u64) { self.buf.write_u64::(v).expect("Vec write shouldn't fail"); } /// Flushes the buffer: appends a slice for everything written into the buffer so far, /// noting the position which has been flushed. Call this method prior to adding any non-buffer /// slice. fn flush_buf(&mut self) { let len = self.buf.len(); if self.unflushed_buf_pos < len { self.slices.append((len - self.unflushed_buf_pos) as u64, Mp4FileSlice::Buf(self.unflushed_buf_pos as u32)); self.unflushed_buf_pos = len; } } /// Appends a static bytestring, flushing the buffer if necessary. fn append_static(&mut self, which: StaticBytestring) { self.flush_buf(); let s = STATIC_BYTESTRINGS[which as usize]; self.slices.append(s.len() as u64, Mp4FileSlice::Static(which)); } } pub struct Mp4File { db: Arc, dir: Arc, segments: Vec, slices: Slices, buf: Vec, video_sample_entries: SmallVec<[Arc; 1]>, initial_sample_byte_pos: u64, last_modified: header::HttpDate, etag: header::EntityTag, } impl Mp4File { fn write_stts(&self, i: usize, r: Range, _l: u64, out: &mut io::Write) -> Result<()> { self.segments[i].with_index(&self.db, |i| { out.write_all(&i.stts()[r.start as usize .. r.end as usize])?; Ok(()) }) } fn write_stsz(&self, i: usize, r: Range, _l: u64, out: &mut io::Write) -> Result<()> { self.segments[i].with_index(&self.db, |i| { out.write_all(&i.stsz()[r.start as usize .. r.end as usize])?; Ok(()) }) } fn write_co64(&self, r: Range, l: u64, out: &mut io::Write) -> Result<()> { pieces::clip_to_range(r, l, out, |w| { let mut pos = self.initial_sample_byte_pos; for s in &self.segments { w.write_u64::(pos)?; let r = s.s.sample_file_range(); pos += r.end - r.start; } Ok(()) }) } fn write_stss(&self, i: usize, r: Range, _l: u64, out: &mut io::Write) -> Result<()> { self.segments[i].with_index(&self.db, |i| { out.write_all(&i.stss()[r.start as usize .. r.end as usize])?; Ok(()) }) } fn write_video_sample_data(&self, i: usize, r: Range, out: &mut io::Write) -> Result<()> { let s = &self.segments[i]; let f = self.dir.open_sample_file(self.db.lock().get_recording(s.s.id)?.sample_file_uuid)?; mmapfile::MmapFileSlice::new(f, s.s.sample_file_range()).write_to(r, out) } fn write_subtitle_sample_data(&self, i: usize, r: Range, l: u64, out: &mut io::Write) -> Result<()> { let s = &self.segments[i]; let d = &s.s.desired_range_90k; let start_sec = (s.s.start + recording::Duration(d.start as i64)).unix_seconds(); let end_sec = (s.s.start + recording::Duration(d.end as i64 + TIME_UNITS_PER_SEC - 1)) .unix_seconds(); pieces::clip_to_range(r, l, out, |w| { for ts in start_sec .. end_sec { w.write_u16::(SUBTITLE_LENGTH as u16)?; let tm = time::at(time::Timespec{sec: ts, nsec: 0}); use std::io::Write; write!(w, "{}", tm.strftime(SUBTITLE_TEMPLATE)?)?; } Ok(()) })?; Ok(()) } } impl resource::Resource for Mp4File { fn content_type(&self) -> mime::Mime { "video/mp4".parse().unwrap() } fn last_modified(&self) -> &header::HttpDate { &self.last_modified } fn etag(&self) -> Option<&header::EntityTag> { Some(&self.etag) } fn len(&self) -> u64 { self.slices.len() } fn write_to(&self, range: Range, out: &mut io::Write) -> Result<()> { self.slices.write_to(self, range, out) } } /// Tests. There are two general strategies used to validate the resulting files: /// /// * basic tests that ffmpeg can read the generated mp4s. This ensures compatibility with /// popular software, though it's hard to test specifics. ffmpeg provides an abstraction layer /// over the encapsulation format, so mp4-specific details are hard to see. Also, ffmpeg might /// paper over errors in the mp4 or have its own bugs. /// /// * tests using the `BoxCursor` type to inspect the generated mp4s more closely. These don't /// detect misunderstandings of the specification or incompatibilities, but they can be used /// to verify the output is byte-for-byte as expected. #[cfg(test)] mod tests { extern crate test; use db; use dir; use ffmpeg; use hyper::{self, header}; use openssl::crypto::hash; use recording::{self, TIME_UNITS_PER_SEC}; use resource::{self, Resource}; use self::test::Bencher; use std::fs; use std::io; use std::mem; use std::path::Path; use std::sync::Arc; use std::str; use super::*; use stream::{self, Opener, Stream}; use testutil::{self, TestDb}; use uuid::Uuid; /// A wrapper around openssl's SHA-1 hashing that implements the `Write` trait. struct Sha1(hash::Hasher); impl Sha1 { fn new() -> Sha1 { Sha1(hash::Hasher::new(hash::Type::SHA1).unwrap()) } fn finish(mut self) -> Vec { self.0.finish().unwrap() } } impl io::Write for Sha1 { fn write(&mut self, buf: &[u8]) -> io::Result { self.0.update(buf).unwrap(); Ok(buf.len()) } fn flush(&mut self) -> io::Result<()> { Ok(()) } } /// Returns the SHA-1 digest of the given `Resource`. fn digest(r: &Resource) -> Vec { let mut sha1 = Sha1::new(); r.write_to(0 .. r.len(), &mut sha1).unwrap(); sha1.finish() } const TEST_CAMERA_ID: i32 = 1; /// Information used within `BoxCursor` to describe a box on the stack. #[derive(Clone)] struct Mp4Box { interior: Range, boxtype: [u8; 4], } /// A cursor over the boxes in a `.mp4` file. Supports moving forward and up/down the box /// stack, not backward. Panics on error. #[derive(Clone)] struct BoxCursor<'a> { mp4: &'a resource::Resource, stack: Vec, } impl<'a> BoxCursor<'a> { pub fn new(mp4: &'a resource::Resource) -> BoxCursor<'a> { BoxCursor{ mp4: mp4, stack: Vec::new(), } } /// Pushes the box at the given position onto the stack (returning true), or returns /// false if pos == max. fn internal_push(&mut self, pos: u64, max: u64) -> bool { if pos == max { return false; } let mut hdr = [0u8; 16]; self.mp4.write_to(pos .. pos+8, &mut &mut hdr[..]).unwrap(); let (len, hdr_len, boxtype_slice) = match BigEndian::read_u32(&hdr[..4]) { 0 => (self.mp4.len() - pos, 8, &hdr[4..8]), 1 => { self.mp4.write_to(pos+8 .. pos+12, &mut &mut hdr[..]).unwrap(); (BigEndian::read_u64(&hdr[4..12]), 16, &hdr[12..]) }, l => (l as u64, 8, &hdr[4..8]), }; let mut boxtype = [0u8; 4]; assert!(pos + (hdr_len as u64) <= max); assert!(pos + len <= max); boxtype[..].copy_from_slice(boxtype_slice); self.stack.push(Mp4Box{ interior: pos + hdr_len as u64 .. pos + len, boxtype: boxtype, }); trace!("positioned at {}", self.path()); true } fn path(&self) -> String { let mut s = String::with_capacity(5 * self.stack.len()); for b in &self.stack { s.push('/'); s.push_str(str::from_utf8(&b.boxtype[..]).unwrap()); } s } /// Gets the specified byte range within the current box, starting after the box type. /// Must not be at EOF. pub fn get(&self, r: Range, mut buf: &mut [u8]) { let interior = &self.stack.last().expect("at root").interior; assert!(r.end < interior.end - interior.start); self.mp4.write_to(r.start+interior.start .. r.end+interior.start, &mut buf).unwrap(); } pub fn get_all(&self) -> Vec { let interior = self.stack.last().expect("at root").interior.clone(); let len = (interior.end - interior.start) as usize; let mut out = Vec::with_capacity(len); self.mp4.write_to(interior, &mut out).unwrap(); out } /// Gets the specified u32 within the current box, starting after the box type. /// Must not be at EOF. pub fn get_u32(&self, p: u64) -> u32 { let mut buf = [0u8; 4]; self.get(p .. p+4, &mut buf); BigEndian::read_u32(&buf[..]) } /// Navigates to the next box after the current one, or up if the current one is last. #[allow(should_implement_trait)] pub fn next(&mut self) -> bool { let old = self.stack.pop().expect("positioned at root; there is no next"); let max = self.stack.last().map(|b| b.interior.end).unwrap_or_else(|| self.mp4.len()); self.internal_push(old.interior.end, max) } /// Finds the next box of the given type after the current one, or navigates up if absent. pub fn find(&mut self, boxtype: &[u8]) -> bool { trace!("looking for {}", str::from_utf8(boxtype).unwrap()); loop { if &self.stack.last().unwrap().boxtype[..] == boxtype { return true; } if !self.next() { return false; } } } /// Moves up the stack. Must not be at root. pub fn up(&mut self) { self.stack.pop(); } /// Moves down the stack. Must be positioned on a box with children. pub fn down(&mut self) { let range = self.stack.last().map(|b| b.interior.clone()) .unwrap_or_else(|| 0 .. self.mp4.len()); assert!(self.internal_push(range.start, range.end), "no children in {}", self.path()); } } /// Information returned by `find_track`. struct Track<'a> { edts_cursor: Option>, stbl_cursor: BoxCursor<'a>, } /// Finds the `moov/trak` that has a `tkhd` associated with the given `track_id`, which must /// exist. fn find_track(mp4: & resource::Resource, track_id: u32) -> Track { let mut cursor = BoxCursor::new(mp4); cursor.down(); assert!(cursor.find(b"moov")); cursor.down(); loop { assert!(cursor.find(b"trak")); cursor.down(); assert!(cursor.find(b"tkhd")); let mut version = [0u8; 1]; cursor.get(0 .. 1, &mut version); // Let id_pos be the offset after the FullBox section of the track_id. let id_pos = match version[0] { 0 => 8, // track_id follows 32-bit creation_time and modification_time 1 => 16, // ...64-bit times... v => panic!("unexpected tkhd version {}", v), }; let cur_track_id = cursor.get_u32(4 + id_pos); trace!("found moov/trak/tkhd with id {}; want {}", cur_track_id, track_id); if cur_track_id == track_id { break; } cursor.up(); assert!(cursor.next()); } let edts_cursor; if cursor.find(b"edts") { edts_cursor = Some(cursor.clone()); cursor.up(); } else { edts_cursor = None; }; cursor.down(); assert!(cursor.find(b"mdia")); cursor.down(); assert!(cursor.find(b"minf")); cursor.down(); assert!(cursor.find(b"stbl")); Track{ edts_cursor: edts_cursor, stbl_cursor: cursor, } } fn copy_mp4_to_db(db: &TestDb) { let mut input = stream::FFMPEG.open(stream::Source::File("src/testdata/clip.mp4")).unwrap(); // 2015-04-26 00:00:00 UTC. const START_TIME: recording::Time = recording::Time(1430006400i64 * TIME_UNITS_PER_SEC); let extra_data = input.get_extra_data().unwrap(); let video_sample_entry_id = db.db.lock().insert_video_sample_entry( extra_data.width, extra_data.height, &extra_data.sample_entry).unwrap(); let mut output = db.dir.create_writer(&db.syncer_channel, START_TIME, START_TIME, TEST_CAMERA_ID, video_sample_entry_id).unwrap(); // end_pts is the pts of the end of the most recent frame (start + duration). // It's needed because dir::Writer calculates a packet's duration from its pts and the // next packet's pts. That's more accurate for RTSP than ffmpeg's estimate of duration. // To write the final packet of this sample .mp4 with a full duration, we need to fake a // next packet's pts from the ffmpeg-supplied duration. let mut end_pts = None; loop { let pkt = match input.get_next() { Ok(p) => p, Err(ffmpeg::Error::Eof) => { break; }, Err(e) => { panic!("unexpected input error: {}", e); }, }; output.write(pkt.data().expect("packet without data"), pkt.pts().unwrap(), pkt.is_key()).unwrap(); end_pts = Some(pkt.pts().unwrap() + pkt.duration()); } output.close(end_pts).unwrap(); db.syncer_channel.flush(); } fn add_dummy_recordings_to_db(db: &db::Database) { let mut data = Vec::new(); data.extend_from_slice(include_bytes!("testdata/video_sample_index.bin")); let mut db = db.lock(); let video_sample_entry_id = db.insert_video_sample_entry(1920, 1080, &[0u8; 100]).unwrap(); const START_TIME: recording::Time = recording::Time(1430006400i64 * TIME_UNITS_PER_SEC); const DURATION: recording::Duration = recording::Duration(5399985); let mut recording = db::RecordingToInsert{ camera_id: TEST_CAMERA_ID, sample_file_bytes: 30104460, time: START_TIME .. (START_TIME + DURATION), local_time: START_TIME, video_samples: 1800, video_sync_samples: 60, video_sample_entry_id: video_sample_entry_id, sample_file_uuid: Uuid::nil(), video_index: data, sample_file_sha1: [0; 20], }; let mut tx = db.tx().unwrap(); tx.bypass_reservation_for_testing = true; for _ in 0..60 { tx.insert_recording(&recording).unwrap(); recording.time.start += DURATION; recording.local_time += DURATION; recording.time.end += DURATION; } tx.commit().unwrap(); } fn create_mp4_from_db(db: Arc, dir: Arc, skip_90k: i32, shorten_90k: i32, include_subtitles: bool) -> Mp4File { let mut builder = Mp4FileBuilder::new(); builder.include_timestamp_subtitle_track(include_subtitles); let all_time = recording::Time(i64::min_value()) .. recording::Time(i64::max_value()); { let db = db.lock(); db.list_recordings(TEST_CAMERA_ID, &all_time, |r| { let d = r.duration_90k; assert!(skip_90k + shorten_90k < d); builder.append(&db, r, skip_90k .. d - shorten_90k).unwrap(); Ok(()) }).unwrap(); } builder.build(db, dir).unwrap() } fn write_mp4(mp4: &Mp4File, dir: &Path) -> String { let mut filename = dir.to_path_buf(); filename.push("clip.new.mp4"); let mut out = fs::OpenOptions::new().write(true).create_new(true).open(&filename).unwrap(); mp4.write_to(0 .. mp4.len(), &mut out).unwrap(); filename.to_str().unwrap().to_string() } fn compare_mp4s(new_filename: &str, pts_offset: i64, shorten: i64) { let mut orig = stream::FFMPEG.open(stream::Source::File("src/testdata/clip.mp4")).unwrap(); let mut new = stream::FFMPEG.open(stream::Source::File(new_filename)).unwrap(); assert_eq!(orig.get_extra_data().unwrap(), new.get_extra_data().unwrap()); let mut final_durations = None; loop { let orig_pkt = match orig.get_next() { Ok(p) => Some(p), Err(ffmpeg::Error::Eof) => None, Err(e) => { panic!("unexpected input error: {}", e); }, }; let new_pkt = match new.get_next() { Ok(p) => Some(p), Err(ffmpeg::Error::Eof) => { break; }, Err(e) => { panic!("unexpected input error: {}", e); }, }; let (orig_pkt, new_pkt) = match (orig_pkt, new_pkt) { (Some(o), Some(n)) => (o, n), (None, None) => break, (o, n) => panic!("orig: {} new: {}", o.is_some(), n.is_some()), }; assert_eq!(orig_pkt.pts().unwrap(), new_pkt.pts().unwrap() + pts_offset); assert_eq!(orig_pkt.dts(), new_pkt.dts() + pts_offset); assert_eq!(orig_pkt.data(), new_pkt.data()); assert_eq!(orig_pkt.is_key(), new_pkt.is_key()); final_durations = Some((orig_pkt.duration(), new_pkt.duration())); } if let Some((orig_dur, new_dur)) = final_durations { // One would normally expect the duration to be exactly the same, but when using an // edit list, ffmpeg appears to extend the last packet's duration by the amount skipped // at the beginning. I think this is a bug on their side. assert!(orig_dur - shorten + pts_offset == new_dur, "orig_dur={} new_dur={} shorten={} pts_offset={}", orig_dur, new_dur, shorten, pts_offset); } } /// Makes a `.mp4` file which is only good for exercising the `Mp4FileSlice` logic for /// producing sample tables that match the supplied encoder. fn make_mp4_from_encoder(db: &TestDb, encoder: recording::SampleIndexEncoder, desired_range_90k: Range) -> Mp4File { let row = db.create_recording_from_encoder(encoder); let mut builder = Mp4FileBuilder::new(); builder.append(&db.db.lock(), row, desired_range_90k).unwrap(); builder.build(db.db.clone(), db.dir.clone()).unwrap() } /// Tests sample table for a simple video index of all sync frames. #[test] fn test_all_sync_frames() { testutil::init(); let db = TestDb::new(); let mut encoder = recording::SampleIndexEncoder::new(); for i in 1..6 { let duration_90k = 2 * i; let bytes = 3 * i; encoder.add_sample(duration_90k, bytes, true); } // Time range [2, 2+4+6+8) means the 2nd, 3rd, and 4th samples should be included. let mp4 = make_mp4_from_encoder(&db, encoder, 2 .. 2+4+6+8); let track = find_track(&mp4, 1); assert!(track.edts_cursor.is_none()); let mut cursor = track.stbl_cursor; cursor.down(); cursor.find(b"stts"); assert_eq!(cursor.get_all(), &[ 0x00, 0x00, 0x00, 0x00, // version + flags 0x00, 0x00, 0x00, 0x03, // entry_count // entries 0x00, 0x00, 0x00, 0x01, 0x00, 0x00, 0x00, 0x04, // run length / timestamps. 0x00, 0x00, 0x00, 0x01, 0x00, 0x00, 0x00, 0x06, 0x00, 0x00, 0x00, 0x01, 0x00, 0x00, 0x00, 0x08, ]); cursor.find(b"stsz"); assert_eq!(cursor.get_all(), &[ 0x00, 0x00, 0x00, 0x00, // version + flags 0x00, 0x00, 0x00, 0x00, // sample_size 0x00, 0x00, 0x00, 0x03, // sample_count // entries 0x00, 0x00, 0x00, 0x06, // size 0x00, 0x00, 0x00, 0x09, 0x00, 0x00, 0x00, 0x0c, ]); cursor.find(b"stss"); assert_eq!(cursor.get_all(), &[ 0x00, 0x00, 0x00, 0x00, // version + flags 0x00, 0x00, 0x00, 0x03, // entry_count // entries 0x00, 0x00, 0x00, 0x01, // sample_number 0x00, 0x00, 0x00, 0x02, 0x00, 0x00, 0x00, 0x03, ]); } /// Tests sample table and edit list for a video index with half sync frames. #[test] fn test_half_sync_frames() { testutil::init(); let db = TestDb::new(); let mut encoder = recording::SampleIndexEncoder::new(); for i in 1..6 { let duration_90k = 2 * i; let bytes = 3 * i; encoder.add_sample(duration_90k, bytes, (i % 2) == 1); } // Time range [2+4+6, 2+4+6+8) means the 4th sample should be included. // The 3rd gets pulled in also because it's a sync frame and the 4th isn't. let mp4 = make_mp4_from_encoder(&db, encoder, 2+4+6 .. 2+4+6+8); let track = find_track(&mp4, 1); // Examine edts. It should skip the 3rd frame. let mut cursor = track.edts_cursor.unwrap(); cursor.down(); cursor.find(b"elst"); assert_eq!(cursor.get_all(), &[ 0x01, 0x00, 0x00, 0x00, // version + flags 0x00, 0x00, 0x00, 0x01, // length 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x08, // segment_duration 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x06, // media_time 0x00, 0x01, 0x00, 0x01, // media_rate_{integer,fraction} ]); // Examine stbl. let mut cursor = track.stbl_cursor; cursor.down(); cursor.find(b"stts"); assert_eq!(cursor.get_all(), &[ 0x00, 0x00, 0x00, 0x00, // version + flags 0x00, 0x00, 0x00, 0x02, // entry_count // entries 0x00, 0x00, 0x00, 0x01, 0x00, 0x00, 0x00, 0x06, // run length / timestamps. 0x00, 0x00, 0x00, 0x01, 0x00, 0x00, 0x00, 0x08, ]); cursor.find(b"stsz"); assert_eq!(cursor.get_all(), &[ 0x00, 0x00, 0x00, 0x00, // version + flags 0x00, 0x00, 0x00, 0x00, // sample_size 0x00, 0x00, 0x00, 0x02, // sample_count // entries 0x00, 0x00, 0x00, 0x09, // size 0x00, 0x00, 0x00, 0x0c, ]); cursor.find(b"stss"); assert_eq!(cursor.get_all(), &[ 0x00, 0x00, 0x00, 0x00, // version + flags 0x00, 0x00, 0x00, 0x01, // entry_count // entries 0x00, 0x00, 0x00, 0x01, // sample_number ]); } #[test] fn test_round_trip() { testutil::init(); let db = TestDb::new(); copy_mp4_to_db(&db); let mp4 = create_mp4_from_db(db.db.clone(), db.dir.clone(), 0, 0, false); let new_filename = write_mp4(&mp4, db.tmpdir.path()); compare_mp4s(&new_filename, 0, 0); // Test the metadata. This is brittle, which is the point. Any time the digest comparison // here fails, it can be updated, but the etag must change as well! Otherwise clients may // combine ranges from the new format with ranges from the old format. let sha1 = digest(&mp4); assert_eq!("1e5331e8371bd97ac3158b3a86494abc87cdc70e", super::hex(&sha1[..])); const EXPECTED_ETAG: &'static str = "3c48af4dbce2024db07f27a00789b6af774a8c89"; assert_eq!(Some(&header::EntityTag::strong(EXPECTED_ETAG.to_owned())), mp4.etag()); drop(db.syncer_channel); db.syncer_join.join().unwrap(); } #[test] fn test_round_trip_with_subtitles() { testutil::init(); let db = TestDb::new(); copy_mp4_to_db(&db); let mp4 = create_mp4_from_db(db.db.clone(), db.dir.clone(), 0, 0, true); let new_filename = write_mp4(&mp4, db.tmpdir.path()); compare_mp4s(&new_filename, 0, 0); // Test the metadata. This is brittle, which is the point. Any time the digest comparison // here fails, it can be updated, but the etag must change as well! Otherwise clients may // combine ranges from the new format with ranges from the old format. let sha1 = digest(&mp4); assert_eq!("de382684a471f178e4e3a163762711b0653bfd83", super::hex(&sha1[..])); const EXPECTED_ETAG: &'static str = "c24d7af372e5d8f66f4feb6e3a5cd43828392371"; assert_eq!(Some(&header::EntityTag::strong(EXPECTED_ETAG.to_owned())), mp4.etag()); drop(db.syncer_channel); db.syncer_join.join().unwrap(); } #[test] fn test_round_trip_with_edit_list() { testutil::init(); let db = TestDb::new(); copy_mp4_to_db(&db); let mp4 = create_mp4_from_db(db.db.clone(), db.dir.clone(), 1, 0, false); let new_filename = write_mp4(&mp4, db.tmpdir.path()); compare_mp4s(&new_filename, 1, 0); // Test the metadata. This is brittle, which is the point. Any time the digest comparison // here fails, it can be updated, but the etag must change as well! Otherwise clients may // combine ranges from the new format with ranges from the old format. let sha1 = digest(&mp4); assert_eq!("685e026af44204bc9cc52115c5e17058e9fb7c70", super::hex(&sha1[..])); const EXPECTED_ETAG: &'static str = "870e2b3cfef4a988951344b32e53af0d4496894d"; assert_eq!(Some(&header::EntityTag::strong(EXPECTED_ETAG.to_owned())), mp4.etag()); drop(db.syncer_channel); db.syncer_join.join().unwrap(); } #[test] fn test_round_trip_with_shorten() { testutil::init(); let db = TestDb::new(); copy_mp4_to_db(&db); let mp4 = create_mp4_from_db(db.db.clone(), db.dir.clone(), 0, 1, false); let new_filename = write_mp4(&mp4, db.tmpdir.path()); compare_mp4s(&new_filename, 0, 1); // Test the metadata. This is brittle, which is the point. Any time the digest comparison // here fails, it can be updated, but the etag must change as well! Otherwise clients may // combine ranges from the new format with ranges from the old format. let sha1 = digest(&mp4); assert_eq!("e0d28ddf08e24575a82657b1ce0b2da73f32fd88", super::hex(&sha1[..])); const EXPECTED_ETAG: &'static str = "71c329188a2cd175c8d61492a9789e242af06c05"; assert_eq!(Some(&header::EntityTag::strong(EXPECTED_ETAG.to_owned())), mp4.etag()); drop(db.syncer_channel); db.syncer_join.join().unwrap(); } #[test] fn mp4_file_slice_size() { assert_eq!(8, mem::size_of::()); } /// An HTTP server for benchmarking. /// It's used as a singleton via `lazy_static!` for two reasons: /// /// * to avoid running out of file descriptors. `#[bench]` functions apparently get called /// many times as the number of iterations is tuned, and hyper servers /// [can't be shut down](https://github.com/hyperium/hyper/issues/338), so /// otherwise the default Ubuntu 16.04.1 ulimit of 1024 files is quickly exhausted. /// * so that when getting a CPU profile of the benchmark, more of the profile focuses /// on the HTTP serving rather than the setup. /// /// Currently this only serves a single `.mp4` file but we could set up variations to benchmark /// different scenarios: with/without subtitles and edit lists, different lengths, serving /// different fractions of the file, etc. struct BenchServer { url: hyper::Url, generated_len: u64, } impl BenchServer { fn new() -> BenchServer { let mut listener = hyper::net::HttpListener::new("127.0.0.1:0").unwrap(); use hyper::net::NetworkListener; let addr = listener.local_addr().unwrap(); let server = hyper::Server::new(listener); let url = hyper::Url::parse( format!("http://{}:{}/", addr.ip(), addr.port()).as_str()).unwrap(); let db = TestDb::new(); add_dummy_recordings_to_db(&db.db); let mp4 = create_mp4_from_db(db.db.clone(), db.dir.clone(), 0, 0, false); let p = mp4.initial_sample_byte_pos; use std::thread::spawn; spawn(move || { use hyper::server::{Request, Response, Fresh}; let (db, dir) = (db.db.clone(), db.dir.clone()); let _ = server.handle(move |req: Request, res: Response| { let mp4 = create_mp4_from_db(db.clone(), dir.clone(), 0, 0, false); resource::serve(&mp4, &req, res).unwrap(); }); }); BenchServer{ url: url, generated_len: p, } } } lazy_static! { static ref SERVER: BenchServer = { BenchServer::new() }; } /// Benchmarks serving the generated part of a `.mp4` file (up to the first byte from disk). #[bench] fn serve_generated_bytes_fresh_client(b: &mut Bencher) { testutil::init(); let server = &*SERVER; let p = server.generated_len; let mut buf = Vec::with_capacity(p as usize); b.bytes = p; b.iter(|| { let client = hyper::Client::new(); let mut resp = client.get(server.url.clone()) .header(header::Range::Bytes(vec![header::ByteRangeSpec::FromTo(0, p - 1)])) .send() .unwrap(); buf.clear(); use std::io::Read; let size = resp.read_to_end(&mut buf).unwrap(); assert_eq!(p, size as u64); }); } /// Another benchmark of serving generated bytes, but reusing the `hyper::Client`. /// This should be faster than the `fresh` version, but see /// [this hyper issue](https://github.com/hyperium/hyper/issues/944) relating to Nagle's /// algorithm. #[bench] fn serve_generated_bytes_reuse_client(b: &mut Bencher) { testutil::init(); let server = &*SERVER; let p = server.generated_len; let mut buf = Vec::with_capacity(p as usize); b.bytes = p; let client = hyper::Client::new(); b.iter(|| { let mut resp = client.get(server.url.clone()) .header(header::Range::Bytes(vec![header::ByteRangeSpec::FromTo(0, p - 1)])) .send() .unwrap(); buf.clear(); use std::io::Read; let size = resp.read_to_end(&mut buf).unwrap(); assert_eq!(p, size as u64); }); } #[bench] fn mp4_construction(b: &mut Bencher) { testutil::init(); let db = TestDb::new(); add_dummy_recordings_to_db(&db.db); b.iter(|| { create_mp4_from_db(db.db.clone(), db.dir.clone(), 0, 0, false); }); } }