#include "string.h"
#include "mp4.h"
+/**
+ * The three states of the mp4 parser. The parser only loads the audio specific
+ * values and tables when it is in the second state.
+ */
+enum audio_track_state {
+ /** We haven't encountered an mp4a atom so far. */
+ ATS_INITIAL,
+ /** We have seen an mp4a atom but no subsequent trak atom yet. */
+ ATS_SEEN_MP4A,
+ /** A trak atom was seen *after* the mp4a atom. */
+ ATS_TRACK_CHANGE,
+};
+
struct mp4_track {
+ /* determines which atoms we still need to parse. */
+ enum audio_track_state state;
+
/* mp4a */
uint16_t channel_count;
uint16_t sample_rate;
uint64_t duration;
};
-#define MAX_TRACKS 1024
-
struct mp4 {
const struct mp4_callback *cb;
- int64_t current_position;
uint64_t moov_offset;
uint64_t moov_size;
uint32_t udta_size;
uint8_t last_atom;
- uint64_t file_size;
-
- /* incremental track index while reading the file */
- int32_t total_tracks;
- /* track data */
- struct mp4_track *track[MAX_TRACKS];
- /* the first audio track found */
- struct mp4_track *audio_track;
-
- /* metadata */
+ struct mp4_track track;
struct mp4_metadata meta;
};
/* regard EAGAIN as an error as reads should be blocking. */
if (ret <= 0)
return ret < 0? -1 : 0;
- f->current_position += ret;
size -= ret;
}
return 1;
uint8_t data[8];
int ret = read_data(f, data, 8);
- if (ret > 0 && result)
+ if (ret > 0)
*result = read_u64_be(data);
return ret;
}
uint8_t data[4];
int ret = read_data(f, data, 4);
- if (ret > 0 && result)
+ if (ret > 0)
*result = read_u32_be(data);
return ret;
}
-static int read_int24(struct mp4 *f, uint32_t *result)
-{
- uint8_t data[3];
- int ret = read_data(f, data, 3);
-
- if (ret > 0 && result)
- *result = read_u24_be(data);
- return ret;
-}
-
static int read_int16(struct mp4 *f, uint16_t *result)
{
uint8_t data[2];
int ret = read_data(f, data, 2);
- if (ret > 0 && result)
+ if (ret > 0)
*result = read_u16_be(data);
return ret;
}
-static uint8_t read_int8(struct mp4 *f, uint8_t *result)
-{
- uint8_t data[1];
- int ret = read_data(f, data, 1);
-
- if (ret > 0 && result)
- *result = data[0];
- return ret;
-}
-
#define ATOM_ITEMS \
ATOM_ITEM(MOOV, 'm', 'o', 'o', 'v') \
ATOM_ITEM(TRAK, 't', 'r', 'a', 'k') \
return 1;
}
-static int64_t get_position(const struct mp4 *f)
+static off_t get_position(const struct mp4 *f)
{
- return f->current_position;
+ return f->cb->seek(f->cb->user_data, 0, SEEK_CUR);
}
-static int32_t set_position(struct mp4 *f, int64_t position)
+static void set_position(struct mp4 *f, off_t position)
{
- f->cb->seek(f->cb->user_data, position);
- f->current_position = position;
+ f->cb->seek(f->cb->user_data, position, SEEK_SET);
+}
- return 0;
+static void skip_bytes(struct mp4 *f, off_t num_skip)
+{
+ f->cb->seek(f->cb->user_data, num_skip, SEEK_CUR);
}
static int read_stsz(struct mp4 *f)
{
int ret;
int32_t i;
- struct mp4_track *t;
+ struct mp4_track *t = &f->track;
- if (f->total_tracks == 0)
- return -1;
- t = f->track[f->total_tracks - 1];
- ret = read_int8(f, NULL); /* version */
- if (ret <= 0)
- return ret;
- ret = read_int24(f, NULL); /* flags */
- if (ret <= 0)
- return ret;
+ if (t->state != ATS_SEEN_MP4A || t->stsz_table)
+ return 1;
+ skip_bytes(f, 4); /* version (1), flags (3) */
ret = read_int32(f, &t->stsz_sample_size);
if (ret <= 0)
return ret;
{
int ret;
int32_t i;
- struct mp4_track *t;
+ struct mp4_track *t = &f->track;
- if (f->total_tracks == 0)
- return -1;
- t = f->track[f->total_tracks - 1];
- if (t->stts_entry_count)
- return 0;
- ret = read_int8(f, NULL); /* version */
- if (ret <= 0)
- return ret;
- ret = read_int24(f, NULL); /* flags */
- if (ret <= 0)
- return ret;
+ if (t->state != ATS_SEEN_MP4A || t->stts_sample_count)
+ return 1;
+ skip_bytes(f, 4); /* version (1), flags (3) */
ret = read_int32(f, &t->stts_entry_count);
if (ret <= 0)
return ret;
ret = read_int32(f, &t->stts_sample_count[i]);
if (ret <= 0)
return ret;
- ret = read_int32(f, NULL); /* sample delta */
- if (ret <= 0)
- return ret;
+ skip_bytes(f, 4); /* sample delta */
}
return 1;
}
{
int ret;
int32_t i;
- struct mp4_track *t;
-
- if (f->total_tracks == 0)
- return -1;
- t = f->track[f->total_tracks - 1];
+ struct mp4_track *t = &f->track;
- ret = read_int8(f, NULL); /* version */
- if (ret <= 0)
- return ret;
- ret = read_int24(f, NULL); /* flags */
- if (ret <= 0)
- return ret;
+ if (t->state != ATS_SEEN_MP4A)
+ return 1;
+ if (t->stsc_first_chunk || t->stsc_samples_per_chunk)
+ return 1;
+ skip_bytes(f, 4); /* version (1), flags (3) */
ret = read_int32(f, &t->stsc_entry_count);
if (ret <= 0)
return ret;
ret = read_int32(f, &t->stsc_samples_per_chunk[i]);
if (ret <= 0)
return ret;
- ret = read_int32(f, NULL); /* sample desc index */
- if (ret <= 0)
- return ret;
+ skip_bytes(f, 4); /* sample desc index */
}
return 1;
}
{
int ret;
int32_t i;
- struct mp4_track *t;
+ struct mp4_track *t = &f->track;
- if (f->total_tracks == 0)
- return -1;
- t = f->track[f->total_tracks - 1];
-
- ret = read_int8(f, NULL); /* version */
- if (ret <= 0)
- return ret;
- ret = read_int24(f, NULL); /* flags */
- if (ret <= 0)
- return ret;
+ if (t->state != ATS_SEEN_MP4A || t->stco_chunk_offset)
+ return 1;
+ skip_bytes(f, 4); /* version (1), flags (3) */
ret = read_int32(f, &t->stco_entry_count);
if (ret <= 0)
return ret;
return 1;
}
-static int read_mp4a(struct mp4 *f)
-{
- int ret;
- int32_t i;
- struct mp4_track *t;
-
- if (f->total_tracks == 0)
- return -1;
- t = f->track[f->total_tracks - 1];
-
- for (i = 0; i < 6; i++) {
- ret = read_int8(f, NULL); /* reserved */
- if (ret <= 0)
- return ret;
- }
- ret = read_int16(f, NULL); /* data_reference_index */
- if (ret <= 0)
- return ret;
- ret = read_int32(f, NULL); /* reserved */
- if (ret <= 0)
- return ret;
- ret = read_int32(f, NULL); /* reserved */
- if (ret <= 0)
- return ret;
- ret = read_int16(f, &t->channel_count);
- if (ret <= 0)
- return ret;
- ret = read_int16(f, NULL);
- if (ret <= 0)
- return ret;
- ret = read_int16(f, NULL);
- if (ret <= 0)
- return ret;
- ret = read_int16(f, NULL);
- if (ret <= 0)
- return ret;
- return read_int16(f, &t->sample_rate);
-}
-
static int read_stsd(struct mp4 *f)
{
int ret;
uint32_t i, entry_count;
- struct mp4_track *t;
- if (f->total_tracks == 0)
- return -1;
- t = f->track[f->total_tracks - 1];
- ret = read_int8(f, NULL); /* version */
- if (ret <= 0)
- return ret;
- ret = read_int24(f, NULL); /* flags */
- if (ret <= 0)
- return ret;
+ if (f->track.state != ATS_INITIAL)
+ return 1;
+ skip_bytes(f, 4); /* version (1), flags (3) */
ret = read_int32(f, &entry_count);
if (ret <= 0)
return ret;
if (ret <= 0)
return ret;
skip += size;
- if (!f->audio_track && atom_type == ATOM_MP4A) {
- f->audio_track = t;
- read_mp4a(f);
+ if (atom_type == ATOM_MP4A) {
+ f->track.state = ATS_SEEN_MP4A;
+ /* reserved (6), data reference index (2), reserved (8) */
+ skip_bytes(f, 16);
+ ret = read_int16(f, &f->track.channel_count);
+ if (ret <= 0)
+ return ret;
+ skip_bytes(f, 6);
+ ret = read_int16(f, &f->track.sample_rate);
+ if (ret <= 0)
+ return ret;
}
set_position(f, skip);
}
destpos = get_position(f) + subsize - header_size;
if (atom_type != ATOM_DATA)
continue;
- ret = read_int8(f, NULL); /* version */
- if (ret <= 0)
- goto fail;
- ret = read_int24(f, NULL); /* flags */
- if (ret <= 0)
- goto fail;
- ret = read_int32(f, NULL); /* reserved */
- if (ret <= 0)
- goto fail;
+ skip_bytes(f, 8); /* version (1), flags (3), reserved (4) */
ret = -ERRNO_TO_PARA_ERROR(EINVAL);
if (subsize < header_size + 8 || subsize > UINT_MAX)
goto fail;
{
int ret;
uint32_t version;
- struct mp4_track *t;
-
- if (f->total_tracks == 0)
- return -1;
- t = f->track[f->total_tracks - 1];
+ struct mp4_track *t = &f->track;
+ if (t->state != ATS_INITIAL)
+ return 1;
ret = read_int32(f, &version);
if (ret <= 0)
return ret;
if (version == 1) {
- ret = read_int64(f, NULL); /* creation-time */
- if (ret <= 0)
- return ret;
- ret = read_int64(f, NULL); /* modification-time */
- if (ret <= 0)
- return ret;
+ skip_bytes(f, 16); /* creation time (8), modification time (8) */
ret = read_int32(f, &t->time_scale);
if (ret <= 0)
return ret;
} else { //version == 0
uint32_t temp;
- ret = read_int32(f, NULL); /* creation-time */
- if (ret <= 0)
- return ret;
- ret = read_int32(f, NULL); /* modification-time */
- if (ret <= 0)
- return ret;
+ skip_bytes(f, 8); /* creation time (4), modification time (4) */
ret = read_int32(f, &t->time_scale);
if (ret <= 0)
return ret;
t->duration = (temp == (uint32_t) (-1))?
(uint64_t) (-1) : (uint64_t) (temp);
}
- ret = read_int16(f, NULL);
- if (ret <= 0)
- return ret;
- ret = read_int16(f, NULL);
- if (ret <= 0)
- return ret;
+ skip_bytes(f, 4);
return 1;
}
uint8_t atom_type;
uint8_t header_size = 0;
- ret = read_int8(f, NULL); /* version */
- if (ret <= 0)
- return ret;
- ret = read_int24(f, NULL); /* flags */
- if (ret <= 0)
- return ret;
+ skip_bytes(f, 4); /* version (1), flags (3) */
while (sumsize < (size - (header_size + 4))) {
ret = atom_read_header(f, &atom_type, &header_size, &subsize);
if (ret <= 0)
if (size == 0)
return -1;
dest = get_position(f) + size - header_size;
- if (atom_type == ATOM_TRAK) {
- if (f->total_tracks >= MAX_TRACKS)
- return -1;
- f->total_tracks++;
- f->track[f->total_tracks - 1] = para_calloc(
- sizeof(struct mp4_track));
- } else if (atom_type == ATOM_UDTA) {
+ if (atom_type == ATOM_TRAK && f->track.state == ATS_SEEN_MP4A) {
+ f->track.state = ATS_TRACK_CHANGE;
+ continue;
+ }
+ if (atom_type == ATOM_UDTA) {
f->udta_offset = get_position(f) - header_size;
f->udta_size = size;
}
f->cb = cb;
while ((ret = atom_read_header(f, &atom_type, &header_size, &size)) > 0) {
- f->file_size += size;
f->last_atom = atom_type;
if (atom_type != ATOM_MOOV || size <= header_size) { /* skip */
set_position(f, get_position(f) + size - header_size);
goto fail;
}
ret = -E_MP4_TRACK;
- if (!f->audio_track)
+ if (f->track.channel_count == 0)
goto fail;
*result = f;
return 1;
{
int32_t i;
- for (i = 0; i < f->total_tracks; i++) {
- if (f->track[i]) {
- free(f->track[i]->stsz_table);
- free(f->track[i]->stts_sample_count);
- free(f->track[i]->stsc_first_chunk);
- free(f->track[i]->stsc_samples_per_chunk);
- free(f->track[i]->stco_chunk_offset);
- free(f->track[i]);
- }
- }
+ free(f->track.stsz_table);
+ free(f->track.stts_sample_count);
+ free(f->track.stsc_first_chunk);
+ free(f->track.stsc_samples_per_chunk);
+ free(f->track.stco_chunk_offset);
for (i = 0; i < f->meta.count; i++) {
free(f->meta.tags[i].item);
free(f->meta.tags[i].value);
static int32_t chunk_of_sample(const struct mp4 *f, int32_t sample,
int32_t *chunk)
{
- const struct mp4_track *t = f->audio_track;
+ const struct mp4_track *t = &f->track;
uint32_t *fc = t->stsc_first_chunk, *spc = t->stsc_samples_per_chunk;
int32_t chunk1, chunk1samples, n, total, i;
*/
uint64_t mp4_get_duration(const struct mp4 *f)
{
- const struct mp4_track *t = f->audio_track;
+ const struct mp4_track *t = &f->track;
if (t->time_scale == 0)
return 0;
int mp4_set_sample_position(struct mp4 *f, int32_t sample)
{
- const struct mp4_track *t = f->audio_track;
+ const struct mp4_track *t = &f->track;
int32_t offset, chunk, chunk_sample;
uint32_t n, srs; /* sample range size */
int32_t mp4_get_sample_size(const struct mp4 *f, int sample)
{
- const struct mp4_track *t = f->audio_track;
+ const struct mp4_track *t = &f->track;
if (t->stsz_sample_size != 0)
return t->stsz_sample_size;
uint32_t mp4_get_sample_rate(const struct mp4 *f)
{
- return f->audio_track->sample_rate;
+ return f->track.sample_rate;
}
uint32_t mp4_get_channel_count(const struct mp4 *f)
{
- return f->audio_track->channel_count;
+ return f->track.channel_count;
}
int32_t mp4_num_samples(const struct mp4 *f)
{
- const struct mp4_track *t = f->audio_track;
+ const struct mp4_track *t = &f->track;
int32_t i;
int32_t total = 0;
return out_buffer;
}
-static int32_t write_data(struct mp4 *f, void *data, uint32_t size)
+static int write_data(struct mp4 *f, void *data, size_t size)
{
- int32_t result = 1;
-
- result = f->cb->write(f->cb->user_data, data, size);
-
- f->current_position += size;
-
- return result;
-}
-
-static int32_t write_int32(struct mp4 *f, uint32_t data)
-{
- int8_t temp[4];
- write_u32_be(temp, data);
- return write_data(f, temp, sizeof(temp));
+ while (size > 0) {
+ ssize_t ret = f->cb->write(f->cb->user_data, data, size);
+ if (ret < 0) {
+ if (errno == EINTR)
+ continue;
+ return -ERRNO_TO_PARA_ERROR(errno);
+ }
+ size -= ret;
+ }
+ return 1;
}
-int32_t mp4_meta_update(struct mp4 *f)
+int mp4_meta_update(struct mp4 *f)
{
void *new_moov_data;
uint32_t new_moov_size;
+ uint8_t buf[8] = "----moov";
+ int ret;
set_position(f, 0);
new_moov_data = modify_moov(f, &new_moov_size);
}
if (f->last_atom != ATOM_MOOV) {
set_position(f, f->moov_offset + 4);
- write_data(f, "free", 4); /* rename old moov to free */
- set_position(f, f->file_size); /* write new moov atom at EOF */
+ ret = write_data(f, "free", 4); /* rename old moov to free */
+ if (ret < 0)
+ goto free_moov;
+ /* write new moov atom at EOF */
+ f->cb->seek(f->cb->user_data, 0, SEEK_END);
} else /* overwrite old moov atom */
set_position(f, f->moov_offset);
- write_int32(f, new_moov_size + 8);
- write_data(f, "moov", 4);
- write_data(f, new_moov_data, new_moov_size);
- free(new_moov_data);
+ write_u32_be(buf, new_moov_size + 8);
+ ret = write_data(f, buf, sizeof(buf));
+ if (ret < 0)
+ goto free_moov;
+ ret = write_data(f, new_moov_data, new_moov_size);
+ if (ret < 0)
+ goto free_moov;
f->cb->truncate(f->cb->user_data);
- return 1;
+ ret = 1;
+free_moov:
+ free(new_moov_data);
+ return ret;
}
static char *meta_find_by_name(const struct mp4 *f, const char *item)