rewrite OggFromWebMWriter

* reduce the number of iterations over the output file (less seeking)
* fix audio samples with size of 255 do not handled correctly in the segment table (allows writing audio streams with 70kbps and 160kbps bitrate)
* add support for VORBIS codec metadata
* write packets based on the timestamp
This commit is contained in:
kapodamy 2019-09-25 16:24:52 -03:00
parent 52a21e4a24
commit 0cdfa6e377
2 changed files with 203 additions and 149 deletions

View file

@ -23,12 +23,16 @@ import javax.annotation.Nullable;
public class OggFromWebMWriter implements Closeable { public class OggFromWebMWriter implements Closeable {
private static final byte FLAG_UNSET = 0x00; private static final byte FLAG_UNSET = 0x00;
//private static final byte FLAG_CONTINUED = 0x01; private static final byte FLAG_CONTINUED = 0x01;
private static final byte FLAG_FIRST = 0x02; private static final byte FLAG_FIRST = 0x02;
private static final byte FLAG_LAST = 0x04; private static final byte FLAG_LAST = 0x04;
private final static byte SEGMENTS_PER_PACKET = 50;// used in ffmpeg, which is near 1 second at 48kHz
private final static byte HEADER_CHECKSUM_OFFSET = 22; private final static byte HEADER_CHECKSUM_OFFSET = 22;
private final static byte HEADER_SIZE = 27;
private final static short BUFFER_SIZE = 8 * 1024;// 8KiB
private final static int TIME_SCALE_NS = 1000000000;
private boolean done = false; private boolean done = false;
private boolean parsed = false; private boolean parsed = false;
@ -38,10 +42,23 @@ public class OggFromWebMWriter implements Closeable {
private int sequence_count = 0; private int sequence_count = 0;
private final int STREAM_ID; private final int STREAM_ID;
private byte packet_flag = FLAG_FIRST;
private int track_index = 0;
private WebMReader webm = null; private WebMReader webm = null;
private WebMTrack webm_track = null; private WebMTrack webm_track = null;
private int track_index = 0; private Segment webm_segment = null;
private Cluster webm_cluster = null;
private SimpleBlock webm_block = null;
private long webm_block_last_timecode = 0;
private long webm_block_near_duration = 0;
private short segment_table_size = 0;
private final byte[] segment_table = new byte[255];
private long segment_table_next_timestamp = TIME_SCALE_NS;
private final int[] crc32_table = new int[256];
public OggFromWebMWriter(@NonNull SharpStream source, @NonNull SharpStream target) { public OggFromWebMWriter(@NonNull SharpStream source, @NonNull SharpStream target) {
if (!source.canRead() || !source.canRewind()) { if (!source.canRead() || !source.canRewind()) {
@ -139,9 +156,8 @@ public class OggFromWebMWriter implements Closeable {
float resolution; float resolution;
int read; int read;
byte[] buffer; byte[] buffer;
int checksum;
byte flag = FLAG_FIRST;// obligatory
/* step 1: get the amount of frames per seconds */
switch (webm_track.kind) { switch (webm_track.kind) {
case Audio: case Audio:
resolution = getSampleFrequencyFromTrack(webm_track.bMetadata); resolution = getSampleFrequencyFromTrack(webm_track.bMetadata);
@ -160,52 +176,65 @@ public class OggFromWebMWriter implements Closeable {
throw new RuntimeException("not implemented"); throw new RuntimeException("not implemented");
} }
/* step 1.1: write codec init data, in most cases must be present */ /* step 2a: create packet with code init data */
ArrayList<byte[]> data_extra = new ArrayList<>(4);
if (webm_track.codecPrivate != null) { if (webm_track.codecPrivate != null) {
addPacketSegment(webm_track.codecPrivate.length); addPacketSegment(webm_track.codecPrivate.length);
dump_packetHeader(flag, 0x00, webm_track.codecPrivate); ByteBuffer buff = byte_buffer(HEADER_SIZE + segment_table_size + webm_track.codecPrivate.length);
flag = FLAG_UNSET;
make_packetHeader(0x00, buff, webm_track.codecPrivate);
data_extra.add(buff.array());
} }
/* step 1.2: write metadata */ /* step 2b: create packet with metadata */
buffer = make_metadata(); buffer = make_metadata();
if (buffer != null) { if (buffer != null) {
addPacketSegment(buffer.length); addPacketSegment(buffer.length);
dump_packetHeader(flag, 0x00, buffer); ByteBuffer buff = byte_buffer(HEADER_SIZE + segment_table_size + buffer.length);
flag = FLAG_UNSET;
make_packetHeader(0x00, buff, buffer);
data_extra.add(buff.array());
} }
buffer = new byte[8 * 1024];
/* step 1.3: write headers */ /* step 3: calculate amount of packets */
long approx_packets = webm_segment.info.duration / webm_segment.info.timecodeScale;
approx_packets = approx_packets / (approx_packets / SEGMENTS_PER_PACKET);
ArrayList<Long> pending_offsets = new ArrayList<>((int) approx_packets);
ArrayList<Integer> pending_checksums = new ArrayList<>((int) approx_packets);
ArrayList<Short> data_offsets = new ArrayList<>((int) approx_packets);
int page_size = 0;
SimpleBlock bloq; SimpleBlock bloq;
int reserve_header = 0;
int headers_amount = 0;
while (webm_segment != null) { while (webm_segment != null) {
bloq = getNextBlock(); bloq = getNextBlock();
if (bloq != null && addPacketSegment(bloq.dataSize)) { if (addPacketSegment(bloq)) {
page_size += bloq.dataSize; continue;
}
if (segment_table_size < SEGMENTS_PER_PACKET) { reserve_header += HEADER_SIZE + segment_table_size;// header size
clearSegmentTable();
webm_block = bloq;
headers_amount++;
}
/* step 4: create packet headers */
rewind_source();
ByteBuffer headers = byte_buffer(reserve_header);
short[] headers_size = new short[headers_amount];
int header_index = 0;
while (webm_segment != null) {
bloq = getNextBlock();
if (addPacketSegment(bloq)) {
continue; continue;
} }
// calculate the current packet duration using the next block // calculate the current packet duration using the next block
bloq = getNextBlock();
}
double elapsed_ns = webm_track.codecDelay; double elapsed_ns = webm_track.codecDelay;
if (bloq == null) { if (bloq == null) {
flag = FLAG_LAST; packet_flag = FLAG_LAST;// note: if the flag is FLAG_CONTINUED, is changed
elapsed_ns += webm_block_last_timecode; elapsed_ns += webm_block_last_timecode;
if (webm_track.defaultDuration > 0) { if (webm_track.defaultDuration > 0) {
@ -219,84 +248,83 @@ public class OggFromWebMWriter implements Closeable {
} }
// get the sample count in the page // get the sample count in the page
elapsed_ns = (elapsed_ns / 1000000000d) * resolution; elapsed_ns = elapsed_ns / TIME_SCALE_NS;
elapsed_ns = Math.ceil(elapsed_ns); elapsed_ns = Math.ceil(elapsed_ns * resolution);
long offset = output_offset + HEADER_CHECKSUM_OFFSET;
pending_offsets.add(offset);
checksum = dump_packetHeader(flag, (long) elapsed_ns, null);
pending_checksums.add(checksum);
data_offsets.add((short) (output_offset - offset));
// reserve space in the page
while (page_size > 0) {
int write = Math.min(page_size, buffer.length);
out_write(buffer, write);
page_size -= write;
}
// create header
headers_size[header_index++] = make_packetHeader((long) elapsed_ns, headers, null);
webm_block = bloq; webm_block = bloq;
} }
/* step 2.1: write stream data */
output.rewind();
output_offset = 0;
source.rewind(); /* step 5: calculate checksums */
rewind_source();
webm = new WebMReader(source); int offset = 0;
webm.parse(); buffer = new byte[BUFFER_SIZE];
webm_track = webm.selectTrack(track_index);
for (int i = 0; i < pending_offsets.size(); i++) { for (header_index = 0; header_index < headers_size.length; header_index++) {
checksum = pending_checksums.get(i); int checksum_offset = offset + HEADER_CHECKSUM_OFFSET;
segment_table_size = 0; int checksum = headers.getInt(checksum_offset);
out_seek(pending_offsets.get(i) + data_offsets.get(i)); while (webm_segment != null) {
while (segment_table_size < SEGMENTS_PER_PACKET) {
bloq = getNextBlock(); bloq = getNextBlock();
if (bloq == null || !addPacketSegment(bloq.dataSize)) { if (!addPacketSegment(bloq)) {
webm_block = bloq;// use this block later (if not null) clearSegmentTable();
webm_block = bloq;
break; break;
} }
// NOTE: calling bloq.data.close() is unnecessary // calculate page checksum
while ((read = bloq.data.read(buffer)) != -1) { while ((read = bloq.data.read(buffer)) > 0) {
out_write(buffer, read); checksum = calc_crc32(checksum, buffer, 0, read);
checksum = calc_crc32(checksum, buffer, read);
} }
} }
pending_checksums.set(i, checksum); headers.putInt(checksum_offset, checksum);
offset += headers_size[header_index];
} }
/* step 2.2: write every checksum */ /* step 6: write extra headers */
output.rewind(); rewind_source();
output_offset = 0;
buffer = new byte[4];
ByteBuffer buff = ByteBuffer.wrap(buffer); for (byte[] buff : data_extra) {
buff.order(ByteOrder.LITTLE_ENDIAN); output.write(buff);
}
for (int i = 0; i < pending_checksums.size(); i++) { /* step 7: write stream packets */
out_seek(pending_offsets.get(i)); byte[] headers_buffers = headers.array();
buff.putInt(0, pending_checksums.get(i)); offset = 0;
out_write(buffer); buffer = new byte[BUFFER_SIZE];
for (header_index = 0; header_index < headers_size.length; header_index++) {
output.write(headers_buffers, offset, headers_size[header_index]);
offset += headers_size[header_index];
while (webm_segment != null) {
bloq = getNextBlock();
if (addPacketSegment(bloq)) {
while ((read = bloq.data.read(buffer)) > 0) {
output.write(buffer, 0, read);
}
} else {
clearSegmentTable();
webm_block = bloq;
break;
}
}
} }
} }
private int dump_packetHeader(byte flag, long gran_pos, byte[] immediate_page) throws IOException { private short make_packetHeader(long gran_pos, ByteBuffer buffer, byte[] immediate_page) {
ByteBuffer buffer = ByteBuffer.allocate(27 + segment_table_size); int offset = buffer.position();
short length = HEADER_SIZE;
buffer.putInt(0x4F676753);// "OggS" binary string buffer.putInt(0x5367674f);// "OggS" binary string in little-endian
buffer.put((byte) 0x00);// version buffer.put((byte) 0x00);// version
buffer.put(flag);// type buffer.put(packet_flag);// type
buffer.order(ByteOrder.LITTLE_ENDIAN);
buffer.putLong(gran_pos);// granulate position buffer.putLong(gran_pos);// granulate position
@ -305,28 +333,24 @@ public class OggFromWebMWriter implements Closeable {
buffer.putInt(0x00);// page checksum buffer.putInt(0x00);// page checksum
buffer.order(ByteOrder.BIG_ENDIAN);
buffer.put((byte) segment_table_size);// segment table buffer.put((byte) segment_table_size);// segment table
buffer.put(segment_table, 0, segment_table_size);// segment size buffer.put(segment_table, 0, segment_table_size);// segment size
segment_table_size = 0;// clear segment table for next header length += segment_table_size;
byte[] buff = buffer.array(); clearSegmentTable();// clear segment table for next header
int checksum_crc32 = calc_crc32(0x00, buff, buff.length);
int checksum_crc32 = calc_crc32(0x00, buffer.array(), offset, length);
if (immediate_page != null) { if (immediate_page != null) {
checksum_crc32 = calc_crc32(checksum_crc32, immediate_page, immediate_page.length); checksum_crc32 = calc_crc32(checksum_crc32, immediate_page, 0, immediate_page.length);
buffer.order(ByteOrder.LITTLE_ENDIAN); System.arraycopy(immediate_page, 0, buffer.array(), length, immediate_page.length);
buffer.putInt(HEADER_CHECKSUM_OFFSET, checksum_crc32); segment_table_next_timestamp -= TIME_SCALE_NS;
out_write(buff);
out_write(immediate_page);
return 0;
} }
out_write(buff); buffer.putInt(offset + HEADER_CHECKSUM_OFFSET, checksum_crc32);
return checksum_crc32;
return length;
} }
@Nullable @Nullable
@ -334,7 +358,7 @@ public class OggFromWebMWriter implements Closeable {
if ("A_OPUS".equals(webm_track.codecId)) { if ("A_OPUS".equals(webm_track.codecId)) {
return new byte[]{ return new byte[]{
0x4F, 0x70, 0x75, 0x73, 0x54, 0x61, 0x67, 0x73,// "OpusTags" binary string 0x4F, 0x70, 0x75, 0x73, 0x54, 0x61, 0x67, 0x73,// "OpusTags" binary string
0x07, 0x00, 0x00, 0x00,// writting application string size 0x07, 0x00, 0x00, 0x00,// writing application string size
0x4E, 0x65, 0x77, 0x50, 0x69, 0x70, 0x65,// "NewPipe" binary string 0x4E, 0x65, 0x77, 0x50, 0x69, 0x70, 0x65,// "NewPipe" binary string
0x00, 0x00, 0x00, 0x00// additional tags count (zero means no tags) 0x00, 0x00, 0x00, 0x00// additional tags count (zero means no tags)
}; };
@ -342,7 +366,7 @@ public class OggFromWebMWriter implements Closeable {
return new byte[]{ return new byte[]{
0x03,// ???????? 0x03,// ????????
0x76, 0x6f, 0x72, 0x62, 0x69, 0x73,// "vorbis" binary string 0x76, 0x6f, 0x72, 0x62, 0x69, 0x73,// "vorbis" binary string
0x07, 0x00, 0x00, 0x00,// writting application string size 0x07, 0x00, 0x00, 0x00,// writing application string size
0x4E, 0x65, 0x77, 0x50, 0x69, 0x70, 0x65,// "NewPipe" binary string 0x4E, 0x65, 0x77, 0x50, 0x69, 0x70, 0x65,// "NewPipe" binary string
0x01, 0x00, 0x00, 0x00,// additional tags count (zero means no tags) 0x01, 0x00, 0x00, 0x00,// additional tags count (zero means no tags)
@ -363,13 +387,26 @@ public class OggFromWebMWriter implements Closeable {
return null; return null;
} }
//<editor-fold defaultstate="collapsed" desc="WebM track handling"> private void rewind_source() throws IOException {
private Segment webm_segment = null; source.rewind();
private Cluster webm_cluter = null;
private SimpleBlock webm_block = null;
private long webm_block_last_timecode = 0;
private long webm_block_near_duration = 0;
webm = new WebMReader(source);
webm.parse();
webm_track = webm.selectTrack(track_index);
webm_segment = webm.getNextSegment();
webm_cluster = null;
webm_block = null;
webm_block_last_timecode = 0L;
segment_table_next_timestamp = TIME_SCALE_NS;
}
private ByteBuffer byte_buffer(int size) {
return ByteBuffer.allocate(size).order(ByteOrder.LITTLE_ENDIAN);
}
//<editor-fold defaultstate="collapsed" desc="WebM track handling">
@Nullable
private SimpleBlock getNextBlock() throws IOException { private SimpleBlock getNextBlock() throws IOException {
SimpleBlock res; SimpleBlock res;
@ -386,17 +423,17 @@ public class OggFromWebMWriter implements Closeable {
} }
} }
if (webm_cluter == null) { if (webm_cluster == null) {
webm_cluter = webm_segment.getNextCluster(); webm_cluster = webm_segment.getNextCluster();
if (webm_cluter == null) { if (webm_cluster == null) {
webm_segment = null; webm_segment = null;
return getNextBlock(); return getNextBlock();
} }
} }
res = webm_cluter.getNextSimpleBlock(); res = webm_cluster.getNextSimpleBlock();
if (res == null) { if (res == null) {
webm_cluter = null; webm_cluster = null;
return getNextBlock(); return getNextBlock();
} }
@ -421,49 +458,64 @@ public class OggFromWebMWriter implements Closeable {
} }
//</editor-fold> //</editor-fold>
//<editor-fold defaultstate="collapsed" desc="Segment table store"> //<editor-fold defaultstate="collapsed" desc="Segment table writing">
private int segment_table_size = 0; private void clearSegmentTable() {
private final byte[] segment_table = new byte[255]; if (packet_flag != FLAG_CONTINUED) {
segment_table_next_timestamp += TIME_SCALE_NS;
packet_flag = FLAG_UNSET;
}
segment_table_size = 0;
}
private boolean addPacketSegment(long size) { private boolean addPacketSegment(SimpleBlock block) {
// check if possible add the segment, without overflow the table if (block == null) {
return false;
}
long timestamp = block.absoluteTimeCodeNs + webm_track.codecDelay;
if (timestamp >= segment_table_next_timestamp) {
return false;
}
boolean result = addPacketSegment((int) block.dataSize);
if (!result && segment_table_next_timestamp < timestamp) {
// WARNING: ¡¡¡¡ not implemented (lack of documentation) !!!!
packet_flag = FLAG_CONTINUED;
}
return result;
}
private boolean addPacketSegment(int size) {
int available = (segment_table.length - segment_table_size) * 255; int available = (segment_table.length - segment_table_size) * 255;
boolean extra = size == 255;
if (extra) {
// add a zero byte entry in the table
// required to indicate the sample size is exactly 255
available -= 255;
}
// check if possible add the segment, without overflow the table
if (available < size) { if (available < size) {
return false;// not enough space on the page return false;// not enough space on the page
} }
while (size > 0) { for (; size > 0; size -= 255) {
segment_table[segment_table_size++] = (byte) Math.min(size, 255); segment_table[segment_table_size++] = (byte) Math.min(size, 255);
size -= 255; }
if (extra) {
segment_table[segment_table_size++] = 0x00;
} }
return true; return true;
} }
//</editor-fold> //</editor-fold>
//<editor-fold defaultstate="collapsed" desc="Output handling">
private long output_offset = 0;
private void out_write(byte[] buffer) throws IOException {
output.write(buffer);
output_offset += buffer.length;
}
private void out_write(byte[] buffer, int size) throws IOException {
output.write(buffer, 0, size);
output_offset += size;
}
private void out_seek(long offset) throws IOException {
//if (output.canSeek()) { output.seek(offset); }
output.skip(offset - output_offset);
output_offset = offset;
}
//</editor-fold>
//<editor-fold defaultstate="collapsed" desc="Checksum CRC32"> //<editor-fold defaultstate="collapsed" desc="Checksum CRC32">
private final int[] crc32_table = new int[256];
private void populate_crc32_table() { private void populate_crc32_table() {
for (int i = 0; i < 0x100; i++) { for (int i = 0; i < 0x100; i++) {
int crc = i << 24; int crc = i << 24;
@ -476,10 +528,12 @@ public class OggFromWebMWriter implements Closeable {
} }
} }
private int calc_crc32(int initial_crc, byte[] buffer, int size) { private int calc_crc32(int initial_crc, byte[] buffer, int offset, int size) {
for (int i = 0; i < size; i++) { size += offset;
for (; offset < size; offset++) {
int reg = (initial_crc >>> 24) & 0xff; int reg = (initial_crc >>> 24) & 0xff;
initial_crc = (initial_crc << 8) ^ crc32_table[reg ^ (buffer[i] & 0xff)]; initial_crc = (initial_crc << 8) ^ crc32_table[reg ^ (buffer[offset] & 0xff)];
} }
return initial_crc; return initial_crc;

View file

@ -11,7 +11,7 @@ import java.nio.ByteBuffer;
class OggFromWebmDemuxer extends Postprocessing { class OggFromWebmDemuxer extends Postprocessing {
OggFromWebmDemuxer() { OggFromWebmDemuxer() {
super(false, true, ALGORITHM_OGG_FROM_WEBM_DEMUXER); super(true, true, ALGORITHM_OGG_FROM_WEBM_DEMUXER);
} }
@Override @Override
@ -24,7 +24,7 @@ class OggFromWebmDemuxer extends Postprocessing {
switch (buffer.getInt()) { switch (buffer.getInt()) {
case 0x1a45dfa3: case 0x1a45dfa3:
return true;// webm return true;// webm/mkv
case 0x4F676753: case 0x4F676753:
return false;// ogg return false;// ogg
} }