misc changes

* read "SeekPreRoll" from the source track (if available)
* use the longest track duration as segment duration, instead of the video track duration
* do not hardcode the "Cue" reserved space behavior
* do not hardcode the "EBML Void" element, unreported issue. The size was not properly calculated
* rewrite the key-frame picking
* remove writeInt(), writeFloat() and writeShort() methods, use inline code
* set "SeekPreRoll" and "CodecDelays" values on output tracks (if available)
* rewrite the "Cluster" maker
* rewrite the code of how "Cluster" sizes are written

Fix encode() method (the reason of this commit/pull-request):
* Use the unsigned shift operator instead of dividing the value, due precession lost
This commit is contained in:
kapodamy 2020-03-12 00:50:14 -03:00 committed by GitHub
parent f7822a448e
commit ca8f8e0ee9
No known key found for this signature in database
GPG key ID: 4AEE18F83AFDEB23
2 changed files with 190 additions and 147 deletions

View file

@ -37,6 +37,7 @@ public class WebMReader {
private final static int ID_DefaultDuration = 0x3E383; private final static int ID_DefaultDuration = 0x3E383;
private final static int ID_FlagLacing = 0x1C; private final static int ID_FlagLacing = 0x1C;
private final static int ID_CodecDelay = 0x16AA; private final static int ID_CodecDelay = 0x16AA;
private final static int ID_SeekPreRoll = 0x16BB;
private final static int ID_Cluster = 0x0F43B675; private final static int ID_Cluster = 0x0F43B675;
private final static int ID_Timecode = 0x67; private final static int ID_Timecode = 0x67;
@ -332,6 +333,10 @@ public class WebMReader {
break; break;
case ID_CodecDelay: case ID_CodecDelay:
entry.codecDelay = readNumber(elem); entry.codecDelay = readNumber(elem);
break;
case ID_SeekPreRoll:
entry.seekPreRoll = readNumber(elem);
break;
default: default:
break; break;
} }
@ -414,8 +419,9 @@ public class WebMReader {
public byte[] codecPrivate; public byte[] codecPrivate;
public byte[] bMetadata; public byte[] bMetadata;
public TrackKind kind; public TrackKind kind;
public long defaultDuration; public long defaultDuration = -1;
public long codecDelay; public long codecDelay = -1;
public long seekPreRoll = -1;
} }
public class Segment { public class Segment {

View file

@ -23,7 +23,10 @@ public class WebMWriter implements Closeable {
private final static int BUFFER_SIZE = 8 * 1024; private final static int BUFFER_SIZE = 8 * 1024;
private final static int DEFAULT_TIMECODE_SCALE = 1000000; private final static int DEFAULT_TIMECODE_SCALE = 1000000;
private final static int INTERV = 100;// 100ms on 1000000us timecode scale private final static int INTERV = 100;// 100ms on 1000000us timecode scale
private final static int DEFAULT_CUES_EACH_MS = 5000;// 100ms on 1000000us timecode scale private final static int DEFAULT_CUES_EACH_MS = 5000;// 5000ms on 1000000us timecode scale
private final static byte CLUSTER_HEADER_SIZE = 8;
private final static int CUE_RESERVE_SIZE = 65535;
private final static byte MINIMUM_EBML_VOID_SIZE = 4;
private WebMReader.WebMTrack[] infoTracks; private WebMReader.WebMTrack[] infoTracks;
private SharpStream[] sourceTracks; private SharpStream[] sourceTracks;
@ -38,15 +41,18 @@ public class WebMWriter implements Closeable {
private Segment[] readersSegment; private Segment[] readersSegment;
private Cluster[] readersCluster; private Cluster[] readersCluster;
private int[] predefinedDurations; private ArrayList<ClusterInfo> clustersOffsetsSizes;
private byte[] outBuffer; private byte[] outBuffer;
private ByteBuffer outByteBuffer;
public WebMWriter(SharpStream... source) { public WebMWriter(SharpStream... source) {
sourceTracks = source; sourceTracks = source;
readers = new WebMReader[sourceTracks.length]; readers = new WebMReader[sourceTracks.length];
infoTracks = new WebMTrack[sourceTracks.length]; infoTracks = new WebMTrack[sourceTracks.length];
outBuffer = new byte[BUFFER_SIZE]; outBuffer = new byte[BUFFER_SIZE];
outByteBuffer = ByteBuffer.wrap(outBuffer);
clustersOffsetsSizes = new ArrayList<>(256);
} }
public WebMTrack[] getTracksFromSource(int sourceIndex) throws IllegalStateException { public WebMTrack[] getTracksFromSource(int sourceIndex) throws IllegalStateException {
@ -83,11 +89,9 @@ public class WebMWriter implements Closeable {
try { try {
readersSegment = new Segment[readers.length]; readersSegment = new Segment[readers.length];
readersCluster = new Cluster[readers.length]; readersCluster = new Cluster[readers.length];
predefinedDurations = new int[readers.length];
for (int i = 0; i < readers.length; i++) { for (int i = 0; i < readers.length; i++) {
infoTracks[i] = readers[i].selectTrack(trackIndex[i]); infoTracks[i] = readers[i].selectTrack(trackIndex[i]);
predefinedDurations[i] = -1;
readersSegment[i] = readers[i].getNextSegment(); readersSegment[i] = readers[i].getNextSegment();
} }
} finally { } finally {
@ -118,6 +122,8 @@ public class WebMWriter implements Closeable {
readersSegment = null; readersSegment = null;
readersCluster = null; readersCluster = null;
outBuffer = null; outBuffer = null;
outByteBuffer = null;
clustersOffsetsSizes = null;
} }
public void build(SharpStream out) throws IOException, RuntimeException { public void build(SharpStream out) throws IOException, RuntimeException {
@ -140,7 +146,7 @@ public class WebMWriter implements Closeable {
0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00// segment content size 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00// segment content size
}); });
long baseSegmentOffset = written + listBuffer.get(0).length; long segmentOffset = written + listBuffer.get(0).length;
/* seek head */ /* seek head */
listBuffer.add(new byte[]{ listBuffer.add(new byte[]{
@ -177,20 +183,22 @@ public class WebMWriter implements Closeable {
/* tracks */ /* tracks */
listBuffer.addAll(makeTracks()); listBuffer.addAll(makeTracks());
for (byte[] buff : listBuffer) { dump(listBuffer, out);
dump(buff, out);
}
// reserve space for Cues element, but is a waste of space (actually is 64 KiB) // reserve space for Cues element
// TODO: better Cue maker long cueOffset = written;
long cueReservedOffset = written; make_EBML_void(out, CUE_RESERVE_SIZE, true);
dump(new byte[]{(byte) 0xec, 0x20, (byte) 0xff, (byte) 0xfb}, out);
int reserved = (1024 * 63) - 4; int[] defaultSampleDuration = new int[infoTracks.length];
while (reserved > 0) { long[] duration = new long[infoTracks.length];
int write = Math.min(reserved, outBuffer.length);
out.write(outBuffer, 0, write); for (int i = 0; i < infoTracks.length; i++) {
reserved -= write; if (infoTracks[i].defaultDuration < 0) {
written += write; defaultSampleDuration[i] = -1;// not available
} else {
defaultSampleDuration[i] = (int) Math.ceil(infoTracks[i].defaultDuration / (float) DEFAULT_TIMECODE_SCALE);
}
duration[i] = -1;
} }
// Select a track for the cue // Select a track for the cue
@ -198,16 +206,8 @@ public class WebMWriter implements Closeable {
long nextCueTime = infoTracks[cuesForTrackId].trackType == 1 ? -1 : 0; long nextCueTime = infoTracks[cuesForTrackId].trackType == 1 ? -1 : 0;
ArrayList<KeyFrame> keyFrames = new ArrayList<>(32); ArrayList<KeyFrame> keyFrames = new ArrayList<>(32);
ArrayList<Long> clusterOffsets = new ArrayList<>(32);
ArrayList<Integer> clusterSizes = new ArrayList<>(32);
long duration = 0;
int durationFromTrackId = 0;
byte[] bTimecode = makeTimecode(0);
int firstClusterOffset = (int) written; int firstClusterOffset = (int) written;
long currentClusterOffset = makeCluster(out, bTimecode, 0, clusterOffsets, clusterSizes); long currentClusterOffset = makeCluster(out, 0, 0, true);
long baseTimecode = 0; long baseTimecode = 0;
long limitTimecode = -1; long limitTimecode = -1;
@ -239,8 +239,7 @@ public class WebMWriter implements Closeable {
newClusterByTrackId = -1; newClusterByTrackId = -1;
baseTimecode = bloq.absoluteTimecode; baseTimecode = bloq.absoluteTimecode;
limitTimecode = baseTimecode + INTERV; limitTimecode = baseTimecode + INTERV;
bTimecode = makeTimecode(baseTimecode); currentClusterOffset = makeCluster(out, baseTimecode, currentClusterOffset, true);
currentClusterOffset = makeCluster(out, bTimecode, currentClusterOffset, clusterOffsets, clusterSizes);
} }
if (cuesForTrackId == i) { if (cuesForTrackId == i) {
@ -248,19 +247,18 @@ public class WebMWriter implements Closeable {
if (nextCueTime > -1) { if (nextCueTime > -1) {
nextCueTime += DEFAULT_CUES_EACH_MS; nextCueTime += DEFAULT_CUES_EACH_MS;
} }
keyFrames.add( keyFrames.add(new KeyFrame(segmentOffset, currentClusterOffset, written, bloq.absoluteTimecode));
new KeyFrame(baseSegmentOffset, currentClusterOffset - 8, written, bTimecode.length, bloq.absoluteTimecode)
);
} }
} }
writeBlock(out, bloq, baseTimecode); writeBlock(out, bloq, baseTimecode);
blockWritten++; blockWritten++;
if (bloq.absoluteTimecode > duration) { if (defaultSampleDuration[i] < 0 && duration[i] >= 0) {
duration = bloq.absoluteTimecode; // if the sample duration in unknown, calculate using current_duration - previous_duration
durationFromTrackId = bloq.trackNumber; defaultSampleDuration[i] = (int) (bloq.absoluteTimecode - duration[i]);
} }
duration[i] = bloq.absoluteTimecode;
if (limitTimecode < 0) { if (limitTimecode < 0) {
limitTimecode = bloq.absoluteTimecode + INTERV; limitTimecode = bloq.absoluteTimecode + INTERV;
@ -276,55 +274,61 @@ public class WebMWriter implements Closeable {
} }
} }
makeCluster(out, null, currentClusterOffset, null, clusterSizes); makeCluster(out, -1, currentClusterOffset, false);
long segmentSize = written - offsetSegmentSizeSet - 7; long segmentSize = written - offsetSegmentSizeSet - 7;
/* ---- final step write offsets and sizes ---- */ /* Segment size */
seekTo(out, offsetSegmentSizeSet); seekTo(out, offsetSegmentSizeSet);
writeLong(out, segmentSize); outByteBuffer.putLong(0, segmentSize);
out.write(outBuffer, 1, DataReader.LONG_SIZE - 1);
if (predefinedDurations[durationFromTrackId] > -1) { /* Segment duration */
duration += predefinedDurations[durationFromTrackId];// this value is full-filled in makeTrackEntry() method long longestDuration = 0;
} for (int i = 0; i < duration.length; i++) {
seekTo(out, offsetInfoDurationSet); if (defaultSampleDuration[i] > 0) {
writeFloat(out, duration); duration[i] += defaultSampleDuration[i];
}
firstClusterOffset -= baseSegmentOffset; if (duration[i] > longestDuration) {
seekTo(out, offsetClusterSet); longestDuration = duration[i];
writeInt(out, firstClusterOffset);
seekTo(out, cueReservedOffset);
/* Cue */
dump(new byte[]{0x1c, 0x53, (byte) 0xbb, 0x6b, 0x20, 0x00, 0x00}, out);
for (KeyFrame keyFrame : keyFrames) {
for (byte[] buffer : makeCuePoint(cuesForTrackId, keyFrame)) {
dump(buffer, out);
if (written >= (cueReservedOffset + 65535 - 16)) {
throw new IOException("Too many Cues");
}
} }
} }
short cueSize = (short) (written - cueReservedOffset - 7); seekTo(out, offsetInfoDurationSet);
outByteBuffer.putFloat(0, longestDuration);
dump(outBuffer, DataReader.FLOAT_SIZE, out);
/* EBML Void */ /* first Cluster offset */
ByteBuffer voidBuffer = ByteBuffer.allocate(4); firstClusterOffset -= segmentOffset;
voidBuffer.putShort((short) 0xec20); writeInt(out, offsetClusterSet, firstClusterOffset);
voidBuffer.putShort((short) (firstClusterOffset - written - 4));
dump(voidBuffer.array(), out);
seekTo(out, offsetCuesSet); seekTo(out, cueOffset);
writeInt(out, (int) (cueReservedOffset - baseSegmentOffset));
seekTo(out, cueReservedOffset + 5); /* Cue */
writeShort(out, cueSize); short cueSize = 0;
dump(new byte[]{0x1c, 0x53, (byte) 0xbb, 0x6b, 0x20, 0x00, 0x00}, out);// header size is 7
for (int i = 0; i < clusterSizes.size(); i++) { for (KeyFrame keyFrame : keyFrames) {
seekTo(out, clusterOffsets.get(i)); int size = makeCuePoint(cuesForTrackId, keyFrame, outBuffer);
byte[] buffer = ByteBuffer.allocate(4).putInt(clusterSizes.get(i) | 0x10000000).array();
dump(buffer, out); if ((cueSize + size + 7 + MINIMUM_EBML_VOID_SIZE) > CUE_RESERVE_SIZE) {
break;// no space left
}
cueSize += size;
dump(outBuffer, size, out);
}
make_EBML_void(out, CUE_RESERVE_SIZE - cueSize - 7, false);
seekTo(out, cueOffset + 5);
outByteBuffer.putShort(0, cueSize);
dump(outBuffer, DataReader.SHORT_SIZE, out);
/* seek head, seek for cues element */
writeInt(out, offsetCuesSet, (int) (cueOffset - segmentOffset));
for (ClusterInfo cluster : clustersOffsetsSizes) {
writeInt(out, cluster.offset, cluster.size | 0x10000000);
} }
} }
@ -375,25 +379,10 @@ public class WebMWriter implements Closeable {
written = offset; written = offset;
} }
private void writeLong(SharpStream stream, long number) throws IOException { private void writeInt(SharpStream stream, long offset, int number) throws IOException {
byte[] buffer = ByteBuffer.allocate(DataReader.LONG_SIZE).putLong(number).array(); seekTo(stream, offset);
stream.write(buffer, 1, buffer.length - 1); outByteBuffer.putInt(0, number);
written += buffer.length - 1; dump(outBuffer, DataReader.INTEGER_SIZE, stream);
}
private void writeFloat(SharpStream stream, float number) throws IOException {
byte[] buffer = ByteBuffer.allocate(DataReader.FLOAT_SIZE).putFloat(number).array();
dump(buffer, stream);
}
private void writeShort(SharpStream stream, short number) throws IOException {
byte[] buffer = ByteBuffer.allocate(DataReader.SHORT_SIZE).putShort(number).array();
dump(buffer, stream);
}
private void writeInt(SharpStream stream, int number) throws IOException {
byte[] buffer = ByteBuffer.allocate(DataReader.INTEGER_SIZE).putInt(number).array();
dump(buffer, stream);
} }
private void writeBlock(SharpStream stream, Block bloq, long clusterTimecode) throws IOException { private void writeBlock(SharpStream stream, Block bloq, long clusterTimecode) throws IOException {
@ -416,47 +405,43 @@ public class WebMWriter implements Closeable {
} }
listBuffer.set(1, encode(blockSize, false)); listBuffer.set(1, encode(blockSize, false));
for (byte[] buff : listBuffer) { dump(listBuffer, stream);
dump(buff, stream);
}
int read; int read;
while ((read = bloq.data.read(outBuffer)) > 0) { while ((read = bloq.data.read(outBuffer)) > 0) {
stream.write(outBuffer, 0, read); dump(outBuffer, read, stream);
written += read;
} }
} }
private byte[] makeTimecode(long timecode) { private long makeCluster(SharpStream stream, long timecode, long offset, boolean create) throws IOException {
ByteBuffer buffer = ByteBuffer.allocate(9); ClusterInfo cluster;
buffer.put((byte) 0xe7);
buffer.put(encode(timecode, true));
byte[] res = new byte[buffer.position()]; if (offset > 0) {
System.arraycopy(buffer.array(), 0, res, 0, res.length); // save the size of the previous cluster (maximum 256 MiB)
cluster = clustersOffsetsSizes.get(clustersOffsetsSizes.size() - 1);
return res; cluster.size = (int) (written - offset - CLUSTER_HEADER_SIZE);
}
private long makeCluster(SharpStream stream, byte[] bTimecode, long startOffset, ArrayList<Long> clusterOffsets, ArrayList<Integer> clusterSizes) throws IOException {
if (startOffset > 0) {
clusterSizes.add((int) (written - startOffset));// size for last offset
} }
if (clusterOffsets != null) { offset = written;
if (create) {
/* cluster */ /* cluster */
dump(new byte[]{0x1f, 0x43, (byte) 0xb6, 0x75}, stream); dump(new byte[]{0x1f, 0x43, (byte) 0xb6, 0x75}, stream);
clusterOffsets.add(written);// warning: max cluster size is 256 MiB
dump(new byte[]{0x10, 0x00, 0x00, 0x00}, stream);
startOffset = written;// size for the this cluster cluster = new ClusterInfo();
cluster.offset = written;
clustersOffsetsSizes.add(cluster);
dump(bTimecode, stream); dump(new byte[]{
0x10, 0x00, 0x00, 0x00,
/* timestamp */
(byte) 0xe7
}, stream);
return startOffset; dump(encode(timecode, true), stream);
} }
return -1; return offset;
} }
private void makeEBML(SharpStream stream) throws IOException { private void makeEBML(SharpStream stream) throws IOException {
@ -509,13 +494,24 @@ public class WebMWriter implements Closeable {
buffer.add(new byte[]{(byte) 0x86}); buffer.add(new byte[]{(byte) 0x86});
buffer.addAll(encode(track.codecId)); buffer.addAll(encode(track.codecId));
/* codec delay*/
if (track.codecDelay >= 0) {
buffer.add(new byte[]{0x56, (byte) 0xAA});
buffer.add(encode(track.codecDelay, true));
}
/* codec seek pre-roll*/
if (track.seekPreRoll >= 0) {
buffer.add(new byte[]{0x56, (byte) 0xBB});
buffer.add(encode(track.seekPreRoll, true));
}
/* type */ /* type */
buffer.add(new byte[]{(byte) 0x83}); buffer.add(new byte[]{(byte) 0x83});
buffer.add(encode(track.trackType, true)); buffer.add(encode(track.trackType, true));
/* default duration */ /* default duration */
if (track.defaultDuration != 0) { if (track.defaultDuration >= 0) {
predefinedDurations[internalTrackId] = (int) Math.ceil(track.defaultDuration / (float) DEFAULT_TIMECODE_SCALE);
buffer.add(new byte[]{0x23, (byte) 0xe3, (byte) 0x83}); buffer.add(new byte[]{0x23, (byte) 0xe3, (byte) 0x83});
buffer.add(encode(track.defaultDuration, true)); buffer.add(encode(track.defaultDuration, true));
} }
@ -538,21 +534,29 @@ public class WebMWriter implements Closeable {
} }
private ArrayList<byte[]> makeCuePoint(int internalTrackId, KeyFrame keyFrame) { private int makeCuePoint(int internalTrackId, KeyFrame keyFrame, byte[] buffer) {
ArrayList<byte[]> buffer = new ArrayList<>(5); ArrayList<byte[]> cue = new ArrayList<>(5);
/* CuePoint */ /* CuePoint */
buffer.add(new byte[]{(byte) 0xbb}); cue.add(new byte[]{(byte) 0xbb});
buffer.add(null); cue.add(null);
/* CueTime */ /* CueTime */
buffer.add(new byte[]{(byte) 0xb3}); cue.add(new byte[]{(byte) 0xb3});
buffer.add(encode(keyFrame.atTimecode, true)); cue.add(encode(keyFrame.duration, true));
/* CueTrackPosition */ /* CueTrackPosition */
buffer.addAll(makeCueTrackPosition(internalTrackId, keyFrame)); cue.addAll(makeCueTrackPosition(internalTrackId, keyFrame));
return lengthFor(buffer); int size = 0;
lengthFor(cue);
for (byte[] buff : cue) {
System.arraycopy(buff, 0, buffer, size, buff.length);
size += buff.length;
}
return size;
} }
private ArrayList<byte[]> makeCueTrackPosition(int internalTrackId, KeyFrame keyFrame) { private ArrayList<byte[]> makeCueTrackPosition(int internalTrackId, KeyFrame keyFrame) {
@ -568,20 +572,48 @@ public class WebMWriter implements Closeable {
/* CueClusterPosition */ /* CueClusterPosition */
buffer.add(new byte[]{(byte) 0xf1}); buffer.add(new byte[]{(byte) 0xf1});
buffer.add(encode(keyFrame.atCluster, true)); buffer.add(encode(keyFrame.clusterPosition, true));
/* CueRelativePosition */ /* CueRelativePosition */
if (keyFrame.atBlock > 0) { if (keyFrame.relativePosition > 0) {
buffer.add(new byte[]{(byte) 0xf0}); buffer.add(new byte[]{(byte) 0xf0});
buffer.add(encode(keyFrame.atBlock, true)); buffer.add(encode(keyFrame.relativePosition, true));
} }
return lengthFor(buffer); return lengthFor(buffer);
} }
private void make_EBML_void(SharpStream out, int size, boolean wipe) throws IOException {
/* ebml void */
outByteBuffer.putShort(0, (short) 0xec20);
outByteBuffer.putShort(2, (short) (size - 4));
dump(outBuffer, 4, out);
if (wipe) {
size -= 4;
while (size > 0) {
int write = Math.min(size, outBuffer.length);
dump(outBuffer, write, out);
size -= write;
}
}
}
private void dump(byte[] buffer, SharpStream stream) throws IOException { private void dump(byte[] buffer, SharpStream stream) throws IOException {
stream.write(buffer); dump(buffer, buffer.length, stream);
written += buffer.length; }
private void dump(byte[] buffer, int count, SharpStream stream) throws IOException {
stream.write(buffer, 0, count);
written += count;
}
private void dump(ArrayList<byte[]> buffers, SharpStream stream) throws IOException {
for (byte[] buffer : buffers) {
stream.write(buffer);
written += buffer.length;
}
} }
private ArrayList<byte[]> lengthFor(ArrayList<byte[]> buffer) { private ArrayList<byte[]> lengthFor(ArrayList<byte[]> buffer) {
@ -614,11 +646,11 @@ public class WebMWriter implements Closeable {
byte[] buffer = new byte[offset + length]; byte[] buffer = new byte[offset + length];
long marker = (long) Math.floor((length - 1f) / 8f); long marker = (long) Math.floor((length - 1f) / 8f);
float mul = 1; int shift = 0;
for (int i = length - 1; i >= 0; i--, mul *= 0x100) { for (int i = length - 1; i >= 0; i--, shift += 8) {
long b = (long) Math.floor(number / mul); long b = number >>> shift;
if (!withLength && i == marker) { if (!withLength && i == marker) {
b = b | (0x80 >> (length - 1)); b = b | (0x80 >>> (length - 1));
} }
buffer[offset + i] = (byte) b; buffer[offset + i] = (byte) b;
} }
@ -686,17 +718,15 @@ public class WebMWriter implements Closeable {
class KeyFrame { class KeyFrame {
KeyFrame(long segment, long cluster, long block, int bTimecodeLength, long timecode) { KeyFrame(long segment, long cluster, long block, long timecode) {
atCluster = cluster - segment; clusterPosition = cluster - segment;
if ((block - bTimecodeLength) > cluster) { relativePosition = (int) (block - cluster - CLUSTER_HEADER_SIZE);
atBlock = (int) (block - cluster); duration = timecode;
}
atTimecode = timecode;
} }
long atCluster; final long clusterPosition;
int atBlock; final int relativePosition;
long atTimecode; final long duration;
} }
class Block { class Block {
@ -717,4 +747,11 @@ public class WebMWriter implements Closeable {
return String.format("trackNumber=%s isKeyFrame=%S absoluteTimecode=%s", trackNumber, isKeyframe(), absoluteTimecode); return String.format("trackNumber=%s isKeyFrame=%S absoluteTimecode=%s", trackNumber, isKeyframe(), absoluteTimecode);
} }
} }
class ClusterInfo {
long offset;
int size;
}
} }