Skip to content

Commit

Permalink
Merge pull request #5508 from Snuffleupagus/jpeg-stream-find-soi
Browse files Browse the repository at this point in the history
Refactor searching for the SOI marker of inline JPEG image streams
  • Loading branch information
yurydelendik committed Dec 15, 2014
2 parents 20bf84a + 3e1b521 commit bc27774
Show file tree
Hide file tree
Showing 2 changed files with 9 additions and 18 deletions.
16 changes: 0 additions & 16 deletions src/core/parser.js
Original file line number Diff line number Diff line change
Expand Up @@ -372,22 +372,6 @@ var Parser = (function ParserClosure() {
return new LZWStream(stream, maybeLength, earlyChange);
}
if (name === 'DCTDecode' || name === 'DCT') {
// According to the specification: for inline images, the ID operator
// shall be followed by a single whitespace character (unless it uses
// ASCII85Decode or ASCIIHexDecode filters).
// In practice this only seems to be followed for inline JPEG images,
// and generally ignoring the first byte of the stream if it is a
// whitespace char can even *cause* issues (e.g. in the CCITTFaxDecode
// filters used in issue2984.pdf).
// Hence when the first byte of the stream of an inline JPEG image is
// a whitespace character, we thus simply skip over it.
if (isCmd(this.buf1, 'ID')) {
var firstByte = stream.peekByte();
if (firstByte === 0x0A /* LF */ || firstByte === 0x0D /* CR */ ||
firstByte === 0x20 /* SPACE */) {
stream.skip();
}
}
xrefStreamStats[StreamType.DCT] = true;
return new JpegStream(stream, maybeLength, stream.dict, this.xref);
}
Expand Down
11 changes: 9 additions & 2 deletions src/core/stream.js
Original file line number Diff line number Diff line change
Expand Up @@ -857,8 +857,15 @@ var PredictorStream = (function PredictorStreamClosure() {
*/
var JpegStream = (function JpegStreamClosure() {
function JpegStream(stream, maybeLength, dict, xref) {
// TODO: per poppler, some images may have 'junk' before that
// need to be removed
// Some images may contain 'junk' before the SOI (start-of-image) marker.
// Note: this seems to mainly affect inline images.
var ch;
while ((ch = stream.getByte()) !== -1) {
if (ch === 0xFF) { // Find the first byte of the SOI marker (0xFFD8).
stream.skip(-1); // Reset the stream position to the SOI.
break;
}
}
this.stream = stream;
this.maybeLength = maybeLength;
this.dict = dict;
Expand Down

0 comments on commit bc27774

Please sign in to comment.