image_pack 0.2.2 → 0.2.3

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (85) hide show
  1. checksums.yaml +4 -4
  2. data/CHANGELOG.md +1 -0
  3. data/README.md +23 -4
  4. data/ext/image_pack/extconf.rb +35 -124
  5. data/ext/image_pack/image_pack.c +638 -595
  6. data/ext/image_pack/mozjpeg_sources.rb +178 -0
  7. data/ext/image_pack/vendor/mozjpeg/BUILDING.md +744 -0
  8. data/ext/image_pack/vendor/mozjpeg/CODE_OF_CONDUCT.md +15 -0
  9. data/ext/image_pack/vendor/mozjpeg/ChangeLog.md +1996 -0
  10. data/lib/image_pack/configuration.rb +54 -8
  11. data/lib/image_pack/version.rb +1 -1
  12. data/lib/image_pack.rb +65 -18
  13. metadata +13 -78
  14. data/ext/image_pack/vendor/mozjpeg/README.ijg +0 -258
  15. data/ext/image_pack/vendor/mozjpeg/cdjpeg.c +0 -156
  16. data/ext/image_pack/vendor/mozjpeg/cjpeg.c +0 -961
  17. data/ext/image_pack/vendor/mozjpeg/djpeg.c +0 -855
  18. data/ext/image_pack/vendor/mozjpeg/jaricom.c +0 -157
  19. data/ext/image_pack/vendor/mozjpeg/jcarith.c +0 -972
  20. data/ext/image_pack/vendor/mozjpeg/jcstest.c +0 -126
  21. data/ext/image_pack/vendor/mozjpeg/jdarith.c +0 -782
  22. data/ext/image_pack/vendor/mozjpeg/jdatadst-tj.c +0 -198
  23. data/ext/image_pack/vendor/mozjpeg/jdatasrc-tj.c +0 -194
  24. data/ext/image_pack/vendor/mozjpeg/jpegtran.c +0 -827
  25. data/ext/image_pack/vendor/mozjpeg/jpegyuv.c +0 -172
  26. data/ext/image_pack/vendor/mozjpeg/rdbmp.c +0 -690
  27. data/ext/image_pack/vendor/mozjpeg/rdcolmap.c +0 -253
  28. data/ext/image_pack/vendor/mozjpeg/rdgif.c +0 -720
  29. data/ext/image_pack/vendor/mozjpeg/rdjpeg.c +0 -160
  30. data/ext/image_pack/vendor/mozjpeg/rdjpgcom.c +0 -494
  31. data/ext/image_pack/vendor/mozjpeg/rdpng.c +0 -194
  32. data/ext/image_pack/vendor/mozjpeg/rdppm.c +0 -781
  33. data/ext/image_pack/vendor/mozjpeg/rdswitch.c +0 -642
  34. data/ext/image_pack/vendor/mozjpeg/rdtarga.c +0 -508
  35. data/ext/image_pack/vendor/mozjpeg/simd/arm/aarch32/jccolext-neon.c +0 -148
  36. data/ext/image_pack/vendor/mozjpeg/simd/arm/aarch32/jchuff-neon.c +0 -334
  37. data/ext/image_pack/vendor/mozjpeg/simd/arm/aarch32/jsimd.c +0 -976
  38. data/ext/image_pack/vendor/mozjpeg/simd/i386/jsimd.c +0 -1312
  39. data/ext/image_pack/vendor/mozjpeg/simd/mips/jsimd.c +0 -1143
  40. data/ext/image_pack/vendor/mozjpeg/simd/mips64/jccolext-mmi.c +0 -455
  41. data/ext/image_pack/vendor/mozjpeg/simd/mips64/jccolor-mmi.c +0 -148
  42. data/ext/image_pack/vendor/mozjpeg/simd/mips64/jcgray-mmi.c +0 -132
  43. data/ext/image_pack/vendor/mozjpeg/simd/mips64/jcgryext-mmi.c +0 -374
  44. data/ext/image_pack/vendor/mozjpeg/simd/mips64/jcsample-mmi.c +0 -98
  45. data/ext/image_pack/vendor/mozjpeg/simd/mips64/jdcolext-mmi.c +0 -415
  46. data/ext/image_pack/vendor/mozjpeg/simd/mips64/jdcolor-mmi.c +0 -139
  47. data/ext/image_pack/vendor/mozjpeg/simd/mips64/jdmerge-mmi.c +0 -149
  48. data/ext/image_pack/vendor/mozjpeg/simd/mips64/jdmrgext-mmi.c +0 -615
  49. data/ext/image_pack/vendor/mozjpeg/simd/mips64/jdsample-mmi.c +0 -304
  50. data/ext/image_pack/vendor/mozjpeg/simd/mips64/jfdctfst-mmi.c +0 -255
  51. data/ext/image_pack/vendor/mozjpeg/simd/mips64/jfdctint-mmi.c +0 -398
  52. data/ext/image_pack/vendor/mozjpeg/simd/mips64/jidctfst-mmi.c +0 -395
  53. data/ext/image_pack/vendor/mozjpeg/simd/mips64/jidctint-mmi.c +0 -571
  54. data/ext/image_pack/vendor/mozjpeg/simd/mips64/jquanti-mmi.c +0 -124
  55. data/ext/image_pack/vendor/mozjpeg/simd/mips64/jsimd.c +0 -866
  56. data/ext/image_pack/vendor/mozjpeg/simd/powerpc/jccolext-altivec.c +0 -269
  57. data/ext/image_pack/vendor/mozjpeg/simd/powerpc/jccolor-altivec.c +0 -116
  58. data/ext/image_pack/vendor/mozjpeg/simd/powerpc/jcgray-altivec.c +0 -111
  59. data/ext/image_pack/vendor/mozjpeg/simd/powerpc/jcgryext-altivec.c +0 -228
  60. data/ext/image_pack/vendor/mozjpeg/simd/powerpc/jcsample-altivec.c +0 -159
  61. data/ext/image_pack/vendor/mozjpeg/simd/powerpc/jdcolext-altivec.c +0 -276
  62. data/ext/image_pack/vendor/mozjpeg/simd/powerpc/jdcolor-altivec.c +0 -106
  63. data/ext/image_pack/vendor/mozjpeg/simd/powerpc/jdmerge-altivec.c +0 -130
  64. data/ext/image_pack/vendor/mozjpeg/simd/powerpc/jdmrgext-altivec.c +0 -329
  65. data/ext/image_pack/vendor/mozjpeg/simd/powerpc/jdsample-altivec.c +0 -400
  66. data/ext/image_pack/vendor/mozjpeg/simd/powerpc/jfdctfst-altivec.c +0 -154
  67. data/ext/image_pack/vendor/mozjpeg/simd/powerpc/jfdctint-altivec.c +0 -258
  68. data/ext/image_pack/vendor/mozjpeg/simd/powerpc/jidctfst-altivec.c +0 -255
  69. data/ext/image_pack/vendor/mozjpeg/simd/powerpc/jidctint-altivec.c +0 -357
  70. data/ext/image_pack/vendor/mozjpeg/simd/powerpc/jquanti-altivec.c +0 -250
  71. data/ext/image_pack/vendor/mozjpeg/simd/powerpc/jsimd.c +0 -884
  72. data/ext/image_pack/vendor/mozjpeg/strtest.c +0 -170
  73. data/ext/image_pack/vendor/mozjpeg/tjbench.c +0 -1044
  74. data/ext/image_pack/vendor/mozjpeg/tjexample.c +0 -406
  75. data/ext/image_pack/vendor/mozjpeg/tjunittest.c +0 -961
  76. data/ext/image_pack/vendor/mozjpeg/tjutil.c +0 -70
  77. data/ext/image_pack/vendor/mozjpeg/transupp.c +0 -2373
  78. data/ext/image_pack/vendor/mozjpeg/turbojpeg-jni.c +0 -1259
  79. data/ext/image_pack/vendor/mozjpeg/turbojpeg.c +0 -2320
  80. data/ext/image_pack/vendor/mozjpeg/wrbmp.c +0 -552
  81. data/ext/image_pack/vendor/mozjpeg/wrgif.c +0 -580
  82. data/ext/image_pack/vendor/mozjpeg/wrjpgcom.c +0 -577
  83. data/ext/image_pack/vendor/mozjpeg/wrppm.c +0 -366
  84. data/ext/image_pack/vendor/mozjpeg/wrtarga.c +0 -258
  85. data/ext/image_pack/vendor/mozjpeg/yuvjpeg.c +0 -268
@@ -0,0 +1,1996 @@
1
+ 2.1.6
2
+ =====
3
+
4
+ ### Significant changes relative to 2.1.5.1:
5
+
6
+ 1. Fixed an oversight in 1.4 beta1[8] that caused various segfaults and buffer
7
+ overruns when attempting to decompress various specially-crafted malformed
8
+ 12-bit-per-component JPEG images using a 12-bit-per-component build of djpeg
9
+ (`-DWITH_12BIT=1`) with both color quantization and RGB565 color conversion
10
+ enabled.
11
+
12
+ 2. Fixed an issue whereby `jpeg_crop_scanline()` sometimes miscalculated the
13
+ downsampled width for components with 4x2 or 2x4 subsampling factors if
14
+ decompression scaling was enabled. This caused the components to be upsampled
15
+ incompletely, which caused the color converter to read from uninitialized
16
+ memory. With 12-bit data precision, this caused a buffer overrun or underrun
17
+ and subsequent segfault if the sample value read from uninitialized memory was
18
+ outside of the valid sample range.
19
+
20
+ 3. Fixed a long-standing issue whereby the `tjTransform()` function, when used
21
+ with the `TJXOP_TRANSPOSE`, `TJXOP_TRANSVERSE`, `TJXOP_ROT90`, or
22
+ `TJXOP_ROT270` transform operation and without automatic JPEG destination
23
+ buffer (re)allocation or lossless cropping, computed the worst-case transformed
24
+ JPEG image size based on the source image dimensions rather than the
25
+ transformed image dimensions. If a calling program allocated the JPEG
26
+ destination buffer based on the transformed image dimensions, as the API
27
+ documentation instructs, and attempted to transform a specially-crafted 4:2:2,
28
+ 4:4:0, or 4:1:1 JPEG source image containing a large amount of metadata, the
29
+ issue caused `tjTransform()` to overflow the JPEG destination buffer rather
30
+ than fail gracefully. The issue could be worked around by setting
31
+ `TJXOPT_COPYNONE`. Note that, irrespective of this issue, `tjTransform()`
32
+ cannot reliably transform JPEG source images that contain a large amount of
33
+ metadata unless automatic JPEG destination buffer (re)allocation is used or
34
+ `TJXOPT_COPYNONE` is set.
35
+
36
+ 4. Fixed an issue that caused the C Huffman encoder (which is not used by
37
+ default on x86 and Arm CPUs) to read from uninitialized memory when attempting
38
+ to transform a specially-crafted malformed arithmetic-coded JPEG source image
39
+ into a baseline Huffman-coded JPEG destination image.
40
+
41
+ 5. Fixed two minor issues in the interblock smoothing algorithm that caused
42
+ mathematical (but not necessarily perceptible) edge block errors when
43
+ decompressing progressive JPEG images exactly two MCU blocks in width or that
44
+ use vertical chrominance subsampling.
45
+
46
+
47
+ 2.1.5.1
48
+ =======
49
+
50
+ ### Significant changes relative to 2.1.5:
51
+
52
+ 1. The SIMD dispatchers in libjpeg-turbo 2.1.4 and prior stored the list of
53
+ supported SIMD instruction sets in a global variable, which caused an innocuous
54
+ race condition whereby the variable could have been initialized multiple times
55
+ if `jpeg_start_*compress()` was called simultaneously in multiple threads.
56
+ libjpeg-turbo 2.1.5 included an undocumented attempt to fix this race condition
57
+ by making the SIMD support variable thread-local. However, that caused another
58
+ issue whereby, if `jpeg_start_*compress()` was called in one thread and
59
+ `jpeg_read_*()` or `jpeg_write_*()` was called in a second thread, the SIMD
60
+ support variable was never initialized in the second thread. On x86 systems,
61
+ this led the second thread to incorrectly assume that AVX2 instructions were
62
+ always available, and when it attempted to use those instructions on older x86
63
+ CPUs that do not support them, an illegal instruction error occurred. The SIMD
64
+ dispatchers now ensure that the SIMD support variable is initialized before
65
+ dispatching based on its value.
66
+
67
+
68
+ 2.1.5
69
+ =====
70
+
71
+ ### Significant changes relative to 2.1.4:
72
+
73
+ 1. Fixed issues in the build system whereby, when using the Ninja Multi-Config
74
+ CMake generator, a static build of libjpeg-turbo (a build in which
75
+ `ENABLE_SHARED` is `0`) could not be installed, a Windows installer could not
76
+ be built, and the Java regression tests failed.
77
+
78
+ 2. Fixed a regression introduced by 2.0 beta1[15] that caused a buffer overrun
79
+ in the progressive Huffman encoder when attempting to transform a
80
+ specially-crafted malformed 12-bit-per-component JPEG image into a progressive
81
+ 12-bit-per-component JPEG image using a 12-bit-per-component build of
82
+ libjpeg-turbo (`-DWITH_12BIT=1`.) Given that the buffer overrun was fully
83
+ contained within the progressive Huffman encoder structure and did not cause a
84
+ segfault or other user-visible errant behavior, given that the lossless
85
+ transformer (unlike the decompressor) is not generally exposed to arbitrary
86
+ data exploits, and given that 12-bit-per-component builds of libjpeg-turbo are
87
+ uncommon, this issue did not likely pose a security risk.
88
+
89
+ 3. Fixed an issue whereby, when using a 12-bit-per-component build of
90
+ libjpeg-turbo (`-DWITH_12BIT=1`), passing samples with values greater than 4095
91
+ or less than 0 to `jpeg_write_scanlines()` caused a buffer overrun or underrun
92
+ in the RGB-to-YCbCr color converter.
93
+
94
+ 4. Fixed a floating point exception that occurred when attempting to use the
95
+ jpegtran `-drop` and `-trim` options to losslessly transform a
96
+ specially-crafted malformed JPEG image.
97
+
98
+ 5. Fixed an issue in `tjBufSizeYUV2()` whereby it returned a bogus result,
99
+ rather than throwing an error, if the `align` parameter was not a power of 2.
100
+ Fixed a similar issue in `tjCompressFromYUV()` whereby it generated a corrupt
101
+ JPEG image in certain cases, rather than throwing an error, if the `align`
102
+ parameter was not a power of 2.
103
+
104
+ 6. Fixed an issue whereby `tjDecompressToYUV2()`, which is a wrapper for
105
+ `tjDecompressToYUVPlanes()`, used the desired YUV image dimensions rather than
106
+ the actual scaled image dimensions when computing the plane pointers and
107
+ strides to pass to `tjDecompressToYUVPlanes()`. This caused a buffer overrun
108
+ and subsequent segfault if the desired image dimensions exceeded the scaled
109
+ image dimensions.
110
+
111
+ 7. Fixed an issue whereby, when decompressing a 12-bit-per-component JPEG image
112
+ (`-DWITH_12BIT=1`) using an alpha-enabled output color space such as
113
+ `JCS_EXT_RGBA`, the alpha channel was set to 255 rather than 4095.
114
+
115
+ 8. Fixed an issue whereby the Java version of TJBench did not accept a range of
116
+ quality values.
117
+
118
+ 9. Fixed an issue whereby, when `-progressive` was passed to TJBench, the JPEG
119
+ input image was not transformed into a progressive JPEG image prior to
120
+ decompression.
121
+
122
+
123
+ 2.1.4
124
+ =====
125
+
126
+ ### Significant changes relative to 2.1.3:
127
+
128
+ 1. Fixed a regression introduced in 2.1.3 that caused build failures with
129
+ Visual Studio 2010.
130
+
131
+ 2. The `tjDecompressHeader3()` function in the TurboJPEG C API and the
132
+ `TJDecompressor.setSourceImage()` method in the TurboJPEG Java API now accept
133
+ "abbreviated table specification" (AKA "tables-only") datastreams, which can be
134
+ used to prime the decompressor with quantization and Huffman tables that can be
135
+ used when decompressing subsequent "abbreviated image" datastreams.
136
+
137
+ 3. libjpeg-turbo now performs run-time detection of AltiVec instructions on
138
+ OS X/PowerPC systems if AltiVec instructions are not enabled at compile time.
139
+ This allows both AltiVec-equipped (PowerPC G4 and G5) and non-AltiVec-equipped
140
+ (PowerPC G3) CPUs to be supported using the same build of libjpeg-turbo.
141
+
142
+ 4. Fixed an error ("Bogus virtual array access") that occurred when attempting
143
+ to decompress a progressive JPEG image with a height less than or equal to one
144
+ iMCU (8 * the vertical sampling factor) using buffered-image mode with
145
+ interblock smoothing enabled. This was a regression introduced by
146
+ 2.1 beta1[6(b)].
147
+
148
+ 5. Fixed two issues that prevented partial image decompression from working
149
+ properly with buffered-image mode:
150
+
151
+ - Attempting to call `jpeg_crop_scanline()` after
152
+ `jpeg_start_decompress()` but before `jpeg_start_output()` resulted in an error
153
+ ("Improper call to JPEG library in state 207".)
154
+ - Attempting to use `jpeg_skip_scanlines()` resulted in an error ("Bogus
155
+ virtual array access") under certain circumstances.
156
+
157
+
158
+ 2.1.3
159
+ =====
160
+
161
+ ### Significant changes relative to 2.1.2:
162
+
163
+ 1. Fixed a regression introduced by 2.0 beta1[7] whereby cjpeg compressed PGM
164
+ input files into full-color JPEG images unless the `-grayscale` option was
165
+ used.
166
+
167
+ 2. cjpeg now automatically compresses GIF and 8-bit BMP input files into
168
+ grayscale JPEG images if the input files contain only shades of gray.
169
+
170
+ 3. The build system now enables the intrinsics implementation of the AArch64
171
+ (Arm 64-bit) Neon SIMD extensions by default when using GCC 12 or later.
172
+
173
+ 4. Fixed a segfault that occurred while decompressing a 4:2:0 JPEG image using
174
+ the merged (non-fancy) upsampling algorithms (that is, with
175
+ `cinfo.do_fancy_upsampling` set to `FALSE`) along with `jpeg_crop_scanline()`.
176
+ Specifically, the segfault occurred if the number of bytes remaining in the
177
+ output buffer was less than the number of bytes required to represent one
178
+ uncropped scanline of the output image. For that reason, the issue could only
179
+ be reproduced using the libjpeg API, not using djpeg.
180
+
181
+
182
+ 2.1.2
183
+ =====
184
+
185
+ ### Significant changes relative to 2.1.1:
186
+
187
+ 1. Fixed a regression introduced by 2.1 beta1[13] that caused the remaining
188
+ GAS implementations of AArch64 (Arm 64-bit) Neon SIMD functions (which are used
189
+ by default with GCC for performance reasons) to be placed in the `.rodata`
190
+ section rather than in the `.text` section. This caused the GNU linker to
191
+ automatically place the `.rodata` section in an executable segment, which
192
+ prevented libjpeg-turbo from working properly with other linkers and also
193
+ represented a potential security risk.
194
+
195
+ 2. Fixed an issue whereby the `tjTransform()` function incorrectly computed the
196
+ MCU block size for 4:4:4 JPEG images with non-unary sampling factors and thus
197
+ unduly rejected some cropping regions, even though those regions aligned with
198
+ 8x8 MCU block boundaries.
199
+
200
+ 3. Fixed a regression introduced by 2.1 beta1[13] that caused the build system
201
+ to enable the Arm Neon SIMD extensions when targetting Armv6 and other legacy
202
+ architectures that do not support Neon instructions.
203
+
204
+ 4. libjpeg-turbo now performs run-time detection of AltiVec instructions on
205
+ FreeBSD/PowerPC systems if AltiVec instructions are not enabled at compile
206
+ time. This allows both AltiVec-equipped and non-AltiVec-equipped CPUs to be
207
+ supported using the same build of libjpeg-turbo.
208
+
209
+ 5. cjpeg now accepts a `-strict` argument similar to that of djpeg and
210
+ jpegtran, which causes the compressor to abort if an LZW-compressed GIF input
211
+ image contains incomplete or corrupt image data.
212
+
213
+
214
+ 2.1.1
215
+ =====
216
+
217
+ ### Significant changes relative to 2.1.0:
218
+
219
+ 1. Fixed a regression introduced in 2.1.0 that caused build failures with
220
+ non-GCC-compatible compilers for Un*x/Arm platforms.
221
+
222
+ 2. Fixed a regression introduced by 2.1 beta1[13] that prevented the Arm 32-bit
223
+ (AArch32) Neon SIMD extensions from building unless the C compiler flags
224
+ included `-mfloat-abi=softfp` or `-mfloat-abi=hard`.
225
+
226
+ 3. Fixed an issue in the AArch32 Neon SIMD Huffman encoder whereby reliance on
227
+ undefined C compiler behavior led to crashes ("SIGBUS: illegal alignment") on
228
+ Android systems when running AArch32/Thumb builds of libjpeg-turbo built with
229
+ recent versions of Clang.
230
+
231
+ 4. Added a command-line argument (`-copy icc`) to jpegtran that causes it to
232
+ copy only the ICC profile markers from the source file and discard any other
233
+ metadata.
234
+
235
+ 5. libjpeg-turbo should now build and run on CHERI-enabled architectures, which
236
+ use capability pointers that are larger than the size of `size_t`.
237
+
238
+ 6. Fixed a regression (CVE-2021-37972) introduced by 2.1 beta1[5] that caused a
239
+ segfault in the 64-bit SSE2 Huffman encoder when attempting to losslessly
240
+ transform a specially-crafted malformed JPEG image.
241
+
242
+
243
+ 2.1.0
244
+ =====
245
+
246
+ ### Significant changes relative to 2.1 beta1:
247
+
248
+ 1. Fixed a regression (CVE-2021-29390) introduced by 2.1 beta1[6(b)] whereby
249
+ attempting to decompress certain progressive JPEG images with one or more
250
+ component planes of width 8 or less caused a buffer overrun.
251
+
252
+ 2. Fixed a regression introduced by 2.1 beta1[6(b)] whereby attempting to
253
+ decompress a specially-crafted malformed progressive JPEG image caused the
254
+ block smoothing algorithm to read from uninitialized memory.
255
+
256
+ 3. Fixed an issue in the Arm Neon SIMD Huffman encoders that caused the
257
+ encoders to generate incorrect results when using the Clang compiler with
258
+ Visual Studio.
259
+
260
+ 4. Fixed a floating point exception (CVE-2021-20205) that occurred when
261
+ attempting to compress a specially-crafted malformed GIF image with a specified
262
+ image width of 0 using cjpeg.
263
+
264
+ 5. Fixed a regression introduced by 2.0 beta1[15] whereby attempting to
265
+ generate a progressive JPEG image on an SSE2-capable CPU using a scan script
266
+ containing one or more scans with lengths divisible by 32 and non-zero
267
+ successive approximation low bit positions would, under certain circumstances,
268
+ result in an error ("Missing Huffman code table entry") and an invalid JPEG
269
+ image.
270
+
271
+ 6. Introduced a new flag (`TJFLAG_LIMITSCANS` in the TurboJPEG C API and
272
+ `TJ.FLAG_LIMIT_SCANS` in the TurboJPEG Java API) and a corresponding TJBench
273
+ command-line argument (`-limitscans`) that causes the TurboJPEG decompression
274
+ and transform functions/operations to return/throw an error if a progressive
275
+ JPEG image contains an unreasonably large number of scans. This allows
276
+ applications that use the TurboJPEG API to guard against an exploit of the
277
+ progressive JPEG format described in the report
278
+ ["Two Issues with the JPEG Standard"](https://libjpeg-turbo.org/pmwiki/uploads/About/TwoIssueswiththeJPEGStandard.pdf).
279
+
280
+ 7. The PPM reader now throws an error, rather than segfaulting (due to a buffer
281
+ overrun, CVE-2021-46822) or generating incorrect pixels, if an application
282
+ attempts to use the `tjLoadImage()` function to load a 16-bit binary PPM file
283
+ (a binary PPM file with a maximum value greater than 255) into a grayscale
284
+ image buffer or to load a 16-bit binary PGM file into an RGB image buffer.
285
+
286
+ 8. Fixed an issue in the PPM reader that caused incorrect pixels to be
287
+ generated when using the `tjLoadImage()` function to load a 16-bit binary PPM
288
+ file into an extended RGB image buffer.
289
+
290
+ 9. Fixed an issue whereby, if a JPEG buffer was automatically re-allocated by
291
+ one of the TurboJPEG compression or transform functions and an error
292
+ subsequently occurred during compression or transformation, the JPEG buffer
293
+ pointer passed by the application was not updated when the function returned.
294
+
295
+
296
+ 2.0.90 (2.1 beta1)
297
+ ==================
298
+
299
+ ### Significant changes relative to 2.0.6:
300
+
301
+ 1. The build system, x86-64 SIMD extensions, and accelerated Huffman codec now
302
+ support the x32 ABI on Linux, which allows for using x86-64 instructions with
303
+ 32-bit pointers. The x32 ABI is generally enabled by adding `-mx32` to the
304
+ compiler flags.
305
+
306
+ Caveats:
307
+ - CMake 3.9.0 or later is required in order for the build system to
308
+ automatically detect an x32 build.
309
+ - Java does not support the x32 ABI, and thus the TurboJPEG Java API will
310
+ automatically be disabled with x32 builds.
311
+
312
+ 2. Added Loongson MMI SIMD implementations of the RGB-to-grayscale, 4:2:2 fancy
313
+ chroma upsampling, 4:2:2 and 4:2:0 merged chroma upsampling/color conversion,
314
+ and fast integer DCT/IDCT algorithms. Relative to libjpeg-turbo 2.0.x, this
315
+ speeds up:
316
+
317
+ - the compression of RGB source images into grayscale JPEG images by
318
+ approximately 20%
319
+ - the decompression of 4:2:2 JPEG images by approximately 40-60% when
320
+ using fancy upsampling
321
+ - the decompression of 4:2:2 and 4:2:0 JPEG images by approximately
322
+ 15-20% when using merged upsampling
323
+ - the compression of RGB source images by approximately 30-45% when using
324
+ the fast integer DCT
325
+ - the decompression of JPEG images into RGB destination images by
326
+ approximately 2x when using the fast integer IDCT
327
+
328
+ The overall decompression speedup for RGB images is now approximately
329
+ 2.3-3.7x (compared to 2-3.5x with libjpeg-turbo 2.0.x.)
330
+
331
+ 3. 32-bit (Armv7 or Armv7s) iOS builds of libjpeg-turbo are no longer
332
+ supported, and the libjpeg-turbo build system can no longer be used to package
333
+ such builds. 32-bit iOS apps cannot run in iOS 11 and later, and the App Store
334
+ no longer allows them.
335
+
336
+ 4. 32-bit (i386) OS X/macOS builds of libjpeg-turbo are no longer supported,
337
+ and the libjpeg-turbo build system can no longer be used to package such
338
+ builds. 32-bit Mac applications cannot run in macOS 10.15 "Catalina" and
339
+ later, and the App Store no longer allows them.
340
+
341
+ 5. The SSE2 (x86 SIMD) and C Huffman encoding algorithms have been
342
+ significantly optimized, resulting in a measured average overall compression
343
+ speedup of 12-28% for 64-bit code and 22-52% for 32-bit code on various Intel
344
+ and AMD CPUs, as well as a measured average overall compression speedup of
345
+ 0-23% on platforms that do not have a SIMD-accelerated Huffman encoding
346
+ implementation.
347
+
348
+ 6. The block smoothing algorithm that is applied by default when decompressing
349
+ progressive Huffman-encoded JPEG images has been improved in the following
350
+ ways:
351
+
352
+ - The algorithm is now more fault-tolerant. Previously, if a particular
353
+ scan was incomplete, then the smoothing parameters for the incomplete scan
354
+ would be applied to the entire output image, including the parts of the image
355
+ that were generated by the prior (complete) scan. Visually, this had the
356
+ effect of removing block smoothing from lower-frequency scans if they were
357
+ followed by an incomplete higher-frequency scan. libjpeg-turbo now applies
358
+ block smoothing parameters to each iMCU row based on which scan generated the
359
+ pixels in that row, rather than always using the block smoothing parameters for
360
+ the most recent scan.
361
+ - When applying block smoothing to DC scans, a Gaussian-like kernel with a
362
+ 5x5 window is used to reduce the "blocky" appearance.
363
+
364
+ 7. Added SIMD acceleration for progressive Huffman encoding on Arm platforms.
365
+ This speeds up the compression of full-color progressive JPEGs by about 30-40%
366
+ on average (relative to libjpeg-turbo 2.0.x) when using modern Arm CPUs.
367
+
368
+ 8. Added configure-time and run-time auto-detection of Loongson MMI SIMD
369
+ instructions, so that the Loongson MMI SIMD extensions can be included in any
370
+ MIPS64 libjpeg-turbo build.
371
+
372
+ 9. Added fault tolerance features to djpeg and jpegtran, mainly to demonstrate
373
+ methods by which applications can guard against the exploits of the JPEG format
374
+ described in the report
375
+ ["Two Issues with the JPEG Standard"](https://libjpeg-turbo.org/pmwiki/uploads/About/TwoIssueswiththeJPEGStandard.pdf).
376
+
377
+ - Both programs now accept a `-maxscans` argument, which can be used to
378
+ limit the number of allowable scans in the input file.
379
+ - Both programs now accept a `-strict` argument, which can be used to
380
+ treat all warnings as fatal.
381
+
382
+ 10. CMake package config files are now included for both the libjpeg and
383
+ TurboJPEG API libraries. This facilitates using libjpeg-turbo with CMake's
384
+ `find_package()` function. For example:
385
+
386
+ find_package(libjpeg-turbo CONFIG REQUIRED)
387
+
388
+ add_executable(libjpeg_program libjpeg_program.c)
389
+ target_link_libraries(libjpeg_program PUBLIC libjpeg-turbo::jpeg)
390
+
391
+ add_executable(libjpeg_program_static libjpeg_program.c)
392
+ target_link_libraries(libjpeg_program_static PUBLIC
393
+ libjpeg-turbo::jpeg-static)
394
+
395
+ add_executable(turbojpeg_program turbojpeg_program.c)
396
+ target_link_libraries(turbojpeg_program PUBLIC
397
+ libjpeg-turbo::turbojpeg)
398
+
399
+ add_executable(turbojpeg_program_static turbojpeg_program.c)
400
+ target_link_libraries(turbojpeg_program_static PUBLIC
401
+ libjpeg-turbo::turbojpeg-static)
402
+
403
+ 11. Since the Unisys LZW patent has long expired, cjpeg and djpeg can now
404
+ read/write both LZW-compressed and uncompressed GIF files (feature ported from
405
+ jpeg-6a and jpeg-9d.)
406
+
407
+ 12. jpegtran now includes the `-wipe` and `-drop` options from jpeg-9a and
408
+ jpeg-9d, as well as the ability to expand the image size using the `-crop`
409
+ option. Refer to jpegtran.1 or usage.txt for more details.
410
+
411
+ 13. Added a complete intrinsics implementation of the Arm Neon SIMD extensions,
412
+ thus providing SIMD acceleration on Arm platforms for all of the algorithms
413
+ that are SIMD-accelerated on x86 platforms. This new implementation is
414
+ significantly faster in some cases than the old GAS implementation--
415
+ depending on the algorithms used, the type of CPU core, and the compiler. GCC,
416
+ as of this writing, does not provide a full or optimal set of Neon intrinsics,
417
+ so for performance reasons, the default when building libjpeg-turbo with GCC is
418
+ to continue using the GAS implementation of the following algorithms:
419
+
420
+ - 32-bit RGB-to-YCbCr color conversion
421
+ - 32-bit fast and accurate inverse DCT
422
+ - 64-bit RGB-to-YCbCr and YCbCr-to-RGB color conversion
423
+ - 64-bit accurate forward and inverse DCT
424
+ - 64-bit Huffman encoding
425
+
426
+ A new CMake variable (`NEON_INTRINSICS`) can be used to override this
427
+ default.
428
+
429
+ Since the new intrinsics implementation includes SIMD acceleration
430
+ for merged upsampling/color conversion, 1.5.1[5] is no longer necessary and has
431
+ been reverted.
432
+
433
+ 14. The Arm Neon SIMD extensions can now be built using Visual Studio.
434
+
435
+ 15. The build system can now be used to generate a universal x86-64 + Armv8
436
+ libjpeg-turbo SDK package for both iOS and macOS.
437
+
438
+
439
+ 2.0.6
440
+ =====
441
+
442
+ ### Significant changes relative to 2.0.5:
443
+
444
+ 1. Fixed "using JNI after critical get" errors that occurred on Android
445
+ platforms when using any of the YUV encoding/compression/decompression/decoding
446
+ methods in the TurboJPEG Java API.
447
+
448
+ 2. Fixed or worked around multiple issues with `jpeg_skip_scanlines()`:
449
+
450
+ - Fixed segfaults (CVE-2020-35538) or "Corrupt JPEG data: premature end of
451
+ data segment" errors in `jpeg_skip_scanlines()` that occurred when
452
+ decompressing 4:2:2 or 4:2:0 JPEG images using merged (non-fancy)
453
+ upsampling/color conversion (that is, when setting `cinfo.do_fancy_upsampling`
454
+ to `FALSE`.) 2.0.0[6] was a similar fix, but it did not cover all cases.
455
+ - `jpeg_skip_scanlines()` now throws an error if two-pass color
456
+ quantization is enabled. Two-pass color quantization never worked properly
457
+ with `jpeg_skip_scanlines()`, and the issues could not readily be fixed.
458
+ - Fixed an issue whereby `jpeg_skip_scanlines()` always returned 0 when
459
+ skipping past the end of an image.
460
+
461
+ 3. The Arm 64-bit (Armv8) Neon SIMD extensions can now be built using MinGW
462
+ toolchains targetting Arm64 (AArch64) Windows binaries.
463
+
464
+ 4. Fixed unexpected visual artifacts that occurred when using
465
+ `jpeg_crop_scanline()` and interblock smoothing while decompressing only the DC
466
+ scan of a progressive JPEG image.
467
+
468
+ 5. Fixed an issue whereby libjpeg-turbo would not build if 12-bit-per-component
469
+ JPEG support (`WITH_12BIT`) was enabled along with libjpeg v7 or libjpeg v8
470
+ API/ABI emulation (`WITH_JPEG7` or `WITH_JPEG8`.)
471
+
472
+
473
+ 2.0.5
474
+ =====
475
+
476
+ ### Significant changes relative to 2.0.4:
477
+
478
+ 1. Worked around issues in the MIPS DSPr2 SIMD extensions that caused failures
479
+ in the libjpeg-turbo regression tests. Specifically, the
480
+ `jsimd_h2v1_downsample_dspr2()` and `jsimd_h2v2_downsample_dspr2()` functions
481
+ in the MIPS DSPr2 SIMD extensions are now disabled until/unless they can be
482
+ fixed, and other functions that are incompatible with big endian MIPS CPUs are
483
+ disabled when building libjpeg-turbo for such CPUs.
484
+
485
+ 2. Fixed an oversight in the `TJCompressor.compress(int)` method in the
486
+ TurboJPEG Java API that caused an error ("java.lang.IllegalStateException: No
487
+ source image is associated with this instance") when attempting to use that
488
+ method to compress a YUV image.
489
+
490
+ 3. Fixed an issue (CVE-2020-13790) in the PPM reader that caused a buffer
491
+ overrun in cjpeg, TJBench, or the `tjLoadImage()` function if one of the values
492
+ in a binary PPM/PGM input file exceeded the maximum value defined in the file's
493
+ header and that maximum value was less than 255. libjpeg-turbo 1.5.0 already
494
+ included a similar fix for binary PPM/PGM files with maximum values greater
495
+ than 255.
496
+
497
+ 4. The TurboJPEG API library's global error handler, which is used in functions
498
+ such as `tjBufSize()` and `tjLoadImage()` that do not require a TurboJPEG
499
+ instance handle, is now thread-safe on platforms that support thread-local
500
+ storage.
501
+
502
+
503
+ 2.0.4
504
+ =====
505
+
506
+ ### Significant changes relative to 2.0.3:
507
+
508
+ 1. Fixed a regression in the Windows packaging system (introduced by
509
+ 2.0 beta1[2]) whereby, if both the 64-bit libjpeg-turbo SDK for GCC and the
510
+ 64-bit libjpeg-turbo SDK for Visual C++ were installed on the same system, only
511
+ one of them could be uninstalled.
512
+
513
+ 2. Fixed a signed integer overflow and subsequent segfault that occurred when
514
+ attempting to decompress images with more than 715827882 pixels using the
515
+ 64-bit C version of TJBench.
516
+
517
+ 3. Fixed out-of-bounds write in `tjDecompressToYUV2()` and
518
+ `tjDecompressToYUVPlanes()` (sometimes manifesting as a double free) that
519
+ occurred when attempting to decompress grayscale JPEG images that were
520
+ compressed with a sampling factor other than 1 (for instance, with
521
+ `cjpeg -grayscale -sample 2x2`).
522
+
523
+ 4. Fixed a regression introduced by 2.0.2[5] that caused the TurboJPEG API to
524
+ incorrectly identify some JPEG images with unusual sampling factors as 4:4:4
525
+ JPEG images. This was known to cause a buffer overflow when attempting to
526
+ decompress some such images using `tjDecompressToYUV2()` or
527
+ `tjDecompressToYUVPlanes()`.
528
+
529
+ 5. Fixed an issue (CVE-2020-17541), detected by ASan, whereby attempting to
530
+ losslessly transform a specially-crafted malformed JPEG image containing an
531
+ extremely-high-frequency coefficient block (junk image data that could never be
532
+ generated by a legitimate JPEG compressor) could cause the Huffman encoder's
533
+ local buffer to be overrun. (Refer to 1.4.0[9] and 1.4beta1[15].) Given that
534
+ the buffer overrun was fully contained within the stack and did not cause a
535
+ segfault or other user-visible errant behavior, and given that the lossless
536
+ transformer (unlike the decompressor) is not generally exposed to arbitrary
537
+ data exploits, this issue did not likely pose a security risk.
538
+
539
+ 6. The Arm 64-bit (Armv8) Neon SIMD assembly code now stores constants in a
540
+ separate read-only data section rather than in the text section, to support
541
+ execute-only memory layouts.
542
+
543
+
544
+ 2.0.3
545
+ =====
546
+
547
+ ### Significant changes relative to 2.0.2:
548
+
549
+ 1. Fixed "using JNI after critical get" errors that occurred on Android
550
+ platforms when passing invalid arguments to certain methods in the TurboJPEG
551
+ Java API.
552
+
553
+ 2. Fixed a regression in the SIMD feature detection code, introduced by
554
+ the AVX2 SIMD extensions (2.0 beta1[1]), that was known to cause an illegal
555
+ instruction exception, in rare cases, on CPUs that lack support for CPUID leaf
556
+ 07H (or on which the maximum CPUID leaf has been limited by way of a BIOS
557
+ setting.)
558
+
559
+ 3. The 4:4:0 (h1v2) fancy (smooth) chroma upsampling algorithm in the
560
+ decompressor now uses a similar bias pattern to that of the 4:2:2 (h2v1) fancy
561
+ chroma upsampling algorithm, rounding up or down the upsampled result for
562
+ alternate pixels rather than always rounding down. This ensures that,
563
+ regardless of whether a 4:2:2 JPEG image is rotated or transposed prior to
564
+ decompression (in the frequency domain) or after decompression (in the spatial
565
+ domain), the final image will be similar.
566
+
567
+ 4. Fixed an integer overflow and subsequent segfault that occurred when
568
+ attempting to compress or decompress images with more than 1 billion pixels
569
+ using the TurboJPEG API.
570
+
571
+ 5. Fixed a regression introduced by 2.0 beta1[15] whereby attempting to
572
+ generate a progressive JPEG image on an SSE2-capable CPU using a scan script
573
+ containing one or more scans with lengths divisible by 16 would result in an
574
+ error ("Missing Huffman code table entry") and an invalid JPEG image.
575
+
576
+ 6. Fixed an issue whereby `tjDecodeYUV()` and `tjDecodeYUVPlanes()` would throw
577
+ an error ("Invalid progressive parameters") or a warning ("Inconsistent
578
+ progression sequence") if passed a TurboJPEG instance that was previously used
579
+ to decompress a progressive JPEG image.
580
+
581
+
582
+ 2.0.2
583
+ =====
584
+
585
+ ### Significant changes relative to 2.0.1:
586
+
587
+ 1. Fixed a regression introduced by 2.0.1[5] that prevented a runtime search
588
+ path (rpath) from being embedded in the libjpeg-turbo shared libraries and
589
+ executables for macOS and iOS. This caused a fatal error of the form
590
+ "dyld: Library not loaded" when attempting to use one of the executables,
591
+ unless `DYLD_LIBRARY_PATH` was explicitly set to the location of the
592
+ libjpeg-turbo shared libraries.
593
+
594
+ 2. Fixed an integer overflow and subsequent segfault (CVE-2018-20330) that
595
+ occurred when attempting to load a BMP file with more than 1 billion pixels
596
+ using the `tjLoadImage()` function.
597
+
598
+ 3. Fixed a buffer overrun (CVE-2018-19664) that occurred when attempting to
599
+ decompress a specially-crafted malformed JPEG image to a 256-color BMP using
600
+ djpeg.
601
+
602
+ 4. Fixed a floating point exception that occurred when attempting to
603
+ decompress a specially-crafted malformed JPEG image with a specified image
604
+ width or height of 0 using the C version of TJBench.
605
+
606
+ 5. The TurboJPEG API will now decompress 4:4:4 JPEG images with 2x1, 1x2, 3x1,
607
+ or 1x3 luminance and chrominance sampling factors. This is a non-standard way
608
+ of specifying 1x subsampling (normally 4:4:4 JPEGs have 1x1 luminance and
609
+ chrominance sampling factors), but the JPEG format and the libjpeg API both
610
+ allow it.
611
+
612
+ 6. Fixed a regression introduced by 2.0 beta1[7] that caused djpeg to generate
613
+ incorrect PPM images when used with the `-colors` option.
614
+
615
+ 7. Fixed an issue whereby a static build of libjpeg-turbo (a build in which
616
+ `ENABLE_SHARED` is `0`) could not be installed using the Visual Studio IDE.
617
+
618
+ 8. Fixed a severe performance issue in the Loongson MMI SIMD extensions that
619
+ occurred when compressing RGB images whose image rows were not 64-bit-aligned.
620
+
621
+
622
+ 2.0.1
623
+ =====
624
+
625
+ ### Significant changes relative to 2.0.0:
626
+
627
+ 1. Fixed a regression introduced with the new CMake-based Un*x build system,
628
+ whereby jconfig.h could cause compiler warnings of the form
629
+ `"HAVE_*_H" redefined` if it was included by downstream Autotools-based
630
+ projects that used `AC_CHECK_HEADERS()` to check for the existence of locale.h,
631
+ stddef.h, or stdlib.h.
632
+
633
+ 2. The `jsimd_quantize_float_dspr2()` and `jsimd_convsamp_float_dspr2()`
634
+ functions in the MIPS DSPr2 SIMD extensions are now disabled at compile time
635
+ if the soft float ABI is enabled. Those functions use instructions that are
636
+ incompatible with the soft float ABI.
637
+
638
+ 3. Fixed a regression in the SIMD feature detection code, introduced by
639
+ the AVX2 SIMD extensions (2.0 beta1[1]), that caused libjpeg-turbo to crash on
640
+ Windows 7 if Service Pack 1 was not installed.
641
+
642
+ 4. Fixed out-of-bounds read in cjpeg that occurred when attempting to compress
643
+ a specially-crafted malformed color-index (8-bit-per-sample) Targa file in
644
+ which some of the samples (color indices) exceeded the bounds of the Targa
645
+ file's color table.
646
+
647
+ 5. Fixed an issue whereby installing a fully static build of libjpeg-turbo
648
+ (a build in which `CFLAGS` contains `-static` and `ENABLE_SHARED` is `0`) would
649
+ fail with "No valid ELF RPATH or RUNPATH entry exists in the file."
650
+
651
+
652
+ 2.0.0
653
+ =====
654
+
655
+ ### Significant changes relative to 2.0 beta1:
656
+
657
+ 1. The TurboJPEG API can now decompress CMYK JPEG images that have subsampled M
658
+ and Y components (not to be confused with YCCK JPEG images, in which the C/M/Y
659
+ components have been transformed into luma and chroma.) Previously, an error
660
+ was generated ("Could not determine subsampling type for JPEG image") when such
661
+ an image was passed to `tjDecompressHeader3()`, `tjTransform()`,
662
+ `tjDecompressToYUVPlanes()`, `tjDecompressToYUV2()`, or the equivalent Java
663
+ methods.
664
+
665
+ 2. Fixed an issue (CVE-2018-11813) whereby a specially-crafted malformed input
666
+ file (specifically, a file with a valid Targa header but incomplete pixel data)
667
+ would cause cjpeg to generate a JPEG file that was potentially thousands of
668
+ times larger than the input file. The Targa reader in cjpeg was not properly
669
+ detecting that the end of the input file had been reached prematurely, so after
670
+ all valid pixels had been read from the input, the reader injected dummy pixels
671
+ with values of 255 into the JPEG compressor until the number of pixels
672
+ specified in the Targa header had been compressed. The Targa reader in cjpeg
673
+ now behaves like the PPM reader and aborts compression if the end of the input
674
+ file is reached prematurely. Because this issue only affected cjpeg and not
675
+ the underlying library, and because it did not involve any out-of-bounds reads
676
+ or other exploitable behaviors, it was not believed to represent a security
677
+ threat.
678
+
679
+ 3. Fixed an issue whereby the `tjLoadImage()` and `tjSaveImage()` functions
680
+ would produce a "Bogus message code" error message if the underlying bitmap and
681
+ PPM readers/writers threw an error that was specific to the readers/writers
682
+ (as opposed to a general libjpeg API error.)
683
+
684
+ 4. Fixed an issue (CVE-2018-1152) whereby a specially-crafted malformed BMP
685
+ file, one in which the header specified an image width of 1073741824 pixels,
686
+ would trigger a floating point exception (division by zero) in the
687
+ `tjLoadImage()` function when attempting to load the BMP file into a
688
+ 4-component image buffer.
689
+
690
+ 5. Fixed an issue whereby certain combinations of calls to
691
+ `jpeg_skip_scanlines()` and `jpeg_read_scanlines()` could trigger an infinite
692
+ loop when decompressing progressive JPEG images that use vertical chroma
693
+ subsampling (for instance, 4:2:0 or 4:4:0.)
694
+
695
+ 6. Fixed a segfault in `jpeg_skip_scanlines()` that occurred when decompressing
696
+ a 4:2:2 or 4:2:0 JPEG image using the merged (non-fancy) upsampling algorithms
697
+ (that is, when setting `cinfo.do_fancy_upsampling` to `FALSE`.)
698
+
699
+ 7. The new CMake-based build system will now disable the MIPS DSPr2 SIMD
700
+ extensions if it detects that the compiler does not support DSPr2 instructions.
701
+
702
+ 8. Fixed out-of-bounds read in cjpeg (CVE-2018-14498) that occurred when
703
+ attempting to compress a specially-crafted malformed color-index
704
+ (8-bit-per-sample) BMP file in which some of the samples (color indices)
705
+ exceeded the bounds of the BMP file's color table.
706
+
707
+ 9. Fixed a signed integer overflow in the progressive Huffman decoder, detected
708
+ by the Clang and GCC undefined behavior sanitizers, that could be triggered by
709
+ attempting to decompress a specially-crafted malformed JPEG image. This issue
710
+ did not pose a security threat, but removing the warning made it easier to
711
+ detect actual security issues, should they arise in the future.
712
+
713
+
714
+ 1.5.90 (2.0 beta1)
715
+ ==================
716
+
717
+ ### Significant changes relative to 1.5.3:
718
+
719
+ 1. Added AVX2 SIMD implementations of the colorspace conversion, chroma
720
+ downsampling and upsampling, integer quantization and sample conversion, and
721
+ accurate integer DCT/IDCT algorithms. When using the accurate integer DCT/IDCT
722
+ algorithms on AVX2-equipped CPUs, the compression of RGB images is
723
+ approximately 13-36% (avg. 22%) faster (relative to libjpeg-turbo 1.5.x) with
724
+ 64-bit code and 11-21% (avg. 17%) faster with 32-bit code, and the
725
+ decompression of RGB images is approximately 9-35% (avg. 17%) faster with
726
+ 64-bit code and 7-17% (avg. 12%) faster with 32-bit code. (As tested on a
727
+ 3 GHz Intel Core i7. Actual mileage may vary.)
728
+
729
+ 2. Overhauled the build system to use CMake on all platforms, and removed the
730
+ autotools-based build system. This decision resulted from extensive
731
+ discussions within the libjpeg-turbo community. libjpeg-turbo traditionally
732
+ used CMake only for Windows builds, but there was an increasing amount of
733
+ demand to extend CMake support to other platforms. However, because of the
734
+ unique nature of our code base (the need to support different assemblers on
735
+ each platform, the need for Java support, etc.), providing dual build systems
736
+ as other OSS imaging libraries do (including libpng and libtiff) would have
737
+ created a maintenance burden. The use of CMake greatly simplifies some aspects
738
+ of our build system, owing to CMake's built-in support for various assemblers,
739
+ Java, and unit testing, as well as generally fewer quirks that have to be
740
+ worked around in order to implement our packaging system. Eliminating
741
+ autotools puts our project slightly at odds with the traditional practices of
742
+ the OSS community, since most "system libraries" tend to be built with
743
+ autotools, but it is believed that the benefits of this move outweigh the
744
+ risks. In addition to providing a unified build environment, switching to
745
+ CMake allows for the use of various build tools and IDEs that aren't supported
746
+ under autotools, including XCode, Ninja, and Eclipse. It also eliminates the
747
+ need to install autotools via MacPorts/Homebrew on OS X and allows
748
+ libjpeg-turbo to be configured without the use of a terminal/command prompt.
749
+ Extensive testing was conducted to ensure that all features provided by the
750
+ autotools-based build system are provided by the new build system.
751
+
752
+ 3. The libjpeg API in this version of libjpeg-turbo now includes two additional
753
+ functions, `jpeg_read_icc_profile()` and `jpeg_write_icc_profile()`, that can
754
+ be used to extract ICC profile data from a JPEG file while decompressing or to
755
+ embed ICC profile data in a JPEG file while compressing or transforming. This
756
+ eliminates the need for downstream projects, such as color management libraries
757
+ and browsers, to include their own glueware for accomplishing this.
758
+
759
+ 4. Improved error handling in the TurboJPEG API library:
760
+
761
+ - Introduced a new function (`tjGetErrorStr2()`) in the TurboJPEG C API
762
+ that allows compression/decompression/transform error messages to be retrieved
763
+ in a thread-safe manner. Retrieving error messages from global functions, such
764
+ as `tjInitCompress()` or `tjBufSize()`, is still thread-unsafe, but since those
765
+ functions will only throw errors if passed an invalid argument or if a memory
766
+ allocation failure occurs, thread safety is not as much of a concern.
767
+ - Introduced a new function (`tjGetErrorCode()`) in the TurboJPEG C API
768
+ and a new method (`TJException.getErrorCode()`) in the TurboJPEG Java API that
769
+ can be used to determine the severity of the last
770
+ compression/decompression/transform error. This allows applications to
771
+ choose whether to ignore warnings (non-fatal errors) from the underlying
772
+ libjpeg API or to treat them as fatal.
773
+ - Introduced a new flag (`TJFLAG_STOPONWARNING` in the TurboJPEG C API and
774
+ `TJ.FLAG_STOPONWARNING` in the TurboJPEG Java API) that causes the library to
775
+ immediately halt a compression/decompression/transform operation if it
776
+ encounters a warning from the underlying libjpeg API (the default behavior is
777
+ to allow the operation to complete unless a fatal error is encountered.)
778
+
779
+ 5. Introduced a new flag in the TurboJPEG C and Java APIs (`TJFLAG_PROGRESSIVE`
780
+ and `TJ.FLAG_PROGRESSIVE`, respectively) that causes the library to use
781
+ progressive entropy coding in JPEG images generated by compression and
782
+ transform operations. Additionally, a new transform option
783
+ (`TJXOPT_PROGRESSIVE` in the C API and `TJTransform.OPT_PROGRESSIVE` in the
784
+ Java API) has been introduced, allowing progressive entropy coding to be
785
+ enabled for selected transforms in a multi-transform operation.
786
+
787
+ 6. Introduced a new transform option in the TurboJPEG API (`TJXOPT_COPYNONE` in
788
+ the C API and `TJTransform.OPT_COPYNONE` in the Java API) that allows the
789
+ copying of markers (including EXIF and ICC profile data) to be disabled for a
790
+ particular transform.
791
+
792
+ 7. Added two functions to the TurboJPEG C API (`tjLoadImage()` and
793
+ `tjSaveImage()`) that can be used to load/save a BMP or PPM/PGM image to/from a
794
+ memory buffer with a specified pixel format and layout. These functions
795
+ replace the project-private (and slow) bmp API, which was previously used by
796
+ TJBench, and they also provide a convenient way for first-time users of
797
+ libjpeg-turbo to quickly develop a complete JPEG compression/decompression
798
+ program.
799
+
800
+ 8. The TurboJPEG C API now includes a new convenience array (`tjAlphaOffset[]`)
801
+ that contains the alpha component index for each pixel format (or -1 if the
802
+ pixel format lacks an alpha component.) The TurboJPEG Java API now includes a
803
+ new method (`TJ.getAlphaOffset()`) that returns the same value. In addition,
804
+ the `tjRedOffset[]`, `tjGreenOffset[]`, and `tjBlueOffset[]` arrays-- and the
805
+ corresponding `TJ.getRedOffset()`, `TJ.getGreenOffset()`, and
806
+ `TJ.getBlueOffset()` methods-- now return -1 for `TJPF_GRAY`/`TJ.PF_GRAY`
807
+ rather than 0. This allows programs to easily determine whether a pixel format
808
+ has red, green, blue, and alpha components.
809
+
810
+ 9. Added a new example (tjexample.c) that demonstrates the basic usage of the
811
+ TurboJPEG C API. This example mirrors the functionality of TJExample.java.
812
+ Both files are now included in the libjpeg-turbo documentation.
813
+
814
+ 10. Fixed two signed integer overflows in the arithmetic decoder, detected by
815
+ the Clang undefined behavior sanitizer, that could be triggered by attempting
816
+ to decompress a specially-crafted malformed JPEG image. These issues did not
817
+ pose a security threat, but removing the warnings makes it easier to detect
818
+ actual security issues, should they arise in the future.
819
+
820
+ 11. Fixed a bug in the merged 4:2:0 upsampling/dithered RGB565 color conversion
821
+ algorithm that caused incorrect dithering in the output image. This algorithm
822
+ now produces bitwise-identical results to the unmerged algorithms.
823
+
824
+ 12. The SIMD function symbols for x86[-64]/ELF, MIPS/ELF, macOS/x86[-64] (if
825
+ libjpeg-turbo is built with Yasm), and iOS/Arm[64] builds are now private.
826
+ This prevents those symbols from being exposed in applications or shared
827
+ libraries that link statically with libjpeg-turbo.
828
+
829
+ 13. Added Loongson MMI SIMD implementations of the RGB-to-YCbCr and
830
+ YCbCr-to-RGB colorspace conversion, 4:2:0 chroma downsampling, 4:2:0 fancy
831
+ chroma upsampling, integer quantization, and accurate integer DCT/IDCT
832
+ algorithms. When using the accurate integer DCT/IDCT, this speeds up the
833
+ compression of RGB images by approximately 70-100% and the decompression of RGB
834
+ images by approximately 2-3.5x.
835
+
836
+ 14. Fixed a build error when building with older MinGW releases (regression
837
+ caused by 1.5.1[7].)
838
+
839
+ 15. Added SIMD acceleration for progressive Huffman encoding on SSE2-capable
840
+ x86 and x86-64 platforms. This speeds up the compression of full-color
841
+ progressive JPEGs by about 85-90% on average (relative to libjpeg-turbo 1.5.x)
842
+ when using modern Intel and AMD CPUs.
843
+
844
+
845
+ 1.5.3
846
+ =====
847
+
848
+ ### Significant changes relative to 1.5.2:
849
+
850
+ 1. Fixed a NullPointerException in the TurboJPEG Java wrapper that occurred
851
+ when using the YUVImage constructor that creates an instance backed by separate
852
+ image planes and allocates memory for the image planes.
853
+
854
+ 2. Fixed an issue whereby the Java version of TJUnitTest would fail when
855
+ testing BufferedImage encoding/decoding on big endian systems.
856
+
857
+ 3. Fixed a segfault in djpeg that would occur if an output format other than
858
+ PPM/PGM was selected along with the `-crop` option. The `-crop` option now
859
+ works with the GIF and Targa formats as well (unfortunately, it cannot be made
860
+ to work with the BMP and RLE formats due to the fact that those output engines
861
+ write scanlines in bottom-up order.) djpeg will now exit gracefully if an
862
+ output format other than PPM/PGM, GIF, or Targa is selected along with the
863
+ `-crop` option.
864
+
865
+ 4. Fixed an issue (CVE-2017-15232) whereby `jpeg_skip_scanlines()` would
866
+ segfault if color quantization was enabled.
867
+
868
+ 5. TJBench (both C and Java versions) will now display usage information if any
869
+ command-line argument is unrecognized. This prevents the program from silently
870
+ ignoring typos.
871
+
872
+ 6. Fixed an access violation in tjbench.exe (Windows) that occurred when the
873
+ program was used to decompress an existing JPEG image.
874
+
875
+ 7. Fixed an ArrayIndexOutOfBoundsException in the TJExample Java program that
876
+ occurred when attempting to decompress a JPEG image that had been compressed
877
+ with 4:1:1 chrominance subsampling.
878
+
879
+ 8. Fixed an issue whereby, when using `jpeg_skip_scanlines()` to skip to the
880
+ end of a single-scan (non-progressive) image, subsequent calls to
881
+ `jpeg_consume_input()` would return `JPEG_SUSPENDED` rather than
882
+ `JPEG_REACHED_EOI`.
883
+
884
+ 9. `jpeg_crop_scanline()` now works correctly when decompressing grayscale JPEG
885
+ images that were compressed with a sampling factor other than 1 (for instance,
886
+ with `cjpeg -grayscale -sample 2x2`).
887
+
888
+
889
+ 1.5.2
890
+ =====
891
+
892
+ ### Significant changes relative to 1.5.1:
893
+
894
+ 1. Fixed a regression introduced by 1.5.1[7] that prevented libjpeg-turbo from
895
+ building with Android NDK platforms prior to android-21 (5.0).
896
+
897
+ 2. Fixed a regression introduced by 1.5.1[1] that prevented the MIPS DSPR2 SIMD
898
+ code in libjpeg-turbo from building.
899
+
900
+ 3. Fixed a regression introduced by 1.5 beta1[11] that prevented the Java
901
+ version of TJBench from outputting any reference images (the `-nowrite` switch
902
+ was accidentally enabled by default.)
903
+
904
+ 4. libjpeg-turbo should now build and run with full AltiVec SIMD acceleration
905
+ on PowerPC-based AmigaOS 4 and OpenBSD systems.
906
+
907
+ 5. Fixed build and runtime errors on Windows that occurred when building
908
+ libjpeg-turbo with libjpeg v7 API/ABI emulation and the in-memory
909
+ source/destination managers. Due to an oversight, the `jpeg_skip_scanlines()`
910
+ and `jpeg_crop_scanline()` functions were not being included in jpeg7.dll when
911
+ libjpeg-turbo was built with `-DWITH_JPEG7=1` and `-DWITH_MEMSRCDST=1`.
912
+
913
+ 6. Fixed "Bogus virtual array access" error that occurred when using the
914
+ lossless crop feature in jpegtran or the TurboJPEG API, if libjpeg-turbo was
915
+ built with libjpeg v7 API/ABI emulation. This was apparently a long-standing
916
+ bug that has existed since the introduction of libjpeg v7/v8 API/ABI emulation
917
+ in libjpeg-turbo v1.1.
918
+
919
+ 7. The lossless transform features in jpegtran and the TurboJPEG API will now
920
+ always attempt to adjust the EXIF image width and height tags if the image size
921
+ changed as a result of the transform. This behavior has always existed when
922
+ using libjpeg v8 API/ABI emulation. It was supposed to be available with
923
+ libjpeg v7 API/ABI emulation as well but did not work properly due to a bug.
924
+ Furthermore, there was never any good reason not to enable it with libjpeg v6b
925
+ API/ABI emulation, since the behavior is entirely internal. Note that
926
+ `-copy all` must be passed to jpegtran in order to transfer the EXIF tags from
927
+ the source image to the destination image.
928
+
929
+ 8. Fixed several memory leaks in the TurboJPEG API library that could occur
930
+ if the library was built with certain compilers and optimization levels
931
+ (known to occur with GCC 4.x and clang with `-O1` and higher but not with
932
+ GCC 5.x or 6.x) and one of the underlying libjpeg API functions threw an error
933
+ after a TurboJPEG API function allocated a local buffer.
934
+
935
+ 9. The libjpeg-turbo memory manager will now honor the `max_memory_to_use`
936
+ structure member in jpeg\_memory\_mgr, which can be set to the maximum amount
937
+ of memory (in bytes) that libjpeg-turbo should use during decompression or
938
+ multi-pass (including progressive) compression. This limit can also be set
939
+ using the `JPEGMEM` environment variable or using the `-maxmemory` switch in
940
+ cjpeg/djpeg/jpegtran (refer to the respective man pages for more details.)
941
+ This has been a documented feature of libjpeg since v5, but the
942
+ `malloc()`/`free()` implementation of the memory manager (jmemnobs.c) never
943
+ implemented the feature. Restricting libjpeg-turbo's memory usage is useful
944
+ for two reasons: it allows testers to more easily work around the 2 GB limit
945
+ in libFuzzer, and it allows developers of security-sensitive applications to
946
+ more easily defend against one of the progressive JPEG exploits (LJT-01-004)
947
+ identified in
948
+ [this report](http://www.libjpeg-turbo.org/pmwiki/uploads/About/TwoIssueswiththeJPEGStandard.pdf).
949
+
950
+ 10. TJBench will now run each benchmark for 1 second prior to starting the
951
+ timer, in order to improve the consistency of the results. Furthermore, the
952
+ `-warmup` option is now used to specify the amount of warmup time rather than
953
+ the number of warmup iterations.
954
+
955
+ 11. Fixed an error (`short jump is out of range`) that occurred when assembling
956
+ the 32-bit x86 SIMD extensions with NASM versions prior to 2.04. This was a
957
+ regression introduced by 1.5 beta1[12].
958
+
959
+
960
+ 1.5.1
961
+ =====
962
+
963
+ ### Significant changes relative to 1.5.0:
964
+
965
+ 1. Previously, the undocumented `JSIMD_FORCE*` environment variables could be
966
+ used to force-enable a particular SIMD instruction set if multiple instruction
967
+ sets were available on a particular platform. On x86 platforms, where CPU
968
+ feature detection is bulletproof and multiple SIMD instruction sets are
969
+ available, it makes sense for those environment variables to allow forcing the
970
+ use of an instruction set only if that instruction set is available. However,
971
+ since the ARM implementations of libjpeg-turbo can only use one SIMD
972
+ instruction set, and since their feature detection code is less bulletproof
973
+ (parsing /proc/cpuinfo), it makes sense for the `JSIMD_FORCENEON` environment
974
+ variable to bypass the feature detection code and really force the use of NEON
975
+ instructions. A new environment variable (`JSIMD_FORCEDSPR2`) was introduced
976
+ in the MIPS implementation for the same reasons, and the existing
977
+ `JSIMD_FORCENONE` environment variable was extended to that implementation.
978
+ These environment variables provide a workaround for those attempting to test
979
+ ARM and MIPS builds of libjpeg-turbo in QEMU, which passes through
980
+ /proc/cpuinfo from the host system.
981
+
982
+ 2. libjpeg-turbo previously assumed that AltiVec instructions were always
983
+ available on PowerPC platforms, which led to "illegal instruction" errors when
984
+ running on PowerPC chips that lack AltiVec support (such as the older 7xx/G3
985
+ and newer e5500 series.) libjpeg-turbo now examines /proc/cpuinfo on
986
+ Linux/Android systems and enables AltiVec instructions only if the CPU supports
987
+ them. It also now provides two environment variables, `JSIMD_FORCEALTIVEC` and
988
+ `JSIMD_FORCENONE`, to force-enable and force-disable AltiVec instructions in
989
+ environments where /proc/cpuinfo is an unreliable means of CPU feature
990
+ detection (such as when running in QEMU.) On OS X, libjpeg-turbo continues to
991
+ assume that AltiVec support is always available, which means that libjpeg-turbo
992
+ cannot be used with G3 Macs unless you set the environment variable
993
+ `JSIMD_FORCENONE` to `1`.
994
+
995
+ 3. Fixed an issue whereby 64-bit ARM (AArch64) builds of libjpeg-turbo would
996
+ crash when built with recent releases of the Clang/LLVM compiler. This was
997
+ caused by an ABI conformance issue in some of libjpeg-turbo's 64-bit NEON SIMD
998
+ routines. Those routines were incorrectly using 64-bit instructions to
999
+ transfer a 32-bit JDIMENSION argument, whereas the ABI allows the upper
1000
+ (unused) 32 bits of a 32-bit argument's register to be undefined. The new
1001
+ Clang/LLVM optimizer uses load combining to transfer multiple adjacent 32-bit
1002
+ structure members into a single 64-bit register, and this exposed the ABI
1003
+ conformance issue.
1004
+
1005
+ 4. Fancy upsampling is now supported when decompressing JPEG images that use
1006
+ 4:4:0 (h1v2) chroma subsampling. These images are generated when losslessly
1007
+ rotating or transposing JPEG images that use 4:2:2 (h2v1) chroma subsampling.
1008
+ The h1v2 fancy upsampling algorithm is not currently SIMD-accelerated.
1009
+
1010
+ 5. If merged upsampling isn't SIMD-accelerated but YCbCr-to-RGB conversion is,
1011
+ then libjpeg-turbo will now disable merged upsampling when decompressing YCbCr
1012
+ JPEG images into RGB or extended RGB output images. This significantly speeds
1013
+ up the decompression of 4:2:0 and 4:2:2 JPEGs on ARM platforms if fancy
1014
+ upsampling is not used (for example, if the `-nosmooth` option to djpeg is
1015
+ specified.)
1016
+
1017
+ 6. The TurboJPEG API will now decompress 4:2:2 and 4:4:0 JPEG images with
1018
+ 2x2 luminance sampling factors and 2x1 or 1x2 chrominance sampling factors.
1019
+ This is a non-standard way of specifying 2x subsampling (normally 4:2:2 JPEGs
1020
+ have 2x1 luminance and 1x1 chrominance sampling factors, and 4:4:0 JPEGs have
1021
+ 1x2 luminance and 1x1 chrominance sampling factors), but the JPEG format and
1022
+ the libjpeg API both allow it.
1023
+
1024
+ 7. Fixed an unsigned integer overflow in the libjpeg memory manager, detected
1025
+ by the Clang undefined behavior sanitizer, that could be triggered by
1026
+ attempting to decompress a specially-crafted malformed JPEG image. This issue
1027
+ affected only 32-bit code and did not pose a security threat, but removing the
1028
+ warning makes it easier to detect actual security issues, should they arise in
1029
+ the future.
1030
+
1031
+ 8. Fixed additional negative left shifts and other issues reported by the GCC
1032
+ and Clang undefined behavior sanitizers when attempting to decompress
1033
+ specially-crafted malformed JPEG images. None of these issues posed a security
1034
+ threat, but removing the warnings makes it easier to detect actual security
1035
+ issues, should they arise in the future.
1036
+
1037
+ 9. Fixed an out-of-bounds array reference, introduced by 1.4.90[2] (partial
1038
+ image decompression) and detected by the Clang undefined behavior sanitizer,
1039
+ that could be triggered by a specially-crafted malformed JPEG image with more
1040
+ than four components. Because the out-of-bounds reference was still within the
1041
+ same structure, it was not known to pose a security threat, but removing the
1042
+ warning makes it easier to detect actual security issues, should they arise in
1043
+ the future.
1044
+
1045
+ 10. Fixed another ABI conformance issue in the 64-bit ARM (AArch64) NEON SIMD
1046
+ code. Some of the routines were incorrectly reading and storing data below the
1047
+ stack pointer, which caused segfaults in certain applications under specific
1048
+ circumstances.
1049
+
1050
+
1051
+ 1.5.0
1052
+ =====
1053
+
1054
+ ### Significant changes relative to 1.5 beta1:
1055
+
1056
+ 1. Fixed an issue whereby a malformed motion-JPEG frame could cause the "fast
1057
+ path" of libjpeg-turbo's Huffman decoder to read from uninitialized memory.
1058
+
1059
+ 2. Added libjpeg-turbo version and build information to the global string table
1060
+ of the libjpeg and TurboJPEG API libraries. This is a common practice in other
1061
+ infrastructure libraries, such as OpenSSL and libpng, because it makes it easy
1062
+ to examine an application binary and determine which version of the library the
1063
+ application was linked against.
1064
+
1065
+ 3. Fixed a couple of issues in the PPM reader that would cause buffer overruns
1066
+ in cjpeg if one of the values in a binary PPM/PGM input file exceeded the
1067
+ maximum value defined in the file's header and that maximum value was greater
1068
+ than 255. libjpeg-turbo 1.4.2 already included a similar fix for ASCII PPM/PGM
1069
+ files. Note that these issues were not security bugs, since they were confined
1070
+ to the cjpeg program and did not affect any of the libjpeg-turbo libraries.
1071
+
1072
+ 4. Fixed an issue whereby attempting to decompress a JPEG file with a corrupt
1073
+ header using the `tjDecompressToYUV2()` function would cause the function to
1074
+ abort without returning an error and, under certain circumstances, corrupt the
1075
+ stack. This only occurred if `tjDecompressToYUV2()` was called prior to
1076
+ calling `tjDecompressHeader3()`, or if the return value from
1077
+ `tjDecompressHeader3()` was ignored (both cases represent incorrect usage of
1078
+ the TurboJPEG API.)
1079
+
1080
+ 5. Fixed an issue in the ARM 32-bit SIMD-accelerated Huffman encoder that
1081
+ prevented the code from assembling properly with clang.
1082
+
1083
+ 6. The `jpeg_stdio_src()`, `jpeg_mem_src()`, `jpeg_stdio_dest()`, and
1084
+ `jpeg_mem_dest()` functions in the libjpeg API will now throw an error if a
1085
+ source/destination manager has already been assigned to the compress or
1086
+ decompress object by a different function or by the calling program. This
1087
+ prevents these functions from attempting to reuse a source/destination manager
1088
+ structure that was allocated elsewhere, because there is no way to ensure that
1089
+ it would be big enough to accommodate the new source/destination manager.
1090
+
1091
+
1092
+ 1.4.90 (1.5 beta1)
1093
+ ==================
1094
+
1095
+ ### Significant changes relative to 1.4.2:
1096
+
1097
+ 1. Added full SIMD acceleration for PowerPC platforms using AltiVec VMX
1098
+ (128-bit SIMD) instructions. Although the performance of libjpeg-turbo on
1099
+ PowerPC was already good, due to the increased number of registers available
1100
+ to the compiler vs. x86, it was still possible to speed up compression by about
1101
+ 3-4x and decompression by about 2-2.5x (relative to libjpeg v6b) through the
1102
+ use of AltiVec instructions.
1103
+
1104
+ 2. Added two new libjpeg API functions (`jpeg_skip_scanlines()` and
1105
+ `jpeg_crop_scanline()`) that can be used to partially decode a JPEG image. See
1106
+ [libjpeg.txt](libjpeg.txt) for more details.
1107
+
1108
+ 3. The TJCompressor and TJDecompressor classes in the TurboJPEG Java API now
1109
+ implement the Closeable interface, so those classes can be used with a
1110
+ try-with-resources statement.
1111
+
1112
+ 4. The TurboJPEG Java classes now throw unchecked idiomatic exceptions
1113
+ (IllegalArgumentException, IllegalStateException) for unrecoverable errors
1114
+ caused by incorrect API usage, and those classes throw a new checked exception
1115
+ type (TJException) for errors that are passed through from the C library.
1116
+
1117
+ 5. Source buffers for the TurboJPEG C API functions, as well as the
1118
+ `jpeg_mem_src()` function in the libjpeg API, are now declared as const
1119
+ pointers. This facilitates passing read-only buffers to those functions and
1120
+ ensures the caller that the source buffer will not be modified. This should
1121
+ not create any backward API or ABI incompatibilities with prior libjpeg-turbo
1122
+ releases.
1123
+
1124
+ 6. The MIPS DSPr2 SIMD code can now be compiled to support either FR=0 or FR=1
1125
+ FPUs.
1126
+
1127
+ 7. Fixed additional negative left shifts and other issues reported by the GCC
1128
+ and Clang undefined behavior sanitizers. Most of these issues affected only
1129
+ 32-bit code, and none of them was known to pose a security threat, but removing
1130
+ the warnings makes it easier to detect actual security issues, should they
1131
+ arise in the future.
1132
+
1133
+ 8. Removed the unnecessary `.arch` directive from the ARM64 NEON SIMD code.
1134
+ This directive was preventing the code from assembling using the clang
1135
+ integrated assembler.
1136
+
1137
+ 9. Fixed a regression caused by 1.4.1[6] that prevented 32-bit and 64-bit
1138
+ libjpeg-turbo RPMs from being installed simultaneously on recent Red Hat/Fedora
1139
+ distributions. This was due to the addition of a macro in jconfig.h that
1140
+ allows the Huffman codec to determine the word size at compile time. Since
1141
+ that macro differs between 32-bit and 64-bit builds, this caused a conflict
1142
+ between the i386 and x86_64 RPMs (any differing files, other than executables,
1143
+ are not allowed when 32-bit and 64-bit RPMs are installed simultaneously.)
1144
+ Since the macro is used only internally, it has been moved into jconfigint.h.
1145
+
1146
+ 10. The x86-64 SIMD code can now be disabled at run time by setting the
1147
+ `JSIMD_FORCENONE` environment variable to `1` (the other SIMD implementations
1148
+ already had this capability.)
1149
+
1150
+ 11. Added a new command-line argument to TJBench (`-nowrite`) that prevents the
1151
+ benchmark from outputting any images. This removes any potential operating
1152
+ system overhead that might be caused by lazy writes to disk and thus improves
1153
+ the consistency of the performance measurements.
1154
+
1155
+ 12. Added SIMD acceleration for Huffman encoding on SSE2-capable x86 and x86-64
1156
+ platforms. This speeds up the compression of full-color JPEGs by about 10-15%
1157
+ on average (relative to libjpeg-turbo 1.4.x) when using modern Intel and AMD
1158
+ CPUs. Additionally, this works around an issue in the clang optimizer that
1159
+ prevents it (as of this writing) from achieving the same performance as GCC
1160
+ when compiling the C version of the Huffman encoder
1161
+ (<https://llvm.org/bugs/show_bug.cgi?id=16035>). For the purposes of
1162
+ benchmarking or regression testing, SIMD-accelerated Huffman encoding can be
1163
+ disabled by setting the `JSIMD_NOHUFFENC` environment variable to `1`.
1164
+
1165
+ 13. Added ARM 64-bit (ARMv8) NEON SIMD implementations of the commonly-used
1166
+ compression algorithms (including the accurate integer forward DCT and h2v2 &
1167
+ h2v1 downsampling algorithms, which are not accelerated in the 32-bit NEON
1168
+ implementation.) This speeds up the compression of full-color JPEGs by about
1169
+ 75% on average on a Cavium ThunderX processor and by about 2-2.5x on average on
1170
+ Cortex-A53 and Cortex-A57 cores.
1171
+
1172
+ 14. Added SIMD acceleration for Huffman encoding on NEON-capable ARM 32-bit
1173
+ and 64-bit platforms.
1174
+
1175
+ For 32-bit code, this speeds up the compression of full-color JPEGs by
1176
+ about 30% on average on a typical iOS device (iPhone 4S, Cortex-A9) and by
1177
+ about 6-7% on average on a typical Android device (Nexus 5X, Cortex-A53 and
1178
+ Cortex-A57), relative to libjpeg-turbo 1.4.x. Note that the larger speedup
1179
+ under iOS is due to the fact that iOS builds use LLVM, which does not optimize
1180
+ the C Huffman encoder as well as GCC does.
1181
+
1182
+ For 64-bit code, NEON-accelerated Huffman encoding speeds up the
1183
+ compression of full-color JPEGs by about 40% on average on a typical iOS device
1184
+ (iPhone 5S, Apple A7) and by about 7-8% on average on a typical Android device
1185
+ (Nexus 5X, Cortex-A53 and Cortex-A57), in addition to the speedup described in
1186
+ [13] above.
1187
+
1188
+ For the purposes of benchmarking or regression testing, SIMD-accelerated
1189
+ Huffman encoding can be disabled by setting the `JSIMD_NOHUFFENC` environment
1190
+ variable to `1`.
1191
+
1192
+ 15. pkg-config (.pc) scripts are now included for both the libjpeg and
1193
+ TurboJPEG API libraries on Un*x systems. Note that if a project's build system
1194
+ relies on these scripts, then it will not be possible to build that project
1195
+ with libjpeg or with a prior version of libjpeg-turbo.
1196
+
1197
+ 16. Optimized the ARM 64-bit (ARMv8) NEON SIMD decompression routines to
1198
+ improve performance on CPUs with in-order pipelines. This speeds up the
1199
+ decompression of full-color JPEGs by nearly 2x on average on a Cavium ThunderX
1200
+ processor and by about 15% on average on a Cortex-A53 core.
1201
+
1202
+ 17. Fixed an issue in the accelerated Huffman decoder that could have caused
1203
+ the decoder to read past the end of the input buffer when a malformed,
1204
+ specially-crafted JPEG image was being decompressed. In prior versions of
1205
+ libjpeg-turbo, the accelerated Huffman decoder was invoked (in most cases) only
1206
+ if there were > 128 bytes of data in the input buffer. However, it is possible
1207
+ to construct a JPEG image in which a single Huffman block is over 430 bytes
1208
+ long, so this version of libjpeg-turbo activates the accelerated Huffman
1209
+ decoder only if there are > 512 bytes of data in the input buffer.
1210
+
1211
+ 18. Fixed a memory leak in tjunittest encountered when running the program
1212
+ with the `-yuv` option.
1213
+
1214
+
1215
+ 1.4.2
1216
+ =====
1217
+
1218
+ ### Significant changes relative to 1.4.1:
1219
+
1220
+ 1. Fixed an issue whereby cjpeg would segfault if a Windows bitmap with a
1221
+ negative width or height was used as an input image (Windows bitmaps can have
1222
+ a negative height if they are stored in top-down order, but such files are
1223
+ rare and not supported by libjpeg-turbo.)
1224
+
1225
+ 2. Fixed an issue whereby, under certain circumstances, libjpeg-turbo would
1226
+ incorrectly encode certain JPEG images when quality=100 and the fast integer
1227
+ forward DCT were used. This was known to cause `make test` to fail when the
1228
+ library was built with `-march=haswell` on x86 systems.
1229
+
1230
+ 3. Fixed an issue whereby libjpeg-turbo would crash when built with the latest
1231
+ & greatest development version of the Clang/LLVM compiler. This was caused by
1232
+ an x86-64 ABI conformance issue in some of libjpeg-turbo's 64-bit SSE2 SIMD
1233
+ routines. Those routines were incorrectly using a 64-bit `mov` instruction to
1234
+ transfer a 32-bit JDIMENSION argument, whereas the x86-64 ABI allows the upper
1235
+ (unused) 32 bits of a 32-bit argument's register to be undefined. The new
1236
+ Clang/LLVM optimizer uses load combining to transfer multiple adjacent 32-bit
1237
+ structure members into a single 64-bit register, and this exposed the ABI
1238
+ conformance issue.
1239
+
1240
+ 4. Fixed a bug in the MIPS DSPr2 4:2:0 "plain" (non-fancy and non-merged)
1241
+ upsampling routine that caused a buffer overflow (and subsequent segfault) when
1242
+ decompressing a 4:2:0 JPEG image whose scaled output width was less than 16
1243
+ pixels. The "plain" upsampling routines are normally only used when
1244
+ decompressing a non-YCbCr JPEG image, but they are also used when decompressing
1245
+ a JPEG image whose scaled output height is 1.
1246
+
1247
+ 5. Fixed various negative left shifts and other issues reported by the GCC and
1248
+ Clang undefined behavior sanitizers. None of these was known to pose a
1249
+ security threat, but removing the warnings makes it easier to detect actual
1250
+ security issues, should they arise in the future.
1251
+
1252
+
1253
+ 1.4.1
1254
+ =====
1255
+
1256
+ ### Significant changes relative to 1.4.0:
1257
+
1258
+ 1. tjbench now properly handles CMYK/YCCK JPEG files. Passing an argument of
1259
+ `-cmyk` (instead of, for instance, `-rgb`) will cause tjbench to internally
1260
+ convert the source bitmap to CMYK prior to compression, to generate YCCK JPEG
1261
+ files, and to internally convert the decompressed CMYK pixels back to RGB after
1262
+ decompression (the latter is done automatically if a CMYK or YCCK JPEG is
1263
+ passed to tjbench as a source image.) The CMYK<->RGB conversion operation is
1264
+ not benchmarked. NOTE: The quick & dirty CMYK<->RGB conversions that tjbench
1265
+ uses are suitable for testing only. Proper conversion between CMYK and RGB
1266
+ requires a color management system.
1267
+
1268
+ 2. `make test` now performs additional bitwise regression tests using tjbench,
1269
+ mainly for the purpose of testing compression from/decompression to a subregion
1270
+ of a larger image buffer.
1271
+
1272
+ 3. `make test` no longer tests the regression of the floating point DCT/IDCT
1273
+ by default, since the results of those tests can vary if the algorithms in
1274
+ question are not implemented using SIMD instructions on a particular platform.
1275
+ See the comments in [Makefile.am](Makefile.am) for information on how to
1276
+ re-enable the tests and to specify an expected result for them based on the
1277
+ particulars of your platform.
1278
+
1279
+ 4. The NULL color conversion routines have been significantly optimized,
1280
+ which speeds up the compression of RGB and CMYK JPEGs by 5-20% when using
1281
+ 64-bit code and 0-3% when using 32-bit code, and the decompression of those
1282
+ images by 10-30% when using 64-bit code and 3-12% when using 32-bit code.
1283
+
1284
+ 5. Fixed an "illegal instruction" error that occurred when djpeg from a
1285
+ SIMD-enabled libjpeg-turbo MIPS build was executed with the `-nosmooth` option
1286
+ on a MIPS machine that lacked DSPr2 support. The MIPS SIMD routines for h2v1
1287
+ and h2v2 merged upsampling were not properly checking for the existence of
1288
+ DSPr2.
1289
+
1290
+ 6. Performance has been improved significantly on 64-bit non-Linux and
1291
+ non-Windows platforms (generally 10-20% faster compression and 5-10% faster
1292
+ decompression.) Due to an oversight, the 64-bit version of the accelerated
1293
+ Huffman codec was not being compiled in when libjpeg-turbo was built on
1294
+ platforms other than Windows or Linux. Oops.
1295
+
1296
+ 7. Fixed an extremely rare bug in the Huffman encoder that caused 64-bit
1297
+ builds of libjpeg-turbo to incorrectly encode a few specific test images when
1298
+ quality=98, an optimized Huffman table, and the accurate integer forward DCT
1299
+ were used.
1300
+
1301
+ 8. The Windows (CMake) build system now supports building only static or only
1302
+ shared libraries. This is accomplished by adding either `-DENABLE_STATIC=0` or
1303
+ `-DENABLE_SHARED=0` to the CMake command line.
1304
+
1305
+ 9. TurboJPEG API functions will now return an error code if a warning is
1306
+ triggered in the underlying libjpeg API. For instance, if a JPEG file is
1307
+ corrupt, the TurboJPEG decompression functions will attempt to decompress
1308
+ as much of the image as possible, but those functions will now return -1 to
1309
+ indicate that the decompression was not entirely successful.
1310
+
1311
+ 10. Fixed a bug in the MIPS DSPr2 4:2:2 fancy upsampling routine that caused a
1312
+ buffer overflow (and subsequent segfault) when decompressing a 4:2:2 JPEG image
1313
+ in which the right-most MCU was 5 or 6 pixels wide.
1314
+
1315
+
1316
+ 1.4.0
1317
+ =====
1318
+
1319
+ ### Significant changes relative to 1.4 beta1:
1320
+
1321
+ 1. Fixed a build issue on OS X PowerPC platforms (md5cmp failed to build
1322
+ because OS X does not provide the `le32toh()` and `htole32()` functions.)
1323
+
1324
+ 2. The non-SIMD RGB565 color conversion code did not work correctly on big
1325
+ endian machines. This has been fixed.
1326
+
1327
+ 3. Fixed an issue in `tjPlaneSizeYUV()` whereby it would erroneously return 1
1328
+ instead of -1 if `componentID` was > 0 and `subsamp` was `TJSAMP_GRAY`.
1329
+
1330
+ 3. Fixed an issue in `tjBufSizeYUV2()` whereby it would erroneously return 0
1331
+ instead of -1 if `width` was < 1.
1332
+
1333
+ 5. The Huffman encoder now uses `clz` and `bsr` instructions for bit counting
1334
+ on ARM64 platforms (see 1.4 beta1[5].)
1335
+
1336
+ 6. The `close()` method in the TJCompressor and TJDecompressor Java classes is
1337
+ now idempotent. Previously, that method would call the native `tjDestroy()`
1338
+ function even if the TurboJPEG instance had already been destroyed. This
1339
+ caused an exception to be thrown during finalization, if the `close()` method
1340
+ had already been called. The exception was caught, but it was still an
1341
+ expensive operation.
1342
+
1343
+ 7. The TurboJPEG API previously generated an error (`Could not determine
1344
+ subsampling type for JPEG image`) when attempting to decompress grayscale JPEG
1345
+ images that were compressed with a sampling factor other than 1 (for instance,
1346
+ with `cjpeg -grayscale -sample 2x2`). Subsampling technically has no meaning
1347
+ with grayscale JPEGs, and thus the horizontal and vertical sampling factors
1348
+ for such images are ignored by the decompressor. However, the TurboJPEG API
1349
+ was being too rigid and was expecting the sampling factors to be equal to 1
1350
+ before it treated the image as a grayscale JPEG.
1351
+
1352
+ 8. cjpeg, djpeg, and jpegtran now accept an argument of `-version`, which will
1353
+ print the library version and exit.
1354
+
1355
+ 9. Referring to 1.4 beta1[15], another extremely rare circumstance was
1356
+ discovered under which the Huffman encoder's local buffer can be overrun
1357
+ when a buffered destination manager is being used and an
1358
+ extremely-high-frequency block (basically junk image data) is being encoded.
1359
+ Even though the Huffman local buffer was increased from 128 bytes to 136 bytes
1360
+ to address the previous issue, the new issue caused even the larger buffer to
1361
+ be overrun. Further analysis reveals that, in the absolute worst case (such as
1362
+ setting alternating AC coefficients to 32767 and -32768 in the JPEG scanning
1363
+ order), the Huffman encoder can produce encoded blocks that approach double the
1364
+ size of the unencoded blocks. Thus, the Huffman local buffer was increased to
1365
+ 256 bytes, which should prevent any such issue from re-occurring in the future.
1366
+
1367
+ 10. The new `tjPlaneSizeYUV()`, `tjPlaneWidth()`, and `tjPlaneHeight()`
1368
+ functions were not actually usable on any platform except OS X and Windows,
1369
+ because those functions were not included in the libturbojpeg mapfile. This
1370
+ has been fixed.
1371
+
1372
+ 11. Restored the `JPP()`, `JMETHOD()`, and `FAR` macros in the libjpeg-turbo
1373
+ header files. The `JPP()` and `JMETHOD()` macros were originally implemented
1374
+ in libjpeg as a way of supporting non-ANSI compilers that lacked support for
1375
+ prototype parameters. libjpeg-turbo has never supported such compilers, but
1376
+ some software packages still use the macros to define their own prototypes.
1377
+ Similarly, libjpeg-turbo has never supported MS-DOS and other platforms that
1378
+ have far symbols, but some software packages still use the `FAR` macro. A
1379
+ pretty good argument can be made that this is a bad practice on the part of the
1380
+ software in question, but since this affects more than one package, it's just
1381
+ easier to fix it here.
1382
+
1383
+ 12. Fixed issues that were preventing the ARM 64-bit SIMD code from compiling
1384
+ for iOS, and included an ARMv8 architecture in all of the binaries installed by
1385
+ the "official" libjpeg-turbo SDK for OS X.
1386
+
1387
+
1388
+ 1.3.90 (1.4 beta1)
1389
+ ==================
1390
+
1391
+ ### Significant changes relative to 1.3.1:
1392
+
1393
+ 1. New features in the TurboJPEG API:
1394
+
1395
+ - YUV planar images can now be generated with an arbitrary line padding
1396
+ (previously only 4-byte padding, which was compatible with X Video, was
1397
+ supported.)
1398
+ - The decompress-to-YUV function has been extended to support image
1399
+ scaling.
1400
+ - JPEG images can now be compressed from YUV planar source images.
1401
+ - YUV planar images can now be decoded into RGB or grayscale images.
1402
+ - 4:1:1 subsampling is now supported. This is mainly included for
1403
+ compatibility, since 4:1:1 is not fully accelerated in libjpeg-turbo and has no
1404
+ significant advantages relative to 4:2:0.
1405
+ - CMYK images are now supported. This feature allows CMYK source images
1406
+ to be compressed to YCCK JPEGs and YCCK or CMYK JPEGs to be decompressed to
1407
+ CMYK destination images. Conversion between CMYK/YCCK and RGB or YUV images is
1408
+ not supported. Such conversion requires a color management system and is thus
1409
+ out of scope for a codec library.
1410
+ - The handling of YUV images in the Java API has been significantly
1411
+ refactored and should now be much more intuitive.
1412
+ - The Java API now supports encoding a YUV image from an arbitrary
1413
+ position in a large image buffer.
1414
+ - All of the YUV functions now have a corresponding function that operates
1415
+ on separate image planes instead of a unified image buffer. This allows for
1416
+ compressing/decoding from or decompressing/encoding to a subregion of a larger
1417
+ YUV image. It also allows for handling YUV formats that swap the order of the
1418
+ U and V planes.
1419
+
1420
+ 2. Added SIMD acceleration for DSPr2-capable MIPS platforms. This speeds up
1421
+ the compression of full-color JPEGs by 70-80% on such platforms and
1422
+ decompression by 25-35%.
1423
+
1424
+ 3. If an application attempts to decompress a Huffman-coded JPEG image whose
1425
+ header does not contain Huffman tables, libjpeg-turbo will now insert the
1426
+ default Huffman tables. In order to save space, many motion JPEG video frames
1427
+ are encoded without the default Huffman tables, so these frames can now be
1428
+ successfully decompressed by libjpeg-turbo without additional work on the part
1429
+ of the application. An application can still override the Huffman tables, for
1430
+ instance to re-use tables from a previous frame of the same video.
1431
+
1432
+ 4. The Mac packaging system now uses pkgbuild and productbuild rather than
1433
+ PackageMaker (which is obsolete and no longer supported.) This means that
1434
+ OS X 10.6 "Snow Leopard" or later must be used when packaging libjpeg-turbo,
1435
+ although the packages produced can be installed on OS X 10.5 "Leopard" or
1436
+ later. OS X 10.4 "Tiger" is no longer supported.
1437
+
1438
+ 5. The Huffman encoder now uses `clz` and `bsr` instructions for bit counting
1439
+ on ARM platforms rather than a lookup table. This reduces the memory footprint
1440
+ by 64k, which may be important for some mobile applications. Out of four
1441
+ Android devices that were tested, two demonstrated a small overall performance
1442
+ loss (~3-4% on average) with ARMv6 code and a small gain (also ~3-4%) with
1443
+ ARMv7 code when enabling this new feature, but the other two devices
1444
+ demonstrated a significant overall performance gain with both ARMv6 and ARMv7
1445
+ code (~10-20%) when enabling the feature. Actual mileage may vary.
1446
+
1447
+ 6. Worked around an issue with Visual C++ 2010 and later that caused incorrect
1448
+ pixels to be generated when decompressing a JPEG image to a 256-color bitmap,
1449
+ if compiler optimization was enabled when libjpeg-turbo was built. This caused
1450
+ the regression tests to fail when doing a release build under Visual C++ 2010
1451
+ and later.
1452
+
1453
+ 7. Improved the accuracy and performance of the non-SIMD implementation of the
1454
+ floating point inverse DCT (using code borrowed from libjpeg v8a and later.)
1455
+ The accuracy of this implementation now matches the accuracy of the SSE/SSE2
1456
+ implementation. Note, however, that the floating point DCT/IDCT algorithms are
1457
+ mainly a legacy feature. They generally do not produce significantly better
1458
+ accuracy than the accurate integer DCT/IDCT algorithms, and they are quite a
1459
+ bit slower.
1460
+
1461
+ 8. Added a new output colorspace (`JCS_RGB565`) to the libjpeg API that allows
1462
+ for decompressing JPEG images into RGB565 (16-bit) pixels. If dithering is not
1463
+ used, then this code path is SIMD-accelerated on ARM platforms.
1464
+
1465
+ 9. Numerous obsolete features, such as support for non-ANSI compilers and
1466
+ support for the MS-DOS memory model, were removed from the libjpeg code,
1467
+ greatly improving its readability and making it easier to maintain and extend.
1468
+
1469
+ 10. Fixed a segfault that occurred when calling `output_message()` with
1470
+ `msg_code` set to `JMSG_COPYRIGHT`.
1471
+
1472
+ 11. Fixed an issue whereby wrjpgcom was allowing comments longer than 65k
1473
+ characters to be passed on the command line, which was causing it to generate
1474
+ incorrect JPEG files.
1475
+
1476
+ 12. Fixed a bug in the build system that was causing the Windows version of
1477
+ wrjpgcom to be built using the rdjpgcom source code.
1478
+
1479
+ 13. Restored 12-bit-per-component JPEG support. A 12-bit version of
1480
+ libjpeg-turbo can now be built by passing an argument of `--with-12bit` to
1481
+ configure (Unix) or `-DWITH_12BIT=1` to cmake (Windows.) 12-bit JPEG support
1482
+ is included only for convenience. Enabling this feature disables all of the
1483
+ performance features in libjpeg-turbo, as well as arithmetic coding and the
1484
+ TurboJPEG API. The resulting library still contains the other libjpeg-turbo
1485
+ features (such as the colorspace extensions), but in general, it performs no
1486
+ faster than libjpeg v6b.
1487
+
1488
+ 14. Added ARM 64-bit SIMD acceleration for the YCC-to-RGB color conversion
1489
+ and IDCT algorithms (both are used during JPEG decompression.) For unknown
1490
+ reasons (probably related to clang), this code cannot currently be compiled for
1491
+ iOS.
1492
+
1493
+ 15. Fixed an extremely rare bug (CVE-2014-9092) that could cause the Huffman
1494
+ encoder's local buffer to overrun when a very high-frequency MCU is compressed
1495
+ using quality 100 and no subsampling, and when the JPEG output buffer is being
1496
+ dynamically resized by the destination manager. This issue was so rare that,
1497
+ even with a test program specifically designed to make the bug occur (by
1498
+ injecting random high-frequency YUV data into the compressor), it was
1499
+ reproducible only once in about every 25 million iterations.
1500
+
1501
+ 16. Fixed an oversight in the TurboJPEG C wrapper: if any of the JPEG
1502
+ compression functions was called repeatedly with the same
1503
+ automatically-allocated destination buffer, then TurboJPEG would erroneously
1504
+ assume that the `jpegSize` parameter was equal to the size of the buffer, when
1505
+ in fact that parameter was probably equal to the size of the most recently
1506
+ compressed JPEG image. If the size of the previous JPEG image was not as large
1507
+ as the current JPEG image, then TurboJPEG would unnecessarily reallocate the
1508
+ destination buffer.
1509
+
1510
+
1511
+ 1.3.1
1512
+ =====
1513
+
1514
+ ### Significant changes relative to 1.3.0:
1515
+
1516
+ 1. On Un*x systems, `make install` now installs the libjpeg-turbo libraries
1517
+ into /opt/libjpeg-turbo/lib32 by default on any 32-bit system, not just x86,
1518
+ and into /opt/libjpeg-turbo/lib64 by default on any 64-bit system, not just
1519
+ x86-64. You can override this by overriding either the `prefix` or `libdir`
1520
+ configure variables.
1521
+
1522
+ 2. The Windows installer now places a copy of the TurboJPEG DLLs in the same
1523
+ directory as the rest of the libjpeg-turbo binaries. This was mainly done
1524
+ to support TurboVNC 1.3, which bundles the DLLs in its Windows installation.
1525
+ When using a 32-bit version of CMake on 64-bit Windows, it is impossible to
1526
+ access the c:\WINDOWS\system32 directory, which made it impossible for the
1527
+ TurboVNC build scripts to bundle the 64-bit TurboJPEG DLL.
1528
+
1529
+ 3. Fixed a bug whereby attempting to encode a progressive JPEG with arithmetic
1530
+ entropy coding (by passing arguments of `-progressive -arithmetic` to cjpeg or
1531
+ jpegtran, for instance) would result in an error, `Requested feature was
1532
+ omitted at compile time`.
1533
+
1534
+ 4. Fixed a couple of issues (CVE-2013-6629 and CVE-2013-6630) whereby malformed
1535
+ JPEG images would cause libjpeg-turbo to use uninitialized memory during
1536
+ decompression.
1537
+
1538
+ 5. Fixed an error (`Buffer passed to JPEG library is too small`) that occurred
1539
+ when calling the TurboJPEG YUV encoding function with a very small (< 5x5)
1540
+ source image, and added a unit test to check for this error.
1541
+
1542
+ 6. The Java classes should now build properly under Visual Studio 2010 and
1543
+ later.
1544
+
1545
+ 7. Fixed an issue that prevented SRPMs generated using the in-tree packaging
1546
+ tools from being rebuilt on certain newer Linux distributions.
1547
+
1548
+ 8. Numerous minor fixes to eliminate compilation and build/packaging system
1549
+ warnings, fix cosmetic issues, improve documentation clarity, and other general
1550
+ source cleanup.
1551
+
1552
+
1553
+ 1.3.0
1554
+ =====
1555
+
1556
+ ### Significant changes relative to 1.3 beta1:
1557
+
1558
+ 1. `make test` now works properly on FreeBSD, and it no longer requires the
1559
+ md5sum executable to be present on other Un*x platforms.
1560
+
1561
+ 2. Overhauled the packaging system:
1562
+
1563
+ - To avoid conflict with vendor-supplied libjpeg-turbo packages, the
1564
+ official RPMs and DEBs for libjpeg-turbo have been renamed to
1565
+ "libjpeg-turbo-official".
1566
+ - The TurboJPEG libraries are now located under /opt/libjpeg-turbo in the
1567
+ official Linux and Mac packages, to avoid conflict with vendor-supplied
1568
+ packages and also to streamline the packaging system.
1569
+ - Release packages are now created with the directory structure defined
1570
+ by the configure variables `prefix`, `bindir`, `libdir`, etc. (Un\*x) or by the
1571
+ `CMAKE_INSTALL_PREFIX` variable (Windows.) The exception is that the docs are
1572
+ always located under the system default documentation directory on Un\*x and
1573
+ Mac systems, and on Windows, the TurboJPEG DLL is always located in the Windows
1574
+ system directory.
1575
+ - To avoid confusion, official libjpeg-turbo packages on Linux/Unix
1576
+ platforms (except for Mac) will always install the 32-bit libraries in
1577
+ /opt/libjpeg-turbo/lib32 and the 64-bit libraries in /opt/libjpeg-turbo/lib64.
1578
+ - Fixed an issue whereby, in some cases, the libjpeg-turbo executables on
1579
+ Un*x systems were not properly linking with the shared libraries installed by
1580
+ the same package.
1581
+ - Fixed an issue whereby building the "installer" target on Windows when
1582
+ `WITH_JAVA=1` would fail if the TurboJPEG JAR had not been previously built.
1583
+ - Building the "install" target on Windows now installs files into the
1584
+ same places that the installer does.
1585
+
1586
+ 3. Fixed a Huffman encoder bug that prevented I/O suspension from working
1587
+ properly.
1588
+
1589
+
1590
+ 1.2.90 (1.3 beta1)
1591
+ ==================
1592
+
1593
+ ### Significant changes relative to 1.2.1:
1594
+
1595
+ 1. Added support for additional scaling factors (3/8, 5/8, 3/4, 7/8, 9/8, 5/4,
1596
+ 11/8, 3/2, 13/8, 7/4, 15/8, and 2) when decompressing. Note that the IDCT will
1597
+ not be SIMD-accelerated when using any of these new scaling factors.
1598
+
1599
+ 2. The TurboJPEG dynamic library is now versioned. It was not strictly
1600
+ necessary to do so, because TurboJPEG uses versioned symbols, and if a function
1601
+ changes in an ABI-incompatible way, that function is renamed and a legacy
1602
+ function is provided to maintain backward compatibility. However, certain
1603
+ Linux distro maintainers have a policy against accepting any library that isn't
1604
+ versioned.
1605
+
1606
+ 3. Extended the TurboJPEG Java API so that it can be used to compress a JPEG
1607
+ image from and decompress a JPEG image to an arbitrary position in a large
1608
+ image buffer.
1609
+
1610
+ 4. The `tjDecompressToYUV()` function now supports the `TJFLAG_FASTDCT` flag.
1611
+
1612
+ 5. The 32-bit supplementary package for amd64 Debian systems now provides
1613
+ symlinks in /usr/lib/i386-linux-gnu for the TurboJPEG libraries in /usr/lib32.
1614
+ This allows those libraries to be used on MultiArch-compatible systems (such as
1615
+ Ubuntu 11 and later) without setting the linker path.
1616
+
1617
+ 6. The TurboJPEG Java wrapper should now find the JNI library on Mac systems
1618
+ without having to pass `-Djava.library.path=/usr/lib` to java.
1619
+
1620
+ 7. TJBench has been ported to Java to provide a convenient way of validating
1621
+ the performance of the TurboJPEG Java API. It can be run with
1622
+ `java -cp turbojpeg.jar TJBench`.
1623
+
1624
+ 8. cjpeg can now be used to generate JPEG files with the RGB colorspace
1625
+ (feature ported from jpeg-8d.)
1626
+
1627
+ 9. The width and height in the `-crop` argument passed to jpegtran can now be
1628
+ suffixed with `f` to indicate that, when the upper left corner of the cropping
1629
+ region is automatically moved to the nearest iMCU boundary, the bottom right
1630
+ corner should be moved by the same amount. In other words, this feature causes
1631
+ jpegtran to strictly honor the specified width/height rather than the specified
1632
+ bottom right corner (feature ported from jpeg-8d.)
1633
+
1634
+ 10. JPEG files using the RGB colorspace can now be decompressed into grayscale
1635
+ images (feature ported from jpeg-8d.)
1636
+
1637
+ 11. Fixed a regression caused by 1.2.1[7] whereby the build would fail with
1638
+ multiple "Mismatch in operand sizes" errors when attempting to build the x86
1639
+ SIMD code with NASM 0.98.
1640
+
1641
+ 12. The in-memory source/destination managers (`jpeg_mem_src()` and
1642
+ `jpeg_mem_dest()`) are now included by default when building libjpeg-turbo with
1643
+ libjpeg v6b or v7 emulation, so that programs can take advantage of these
1644
+ functions without requiring the use of the backward-incompatible libjpeg v8
1645
+ ABI. The "age number" of the libjpeg-turbo library on Un*x systems has been
1646
+ incremented by 1 to reflect this. You can disable this feature with a
1647
+ configure/CMake switch in order to retain strict API/ABI compatibility with the
1648
+ libjpeg v6b or v7 API/ABI (or with previous versions of libjpeg-turbo.) See
1649
+ [README.md](README.md) for more details.
1650
+
1651
+ 13. Added ARMv7s architecture to libjpeg.a and libturbojpeg.a in the official
1652
+ libjpeg-turbo binary package for OS X, so that those libraries can be used to
1653
+ build applications that leverage the faster CPUs in the iPhone 5 and iPad 4.
1654
+
1655
+
1656
+ 1.2.1
1657
+ =====
1658
+
1659
+ ### Significant changes relative to 1.2.0:
1660
+
1661
+ 1. Creating or decoding a JPEG file that uses the RGB colorspace should now
1662
+ properly work when the input or output colorspace is one of the libjpeg-turbo
1663
+ colorspace extensions.
1664
+
1665
+ 2. When libjpeg-turbo was built without SIMD support and merged (non-fancy)
1666
+ upsampling was used along with an alpha-enabled colorspace during
1667
+ decompression, the unused byte of the decompressed pixels was not being set to
1668
+ 0xFF. This has been fixed. TJUnitTest has also been extended to test for the
1669
+ correct behavior of the colorspace extensions when merged upsampling is used.
1670
+
1671
+ 3. Fixed a bug whereby the libjpeg-turbo SSE2 SIMD code would not preserve the
1672
+ upper 64 bits of xmm6 and xmm7 on Win64 platforms, which violated the Win64
1673
+ calling conventions.
1674
+
1675
+ 4. Fixed a regression (CVE-2012-2806) caused by 1.2.0[6] whereby decompressing
1676
+ corrupt JPEG images (specifically, images in which the component count was
1677
+ erroneously set to a large value) would cause libjpeg-turbo to segfault.
1678
+
1679
+ 5. Worked around a severe performance issue with "Bobcat" (AMD Embedded APU)
1680
+ processors. The `MASKMOVDQU` instruction, which was used by the libjpeg-turbo
1681
+ SSE2 SIMD code, is apparently implemented in microcode on AMD processors, and
1682
+ it is painfully slow on Bobcat processors in particular. Eliminating the use
1683
+ of this instruction improved performance by an order of magnitude on Bobcat
1684
+ processors and by a small amount (typically 5%) on AMD desktop processors.
1685
+
1686
+ 6. Added SIMD acceleration for performing 4:2:2 upsampling on NEON-capable ARM
1687
+ platforms. This speeds up the decompression of 4:2:2 JPEGs by 20-25% on such
1688
+ platforms.
1689
+
1690
+ 7. Fixed a regression caused by 1.2.0[2] whereby, on Linux/x86 platforms
1691
+ running the 32-bit SSE2 SIMD code in libjpeg-turbo, decompressing a 4:2:0 or
1692
+ 4:2:2 JPEG image into a 32-bit (RGBX, BGRX, etc.) buffer without using fancy
1693
+ upsampling would produce several incorrect columns of pixels at the right-hand
1694
+ side of the output image if each row in the output image was not evenly
1695
+ divisible by 16 bytes.
1696
+
1697
+ 8. Fixed an issue whereby attempting to build the SIMD extensions with Xcode
1698
+ 4.3 on OS X platforms would cause NASM to return numerous errors of the form
1699
+ "'%define' expects a macro identifier".
1700
+
1701
+ 9. Added flags to the TurboJPEG API that allow the caller to force the use of
1702
+ either the fast or the accurate DCT/IDCT algorithms in the underlying codec.
1703
+
1704
+
1705
+ 1.2.0
1706
+ =====
1707
+
1708
+ ### Significant changes relative to 1.2 beta1:
1709
+
1710
+ 1. Fixed build issue with Yasm on Unix systems (the libjpeg-turbo build system
1711
+ was not adding the current directory to the assembler include path, so Yasm
1712
+ was not able to find jsimdcfg.inc.)
1713
+
1714
+ 2. Fixed out-of-bounds read in SSE2 SIMD code that occurred when decompressing
1715
+ a JPEG image to a bitmap buffer whose size was not a multiple of 16 bytes.
1716
+ This was more of an annoyance than an actual bug, since it did not cause any
1717
+ actual run-time problems, but the issue showed up when running libjpeg-turbo in
1718
+ valgrind. See <http://crbug.com/72399> for more information.
1719
+
1720
+ 3. Added a compile-time macro (`LIBJPEG_TURBO_VERSION`) that can be used to
1721
+ check the version of libjpeg-turbo against which an application was compiled.
1722
+
1723
+ 4. Added new RGBA/BGRA/ABGR/ARGB colorspace extension constants (libjpeg API)
1724
+ and pixel formats (TurboJPEG API), which allow applications to specify that,
1725
+ when decompressing to a 4-component RGB buffer, the unused byte should be set
1726
+ to 0xFF so that it can be interpreted as an opaque alpha channel.
1727
+
1728
+ 5. Fixed regression issue whereby DevIL failed to build against libjpeg-turbo
1729
+ because libjpeg-turbo's distributed version of jconfig.h contained an `INLINE`
1730
+ macro, which conflicted with a similar macro in DevIL. This macro is used only
1731
+ internally when building libjpeg-turbo, so it was moved into config.h.
1732
+
1733
+ 6. libjpeg-turbo will now correctly decompress erroneous CMYK/YCCK JPEGs whose
1734
+ K component is assigned a component ID of 1 instead of 4. Although these files
1735
+ are in violation of the spec, other JPEG implementations handle them
1736
+ correctly.
1737
+
1738
+ 7. Added ARMv6 and ARMv7 architectures to libjpeg.a and libturbojpeg.a in
1739
+ the official libjpeg-turbo binary package for OS X, so that those libraries can
1740
+ be used to build both OS X and iOS applications.
1741
+
1742
+
1743
+ 1.1.90 (1.2 beta1)
1744
+ ==================
1745
+
1746
+ ### Significant changes relative to 1.1.1:
1747
+
1748
+ 1. Added a Java wrapper for the TurboJPEG API. See [java/README](java/README)
1749
+ for more details.
1750
+
1751
+ 2. The TurboJPEG API can now be used to scale down images during
1752
+ decompression.
1753
+
1754
+ 3. Added SIMD routines for RGB-to-grayscale color conversion, which
1755
+ significantly improves the performance of grayscale JPEG compression from an
1756
+ RGB source image.
1757
+
1758
+ 4. Improved the performance of the C color conversion routines, which are used
1759
+ on platforms for which SIMD acceleration is not available.
1760
+
1761
+ 5. Added a function to the TurboJPEG API that performs lossless transforms.
1762
+ This function is implemented using the same back end as jpegtran, but it
1763
+ performs transcoding entirely in memory and allows multiple transforms and/or
1764
+ crop operations to be batched together, so the source coefficients only need to
1765
+ be read once. This is useful when generating image tiles from a single source
1766
+ JPEG.
1767
+
1768
+ 6. Added tests for the new TurboJPEG scaled decompression and lossless
1769
+ transform features to tjbench (the TurboJPEG benchmark, formerly called
1770
+ "jpgtest".)
1771
+
1772
+ 7. Added support for 4:4:0 (transposed 4:2:2) subsampling in TurboJPEG, which
1773
+ was necessary in order for it to read 4:2:2 JPEG files that had been losslessly
1774
+ transposed or rotated 90 degrees.
1775
+
1776
+ 8. All legacy VirtualGL code has been re-factored, and this has allowed
1777
+ libjpeg-turbo, in its entirety, to be re-licensed under a BSD-style license.
1778
+
1779
+ 9. libjpeg-turbo can now be built with Yasm.
1780
+
1781
+ 10. Added SIMD acceleration for ARM Linux and iOS platforms that support
1782
+ NEON instructions.
1783
+
1784
+ 11. Refactored the TurboJPEG C API and documented it using Doxygen. The
1785
+ TurboJPEG 1.2 API uses pixel formats to define the size and component order of
1786
+ the uncompressed source/destination images, and it includes a more efficient
1787
+ version of `TJBUFSIZE()` that computes a worst-case JPEG size based on the
1788
+ level of chrominance subsampling. The refactored implementation of the
1789
+ TurboJPEG API now uses the libjpeg memory source and destination managers,
1790
+ which allows the TurboJPEG compressor to grow the JPEG buffer as necessary.
1791
+
1792
+ 12. Eliminated errors in the output of jpegtran on Windows that occurred when
1793
+ the application was invoked using I/O redirection
1794
+ (`jpegtran <input.jpg >output.jpg`.)
1795
+
1796
+ 13. The inclusion of libjpeg v7 and v8 emulation as well as arithmetic coding
1797
+ support in libjpeg-turbo v1.1.0 introduced several new error constants in
1798
+ jerror.h, and these were mistakenly enabled for all emulation modes, causing
1799
+ the error enum in libjpeg-turbo to sometimes have different values than the
1800
+ same enum in libjpeg. This represents an ABI incompatibility, and it caused
1801
+ problems with rare applications that took specific action based on a particular
1802
+ error value. The fix was to include the new error constants conditionally
1803
+ based on whether libjpeg v7 or v8 emulation was enabled.
1804
+
1805
+ 14. Fixed an issue whereby Windows applications that used libjpeg-turbo would
1806
+ fail to compile if the Windows system headers were included before jpeglib.h.
1807
+ This issue was caused by a conflict in the definition of the INT32 type.
1808
+
1809
+ 15. Fixed 32-bit supplementary package for amd64 Debian systems, which was
1810
+ broken by enhancements to the packaging system in 1.1.
1811
+
1812
+ 16. When decompressing a JPEG image using an output colorspace of
1813
+ `JCS_EXT_RGBX`, `JCS_EXT_BGRX`, `JCS_EXT_XBGR`, or `JCS_EXT_XRGB`,
1814
+ libjpeg-turbo will now set the unused byte to 0xFF, which allows applications
1815
+ to interpret that byte as an alpha channel (0xFF = opaque).
1816
+
1817
+
1818
+ 1.1.1
1819
+ =====
1820
+
1821
+ ### Significant changes relative to 1.1.0:
1822
+
1823
+ 1. Fixed a 1-pixel error in row 0, column 21 of the luminance plane generated
1824
+ by `tjEncodeYUV()`.
1825
+
1826
+ 2. libjpeg-turbo's accelerated Huffman decoder previously ignored unexpected
1827
+ markers found in the middle of the JPEG data stream during decompression. It
1828
+ will now hand off decoding of a particular block to the unaccelerated Huffman
1829
+ decoder if an unexpected marker is found, so that the unaccelerated Huffman
1830
+ decoder can generate an appropriate warning.
1831
+
1832
+ 3. Older versions of MinGW64 prefixed symbol names with underscores by
1833
+ default, which differed from the behavior of 64-bit Visual C++. MinGW64 1.0
1834
+ has adopted the behavior of 64-bit Visual C++ as the default, so to accommodate
1835
+ this, the libjpeg-turbo SIMD function names are no longer prefixed with an
1836
+ underscore when building with MinGW64. This means that, when building
1837
+ libjpeg-turbo with older versions of MinGW64, you will now have to add
1838
+ `-fno-leading-underscore` to the `CFLAGS`.
1839
+
1840
+ 4. Fixed a regression bug in the NSIS script that caused the Windows installer
1841
+ build to fail when using the Visual Studio IDE.
1842
+
1843
+ 5. Fixed a bug in `jpeg_read_coefficients()` whereby it would not initialize
1844
+ `cinfo->image_width` and `cinfo->image_height` if libjpeg v7 or v8 emulation
1845
+ was enabled. This specifically caused the jpegoptim program to fail if it was
1846
+ linked against a version of libjpeg-turbo that was built with libjpeg v7 or v8
1847
+ emulation.
1848
+
1849
+ 6. Eliminated excessive I/O overhead that occurred when reading BMP files in
1850
+ cjpeg.
1851
+
1852
+ 7. Eliminated errors in the output of cjpeg on Windows that occurred when the
1853
+ application was invoked using I/O redirection (`cjpeg <inputfile >output.jpg`.)
1854
+
1855
+
1856
+ 1.1.0
1857
+ =====
1858
+
1859
+ ### Significant changes relative to 1.1 beta1:
1860
+
1861
+ 1. The algorithm used by the SIMD quantization function cannot produce correct
1862
+ results when the JPEG quality is >= 98 and the fast integer forward DCT is
1863
+ used. Thus, the non-SIMD quantization function is now used for those cases,
1864
+ and libjpeg-turbo should now produce identical output to libjpeg v6b in all
1865
+ cases.
1866
+
1867
+ 2. Despite the above, the fast integer forward DCT still degrades somewhat for
1868
+ JPEG qualities greater than 95, so the TurboJPEG wrapper will now automatically
1869
+ use the accurate integer forward DCT when generating JPEG images of quality 96
1870
+ or greater. This reduces compression performance by as much as 15% for these
1871
+ high-quality images but is necessary to ensure that the images are perceptually
1872
+ lossless. It also ensures that the library can avoid the performance pitfall
1873
+ created by [1].
1874
+
1875
+ 3. Ported jpgtest.cxx to pure C to avoid the need for a C++ compiler.
1876
+
1877
+ 4. Fixed visual artifacts in grayscale JPEG compression caused by a typo in
1878
+ the RGB-to-luminance lookup tables.
1879
+
1880
+ 5. The Windows distribution packages now include the libjpeg run-time programs
1881
+ (cjpeg, etc.)
1882
+
1883
+ 6. All packages now include jpgtest.
1884
+
1885
+ 7. The TurboJPEG dynamic library now uses versioned symbols.
1886
+
1887
+ 8. Added two new TurboJPEG API functions, `tjEncodeYUV()` and
1888
+ `tjDecompressToYUV()`, to replace the somewhat hackish `TJ_YUV` flag.
1889
+
1890
+
1891
+ 1.0.90 (1.1 beta1)
1892
+ ==================
1893
+
1894
+ ### Significant changes relative to 1.0.1:
1895
+
1896
+ 1. Added emulation of the libjpeg v7 and v8 APIs and ABIs. See
1897
+ [README.md](README.md) for more details. This feature was sponsored by
1898
+ CamTrace SAS.
1899
+
1900
+ 2. Created a new CMake-based build system for the Visual C++ and MinGW builds.
1901
+
1902
+ 3. Grayscale bitmaps can now be compressed from/decompressed to using the
1903
+ TurboJPEG API.
1904
+
1905
+ 4. jpgtest can now be used to test decompression performance with existing
1906
+ JPEG images.
1907
+
1908
+ 5. If the default install prefix (/opt/libjpeg-turbo) is used, then
1909
+ `make install` now creates /opt/libjpeg-turbo/lib32 and
1910
+ /opt/libjpeg-turbo/lib64 sym links to duplicate the behavior of the binary
1911
+ packages.
1912
+
1913
+ 6. All symbols in the libjpeg-turbo dynamic library are now versioned, even
1914
+ when the library is built with libjpeg v6b emulation.
1915
+
1916
+ 7. Added arithmetic encoding and decoding support (can be disabled with
1917
+ configure or CMake options)
1918
+
1919
+ 8. Added a `TJ_YUV` flag to the TurboJPEG API, which causes both the compressor
1920
+ and decompressor to output planar YUV images.
1921
+
1922
+ 9. Added an extended version of `tjDecompressHeader()` to the TurboJPEG API,
1923
+ which allows the caller to determine the type of subsampling used in a JPEG
1924
+ image.
1925
+
1926
+ 10. Added further protections against invalid Huffman codes.
1927
+
1928
+
1929
+ 1.0.1
1930
+ =====
1931
+
1932
+ ### Significant changes relative to 1.0.0:
1933
+
1934
+ 1. The Huffman decoder will now handle erroneous Huffman codes (for instance,
1935
+ from a corrupt JPEG image.) Previously, these would cause libjpeg-turbo to
1936
+ crash under certain circumstances.
1937
+
1938
+ 2. Fixed typo in SIMD dispatch routines that was causing 4:2:2 upsampling to
1939
+ be used instead of 4:2:0 when decompressing JPEG images using SSE2 code.
1940
+
1941
+ 3. The configure script will now automatically determine whether the
1942
+ `INCOMPLETE_TYPES_BROKEN` macro should be defined.
1943
+
1944
+
1945
+ 1.0.0
1946
+ =====
1947
+
1948
+ ### Significant changes relative to 0.0.93:
1949
+
1950
+ 1. 2983700: Further FreeBSD build tweaks (no longer necessary to specify
1951
+ `--host` when configuring on a 64-bit system)
1952
+
1953
+ 2. Created symlinks in the Unix/Linux packages so that the TurboJPEG
1954
+ include file can always be found in /opt/libjpeg-turbo/include, the 32-bit
1955
+ static libraries can always be found in /opt/libjpeg-turbo/lib32, and the
1956
+ 64-bit static libraries can always be found in /opt/libjpeg-turbo/lib64.
1957
+
1958
+ 3. The Unix/Linux distribution packages now include the libjpeg run-time
1959
+ programs (cjpeg, etc.) and man pages.
1960
+
1961
+ 4. Created a 32-bit supplementary package for amd64 Debian systems, which
1962
+ contains just the 32-bit libjpeg-turbo libraries.
1963
+
1964
+ 5. Moved the libraries from */lib32 to */lib in the i386 Debian package.
1965
+
1966
+ 6. Include distribution package for Cygwin
1967
+
1968
+ 7. No longer necessary to specify `--without-simd` on non-x86 architectures,
1969
+ and unit tests now work on those architectures.
1970
+
1971
+
1972
+ 0.0.93
1973
+ ======
1974
+
1975
+ ### Significant changes since 0.0.91:
1976
+
1977
+ 1. 2982659: Fixed x86-64 build on FreeBSD systems
1978
+
1979
+ 2. 2988188: Added support for Windows 64-bit systems
1980
+
1981
+
1982
+ 0.0.91
1983
+ ======
1984
+
1985
+ ### Significant changes relative to 0.0.90:
1986
+
1987
+ 1. Added documentation to .deb packages
1988
+
1989
+ 2. 2968313: Fixed data corruption issues when decompressing large JPEG images
1990
+ and/or using buffered I/O with the libjpeg-turbo decompressor
1991
+
1992
+
1993
+ 0.0.90
1994
+ ======
1995
+
1996
+ Initial release