image_pack 0.2.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (319) hide show
  1. checksums.yaml +7 -0
  2. data/CHANGELOG.md +18 -0
  3. data/LICENSE.txt +21 -0
  4. data/README.md +140 -0
  5. data/THIRD_PARTY_NOTICES.md +8 -0
  6. data/ext/image_pack/extconf.rb +515 -0
  7. data/ext/image_pack/image_pack.c +1618 -0
  8. data/ext/image_pack/vendor/.vendored +1 -0
  9. data/ext/image_pack/vendor/mozjpeg/BUILDING.txt +902 -0
  10. data/ext/image_pack/vendor/mozjpeg/CMakeLists.txt +1593 -0
  11. data/ext/image_pack/vendor/mozjpeg/LICENSE.md +132 -0
  12. data/ext/image_pack/vendor/mozjpeg/README-mozilla.txt +194 -0
  13. data/ext/image_pack/vendor/mozjpeg/README-turbo.txt +346 -0
  14. data/ext/image_pack/vendor/mozjpeg/README.ijg +258 -0
  15. data/ext/image_pack/vendor/mozjpeg/README.md +29 -0
  16. data/ext/image_pack/vendor/mozjpeg/cderror.h +128 -0
  17. data/ext/image_pack/vendor/mozjpeg/cdjpeg.c +156 -0
  18. data/ext/image_pack/vendor/mozjpeg/cdjpeg.h +171 -0
  19. data/ext/image_pack/vendor/mozjpeg/cjpeg.c +961 -0
  20. data/ext/image_pack/vendor/mozjpeg/cmyk.h +60 -0
  21. data/ext/image_pack/vendor/mozjpeg/coderules.txt +78 -0
  22. data/ext/image_pack/vendor/mozjpeg/croptest.in +95 -0
  23. data/ext/image_pack/vendor/mozjpeg/djpeg.c +855 -0
  24. data/ext/image_pack/vendor/mozjpeg/example.txt +464 -0
  25. data/ext/image_pack/vendor/mozjpeg/jaricom.c +157 -0
  26. data/ext/image_pack/vendor/mozjpeg/jcapimin.c +307 -0
  27. data/ext/image_pack/vendor/mozjpeg/jcapistd.c +168 -0
  28. data/ext/image_pack/vendor/mozjpeg/jcarith.c +972 -0
  29. data/ext/image_pack/vendor/mozjpeg/jccoefct.c +609 -0
  30. data/ext/image_pack/vendor/mozjpeg/jccolext.c +144 -0
  31. data/ext/image_pack/vendor/mozjpeg/jccolor.c +721 -0
  32. data/ext/image_pack/vendor/mozjpeg/jcdctmgr.c +1776 -0
  33. data/ext/image_pack/vendor/mozjpeg/jcext.c +219 -0
  34. data/ext/image_pack/vendor/mozjpeg/jchuff.c +1146 -0
  35. data/ext/image_pack/vendor/mozjpeg/jchuff.h +57 -0
  36. data/ext/image_pack/vendor/mozjpeg/jcicc.c +105 -0
  37. data/ext/image_pack/vendor/mozjpeg/jcinit.c +82 -0
  38. data/ext/image_pack/vendor/mozjpeg/jcmainct.c +162 -0
  39. data/ext/image_pack/vendor/mozjpeg/jcmarker.c +844 -0
  40. data/ext/image_pack/vendor/mozjpeg/jcmaster.c +958 -0
  41. data/ext/image_pack/vendor/mozjpeg/jcmaster.h +56 -0
  42. data/ext/image_pack/vendor/mozjpeg/jcomapi.c +109 -0
  43. data/ext/image_pack/vendor/mozjpeg/jconfig.h.in +37 -0
  44. data/ext/image_pack/vendor/mozjpeg/jconfig.txt +93 -0
  45. data/ext/image_pack/vendor/mozjpeg/jconfigint.h.in +44 -0
  46. data/ext/image_pack/vendor/mozjpeg/jcparam.c +991 -0
  47. data/ext/image_pack/vendor/mozjpeg/jcphuff.c +1123 -0
  48. data/ext/image_pack/vendor/mozjpeg/jcprepct.c +351 -0
  49. data/ext/image_pack/vendor/mozjpeg/jcsample.c +522 -0
  50. data/ext/image_pack/vendor/mozjpeg/jcstest.c +126 -0
  51. data/ext/image_pack/vendor/mozjpeg/jctrans.c +408 -0
  52. data/ext/image_pack/vendor/mozjpeg/jdapimin.c +407 -0
  53. data/ext/image_pack/vendor/mozjpeg/jdapistd.c +691 -0
  54. data/ext/image_pack/vendor/mozjpeg/jdarith.c +782 -0
  55. data/ext/image_pack/vendor/mozjpeg/jdatadst-tj.c +198 -0
  56. data/ext/image_pack/vendor/mozjpeg/jdatadst.c +299 -0
  57. data/ext/image_pack/vendor/mozjpeg/jdatasrc-tj.c +194 -0
  58. data/ext/image_pack/vendor/mozjpeg/jdatasrc.c +295 -0
  59. data/ext/image_pack/vendor/mozjpeg/jdcoefct.c +881 -0
  60. data/ext/image_pack/vendor/mozjpeg/jdcoefct.h +83 -0
  61. data/ext/image_pack/vendor/mozjpeg/jdcol565.c +384 -0
  62. data/ext/image_pack/vendor/mozjpeg/jdcolext.c +141 -0
  63. data/ext/image_pack/vendor/mozjpeg/jdcolor.c +881 -0
  64. data/ext/image_pack/vendor/mozjpeg/jdct.h +208 -0
  65. data/ext/image_pack/vendor/mozjpeg/jddctmgr.c +367 -0
  66. data/ext/image_pack/vendor/mozjpeg/jdhuff.c +834 -0
  67. data/ext/image_pack/vendor/mozjpeg/jdhuff.h +247 -0
  68. data/ext/image_pack/vendor/mozjpeg/jdicc.c +167 -0
  69. data/ext/image_pack/vendor/mozjpeg/jdinput.c +408 -0
  70. data/ext/image_pack/vendor/mozjpeg/jdmainct.c +460 -0
  71. data/ext/image_pack/vendor/mozjpeg/jdmainct.h +71 -0
  72. data/ext/image_pack/vendor/mozjpeg/jdmarker.c +1374 -0
  73. data/ext/image_pack/vendor/mozjpeg/jdmaster.c +727 -0
  74. data/ext/image_pack/vendor/mozjpeg/jdmaster.h +33 -0
  75. data/ext/image_pack/vendor/mozjpeg/jdmerge.c +587 -0
  76. data/ext/image_pack/vendor/mozjpeg/jdmerge.h +47 -0
  77. data/ext/image_pack/vendor/mozjpeg/jdmrg565.c +354 -0
  78. data/ext/image_pack/vendor/mozjpeg/jdmrgext.c +184 -0
  79. data/ext/image_pack/vendor/mozjpeg/jdphuff.c +679 -0
  80. data/ext/image_pack/vendor/mozjpeg/jdpostct.c +294 -0
  81. data/ext/image_pack/vendor/mozjpeg/jdsample.c +524 -0
  82. data/ext/image_pack/vendor/mozjpeg/jdsample.h +50 -0
  83. data/ext/image_pack/vendor/mozjpeg/jdtrans.c +156 -0
  84. data/ext/image_pack/vendor/mozjpeg/jerror.c +251 -0
  85. data/ext/image_pack/vendor/mozjpeg/jerror.h +335 -0
  86. data/ext/image_pack/vendor/mozjpeg/jfdctflt.c +169 -0
  87. data/ext/image_pack/vendor/mozjpeg/jfdctfst.c +227 -0
  88. data/ext/image_pack/vendor/mozjpeg/jfdctint.c +288 -0
  89. data/ext/image_pack/vendor/mozjpeg/jidctflt.c +240 -0
  90. data/ext/image_pack/vendor/mozjpeg/jidctfst.c +371 -0
  91. data/ext/image_pack/vendor/mozjpeg/jidctint.c +2627 -0
  92. data/ext/image_pack/vendor/mozjpeg/jidctred.c +409 -0
  93. data/ext/image_pack/vendor/mozjpeg/jinclude.h +147 -0
  94. data/ext/image_pack/vendor/mozjpeg/jmemmgr.c +1180 -0
  95. data/ext/image_pack/vendor/mozjpeg/jmemnobs.c +110 -0
  96. data/ext/image_pack/vendor/mozjpeg/jmemsys.h +178 -0
  97. data/ext/image_pack/vendor/mozjpeg/jmorecfg.h +382 -0
  98. data/ext/image_pack/vendor/mozjpeg/jpeg_nbits_table.h +4098 -0
  99. data/ext/image_pack/vendor/mozjpeg/jpegcomp.h +32 -0
  100. data/ext/image_pack/vendor/mozjpeg/jpegint.h +453 -0
  101. data/ext/image_pack/vendor/mozjpeg/jpeglib.h +1211 -0
  102. data/ext/image_pack/vendor/mozjpeg/jpegtran.c +827 -0
  103. data/ext/image_pack/vendor/mozjpeg/jpegyuv.c +172 -0
  104. data/ext/image_pack/vendor/mozjpeg/jquant1.c +856 -0
  105. data/ext/image_pack/vendor/mozjpeg/jquant2.c +1286 -0
  106. data/ext/image_pack/vendor/mozjpeg/jsimd.h +123 -0
  107. data/ext/image_pack/vendor/mozjpeg/jsimd_none.c +431 -0
  108. data/ext/image_pack/vendor/mozjpeg/jsimddct.h +70 -0
  109. data/ext/image_pack/vendor/mozjpeg/jstdhuff.c +144 -0
  110. data/ext/image_pack/vendor/mozjpeg/jutils.c +133 -0
  111. data/ext/image_pack/vendor/mozjpeg/jversion.h.in +56 -0
  112. data/ext/image_pack/vendor/mozjpeg/libjpeg.map.in +11 -0
  113. data/ext/image_pack/vendor/mozjpeg/libjpeg.txt +3150 -0
  114. data/ext/image_pack/vendor/mozjpeg/rdbmp.c +690 -0
  115. data/ext/image_pack/vendor/mozjpeg/rdcolmap.c +253 -0
  116. data/ext/image_pack/vendor/mozjpeg/rdgif.c +720 -0
  117. data/ext/image_pack/vendor/mozjpeg/rdjpeg.c +160 -0
  118. data/ext/image_pack/vendor/mozjpeg/rdjpgcom.c +494 -0
  119. data/ext/image_pack/vendor/mozjpeg/rdpng.c +194 -0
  120. data/ext/image_pack/vendor/mozjpeg/rdppm.c +781 -0
  121. data/ext/image_pack/vendor/mozjpeg/rdswitch.c +642 -0
  122. data/ext/image_pack/vendor/mozjpeg/rdtarga.c +508 -0
  123. data/ext/image_pack/vendor/mozjpeg/simd/arm/aarch32/jccolext-neon.c +148 -0
  124. data/ext/image_pack/vendor/mozjpeg/simd/arm/aarch32/jchuff-neon.c +334 -0
  125. data/ext/image_pack/vendor/mozjpeg/simd/arm/aarch32/jsimd.c +976 -0
  126. data/ext/image_pack/vendor/mozjpeg/simd/arm/aarch32/jsimd_neon.S +1200 -0
  127. data/ext/image_pack/vendor/mozjpeg/simd/arm/aarch64/jccolext-neon.c +316 -0
  128. data/ext/image_pack/vendor/mozjpeg/simd/arm/aarch64/jchuff-neon.c +411 -0
  129. data/ext/image_pack/vendor/mozjpeg/simd/arm/aarch64/jsimd.c +1053 -0
  130. data/ext/image_pack/vendor/mozjpeg/simd/arm/aarch64/jsimd_neon.S +2254 -0
  131. data/ext/image_pack/vendor/mozjpeg/simd/arm/align.h +28 -0
  132. data/ext/image_pack/vendor/mozjpeg/simd/arm/jccolor-neon.c +160 -0
  133. data/ext/image_pack/vendor/mozjpeg/simd/arm/jcgray-neon.c +120 -0
  134. data/ext/image_pack/vendor/mozjpeg/simd/arm/jcgryext-neon.c +106 -0
  135. data/ext/image_pack/vendor/mozjpeg/simd/arm/jchuff.h +131 -0
  136. data/ext/image_pack/vendor/mozjpeg/simd/arm/jcphuff-neon.c +623 -0
  137. data/ext/image_pack/vendor/mozjpeg/simd/arm/jcsample-neon.c +192 -0
  138. data/ext/image_pack/vendor/mozjpeg/simd/arm/jdcolext-neon.c +374 -0
  139. data/ext/image_pack/vendor/mozjpeg/simd/arm/jdcolor-neon.c +141 -0
  140. data/ext/image_pack/vendor/mozjpeg/simd/arm/jdmerge-neon.c +144 -0
  141. data/ext/image_pack/vendor/mozjpeg/simd/arm/jdmrgext-neon.c +723 -0
  142. data/ext/image_pack/vendor/mozjpeg/simd/arm/jdsample-neon.c +569 -0
  143. data/ext/image_pack/vendor/mozjpeg/simd/arm/jfdctfst-neon.c +214 -0
  144. data/ext/image_pack/vendor/mozjpeg/simd/arm/jfdctint-neon.c +376 -0
  145. data/ext/image_pack/vendor/mozjpeg/simd/arm/jidctfst-neon.c +472 -0
  146. data/ext/image_pack/vendor/mozjpeg/simd/arm/jidctint-neon.c +801 -0
  147. data/ext/image_pack/vendor/mozjpeg/simd/arm/jidctred-neon.c +486 -0
  148. data/ext/image_pack/vendor/mozjpeg/simd/arm/jquanti-neon.c +193 -0
  149. data/ext/image_pack/vendor/mozjpeg/simd/arm/neon-compat.h +26 -0
  150. data/ext/image_pack/vendor/mozjpeg/simd/arm/neon-compat.h.in +37 -0
  151. data/ext/image_pack/vendor/mozjpeg/simd/i386/jccolext-avx2.asm +578 -0
  152. data/ext/image_pack/vendor/mozjpeg/simd/i386/jccolext-mmx.asm +476 -0
  153. data/ext/image_pack/vendor/mozjpeg/simd/i386/jccolext-sse2.asm +503 -0
  154. data/ext/image_pack/vendor/mozjpeg/simd/i386/jccolor-avx2.asm +121 -0
  155. data/ext/image_pack/vendor/mozjpeg/simd/i386/jccolor-mmx.asm +121 -0
  156. data/ext/image_pack/vendor/mozjpeg/simd/i386/jccolor-sse2.asm +120 -0
  157. data/ext/image_pack/vendor/mozjpeg/simd/i386/jcgray-avx2.asm +113 -0
  158. data/ext/image_pack/vendor/mozjpeg/simd/i386/jcgray-mmx.asm +113 -0
  159. data/ext/image_pack/vendor/mozjpeg/simd/i386/jcgray-sse2.asm +112 -0
  160. data/ext/image_pack/vendor/mozjpeg/simd/i386/jcgryext-avx2.asm +457 -0
  161. data/ext/image_pack/vendor/mozjpeg/simd/i386/jcgryext-mmx.asm +355 -0
  162. data/ext/image_pack/vendor/mozjpeg/simd/i386/jcgryext-sse2.asm +382 -0
  163. data/ext/image_pack/vendor/mozjpeg/simd/i386/jchuff-sse2.asm +761 -0
  164. data/ext/image_pack/vendor/mozjpeg/simd/i386/jcphuff-sse2.asm +662 -0
  165. data/ext/image_pack/vendor/mozjpeg/simd/i386/jcsample-avx2.asm +388 -0
  166. data/ext/image_pack/vendor/mozjpeg/simd/i386/jcsample-mmx.asm +324 -0
  167. data/ext/image_pack/vendor/mozjpeg/simd/i386/jcsample-sse2.asm +351 -0
  168. data/ext/image_pack/vendor/mozjpeg/simd/i386/jdcolext-avx2.asm +515 -0
  169. data/ext/image_pack/vendor/mozjpeg/simd/i386/jdcolext-mmx.asm +404 -0
  170. data/ext/image_pack/vendor/mozjpeg/simd/i386/jdcolext-sse2.asm +458 -0
  171. data/ext/image_pack/vendor/mozjpeg/simd/i386/jdcolor-avx2.asm +118 -0
  172. data/ext/image_pack/vendor/mozjpeg/simd/i386/jdcolor-mmx.asm +117 -0
  173. data/ext/image_pack/vendor/mozjpeg/simd/i386/jdcolor-sse2.asm +117 -0
  174. data/ext/image_pack/vendor/mozjpeg/simd/i386/jdmerge-avx2.asm +136 -0
  175. data/ext/image_pack/vendor/mozjpeg/simd/i386/jdmerge-mmx.asm +123 -0
  176. data/ext/image_pack/vendor/mozjpeg/simd/i386/jdmerge-sse2.asm +135 -0
  177. data/ext/image_pack/vendor/mozjpeg/simd/i386/jdmrgext-avx2.asm +575 -0
  178. data/ext/image_pack/vendor/mozjpeg/simd/i386/jdmrgext-mmx.asm +460 -0
  179. data/ext/image_pack/vendor/mozjpeg/simd/i386/jdmrgext-sse2.asm +517 -0
  180. data/ext/image_pack/vendor/mozjpeg/simd/i386/jdsample-avx2.asm +760 -0
  181. data/ext/image_pack/vendor/mozjpeg/simd/i386/jdsample-mmx.asm +731 -0
  182. data/ext/image_pack/vendor/mozjpeg/simd/i386/jdsample-sse2.asm +724 -0
  183. data/ext/image_pack/vendor/mozjpeg/simd/i386/jfdctflt-3dn.asm +318 -0
  184. data/ext/image_pack/vendor/mozjpeg/simd/i386/jfdctflt-sse.asm +369 -0
  185. data/ext/image_pack/vendor/mozjpeg/simd/i386/jfdctfst-mmx.asm +395 -0
  186. data/ext/image_pack/vendor/mozjpeg/simd/i386/jfdctfst-sse2.asm +403 -0
  187. data/ext/image_pack/vendor/mozjpeg/simd/i386/jfdctint-avx2.asm +331 -0
  188. data/ext/image_pack/vendor/mozjpeg/simd/i386/jfdctint-mmx.asm +620 -0
  189. data/ext/image_pack/vendor/mozjpeg/simd/i386/jfdctint-sse2.asm +633 -0
  190. data/ext/image_pack/vendor/mozjpeg/simd/i386/jidctflt-3dn.asm +451 -0
  191. data/ext/image_pack/vendor/mozjpeg/simd/i386/jidctflt-sse.asm +571 -0
  192. data/ext/image_pack/vendor/mozjpeg/simd/i386/jidctflt-sse2.asm +497 -0
  193. data/ext/image_pack/vendor/mozjpeg/simd/i386/jidctfst-mmx.asm +499 -0
  194. data/ext/image_pack/vendor/mozjpeg/simd/i386/jidctfst-sse2.asm +501 -0
  195. data/ext/image_pack/vendor/mozjpeg/simd/i386/jidctint-avx2.asm +453 -0
  196. data/ext/image_pack/vendor/mozjpeg/simd/i386/jidctint-mmx.asm +851 -0
  197. data/ext/image_pack/vendor/mozjpeg/simd/i386/jidctint-sse2.asm +858 -0
  198. data/ext/image_pack/vendor/mozjpeg/simd/i386/jidctred-mmx.asm +704 -0
  199. data/ext/image_pack/vendor/mozjpeg/simd/i386/jidctred-sse2.asm +592 -0
  200. data/ext/image_pack/vendor/mozjpeg/simd/i386/jquant-3dn.asm +230 -0
  201. data/ext/image_pack/vendor/mozjpeg/simd/i386/jquant-mmx.asm +276 -0
  202. data/ext/image_pack/vendor/mozjpeg/simd/i386/jquant-sse.asm +208 -0
  203. data/ext/image_pack/vendor/mozjpeg/simd/i386/jquantf-sse2.asm +168 -0
  204. data/ext/image_pack/vendor/mozjpeg/simd/i386/jquanti-avx2.asm +188 -0
  205. data/ext/image_pack/vendor/mozjpeg/simd/i386/jquanti-sse2.asm +201 -0
  206. data/ext/image_pack/vendor/mozjpeg/simd/i386/jsimd.c +1312 -0
  207. data/ext/image_pack/vendor/mozjpeg/simd/i386/jsimdcpu.asm +135 -0
  208. data/ext/image_pack/vendor/mozjpeg/simd/jsimd.h +1258 -0
  209. data/ext/image_pack/vendor/mozjpeg/simd/mips/jsimd.c +1143 -0
  210. data/ext/image_pack/vendor/mozjpeg/simd/mips/jsimd_dspr2.S +4543 -0
  211. data/ext/image_pack/vendor/mozjpeg/simd/mips/jsimd_dspr2_asm.h +292 -0
  212. data/ext/image_pack/vendor/mozjpeg/simd/mips64/jccolext-mmi.c +455 -0
  213. data/ext/image_pack/vendor/mozjpeg/simd/mips64/jccolor-mmi.c +148 -0
  214. data/ext/image_pack/vendor/mozjpeg/simd/mips64/jcgray-mmi.c +132 -0
  215. data/ext/image_pack/vendor/mozjpeg/simd/mips64/jcgryext-mmi.c +374 -0
  216. data/ext/image_pack/vendor/mozjpeg/simd/mips64/jcsample-mmi.c +98 -0
  217. data/ext/image_pack/vendor/mozjpeg/simd/mips64/jcsample.h +28 -0
  218. data/ext/image_pack/vendor/mozjpeg/simd/mips64/jdcolext-mmi.c +415 -0
  219. data/ext/image_pack/vendor/mozjpeg/simd/mips64/jdcolor-mmi.c +139 -0
  220. data/ext/image_pack/vendor/mozjpeg/simd/mips64/jdmerge-mmi.c +149 -0
  221. data/ext/image_pack/vendor/mozjpeg/simd/mips64/jdmrgext-mmi.c +615 -0
  222. data/ext/image_pack/vendor/mozjpeg/simd/mips64/jdsample-mmi.c +304 -0
  223. data/ext/image_pack/vendor/mozjpeg/simd/mips64/jfdctfst-mmi.c +255 -0
  224. data/ext/image_pack/vendor/mozjpeg/simd/mips64/jfdctint-mmi.c +398 -0
  225. data/ext/image_pack/vendor/mozjpeg/simd/mips64/jidctfst-mmi.c +395 -0
  226. data/ext/image_pack/vendor/mozjpeg/simd/mips64/jidctint-mmi.c +571 -0
  227. data/ext/image_pack/vendor/mozjpeg/simd/mips64/jquanti-mmi.c +124 -0
  228. data/ext/image_pack/vendor/mozjpeg/simd/mips64/jsimd.c +866 -0
  229. data/ext/image_pack/vendor/mozjpeg/simd/mips64/jsimd_mmi.h +69 -0
  230. data/ext/image_pack/vendor/mozjpeg/simd/mips64/loongson-mmintrin.h +1334 -0
  231. data/ext/image_pack/vendor/mozjpeg/simd/nasm/jcolsamp.inc +135 -0
  232. data/ext/image_pack/vendor/mozjpeg/simd/nasm/jdct.inc +31 -0
  233. data/ext/image_pack/vendor/mozjpeg/simd/nasm/jsimdcfg.inc +93 -0
  234. data/ext/image_pack/vendor/mozjpeg/simd/nasm/jsimdcfg.inc.h +133 -0
  235. data/ext/image_pack/vendor/mozjpeg/simd/nasm/jsimdext.inc +520 -0
  236. data/ext/image_pack/vendor/mozjpeg/simd/powerpc/jccolext-altivec.c +269 -0
  237. data/ext/image_pack/vendor/mozjpeg/simd/powerpc/jccolor-altivec.c +116 -0
  238. data/ext/image_pack/vendor/mozjpeg/simd/powerpc/jcgray-altivec.c +111 -0
  239. data/ext/image_pack/vendor/mozjpeg/simd/powerpc/jcgryext-altivec.c +228 -0
  240. data/ext/image_pack/vendor/mozjpeg/simd/powerpc/jcsample-altivec.c +159 -0
  241. data/ext/image_pack/vendor/mozjpeg/simd/powerpc/jcsample.h +28 -0
  242. data/ext/image_pack/vendor/mozjpeg/simd/powerpc/jdcolext-altivec.c +276 -0
  243. data/ext/image_pack/vendor/mozjpeg/simd/powerpc/jdcolor-altivec.c +106 -0
  244. data/ext/image_pack/vendor/mozjpeg/simd/powerpc/jdmerge-altivec.c +130 -0
  245. data/ext/image_pack/vendor/mozjpeg/simd/powerpc/jdmrgext-altivec.c +329 -0
  246. data/ext/image_pack/vendor/mozjpeg/simd/powerpc/jdsample-altivec.c +400 -0
  247. data/ext/image_pack/vendor/mozjpeg/simd/powerpc/jfdctfst-altivec.c +154 -0
  248. data/ext/image_pack/vendor/mozjpeg/simd/powerpc/jfdctint-altivec.c +258 -0
  249. data/ext/image_pack/vendor/mozjpeg/simd/powerpc/jidctfst-altivec.c +255 -0
  250. data/ext/image_pack/vendor/mozjpeg/simd/powerpc/jidctint-altivec.c +357 -0
  251. data/ext/image_pack/vendor/mozjpeg/simd/powerpc/jquanti-altivec.c +250 -0
  252. data/ext/image_pack/vendor/mozjpeg/simd/powerpc/jsimd.c +884 -0
  253. data/ext/image_pack/vendor/mozjpeg/simd/powerpc/jsimd_altivec.h +98 -0
  254. data/ext/image_pack/vendor/mozjpeg/simd/x86_64/jccolext-avx2.asm +559 -0
  255. data/ext/image_pack/vendor/mozjpeg/simd/x86_64/jccolext-sse2.asm +484 -0
  256. data/ext/image_pack/vendor/mozjpeg/simd/x86_64/jccolor-avx2.asm +121 -0
  257. data/ext/image_pack/vendor/mozjpeg/simd/x86_64/jccolor-sse2.asm +120 -0
  258. data/ext/image_pack/vendor/mozjpeg/simd/x86_64/jcgray-avx2.asm +113 -0
  259. data/ext/image_pack/vendor/mozjpeg/simd/x86_64/jcgray-sse2.asm +112 -0
  260. data/ext/image_pack/vendor/mozjpeg/simd/x86_64/jcgryext-avx2.asm +438 -0
  261. data/ext/image_pack/vendor/mozjpeg/simd/x86_64/jcgryext-sse2.asm +363 -0
  262. data/ext/image_pack/vendor/mozjpeg/simd/x86_64/jchuff-sse2.asm +583 -0
  263. data/ext/image_pack/vendor/mozjpeg/simd/x86_64/jcphuff-sse2.asm +639 -0
  264. data/ext/image_pack/vendor/mozjpeg/simd/x86_64/jcsample-avx2.asm +367 -0
  265. data/ext/image_pack/vendor/mozjpeg/simd/x86_64/jcsample-sse2.asm +330 -0
  266. data/ext/image_pack/vendor/mozjpeg/simd/x86_64/jdcolext-avx2.asm +496 -0
  267. data/ext/image_pack/vendor/mozjpeg/simd/x86_64/jdcolext-sse2.asm +439 -0
  268. data/ext/image_pack/vendor/mozjpeg/simd/x86_64/jdcolor-avx2.asm +118 -0
  269. data/ext/image_pack/vendor/mozjpeg/simd/x86_64/jdcolor-sse2.asm +117 -0
  270. data/ext/image_pack/vendor/mozjpeg/simd/x86_64/jdmerge-avx2.asm +136 -0
  271. data/ext/image_pack/vendor/mozjpeg/simd/x86_64/jdmerge-sse2.asm +135 -0
  272. data/ext/image_pack/vendor/mozjpeg/simd/x86_64/jdmrgext-avx2.asm +596 -0
  273. data/ext/image_pack/vendor/mozjpeg/simd/x86_64/jdmrgext-sse2.asm +538 -0
  274. data/ext/image_pack/vendor/mozjpeg/simd/x86_64/jdsample-avx2.asm +696 -0
  275. data/ext/image_pack/vendor/mozjpeg/simd/x86_64/jdsample-sse2.asm +665 -0
  276. data/ext/image_pack/vendor/mozjpeg/simd/x86_64/jfdctflt-sse.asm +355 -0
  277. data/ext/image_pack/vendor/mozjpeg/simd/x86_64/jfdctfst-sse2.asm +389 -0
  278. data/ext/image_pack/vendor/mozjpeg/simd/x86_64/jfdctint-avx2.asm +320 -0
  279. data/ext/image_pack/vendor/mozjpeg/simd/x86_64/jfdctint-sse2.asm +619 -0
  280. data/ext/image_pack/vendor/mozjpeg/simd/x86_64/jidctflt-sse2.asm +482 -0
  281. data/ext/image_pack/vendor/mozjpeg/simd/x86_64/jidctfst-sse2.asm +491 -0
  282. data/ext/image_pack/vendor/mozjpeg/simd/x86_64/jidctint-avx2.asm +418 -0
  283. data/ext/image_pack/vendor/mozjpeg/simd/x86_64/jidctint-sse2.asm +847 -0
  284. data/ext/image_pack/vendor/mozjpeg/simd/x86_64/jidctred-sse2.asm +574 -0
  285. data/ext/image_pack/vendor/mozjpeg/simd/x86_64/jquantf-sse2.asm +155 -0
  286. data/ext/image_pack/vendor/mozjpeg/simd/x86_64/jquanti-avx2.asm +163 -0
  287. data/ext/image_pack/vendor/mozjpeg/simd/x86_64/jquanti-sse2.asm +188 -0
  288. data/ext/image_pack/vendor/mozjpeg/simd/x86_64/jsimd.c +1110 -0
  289. data/ext/image_pack/vendor/mozjpeg/simd/x86_64/jsimdcpu.asm +86 -0
  290. data/ext/image_pack/vendor/mozjpeg/strtest.c +170 -0
  291. data/ext/image_pack/vendor/mozjpeg/structure.txt +900 -0
  292. data/ext/image_pack/vendor/mozjpeg/tjbench.c +1044 -0
  293. data/ext/image_pack/vendor/mozjpeg/tjbenchtest.in +256 -0
  294. data/ext/image_pack/vendor/mozjpeg/tjbenchtest.java.in +215 -0
  295. data/ext/image_pack/vendor/mozjpeg/tjexample.c +406 -0
  296. data/ext/image_pack/vendor/mozjpeg/tjexampletest.in +149 -0
  297. data/ext/image_pack/vendor/mozjpeg/tjexampletest.java.in +151 -0
  298. data/ext/image_pack/vendor/mozjpeg/tjunittest.c +961 -0
  299. data/ext/image_pack/vendor/mozjpeg/tjutil.c +70 -0
  300. data/ext/image_pack/vendor/mozjpeg/tjutil.h +53 -0
  301. data/ext/image_pack/vendor/mozjpeg/transupp.c +2373 -0
  302. data/ext/image_pack/vendor/mozjpeg/transupp.h +243 -0
  303. data/ext/image_pack/vendor/mozjpeg/turbojpeg-jni.c +1259 -0
  304. data/ext/image_pack/vendor/mozjpeg/turbojpeg.c +2320 -0
  305. data/ext/image_pack/vendor/mozjpeg/turbojpeg.h +1784 -0
  306. data/ext/image_pack/vendor/mozjpeg/usage.txt +679 -0
  307. data/ext/image_pack/vendor/mozjpeg/wizard.txt +220 -0
  308. data/ext/image_pack/vendor/mozjpeg/wrbmp.c +552 -0
  309. data/ext/image_pack/vendor/mozjpeg/wrgif.c +580 -0
  310. data/ext/image_pack/vendor/mozjpeg/wrjpgcom.c +577 -0
  311. data/ext/image_pack/vendor/mozjpeg/wrppm.c +366 -0
  312. data/ext/image_pack/vendor/mozjpeg/wrtarga.c +258 -0
  313. data/ext/image_pack/vendor/mozjpeg/yuvjpeg.c +268 -0
  314. data/lib/image_pack/backend.rb +8 -0
  315. data/lib/image_pack/configuration.rb +23 -0
  316. data/lib/image_pack/errors.rb +13 -0
  317. data/lib/image_pack/version.rb +5 -0
  318. data/lib/image_pack.rb +208 -0
  319. metadata +433 -0
@@ -0,0 +1,439 @@
1
+ ;
2
+ ; jdcolext.asm - colorspace conversion (64-bit SSE2)
3
+ ;
4
+ ; Copyright 2009, 2012 Pierre Ossman <ossman@cendio.se> for Cendio AB
5
+ ; Copyright (C) 2009, 2012, 2016, D. R. Commander.
6
+ ; Copyright (C) 2018, Matthias Räncker.
7
+ ;
8
+ ; Based on the x86 SIMD extension for IJG JPEG library
9
+ ; Copyright (C) 1999-2006, MIYASAKA Masaru.
10
+ ; For conditions of distribution and use, see copyright notice in jsimdext.inc
11
+ ;
12
+ ; This file should be assembled with NASM (Netwide Assembler),
13
+ ; can *not* be assembled with Microsoft's MASM or any compatible
14
+ ; assembler (including Borland's Turbo Assembler).
15
+ ; NASM is available from http://nasm.sourceforge.net/ or
16
+ ; http://sourceforge.net/project/showfiles.php?group_id=6208
17
+
18
+ %include "jcolsamp.inc"
19
+
20
+ ; --------------------------------------------------------------------------
21
+ ;
22
+ ; Convert some rows of samples to the output colorspace.
23
+ ;
24
+ ; GLOBAL(void)
25
+ ; jsimd_ycc_rgb_convert_sse2(JDIMENSION out_width, JSAMPIMAGE input_buf,
26
+ ; JDIMENSION input_row, JSAMPARRAY output_buf,
27
+ ; int num_rows)
28
+ ;
29
+
30
+ ; r10d = JDIMENSION out_width
31
+ ; r11 = JSAMPIMAGE input_buf
32
+ ; r12d = JDIMENSION input_row
33
+ ; r13 = JSAMPARRAY output_buf
34
+ ; r14d = int num_rows
35
+
36
+ %define wk(i) rbp - (WK_NUM - (i)) * SIZEOF_XMMWORD ; xmmword wk[WK_NUM]
37
+ %define WK_NUM 2
38
+
39
+ align 32
40
+ GLOBAL_FUNCTION(jsimd_ycc_rgb_convert_sse2)
41
+
42
+ EXTN(jsimd_ycc_rgb_convert_sse2):
43
+ push rbp
44
+ mov rax, rsp ; rax = original rbp
45
+ sub rsp, byte 4
46
+ and rsp, byte (-SIZEOF_XMMWORD) ; align to 128 bits
47
+ mov [rsp], rax
48
+ mov rbp, rsp ; rbp = aligned rbp
49
+ lea rsp, [wk(0)]
50
+ collect_args 5
51
+ push rbx
52
+
53
+ mov ecx, r10d ; num_cols
54
+ test rcx, rcx
55
+ jz near .return
56
+
57
+ push rcx
58
+
59
+ mov rdi, r11
60
+ mov ecx, r12d
61
+ mov rsip, JSAMPARRAY [rdi+0*SIZEOF_JSAMPARRAY]
62
+ mov rbxp, JSAMPARRAY [rdi+1*SIZEOF_JSAMPARRAY]
63
+ mov rdxp, JSAMPARRAY [rdi+2*SIZEOF_JSAMPARRAY]
64
+ lea rsi, [rsi+rcx*SIZEOF_JSAMPROW]
65
+ lea rbx, [rbx+rcx*SIZEOF_JSAMPROW]
66
+ lea rdx, [rdx+rcx*SIZEOF_JSAMPROW]
67
+
68
+ pop rcx
69
+
70
+ mov rdi, r13
71
+ mov eax, r14d
72
+ test rax, rax
73
+ jle near .return
74
+ .rowloop:
75
+ push rax
76
+ push rdi
77
+ push rdx
78
+ push rbx
79
+ push rsi
80
+ push rcx ; col
81
+
82
+ mov rsip, JSAMPROW [rsi] ; inptr0
83
+ mov rbxp, JSAMPROW [rbx] ; inptr1
84
+ mov rdxp, JSAMPROW [rdx] ; inptr2
85
+ mov rdip, JSAMPROW [rdi] ; outptr
86
+ .columnloop:
87
+
88
+ movdqa xmm5, XMMWORD [rbx] ; xmm5=Cb(0123456789ABCDEF)
89
+ movdqa xmm1, XMMWORD [rdx] ; xmm1=Cr(0123456789ABCDEF)
90
+
91
+ pcmpeqw xmm4, xmm4
92
+ pcmpeqw xmm7, xmm7
93
+ psrlw xmm4, BYTE_BIT
94
+ psllw xmm7, 7 ; xmm7={0xFF80 0xFF80 0xFF80 0xFF80 ..}
95
+ movdqa xmm0, xmm4 ; xmm0=xmm4={0xFF 0x00 0xFF 0x00 ..}
96
+
97
+ pand xmm4, xmm5 ; xmm4=Cb(02468ACE)=CbE
98
+ psrlw xmm5, BYTE_BIT ; xmm5=Cb(13579BDF)=CbO
99
+ pand xmm0, xmm1 ; xmm0=Cr(02468ACE)=CrE
100
+ psrlw xmm1, BYTE_BIT ; xmm1=Cr(13579BDF)=CrO
101
+
102
+ paddw xmm4, xmm7
103
+ paddw xmm5, xmm7
104
+ paddw xmm0, xmm7
105
+ paddw xmm1, xmm7
106
+
107
+ ; (Original)
108
+ ; R = Y + 1.40200 * Cr
109
+ ; G = Y - 0.34414 * Cb - 0.71414 * Cr
110
+ ; B = Y + 1.77200 * Cb
111
+ ;
112
+ ; (This implementation)
113
+ ; R = Y + 0.40200 * Cr + Cr
114
+ ; G = Y - 0.34414 * Cb + 0.28586 * Cr - Cr
115
+ ; B = Y - 0.22800 * Cb + Cb + Cb
116
+
117
+ movdqa xmm2, xmm4 ; xmm2=CbE
118
+ movdqa xmm3, xmm5 ; xmm3=CbO
119
+ paddw xmm4, xmm4 ; xmm4=2*CbE
120
+ paddw xmm5, xmm5 ; xmm5=2*CbO
121
+ movdqa xmm6, xmm0 ; xmm6=CrE
122
+ movdqa xmm7, xmm1 ; xmm7=CrO
123
+ paddw xmm0, xmm0 ; xmm0=2*CrE
124
+ paddw xmm1, xmm1 ; xmm1=2*CrO
125
+
126
+ pmulhw xmm4, [rel PW_MF0228] ; xmm4=(2*CbE * -FIX(0.22800))
127
+ pmulhw xmm5, [rel PW_MF0228] ; xmm5=(2*CbO * -FIX(0.22800))
128
+ pmulhw xmm0, [rel PW_F0402] ; xmm0=(2*CrE * FIX(0.40200))
129
+ pmulhw xmm1, [rel PW_F0402] ; xmm1=(2*CrO * FIX(0.40200))
130
+
131
+ paddw xmm4, [rel PW_ONE]
132
+ paddw xmm5, [rel PW_ONE]
133
+ psraw xmm4, 1 ; xmm4=(CbE * -FIX(0.22800))
134
+ psraw xmm5, 1 ; xmm5=(CbO * -FIX(0.22800))
135
+ paddw xmm0, [rel PW_ONE]
136
+ paddw xmm1, [rel PW_ONE]
137
+ psraw xmm0, 1 ; xmm0=(CrE * FIX(0.40200))
138
+ psraw xmm1, 1 ; xmm1=(CrO * FIX(0.40200))
139
+
140
+ paddw xmm4, xmm2
141
+ paddw xmm5, xmm3
142
+ paddw xmm4, xmm2 ; xmm4=(CbE * FIX(1.77200))=(B-Y)E
143
+ paddw xmm5, xmm3 ; xmm5=(CbO * FIX(1.77200))=(B-Y)O
144
+ paddw xmm0, xmm6 ; xmm0=(CrE * FIX(1.40200))=(R-Y)E
145
+ paddw xmm1, xmm7 ; xmm1=(CrO * FIX(1.40200))=(R-Y)O
146
+
147
+ movdqa XMMWORD [wk(0)], xmm4 ; wk(0)=(B-Y)E
148
+ movdqa XMMWORD [wk(1)], xmm5 ; wk(1)=(B-Y)O
149
+
150
+ movdqa xmm4, xmm2
151
+ movdqa xmm5, xmm3
152
+ punpcklwd xmm2, xmm6
153
+ punpckhwd xmm4, xmm6
154
+ pmaddwd xmm2, [rel PW_MF0344_F0285]
155
+ pmaddwd xmm4, [rel PW_MF0344_F0285]
156
+ punpcklwd xmm3, xmm7
157
+ punpckhwd xmm5, xmm7
158
+ pmaddwd xmm3, [rel PW_MF0344_F0285]
159
+ pmaddwd xmm5, [rel PW_MF0344_F0285]
160
+
161
+ paddd xmm2, [rel PD_ONEHALF]
162
+ paddd xmm4, [rel PD_ONEHALF]
163
+ psrad xmm2, SCALEBITS
164
+ psrad xmm4, SCALEBITS
165
+ paddd xmm3, [rel PD_ONEHALF]
166
+ paddd xmm5, [rel PD_ONEHALF]
167
+ psrad xmm3, SCALEBITS
168
+ psrad xmm5, SCALEBITS
169
+
170
+ packssdw xmm2, xmm4 ; xmm2=CbE*-FIX(0.344)+CrE*FIX(0.285)
171
+ packssdw xmm3, xmm5 ; xmm3=CbO*-FIX(0.344)+CrO*FIX(0.285)
172
+ psubw xmm2, xmm6 ; xmm2=CbE*-FIX(0.344)+CrE*-FIX(0.714)=(G-Y)E
173
+ psubw xmm3, xmm7 ; xmm3=CbO*-FIX(0.344)+CrO*-FIX(0.714)=(G-Y)O
174
+
175
+ movdqa xmm5, XMMWORD [rsi] ; xmm5=Y(0123456789ABCDEF)
176
+
177
+ pcmpeqw xmm4, xmm4
178
+ psrlw xmm4, BYTE_BIT ; xmm4={0xFF 0x00 0xFF 0x00 ..}
179
+ pand xmm4, xmm5 ; xmm4=Y(02468ACE)=YE
180
+ psrlw xmm5, BYTE_BIT ; xmm5=Y(13579BDF)=YO
181
+
182
+ paddw xmm0, xmm4 ; xmm0=((R-Y)E+YE)=RE=R(02468ACE)
183
+ paddw xmm1, xmm5 ; xmm1=((R-Y)O+YO)=RO=R(13579BDF)
184
+ packuswb xmm0, xmm0 ; xmm0=R(02468ACE********)
185
+ packuswb xmm1, xmm1 ; xmm1=R(13579BDF********)
186
+
187
+ paddw xmm2, xmm4 ; xmm2=((G-Y)E+YE)=GE=G(02468ACE)
188
+ paddw xmm3, xmm5 ; xmm3=((G-Y)O+YO)=GO=G(13579BDF)
189
+ packuswb xmm2, xmm2 ; xmm2=G(02468ACE********)
190
+ packuswb xmm3, xmm3 ; xmm3=G(13579BDF********)
191
+
192
+ paddw xmm4, XMMWORD [wk(0)] ; xmm4=(YE+(B-Y)E)=BE=B(02468ACE)
193
+ paddw xmm5, XMMWORD [wk(1)] ; xmm5=(YO+(B-Y)O)=BO=B(13579BDF)
194
+ packuswb xmm4, xmm4 ; xmm4=B(02468ACE********)
195
+ packuswb xmm5, xmm5 ; xmm5=B(13579BDF********)
196
+
197
+ %if RGB_PIXELSIZE == 3 ; ---------------
198
+
199
+ ; xmmA=(00 02 04 06 08 0A 0C 0E **), xmmB=(01 03 05 07 09 0B 0D 0F **)
200
+ ; xmmC=(10 12 14 16 18 1A 1C 1E **), xmmD=(11 13 15 17 19 1B 1D 1F **)
201
+ ; xmmE=(20 22 24 26 28 2A 2C 2E **), xmmF=(21 23 25 27 29 2B 2D 2F **)
202
+ ; xmmG=(** ** ** ** ** ** ** ** **), xmmH=(** ** ** ** ** ** ** ** **)
203
+
204
+ punpcklbw xmmA, xmmC ; xmmA=(00 10 02 12 04 14 06 16 08 18 0A 1A 0C 1C 0E 1E)
205
+ punpcklbw xmmE, xmmB ; xmmE=(20 01 22 03 24 05 26 07 28 09 2A 0B 2C 0D 2E 0F)
206
+ punpcklbw xmmD, xmmF ; xmmD=(11 21 13 23 15 25 17 27 19 29 1B 2B 1D 2D 1F 2F)
207
+
208
+ movdqa xmmG, xmmA
209
+ movdqa xmmH, xmmA
210
+ punpcklwd xmmA, xmmE ; xmmA=(00 10 20 01 02 12 22 03 04 14 24 05 06 16 26 07)
211
+ punpckhwd xmmG, xmmE ; xmmG=(08 18 28 09 0A 1A 2A 0B 0C 1C 2C 0D 0E 1E 2E 0F)
212
+
213
+ psrldq xmmH, 2 ; xmmH=(02 12 04 14 06 16 08 18 0A 1A 0C 1C 0E 1E -- --)
214
+ psrldq xmmE, 2 ; xmmE=(22 03 24 05 26 07 28 09 2A 0B 2C 0D 2E 0F -- --)
215
+
216
+ movdqa xmmC, xmmD
217
+ movdqa xmmB, xmmD
218
+ punpcklwd xmmD, xmmH ; xmmD=(11 21 02 12 13 23 04 14 15 25 06 16 17 27 08 18)
219
+ punpckhwd xmmC, xmmH ; xmmC=(19 29 0A 1A 1B 2B 0C 1C 1D 2D 0E 1E 1F 2F -- --)
220
+
221
+ psrldq xmmB, 2 ; xmmB=(13 23 15 25 17 27 19 29 1B 2B 1D 2D 1F 2F -- --)
222
+
223
+ movdqa xmmF, xmmE
224
+ punpcklwd xmmE, xmmB ; xmmE=(22 03 13 23 24 05 15 25 26 07 17 27 28 09 19 29)
225
+ punpckhwd xmmF, xmmB ; xmmF=(2A 0B 1B 2B 2C 0D 1D 2D 2E 0F 1F 2F -- -- -- --)
226
+
227
+ pshufd xmmH, xmmA, 0x4E ; xmmH=(04 14 24 05 06 16 26 07 00 10 20 01 02 12 22 03)
228
+ movdqa xmmB, xmmE
229
+ punpckldq xmmA, xmmD ; xmmA=(00 10 20 01 11 21 02 12 02 12 22 03 13 23 04 14)
230
+ punpckldq xmmE, xmmH ; xmmE=(22 03 13 23 04 14 24 05 24 05 15 25 06 16 26 07)
231
+ punpckhdq xmmD, xmmB ; xmmD=(15 25 06 16 26 07 17 27 17 27 08 18 28 09 19 29)
232
+
233
+ pshufd xmmH, xmmG, 0x4E ; xmmH=(0C 1C 2C 0D 0E 1E 2E 0F 08 18 28 09 0A 1A 2A 0B)
234
+ movdqa xmmB, xmmF
235
+ punpckldq xmmG, xmmC ; xmmG=(08 18 28 09 19 29 0A 1A 0A 1A 2A 0B 1B 2B 0C 1C)
236
+ punpckldq xmmF, xmmH ; xmmF=(2A 0B 1B 2B 0C 1C 2C 0D 2C 0D 1D 2D 0E 1E 2E 0F)
237
+ punpckhdq xmmC, xmmB ; xmmC=(1D 2D 0E 1E 2E 0F 1F 2F 1F 2F -- -- -- -- -- --)
238
+
239
+ punpcklqdq xmmA, xmmE ; xmmA=(00 10 20 01 11 21 02 12 22 03 13 23 04 14 24 05)
240
+ punpcklqdq xmmD, xmmG ; xmmD=(15 25 06 16 26 07 17 27 08 18 28 09 19 29 0A 1A)
241
+ punpcklqdq xmmF, xmmC ; xmmF=(2A 0B 1B 2B 0C 1C 2C 0D 1D 2D 0E 1E 2E 0F 1F 2F)
242
+
243
+ cmp rcx, byte SIZEOF_XMMWORD
244
+ jb short .column_st32
245
+
246
+ test rdi, SIZEOF_XMMWORD-1
247
+ jnz short .out1
248
+ ; --(aligned)-------------------
249
+ movntdq XMMWORD [rdi+0*SIZEOF_XMMWORD], xmmA
250
+ movntdq XMMWORD [rdi+1*SIZEOF_XMMWORD], xmmD
251
+ movntdq XMMWORD [rdi+2*SIZEOF_XMMWORD], xmmF
252
+ jmp short .out0
253
+ .out1: ; --(unaligned)-----------------
254
+ movdqu XMMWORD [rdi+0*SIZEOF_XMMWORD], xmmA
255
+ movdqu XMMWORD [rdi+1*SIZEOF_XMMWORD], xmmD
256
+ movdqu XMMWORD [rdi+2*SIZEOF_XMMWORD], xmmF
257
+ .out0:
258
+ add rdi, byte RGB_PIXELSIZE*SIZEOF_XMMWORD ; outptr
259
+ sub rcx, byte SIZEOF_XMMWORD
260
+ jz near .nextrow
261
+
262
+ add rsi, byte SIZEOF_XMMWORD ; inptr0
263
+ add rbx, byte SIZEOF_XMMWORD ; inptr1
264
+ add rdx, byte SIZEOF_XMMWORD ; inptr2
265
+ jmp near .columnloop
266
+
267
+ .column_st32:
268
+ lea rcx, [rcx+rcx*2] ; imul ecx, RGB_PIXELSIZE
269
+ cmp rcx, byte 2*SIZEOF_XMMWORD
270
+ jb short .column_st16
271
+ movdqu XMMWORD [rdi+0*SIZEOF_XMMWORD], xmmA
272
+ movdqu XMMWORD [rdi+1*SIZEOF_XMMWORD], xmmD
273
+ add rdi, byte 2*SIZEOF_XMMWORD ; outptr
274
+ movdqa xmmA, xmmF
275
+ sub rcx, byte 2*SIZEOF_XMMWORD
276
+ jmp short .column_st15
277
+ .column_st16:
278
+ cmp rcx, byte SIZEOF_XMMWORD
279
+ jb short .column_st15
280
+ movdqu XMMWORD [rdi+0*SIZEOF_XMMWORD], xmmA
281
+ add rdi, byte SIZEOF_XMMWORD ; outptr
282
+ movdqa xmmA, xmmD
283
+ sub rcx, byte SIZEOF_XMMWORD
284
+ .column_st15:
285
+ ; Store the lower 8 bytes of xmmA to the output when it has enough
286
+ ; space.
287
+ cmp rcx, byte SIZEOF_MMWORD
288
+ jb short .column_st7
289
+ movq XMM_MMWORD [rdi], xmmA
290
+ add rdi, byte SIZEOF_MMWORD
291
+ sub rcx, byte SIZEOF_MMWORD
292
+ psrldq xmmA, SIZEOF_MMWORD
293
+ .column_st7:
294
+ ; Store the lower 4 bytes of xmmA to the output when it has enough
295
+ ; space.
296
+ cmp rcx, byte SIZEOF_DWORD
297
+ jb short .column_st3
298
+ movd XMM_DWORD [rdi], xmmA
299
+ add rdi, byte SIZEOF_DWORD
300
+ sub rcx, byte SIZEOF_DWORD
301
+ psrldq xmmA, SIZEOF_DWORD
302
+ .column_st3:
303
+ ; Store the lower 2 bytes of rax to the output when it has enough
304
+ ; space.
305
+ movd eax, xmmA
306
+ cmp rcx, byte SIZEOF_WORD
307
+ jb short .column_st1
308
+ mov word [rdi], ax
309
+ add rdi, byte SIZEOF_WORD
310
+ sub rcx, byte SIZEOF_WORD
311
+ shr rax, 16
312
+ .column_st1:
313
+ ; Store the lower 1 byte of rax to the output when it has enough
314
+ ; space.
315
+ test rcx, rcx
316
+ jz short .nextrow
317
+ mov byte [rdi], al
318
+
319
+ %else ; RGB_PIXELSIZE == 4 ; -----------
320
+
321
+ %ifdef RGBX_FILLER_0XFF
322
+ pcmpeqb xmm6, xmm6 ; xmm6=XE=X(02468ACE********)
323
+ pcmpeqb xmm7, xmm7 ; xmm7=XO=X(13579BDF********)
324
+ %else
325
+ pxor xmm6, xmm6 ; xmm6=XE=X(02468ACE********)
326
+ pxor xmm7, xmm7 ; xmm7=XO=X(13579BDF********)
327
+ %endif
328
+ ; xmmA=(00 02 04 06 08 0A 0C 0E **), xmmB=(01 03 05 07 09 0B 0D 0F **)
329
+ ; xmmC=(10 12 14 16 18 1A 1C 1E **), xmmD=(11 13 15 17 19 1B 1D 1F **)
330
+ ; xmmE=(20 22 24 26 28 2A 2C 2E **), xmmF=(21 23 25 27 29 2B 2D 2F **)
331
+ ; xmmG=(30 32 34 36 38 3A 3C 3E **), xmmH=(31 33 35 37 39 3B 3D 3F **)
332
+
333
+ punpcklbw xmmA, xmmC ; xmmA=(00 10 02 12 04 14 06 16 08 18 0A 1A 0C 1C 0E 1E)
334
+ punpcklbw xmmE, xmmG ; xmmE=(20 30 22 32 24 34 26 36 28 38 2A 3A 2C 3C 2E 3E)
335
+ punpcklbw xmmB, xmmD ; xmmB=(01 11 03 13 05 15 07 17 09 19 0B 1B 0D 1D 0F 1F)
336
+ punpcklbw xmmF, xmmH ; xmmF=(21 31 23 33 25 35 27 37 29 39 2B 3B 2D 3D 2F 3F)
337
+
338
+ movdqa xmmC, xmmA
339
+ punpcklwd xmmA, xmmE ; xmmA=(00 10 20 30 02 12 22 32 04 14 24 34 06 16 26 36)
340
+ punpckhwd xmmC, xmmE ; xmmC=(08 18 28 38 0A 1A 2A 3A 0C 1C 2C 3C 0E 1E 2E 3E)
341
+ movdqa xmmG, xmmB
342
+ punpcklwd xmmB, xmmF ; xmmB=(01 11 21 31 03 13 23 33 05 15 25 35 07 17 27 37)
343
+ punpckhwd xmmG, xmmF ; xmmG=(09 19 29 39 0B 1B 2B 3B 0D 1D 2D 3D 0F 1F 2F 3F)
344
+
345
+ movdqa xmmD, xmmA
346
+ punpckldq xmmA, xmmB ; xmmA=(00 10 20 30 01 11 21 31 02 12 22 32 03 13 23 33)
347
+ punpckhdq xmmD, xmmB ; xmmD=(04 14 24 34 05 15 25 35 06 16 26 36 07 17 27 37)
348
+ movdqa xmmH, xmmC
349
+ punpckldq xmmC, xmmG ; xmmC=(08 18 28 38 09 19 29 39 0A 1A 2A 3A 0B 1B 2B 3B)
350
+ punpckhdq xmmH, xmmG ; xmmH=(0C 1C 2C 3C 0D 1D 2D 3D 0E 1E 2E 3E 0F 1F 2F 3F)
351
+
352
+ cmp rcx, byte SIZEOF_XMMWORD
353
+ jb short .column_st32
354
+
355
+ test rdi, SIZEOF_XMMWORD-1
356
+ jnz short .out1
357
+ ; --(aligned)-------------------
358
+ movntdq XMMWORD [rdi+0*SIZEOF_XMMWORD], xmmA
359
+ movntdq XMMWORD [rdi+1*SIZEOF_XMMWORD], xmmD
360
+ movntdq XMMWORD [rdi+2*SIZEOF_XMMWORD], xmmC
361
+ movntdq XMMWORD [rdi+3*SIZEOF_XMMWORD], xmmH
362
+ jmp short .out0
363
+ .out1: ; --(unaligned)-----------------
364
+ movdqu XMMWORD [rdi+0*SIZEOF_XMMWORD], xmmA
365
+ movdqu XMMWORD [rdi+1*SIZEOF_XMMWORD], xmmD
366
+ movdqu XMMWORD [rdi+2*SIZEOF_XMMWORD], xmmC
367
+ movdqu XMMWORD [rdi+3*SIZEOF_XMMWORD], xmmH
368
+ .out0:
369
+ add rdi, byte RGB_PIXELSIZE*SIZEOF_XMMWORD ; outptr
370
+ sub rcx, byte SIZEOF_XMMWORD
371
+ jz near .nextrow
372
+
373
+ add rsi, byte SIZEOF_XMMWORD ; inptr0
374
+ add rbx, byte SIZEOF_XMMWORD ; inptr1
375
+ add rdx, byte SIZEOF_XMMWORD ; inptr2
376
+ jmp near .columnloop
377
+
378
+ .column_st32:
379
+ cmp rcx, byte SIZEOF_XMMWORD/2
380
+ jb short .column_st16
381
+ movdqu XMMWORD [rdi+0*SIZEOF_XMMWORD], xmmA
382
+ movdqu XMMWORD [rdi+1*SIZEOF_XMMWORD], xmmD
383
+ add rdi, byte 2*SIZEOF_XMMWORD ; outptr
384
+ movdqa xmmA, xmmC
385
+ movdqa xmmD, xmmH
386
+ sub rcx, byte SIZEOF_XMMWORD/2
387
+ .column_st16:
388
+ cmp rcx, byte SIZEOF_XMMWORD/4
389
+ jb short .column_st15
390
+ movdqu XMMWORD [rdi+0*SIZEOF_XMMWORD], xmmA
391
+ add rdi, byte SIZEOF_XMMWORD ; outptr
392
+ movdqa xmmA, xmmD
393
+ sub rcx, byte SIZEOF_XMMWORD/4
394
+ .column_st15:
395
+ ; Store two pixels (8 bytes) of xmmA to the output when it has enough
396
+ ; space.
397
+ cmp rcx, byte SIZEOF_XMMWORD/8
398
+ jb short .column_st7
399
+ movq MMWORD [rdi], xmmA
400
+ add rdi, byte SIZEOF_XMMWORD/8*4
401
+ sub rcx, byte SIZEOF_XMMWORD/8
402
+ psrldq xmmA, SIZEOF_XMMWORD/8*4
403
+ .column_st7:
404
+ ; Store one pixel (4 bytes) of xmmA to the output when it has enough
405
+ ; space.
406
+ test rcx, rcx
407
+ jz short .nextrow
408
+ movd XMM_DWORD [rdi], xmmA
409
+
410
+ %endif ; RGB_PIXELSIZE ; ---------------
411
+
412
+ .nextrow:
413
+ pop rcx
414
+ pop rsi
415
+ pop rbx
416
+ pop rdx
417
+ pop rdi
418
+ pop rax
419
+
420
+ add rsi, byte SIZEOF_JSAMPROW
421
+ add rbx, byte SIZEOF_JSAMPROW
422
+ add rdx, byte SIZEOF_JSAMPROW
423
+ add rdi, byte SIZEOF_JSAMPROW ; output_buf
424
+ dec rax ; num_rows
425
+ jg near .rowloop
426
+
427
+ sfence ; flush the write buffer
428
+
429
+ .return:
430
+ pop rbx
431
+ uncollect_args 5
432
+ mov rsp, rbp ; rsp <- aligned rbp
433
+ pop rsp ; rsp <- original rbp
434
+ pop rbp
435
+ ret
436
+
437
+ ; For some reason, the OS X linker does not honor the request to align the
438
+ ; segment unless we do this.
439
+ align 32
@@ -0,0 +1,118 @@
1
+ ;
2
+ ; jdcolor.asm - colorspace conversion (64-bit AVX2)
3
+ ;
4
+ ; Copyright 2009 Pierre Ossman <ossman@cendio.se> for Cendio AB
5
+ ; Copyright (C) 2009, 2016, D. R. Commander.
6
+ ; Copyright (C) 2015, Intel Corporation.
7
+ ;
8
+ ; Based on the x86 SIMD extension for IJG JPEG library
9
+ ; Copyright (C) 1999-2006, MIYASAKA Masaru.
10
+ ; For conditions of distribution and use, see copyright notice in jsimdext.inc
11
+ ;
12
+ ; This file should be assembled with NASM (Netwide Assembler),
13
+ ; can *not* be assembled with Microsoft's MASM or any compatible
14
+ ; assembler (including Borland's Turbo Assembler).
15
+ ; NASM is available from http://nasm.sourceforge.net/ or
16
+ ; http://sourceforge.net/project/showfiles.php?group_id=6208
17
+
18
+ %include "jsimdext.inc"
19
+
20
+ ; --------------------------------------------------------------------------
21
+
22
+ %define SCALEBITS 16
23
+
24
+ F_0_344 equ 22554 ; FIX(0.34414)
25
+ F_0_714 equ 46802 ; FIX(0.71414)
26
+ F_1_402 equ 91881 ; FIX(1.40200)
27
+ F_1_772 equ 116130 ; FIX(1.77200)
28
+ F_0_402 equ (F_1_402 - 65536) ; FIX(1.40200) - FIX(1)
29
+ F_0_285 equ ( 65536 - F_0_714) ; FIX(1) - FIX(0.71414)
30
+ F_0_228 equ (131072 - F_1_772) ; FIX(2) - FIX(1.77200)
31
+
32
+ ; --------------------------------------------------------------------------
33
+ SECTION SEG_CONST
34
+
35
+ alignz 32
36
+ GLOBAL_DATA(jconst_ycc_rgb_convert_avx2)
37
+
38
+ EXTN(jconst_ycc_rgb_convert_avx2):
39
+
40
+ PW_F0402 times 16 dw F_0_402
41
+ PW_MF0228 times 16 dw -F_0_228
42
+ PW_MF0344_F0285 times 8 dw -F_0_344, F_0_285
43
+ PW_ONE times 16 dw 1
44
+ PD_ONEHALF times 8 dd 1 << (SCALEBITS - 1)
45
+
46
+ alignz 32
47
+
48
+ ; --------------------------------------------------------------------------
49
+ SECTION SEG_TEXT
50
+ BITS 64
51
+
52
+ %include "jdcolext-avx2.asm"
53
+
54
+ %undef RGB_RED
55
+ %undef RGB_GREEN
56
+ %undef RGB_BLUE
57
+ %undef RGB_PIXELSIZE
58
+ %define RGB_RED EXT_RGB_RED
59
+ %define RGB_GREEN EXT_RGB_GREEN
60
+ %define RGB_BLUE EXT_RGB_BLUE
61
+ %define RGB_PIXELSIZE EXT_RGB_PIXELSIZE
62
+ %define jsimd_ycc_rgb_convert_avx2 jsimd_ycc_extrgb_convert_avx2
63
+ %include "jdcolext-avx2.asm"
64
+
65
+ %undef RGB_RED
66
+ %undef RGB_GREEN
67
+ %undef RGB_BLUE
68
+ %undef RGB_PIXELSIZE
69
+ %define RGB_RED EXT_RGBX_RED
70
+ %define RGB_GREEN EXT_RGBX_GREEN
71
+ %define RGB_BLUE EXT_RGBX_BLUE
72
+ %define RGB_PIXELSIZE EXT_RGBX_PIXELSIZE
73
+ %define jsimd_ycc_rgb_convert_avx2 jsimd_ycc_extrgbx_convert_avx2
74
+ %include "jdcolext-avx2.asm"
75
+
76
+ %undef RGB_RED
77
+ %undef RGB_GREEN
78
+ %undef RGB_BLUE
79
+ %undef RGB_PIXELSIZE
80
+ %define RGB_RED EXT_BGR_RED
81
+ %define RGB_GREEN EXT_BGR_GREEN
82
+ %define RGB_BLUE EXT_BGR_BLUE
83
+ %define RGB_PIXELSIZE EXT_BGR_PIXELSIZE
84
+ %define jsimd_ycc_rgb_convert_avx2 jsimd_ycc_extbgr_convert_avx2
85
+ %include "jdcolext-avx2.asm"
86
+
87
+ %undef RGB_RED
88
+ %undef RGB_GREEN
89
+ %undef RGB_BLUE
90
+ %undef RGB_PIXELSIZE
91
+ %define RGB_RED EXT_BGRX_RED
92
+ %define RGB_GREEN EXT_BGRX_GREEN
93
+ %define RGB_BLUE EXT_BGRX_BLUE
94
+ %define RGB_PIXELSIZE EXT_BGRX_PIXELSIZE
95
+ %define jsimd_ycc_rgb_convert_avx2 jsimd_ycc_extbgrx_convert_avx2
96
+ %include "jdcolext-avx2.asm"
97
+
98
+ %undef RGB_RED
99
+ %undef RGB_GREEN
100
+ %undef RGB_BLUE
101
+ %undef RGB_PIXELSIZE
102
+ %define RGB_RED EXT_XBGR_RED
103
+ %define RGB_GREEN EXT_XBGR_GREEN
104
+ %define RGB_BLUE EXT_XBGR_BLUE
105
+ %define RGB_PIXELSIZE EXT_XBGR_PIXELSIZE
106
+ %define jsimd_ycc_rgb_convert_avx2 jsimd_ycc_extxbgr_convert_avx2
107
+ %include "jdcolext-avx2.asm"
108
+
109
+ %undef RGB_RED
110
+ %undef RGB_GREEN
111
+ %undef RGB_BLUE
112
+ %undef RGB_PIXELSIZE
113
+ %define RGB_RED EXT_XRGB_RED
114
+ %define RGB_GREEN EXT_XRGB_GREEN
115
+ %define RGB_BLUE EXT_XRGB_BLUE
116
+ %define RGB_PIXELSIZE EXT_XRGB_PIXELSIZE
117
+ %define jsimd_ycc_rgb_convert_avx2 jsimd_ycc_extxrgb_convert_avx2
118
+ %include "jdcolext-avx2.asm"
@@ -0,0 +1,117 @@
1
+ ;
2
+ ; jdcolor.asm - colorspace conversion (64-bit SSE2)
3
+ ;
4
+ ; Copyright 2009 Pierre Ossman <ossman@cendio.se> for Cendio AB
5
+ ; Copyright (C) 2009, 2016, D. R. Commander.
6
+ ;
7
+ ; Based on the x86 SIMD extension for IJG JPEG library
8
+ ; Copyright (C) 1999-2006, MIYASAKA Masaru.
9
+ ; For conditions of distribution and use, see copyright notice in jsimdext.inc
10
+ ;
11
+ ; This file should be assembled with NASM (Netwide Assembler),
12
+ ; can *not* be assembled with Microsoft's MASM or any compatible
13
+ ; assembler (including Borland's Turbo Assembler).
14
+ ; NASM is available from http://nasm.sourceforge.net/ or
15
+ ; http://sourceforge.net/project/showfiles.php?group_id=6208
16
+
17
+ %include "jsimdext.inc"
18
+
19
+ ; --------------------------------------------------------------------------
20
+
21
+ %define SCALEBITS 16
22
+
23
+ F_0_344 equ 22554 ; FIX(0.34414)
24
+ F_0_714 equ 46802 ; FIX(0.71414)
25
+ F_1_402 equ 91881 ; FIX(1.40200)
26
+ F_1_772 equ 116130 ; FIX(1.77200)
27
+ F_0_402 equ (F_1_402 - 65536) ; FIX(1.40200) - FIX(1)
28
+ F_0_285 equ ( 65536 - F_0_714) ; FIX(1) - FIX(0.71414)
29
+ F_0_228 equ (131072 - F_1_772) ; FIX(2) - FIX(1.77200)
30
+
31
+ ; --------------------------------------------------------------------------
32
+ SECTION SEG_CONST
33
+
34
+ alignz 32
35
+ GLOBAL_DATA(jconst_ycc_rgb_convert_sse2)
36
+
37
+ EXTN(jconst_ycc_rgb_convert_sse2):
38
+
39
+ PW_F0402 times 8 dw F_0_402
40
+ PW_MF0228 times 8 dw -F_0_228
41
+ PW_MF0344_F0285 times 4 dw -F_0_344, F_0_285
42
+ PW_ONE times 8 dw 1
43
+ PD_ONEHALF times 4 dd 1 << (SCALEBITS - 1)
44
+
45
+ alignz 32
46
+
47
+ ; --------------------------------------------------------------------------
48
+ SECTION SEG_TEXT
49
+ BITS 64
50
+
51
+ %include "jdcolext-sse2.asm"
52
+
53
+ %undef RGB_RED
54
+ %undef RGB_GREEN
55
+ %undef RGB_BLUE
56
+ %undef RGB_PIXELSIZE
57
+ %define RGB_RED EXT_RGB_RED
58
+ %define RGB_GREEN EXT_RGB_GREEN
59
+ %define RGB_BLUE EXT_RGB_BLUE
60
+ %define RGB_PIXELSIZE EXT_RGB_PIXELSIZE
61
+ %define jsimd_ycc_rgb_convert_sse2 jsimd_ycc_extrgb_convert_sse2
62
+ %include "jdcolext-sse2.asm"
63
+
64
+ %undef RGB_RED
65
+ %undef RGB_GREEN
66
+ %undef RGB_BLUE
67
+ %undef RGB_PIXELSIZE
68
+ %define RGB_RED EXT_RGBX_RED
69
+ %define RGB_GREEN EXT_RGBX_GREEN
70
+ %define RGB_BLUE EXT_RGBX_BLUE
71
+ %define RGB_PIXELSIZE EXT_RGBX_PIXELSIZE
72
+ %define jsimd_ycc_rgb_convert_sse2 jsimd_ycc_extrgbx_convert_sse2
73
+ %include "jdcolext-sse2.asm"
74
+
75
+ %undef RGB_RED
76
+ %undef RGB_GREEN
77
+ %undef RGB_BLUE
78
+ %undef RGB_PIXELSIZE
79
+ %define RGB_RED EXT_BGR_RED
80
+ %define RGB_GREEN EXT_BGR_GREEN
81
+ %define RGB_BLUE EXT_BGR_BLUE
82
+ %define RGB_PIXELSIZE EXT_BGR_PIXELSIZE
83
+ %define jsimd_ycc_rgb_convert_sse2 jsimd_ycc_extbgr_convert_sse2
84
+ %include "jdcolext-sse2.asm"
85
+
86
+ %undef RGB_RED
87
+ %undef RGB_GREEN
88
+ %undef RGB_BLUE
89
+ %undef RGB_PIXELSIZE
90
+ %define RGB_RED EXT_BGRX_RED
91
+ %define RGB_GREEN EXT_BGRX_GREEN
92
+ %define RGB_BLUE EXT_BGRX_BLUE
93
+ %define RGB_PIXELSIZE EXT_BGRX_PIXELSIZE
94
+ %define jsimd_ycc_rgb_convert_sse2 jsimd_ycc_extbgrx_convert_sse2
95
+ %include "jdcolext-sse2.asm"
96
+
97
+ %undef RGB_RED
98
+ %undef RGB_GREEN
99
+ %undef RGB_BLUE
100
+ %undef RGB_PIXELSIZE
101
+ %define RGB_RED EXT_XBGR_RED
102
+ %define RGB_GREEN EXT_XBGR_GREEN
103
+ %define RGB_BLUE EXT_XBGR_BLUE
104
+ %define RGB_PIXELSIZE EXT_XBGR_PIXELSIZE
105
+ %define jsimd_ycc_rgb_convert_sse2 jsimd_ycc_extxbgr_convert_sse2
106
+ %include "jdcolext-sse2.asm"
107
+
108
+ %undef RGB_RED
109
+ %undef RGB_GREEN
110
+ %undef RGB_BLUE
111
+ %undef RGB_PIXELSIZE
112
+ %define RGB_RED EXT_XRGB_RED
113
+ %define RGB_GREEN EXT_XRGB_GREEN
114
+ %define RGB_BLUE EXT_XRGB_BLUE
115
+ %define RGB_PIXELSIZE EXT_XRGB_PIXELSIZE
116
+ %define jsimd_ycc_rgb_convert_sse2 jsimd_ycc_extxrgb_convert_sse2
117
+ %include "jdcolext-sse2.asm"