pango 2.2.4-x64-mingw32
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +7 -0
- data/README +33 -0
- data/Rakefile +65 -0
- data/ext/pango/depend +12 -0
- data/ext/pango/extconf.rb +90 -0
- data/ext/pango/pango.def +18 -0
- data/ext/pango/rbpango.c +318 -0
- data/ext/pango/rbpango.h +96 -0
- data/ext/pango/rbpangoanalysis.c +218 -0
- data/ext/pango/rbpangoattribute.c +499 -0
- data/ext/pango/rbpangoattriterator.c +141 -0
- data/ext/pango/rbpangoattrlist.c +101 -0
- data/ext/pango/rbpangocairo.c +122 -0
- data/ext/pango/rbpangocairocontext.c +131 -0
- data/ext/pango/rbpangocolor.c +120 -0
- data/ext/pango/rbpangocontext.c +309 -0
- data/ext/pango/rbpangoconversions.h +111 -0
- data/ext/pango/rbpangocoverage.c +106 -0
- data/ext/pango/rbpangoengine.c +73 -0
- data/ext/pango/rbpangofont.c +110 -0
- data/ext/pango/rbpangofontdescription.c +282 -0
- data/ext/pango/rbpangofontface.c +73 -0
- data/ext/pango/rbpangofontfamily.c +79 -0
- data/ext/pango/rbpangofontmap.c +102 -0
- data/ext/pango/rbpangofontmetrics.c +85 -0
- data/ext/pango/rbpangofontset.c +69 -0
- data/ext/pango/rbpangofontsetsimple.c +60 -0
- data/ext/pango/rbpangoglyphinfo.c +123 -0
- data/ext/pango/rbpangoglyphitem.c +125 -0
- data/ext/pango/rbpangoglyphstring.c +151 -0
- data/ext/pango/rbpangogravity.c +54 -0
- data/ext/pango/rbpangoitem.c +95 -0
- data/ext/pango/rbpangolanguage.c +86 -0
- data/ext/pango/rbpangolayout.c +572 -0
- data/ext/pango/rbpangolayoutiter.c +189 -0
- data/ext/pango/rbpangolayoutline.c +239 -0
- data/ext/pango/rbpangologattr.c +109 -0
- data/ext/pango/rbpangomatrix.c +143 -0
- data/ext/pango/rbpangoprivate.h +49 -0
- data/ext/pango/rbpangorectangle.c +170 -0
- data/ext/pango/rbpangorenderer.c +193 -0
- data/ext/pango/rbpangoscript.c +84 -0
- data/ext/pango/rbpangoscriptiter.c +92 -0
- data/ext/pango/rbpangotabarray.c +128 -0
- data/extconf.rb +49 -0
- data/lib/2.0/pango.so +0 -0
- data/lib/2.1/pango.so +0 -0
- data/lib/2.2/pango.so +0 -0
- data/lib/pango.rb +79 -0
- data/sample/attribute.rb +82 -0
- data/sample/break.rb +28 -0
- data/sample/gdk_layout.rb +27 -0
- data/sample/glyphstring.rb +61 -0
- data/sample/item.rb +37 -0
- data/sample/label.rb +23 -0
- data/sample/layout.rb +102 -0
- data/sample/pango_cairo.rb +66 -0
- data/sample/parse.rb +33 -0
- data/sample/sample.txt +10 -0
- data/sample/script.rb +23 -0
- data/test/pango-test-utils.rb +9 -0
- data/test/run-test.rb +28 -0
- data/test/test-analysis.rb +26 -0
- data/test/test-attribute.rb +19 -0
- data/test/test-color.rb +47 -0
- data/test/test-language.rb +7 -0
- data/test/test-layout.rb +34 -0
- data/test/test-log-attr.rb +26 -0
- data/test/test-matrix.rb +26 -0
- data/test/test-rectangle.rb +26 -0
- data/vendor/local/bin/derb.exe +0 -0
- data/vendor/local/bin/genbrk.exe +0 -0
- data/vendor/local/bin/genccode.exe +0 -0
- data/vendor/local/bin/gencfu.exe +0 -0
- data/vendor/local/bin/gencmn.exe +0 -0
- data/vendor/local/bin/gencnval.exe +0 -0
- data/vendor/local/bin/gendict.exe +0 -0
- data/vendor/local/bin/gennorm2.exe +0 -0
- data/vendor/local/bin/genrb.exe +0 -0
- data/vendor/local/bin/gensprep.exe +0 -0
- data/vendor/local/bin/hb-ot-shape-closure.exe +0 -0
- data/vendor/local/bin/hb-shape.exe +0 -0
- data/vendor/local/bin/hb-view.exe +0 -0
- data/vendor/local/bin/icu-config +820 -0
- data/vendor/local/bin/icuinfo.exe +0 -0
- data/vendor/local/bin/icupkg.exe +0 -0
- data/vendor/local/bin/libharfbuzz-0.dll +0 -0
- data/vendor/local/bin/libpango-1.0-0.dll +0 -0
- data/vendor/local/bin/libpangocairo-1.0-0.dll +0 -0
- data/vendor/local/bin/libpangoft2-1.0-0.dll +0 -0
- data/vendor/local/bin/libpangowin32-1.0-0.dll +0 -0
- data/vendor/local/bin/makeconv.exe +0 -0
- data/vendor/local/bin/pango-querymodules.exe +0 -0
- data/vendor/local/bin/pango-view.exe +0 -0
- data/vendor/local/bin/pkgdata.exe +0 -0
- data/vendor/local/bin/uconv.exe +0 -0
- data/vendor/local/etc/pango/pango.modules +19 -0
- data/vendor/local/include/harfbuzz/hb-blob.h +126 -0
- data/vendor/local/include/harfbuzz/hb-buffer.h +344 -0
- data/vendor/local/include/harfbuzz/hb-common.h +344 -0
- data/vendor/local/include/harfbuzz/hb-deprecated.h +51 -0
- data/vendor/local/include/harfbuzz/hb-face.h +117 -0
- data/vendor/local/include/harfbuzz/hb-font.h +507 -0
- data/vendor/local/include/harfbuzz/hb-ft.h +62 -0
- data/vendor/local/include/harfbuzz/hb-glib.h +52 -0
- data/vendor/local/include/harfbuzz/hb-icu.h +52 -0
- data/vendor/local/include/harfbuzz/hb-ot-font.h +41 -0
- data/vendor/local/include/harfbuzz/hb-ot-layout.h +302 -0
- data/vendor/local/include/harfbuzz/hb-ot-shape.h +53 -0
- data/vendor/local/include/harfbuzz/hb-ot-tag.h +59 -0
- data/vendor/local/include/harfbuzz/hb-ot.h +43 -0
- data/vendor/local/include/harfbuzz/hb-set.h +154 -0
- data/vendor/local/include/harfbuzz/hb-shape-plan.h +89 -0
- data/vendor/local/include/harfbuzz/hb-shape.h +81 -0
- data/vendor/local/include/harfbuzz/hb-unicode.h +445 -0
- data/vendor/local/include/harfbuzz/hb-version.h +66 -0
- data/vendor/local/include/harfbuzz/hb.h +47 -0
- data/vendor/local/include/layout/LEFontInstance.h +550 -0
- data/vendor/local/include/layout/LEGlyphFilter.h +45 -0
- data/vendor/local/include/layout/LEGlyphStorage.h +546 -0
- data/vendor/local/include/layout/LEInsertionList.h +177 -0
- data/vendor/local/include/layout/LELanguages.h +112 -0
- data/vendor/local/include/layout/LEScripts.h +263 -0
- data/vendor/local/include/layout/LESwaps.h +100 -0
- data/vendor/local/include/layout/LETableReference.h +418 -0
- data/vendor/local/include/layout/LETypes.h +728 -0
- data/vendor/local/include/layout/LayoutEngine.h +518 -0
- data/vendor/local/include/layout/ParagraphLayout.h +747 -0
- data/vendor/local/include/layout/RunArrays.h +676 -0
- data/vendor/local/include/layout/loengine.h +225 -0
- data/vendor/local/include/layout/playout.h +466 -0
- data/vendor/local/include/layout/plruns.h +441 -0
- data/vendor/local/include/pango-1.0/pango/pango-attributes.h +514 -0
- data/vendor/local/include/pango-1.0/pango/pango-bidi-type.h +136 -0
- data/vendor/local/include/pango-1.0/pango/pango-break.h +173 -0
- data/vendor/local/include/pango-1.0/pango/pango-context.h +112 -0
- data/vendor/local/include/pango-1.0/pango/pango-coverage.h +79 -0
- data/vendor/local/include/pango-1.0/pango/pango-engine.h +429 -0
- data/vendor/local/include/pango-1.0/pango/pango-enum-types.h +69 -0
- data/vendor/local/include/pango-1.0/pango/pango-features.h +12 -0
- data/vendor/local/include/pango-1.0/pango/pango-font.h +622 -0
- data/vendor/local/include/pango-1.0/pango/pango-fontmap.h +167 -0
- data/vendor/local/include/pango-1.0/pango/pango-fontset.h +169 -0
- data/vendor/local/include/pango-1.0/pango/pango-glyph-item.h +158 -0
- data/vendor/local/include/pango-1.0/pango/pango-glyph.h +197 -0
- data/vendor/local/include/pango-1.0/pango/pango-gravity.h +128 -0
- data/vendor/local/include/pango-1.0/pango/pango-item.h +109 -0
- data/vendor/local/include/pango-1.0/pango/pango-language.h +61 -0
- data/vendor/local/include/pango-1.0/pango/pango-layout.h +340 -0
- data/vendor/local/include/pango-1.0/pango/pango-matrix.h +117 -0
- data/vendor/local/include/pango-1.0/pango/pango-modules.h +71 -0
- data/vendor/local/include/pango-1.0/pango/pango-ot.h +391 -0
- data/vendor/local/include/pango-1.0/pango/pango-renderer.h +260 -0
- data/vendor/local/include/pango-1.0/pango/pango-script.h +260 -0
- data/vendor/local/include/pango-1.0/pango/pango-tabs.h +87 -0
- data/vendor/local/include/pango-1.0/pango/pango-types.h +200 -0
- data/vendor/local/include/pango-1.0/pango/pango-utils.h +189 -0
- data/vendor/local/include/pango-1.0/pango/pango.h +48 -0
- data/vendor/local/include/pango-1.0/pango/pangocairo.h +169 -0
- data/vendor/local/include/pango-1.0/pango/pangofc-decoder.h +110 -0
- data/vendor/local/include/pango-1.0/pango/pangofc-font.h +153 -0
- data/vendor/local/include/pango-1.0/pango/pangofc-fontmap.h +289 -0
- data/vendor/local/include/pango-1.0/pango/pangoft2.h +133 -0
- data/vendor/local/include/pango-1.0/pango/pangowin32.h +128 -0
- data/vendor/local/include/unicode/alphaindex.h +752 -0
- data/vendor/local/include/unicode/appendable.h +232 -0
- data/vendor/local/include/unicode/basictz.h +214 -0
- data/vendor/local/include/unicode/brkiter.h +655 -0
- data/vendor/local/include/unicode/bytestream.h +257 -0
- data/vendor/local/include/unicode/bytestrie.h +519 -0
- data/vendor/local/include/unicode/bytestriebuilder.h +181 -0
- data/vendor/local/include/unicode/calendar.h +2519 -0
- data/vendor/local/include/unicode/caniter.h +208 -0
- data/vendor/local/include/unicode/chariter.h +722 -0
- data/vendor/local/include/unicode/choicfmt.h +594 -0
- data/vendor/local/include/unicode/coleitr.h +404 -0
- data/vendor/local/include/unicode/coll.h +1267 -0
- data/vendor/local/include/unicode/compactdecimalformat.h +330 -0
- data/vendor/local/include/unicode/curramt.h +130 -0
- data/vendor/local/include/unicode/currpinf.h +258 -0
- data/vendor/local/include/unicode/currunit.h +110 -0
- data/vendor/local/include/unicode/datefmt.h +883 -0
- data/vendor/local/include/unicode/dbbi.h +40 -0
- data/vendor/local/include/unicode/dcfmtsym.h +482 -0
- data/vendor/local/include/unicode/decimfmt.h +2479 -0
- data/vendor/local/include/unicode/docmain.h +215 -0
- data/vendor/local/include/unicode/dtfmtsym.h +912 -0
- data/vendor/local/include/unicode/dtintrv.h +158 -0
- data/vendor/local/include/unicode/dtitvfmt.h +985 -0
- data/vendor/local/include/unicode/dtitvinf.h +514 -0
- data/vendor/local/include/unicode/dtptngen.h +498 -0
- data/vendor/local/include/unicode/dtrule.h +250 -0
- data/vendor/local/include/unicode/enumset.h +64 -0
- data/vendor/local/include/unicode/errorcode.h +137 -0
- data/vendor/local/include/unicode/fieldpos.h +291 -0
- data/vendor/local/include/unicode/filteredbrk.h +131 -0
- data/vendor/local/include/unicode/fmtable.h +760 -0
- data/vendor/local/include/unicode/format.h +305 -0
- data/vendor/local/include/unicode/fpositer.h +117 -0
- data/vendor/local/include/unicode/gender.h +111 -0
- data/vendor/local/include/unicode/gregocal.h +777 -0
- data/vendor/local/include/unicode/icudataver.h +41 -0
- data/vendor/local/include/unicode/icuplug.h +371 -0
- data/vendor/local/include/unicode/idna.h +323 -0
- data/vendor/local/include/unicode/listformatter.h +167 -0
- data/vendor/local/include/unicode/localpointer.h +304 -0
- data/vendor/local/include/unicode/locdspnm.h +204 -0
- data/vendor/local/include/unicode/locid.h +815 -0
- data/vendor/local/include/unicode/measfmt.h +389 -0
- data/vendor/local/include/unicode/measunit.h +1443 -0
- data/vendor/local/include/unicode/measure.h +159 -0
- data/vendor/local/include/unicode/messagepattern.h +943 -0
- data/vendor/local/include/unicode/msgfmt.h +1093 -0
- data/vendor/local/include/unicode/normalizer2.h +658 -0
- data/vendor/local/include/unicode/normlzr.h +797 -0
- data/vendor/local/include/unicode/numfmt.h +1187 -0
- data/vendor/local/include/unicode/numsys.h +208 -0
- data/vendor/local/include/unicode/parseerr.h +92 -0
- data/vendor/local/include/unicode/parsepos.h +230 -0
- data/vendor/local/include/unicode/platform.h +751 -0
- data/vendor/local/include/unicode/plurfmt.h +615 -0
- data/vendor/local/include/unicode/plurrule.h +501 -0
- data/vendor/local/include/unicode/ptypes.h +126 -0
- data/vendor/local/include/unicode/putil.h +181 -0
- data/vendor/local/include/unicode/rbbi.h +782 -0
- data/vendor/local/include/unicode/rbnf.h +1032 -0
- data/vendor/local/include/unicode/rbtz.h +362 -0
- data/vendor/local/include/unicode/regex.h +1857 -0
- data/vendor/local/include/unicode/region.h +228 -0
- data/vendor/local/include/unicode/reldatefmt.h +498 -0
- data/vendor/local/include/unicode/rep.h +261 -0
- data/vendor/local/include/unicode/resbund.h +490 -0
- data/vendor/local/include/unicode/schriter.h +187 -0
- data/vendor/local/include/unicode/scientificformathelper.h +139 -0
- data/vendor/local/include/unicode/search.h +575 -0
- data/vendor/local/include/unicode/selfmt.h +367 -0
- data/vendor/local/include/unicode/simpletz.h +928 -0
- data/vendor/local/include/unicode/smpdtfmt.h +1592 -0
- data/vendor/local/include/unicode/sortkey.h +338 -0
- data/vendor/local/include/unicode/std_string.h +37 -0
- data/vendor/local/include/unicode/strenum.h +276 -0
- data/vendor/local/include/unicode/stringpiece.h +224 -0
- data/vendor/local/include/unicode/stringtriebuilder.h +402 -0
- data/vendor/local/include/unicode/stsearch.h +504 -0
- data/vendor/local/include/unicode/symtable.h +112 -0
- data/vendor/local/include/unicode/tblcoll.h +873 -0
- data/vendor/local/include/unicode/timezone.h +948 -0
- data/vendor/local/include/unicode/tmunit.h +129 -0
- data/vendor/local/include/unicode/tmutamt.h +168 -0
- data/vendor/local/include/unicode/tmutfmt.h +243 -0
- data/vendor/local/include/unicode/translit.h +1342 -0
- data/vendor/local/include/unicode/tzfmt.h +1098 -0
- data/vendor/local/include/unicode/tznames.h +404 -0
- data/vendor/local/include/unicode/tzrule.h +828 -0
- data/vendor/local/include/unicode/tztrans.h +195 -0
- data/vendor/local/include/unicode/ubidi.h +2186 -0
- data/vendor/local/include/unicode/ubrk.h +540 -0
- data/vendor/local/include/unicode/ucal.h +1560 -0
- data/vendor/local/include/unicode/ucasemap.h +423 -0
- data/vendor/local/include/unicode/ucat.h +158 -0
- data/vendor/local/include/unicode/uchar.h +3426 -0
- data/vendor/local/include/unicode/ucharstrie.h +576 -0
- data/vendor/local/include/unicode/ucharstriebuilder.h +185 -0
- data/vendor/local/include/unicode/uchriter.h +381 -0
- data/vendor/local/include/unicode/uclean.h +258 -0
- data/vendor/local/include/unicode/ucnv.h +2036 -0
- data/vendor/local/include/unicode/ucnv_cb.h +162 -0
- data/vendor/local/include/unicode/ucnv_err.h +463 -0
- data/vendor/local/include/unicode/ucnvsel.h +187 -0
- data/vendor/local/include/unicode/ucol.h +1474 -0
- data/vendor/local/include/unicode/ucoleitr.h +266 -0
- data/vendor/local/include/unicode/uconfig.h +430 -0
- data/vendor/local/include/unicode/ucsdet.h +413 -0
- data/vendor/local/include/unicode/ucurr.h +424 -0
- data/vendor/local/include/unicode/udat.h +1536 -0
- data/vendor/local/include/unicode/udata.h +430 -0
- data/vendor/local/include/unicode/udateintervalformat.h +181 -0
- data/vendor/local/include/unicode/udatpg.h +588 -0
- data/vendor/local/include/unicode/udisplaycontext.h +150 -0
- data/vendor/local/include/unicode/uenum.h +206 -0
- data/vendor/local/include/unicode/uformattable.h +280 -0
- data/vendor/local/include/unicode/ugender.h +82 -0
- data/vendor/local/include/unicode/uidna.h +762 -0
- data/vendor/local/include/unicode/uiter.h +707 -0
- data/vendor/local/include/unicode/uldnames.h +302 -0
- data/vendor/local/include/unicode/uloc.h +1256 -0
- data/vendor/local/include/unicode/ulocdata.h +277 -0
- data/vendor/local/include/unicode/umachine.h +356 -0
- data/vendor/local/include/unicode/umisc.h +60 -0
- data/vendor/local/include/unicode/umsg.h +623 -0
- data/vendor/local/include/unicode/unifilt.h +120 -0
- data/vendor/local/include/unicode/unifunct.h +125 -0
- data/vendor/local/include/unicode/unimatch.h +163 -0
- data/vendor/local/include/unicode/unirepl.h +97 -0
- data/vendor/local/include/unicode/uniset.h +1691 -0
- data/vendor/local/include/unicode/unistr.h +4470 -0
- data/vendor/local/include/unicode/unorm.h +561 -0
- data/vendor/local/include/unicode/unorm2.h +528 -0
- data/vendor/local/include/unicode/unum.h +1328 -0
- data/vendor/local/include/unicode/unumsys.h +170 -0
- data/vendor/local/include/unicode/uobject.h +320 -0
- data/vendor/local/include/unicode/upluralrules.h +145 -0
- data/vendor/local/include/unicode/uregex.h +1591 -0
- data/vendor/local/include/unicode/uregion.h +248 -0
- data/vendor/local/include/unicode/urename.h +1784 -0
- data/vendor/local/include/unicode/urep.h +155 -0
- data/vendor/local/include/unicode/ures.h +887 -0
- data/vendor/local/include/unicode/uscript.h +642 -0
- data/vendor/local/include/unicode/usearch.h +885 -0
- data/vendor/local/include/unicode/uset.h +1126 -0
- data/vendor/local/include/unicode/usetiter.h +318 -0
- data/vendor/local/include/unicode/ushape.h +474 -0
- data/vendor/local/include/unicode/uspoof.h +1064 -0
- data/vendor/local/include/unicode/usprep.h +269 -0
- data/vendor/local/include/unicode/ustdio.h +1018 -0
- data/vendor/local/include/unicode/ustream.h +68 -0
- data/vendor/local/include/unicode/ustring.h +1700 -0
- data/vendor/local/include/unicode/ustringtrie.h +95 -0
- data/vendor/local/include/unicode/utext.h +1600 -0
- data/vendor/local/include/unicode/utf.h +223 -0
- data/vendor/local/include/unicode/utf16.h +623 -0
- data/vendor/local/include/unicode/utf32.h +23 -0
- data/vendor/local/include/unicode/utf8.h +824 -0
- data/vendor/local/include/unicode/utf_old.h +1169 -0
- data/vendor/local/include/unicode/utmscale.h +481 -0
- data/vendor/local/include/unicode/utrace.h +359 -0
- data/vendor/local/include/unicode/utrans.h +658 -0
- data/vendor/local/include/unicode/utypes.h +723 -0
- data/vendor/local/include/unicode/uvernum.h +170 -0
- data/vendor/local/include/unicode/uversion.h +193 -0
- data/vendor/local/include/unicode/vtzone.h +455 -0
- data/vendor/local/lib/girepository-1.0/Pango-1.0.typelib +0 -0
- data/vendor/local/lib/girepository-1.0/PangoCairo-1.0.typelib +0 -0
- data/vendor/local/lib/girepository-1.0/PangoFT2-1.0.typelib +0 -0
- data/vendor/local/lib/icu/54.1/Makefile.inc +293 -0
- data/vendor/local/lib/icu/54.1/pkgdata.inc +17 -0
- data/vendor/local/lib/icu/Makefile.inc +293 -0
- data/vendor/local/lib/icu/pkgdata.inc +17 -0
- data/vendor/local/lib/icudt.dll +0 -0
- data/vendor/local/lib/icudt54.dll +0 -0
- data/vendor/local/lib/icuin.dll +0 -0
- data/vendor/local/lib/icuin54.dll +0 -0
- data/vendor/local/lib/icuio.dll +0 -0
- data/vendor/local/lib/icuio54.dll +0 -0
- data/vendor/local/lib/icule.dll +0 -0
- data/vendor/local/lib/icule54.dll +0 -0
- data/vendor/local/lib/iculx.dll +0 -0
- data/vendor/local/lib/iculx54.dll +0 -0
- data/vendor/local/lib/icutest.dll +0 -0
- data/vendor/local/lib/icutest54.dll +0 -0
- data/vendor/local/lib/icutu.dll +0 -0
- data/vendor/local/lib/icutu54.dll +0 -0
- data/vendor/local/lib/icuuc.dll +0 -0
- data/vendor/local/lib/icuuc54.dll +0 -0
- data/vendor/local/lib/libharfbuzz-icu.a +0 -0
- data/vendor/local/lib/libharfbuzz-icu.la +41 -0
- data/vendor/local/lib/libharfbuzz.dll.a +0 -0
- data/vendor/local/lib/libharfbuzz.la +41 -0
- data/vendor/local/lib/libicudt.dll.a +0 -0
- data/vendor/local/lib/libicuin.dll.a +0 -0
- data/vendor/local/lib/libicuio.dll.a +0 -0
- data/vendor/local/lib/libicule.dll.a +0 -0
- data/vendor/local/lib/libiculx.dll.a +0 -0
- data/vendor/local/lib/libicutest.dll.a +0 -0
- data/vendor/local/lib/libicutu.dll.a +0 -0
- data/vendor/local/lib/libicuuc.dll.a +0 -0
- data/vendor/local/lib/libpango-1.0.dll.a +0 -0
- data/vendor/local/lib/libpango-1.0.la +41 -0
- data/vendor/local/lib/libpangocairo-1.0.dll.a +0 -0
- data/vendor/local/lib/libpangocairo-1.0.la +41 -0
- data/vendor/local/lib/libpangoft2-1.0.dll.a +0 -0
- data/vendor/local/lib/libpangoft2-1.0.la +41 -0
- data/vendor/local/lib/libpangowin32-1.0.dll.a +0 -0
- data/vendor/local/lib/libpangowin32-1.0.la +41 -0
- data/vendor/local/lib/pango/1.8.0/modules/pango-arabic-lang.dll +0 -0
- data/vendor/local/lib/pango/1.8.0/modules/pango-arabic-lang.dll.a +0 -0
- data/vendor/local/lib/pango/1.8.0/modules/pango-arabic-lang.la +41 -0
- data/vendor/local/lib/pango/1.8.0/modules/pango-basic-fc.dll +0 -0
- data/vendor/local/lib/pango/1.8.0/modules/pango-basic-fc.dll.a +0 -0
- data/vendor/local/lib/pango/1.8.0/modules/pango-basic-fc.la +41 -0
- data/vendor/local/lib/pango/1.8.0/modules/pango-basic-win32.dll +0 -0
- data/vendor/local/lib/pango/1.8.0/modules/pango-basic-win32.dll.a +0 -0
- data/vendor/local/lib/pango/1.8.0/modules/pango-basic-win32.la +41 -0
- data/vendor/local/lib/pango/1.8.0/modules/pango-indic-lang.dll +0 -0
- data/vendor/local/lib/pango/1.8.0/modules/pango-indic-lang.dll.a +0 -0
- data/vendor/local/lib/pango/1.8.0/modules/pango-indic-lang.la +41 -0
- data/vendor/local/lib/pkgconfig/harfbuzz-icu.pc +13 -0
- data/vendor/local/lib/pkgconfig/harfbuzz.pc +11 -0
- data/vendor/local/lib/pkgconfig/icu-i18n.pc +38 -0
- data/vendor/local/lib/pkgconfig/icu-io.pc +38 -0
- data/vendor/local/lib/pkgconfig/icu-le.pc +38 -0
- data/vendor/local/lib/pkgconfig/icu-lx.pc +38 -0
- data/vendor/local/lib/pkgconfig/icu-uc.pc +38 -0
- data/vendor/local/lib/pkgconfig/pango.pc +14 -0
- data/vendor/local/lib/pkgconfig/pangocairo.pc +11 -0
- data/vendor/local/lib/pkgconfig/pangoft2.pc +12 -0
- data/vendor/local/lib/pkgconfig/pangowin32.pc +11 -0
- data/vendor/local/share/gir-1.0/Pango-1.0.gir +13329 -0
- data/vendor/local/share/gir-1.0/PangoCairo-1.0.gir +833 -0
- data/vendor/local/share/gir-1.0/PangoFT2-1.0.gir +354 -0
- data/vendor/local/share/gtk-doc/html/harfbuzz/annotation-glossary.html +75 -0
- data/vendor/local/share/gtk-doc/html/harfbuzz/api-index-full.html +1449 -0
- data/vendor/local/share/gtk-doc/html/harfbuzz/ch01.html +98 -0
- data/vendor/local/share/gtk-doc/html/harfbuzz/deprecated-api-index.html +46 -0
- data/vendor/local/share/gtk-doc/html/harfbuzz/harfbuzz-hb-blob.html +610 -0
- data/vendor/local/share/gtk-doc/html/harfbuzz/harfbuzz-hb-buffer.html +1780 -0
- data/vendor/local/share/gtk-doc/html/harfbuzz/harfbuzz-hb-common.html +1337 -0
- data/vendor/local/share/gtk-doc/html/harfbuzz/harfbuzz-hb-coretext.html +144 -0
- data/vendor/local/share/gtk-doc/html/harfbuzz/harfbuzz-hb-deprecated.html +99 -0
- data/vendor/local/share/gtk-doc/html/harfbuzz/harfbuzz-hb-face.html +630 -0
- data/vendor/local/share/gtk-doc/html/harfbuzz/harfbuzz-hb-font.html +2529 -0
- data/vendor/local/share/gtk-doc/html/harfbuzz/harfbuzz-hb-ft.html +188 -0
- data/vendor/local/share/gtk-doc/html/harfbuzz/harfbuzz-hb-glib.html +120 -0
- data/vendor/local/share/gtk-doc/html/harfbuzz/harfbuzz-hb-gobject.html +50 -0
- data/vendor/local/share/gtk-doc/html/harfbuzz/harfbuzz-hb-graphite2.html +120 -0
- data/vendor/local/share/gtk-doc/html/harfbuzz/harfbuzz-hb-icu.html +120 -0
- data/vendor/local/share/gtk-doc/html/harfbuzz/harfbuzz-hb-ot-layout.html +771 -0
- data/vendor/local/share/gtk-doc/html/harfbuzz/harfbuzz-hb-ot-tag.html +172 -0
- data/vendor/local/share/gtk-doc/html/harfbuzz/harfbuzz-hb-ot.html +50 -0
- data/vendor/local/share/gtk-doc/html/harfbuzz/harfbuzz-hb-set.html +966 -0
- data/vendor/local/share/gtk-doc/html/harfbuzz/harfbuzz-hb-shape-plan.html +405 -0
- data/vendor/local/share/gtk-doc/html/harfbuzz/harfbuzz-hb-shape.html +286 -0
- data/vendor/local/share/gtk-doc/html/harfbuzz/harfbuzz-hb-unicode.html +1523 -0
- data/vendor/local/share/gtk-doc/html/harfbuzz/harfbuzz-hb-uniscribe.html +100 -0
- data/vendor/local/share/gtk-doc/html/harfbuzz/harfbuzz-hb-version.html +182 -0
- data/vendor/local/share/gtk-doc/html/harfbuzz/harfbuzz-hb.html +50 -0
- data/vendor/local/share/gtk-doc/html/harfbuzz/harfbuzz.devhelp2 +378 -0
- data/vendor/local/share/gtk-doc/html/harfbuzz/home.png +0 -0
- data/vendor/local/share/gtk-doc/html/harfbuzz/index.html +105 -0
- data/vendor/local/share/gtk-doc/html/harfbuzz/index.sgml +496 -0
- data/vendor/local/share/gtk-doc/html/harfbuzz/left-insensitive.png +0 -0
- data/vendor/local/share/gtk-doc/html/harfbuzz/left.png +0 -0
- data/vendor/local/share/gtk-doc/html/harfbuzz/object-tree.html +59 -0
- data/vendor/local/share/gtk-doc/html/harfbuzz/right-insensitive.png +0 -0
- data/vendor/local/share/gtk-doc/html/harfbuzz/right.png +0 -0
- data/vendor/local/share/gtk-doc/html/harfbuzz/style.css +476 -0
- data/vendor/local/share/gtk-doc/html/harfbuzz/up-insensitive.png +0 -0
- data/vendor/local/share/gtk-doc/html/harfbuzz/up.png +0 -0
- data/vendor/local/share/gtk-doc/html/pango/PangoEngineLang.html +224 -0
- data/vendor/local/share/gtk-doc/html/pango/PangoEngineShape.html +255 -0
- data/vendor/local/share/gtk-doc/html/pango/PangoFcDecoder.html +246 -0
- data/vendor/local/share/gtk-doc/html/pango/PangoFcFont.html +500 -0
- data/vendor/local/share/gtk-doc/html/pango/PangoFcFontMap.html +1001 -0
- data/vendor/local/share/gtk-doc/html/pango/PangoMarkupFormat.html +301 -0
- data/vendor/local/share/gtk-doc/html/pango/PangoRenderer.html +1219 -0
- data/vendor/local/share/gtk-doc/html/pango/annotation-glossary.html +89 -0
- data/vendor/local/share/gtk-doc/html/pango/api-index-1-10.html +135 -0
- data/vendor/local/share/gtk-doc/html/pango/api-index-1-12.html +49 -0
- data/vendor/local/share/gtk-doc/html/pango/api-index-1-14.html +64 -0
- data/vendor/local/share/gtk-doc/html/pango/api-index-1-16.html +228 -0
- data/vendor/local/share/gtk-doc/html/pango/api-index-1-18.html +152 -0
- data/vendor/local/share/gtk-doc/html/pango/api-index-1-2.html +122 -0
- data/vendor/local/share/gtk-doc/html/pango/api-index-1-20.html +87 -0
- data/vendor/local/share/gtk-doc/html/pango/api-index-1-22.html +124 -0
- data/vendor/local/share/gtk-doc/html/pango/api-index-1-24.html +97 -0
- data/vendor/local/share/gtk-doc/html/pango/api-index-1-26.html +46 -0
- data/vendor/local/share/gtk-doc/html/pango/api-index-1-30.html +39 -0
- data/vendor/local/share/gtk-doc/html/pango/api-index-1-31-0.html +39 -0
- data/vendor/local/share/gtk-doc/html/pango/api-index-1-32-4.html +53 -0
- data/vendor/local/share/gtk-doc/html/pango/api-index-1-32.html +42 -0
- data/vendor/local/share/gtk-doc/html/pango/api-index-1-34.html +38 -0
- data/vendor/local/share/gtk-doc/html/pango/api-index-1-4.html +201 -0
- data/vendor/local/share/gtk-doc/html/pango/api-index-1-6.html +165 -0
- data/vendor/local/share/gtk-doc/html/pango/api-index-1-8.html +171 -0
- data/vendor/local/share/gtk-doc/html/pango/api-index-deprecated.html +284 -0
- data/vendor/local/share/gtk-doc/html/pango/api-index-full.html +2968 -0
- data/vendor/local/share/gtk-doc/html/pango/home.png +0 -0
- data/vendor/local/share/gtk-doc/html/pango/index.html +146 -0
- data/vendor/local/share/gtk-doc/html/pango/index.sgml +957 -0
- data/vendor/local/share/gtk-doc/html/pango/layout.gif +0 -0
- data/vendor/local/share/gtk-doc/html/pango/left-insensitive.png +0 -0
- data/vendor/local/share/gtk-doc/html/pango/left.png +0 -0
- data/vendor/local/share/gtk-doc/html/pango/lowlevel.html +68 -0
- data/vendor/local/share/gtk-doc/html/pango/pango-Bidirectional-Text.html +514 -0
- data/vendor/local/share/gtk-doc/html/pango/pango-Cairo-Rendering.html +1632 -0
- data/vendor/local/share/gtk-doc/html/pango/pango-CoreText-Fonts.html +115 -0
- data/vendor/local/share/gtk-doc/html/pango/pango-Coverage-Maps.html +508 -0
- data/vendor/local/share/gtk-doc/html/pango/pango-Engines.html +358 -0
- data/vendor/local/share/gtk-doc/html/pango/pango-Fonts.html +4154 -0
- data/vendor/local/share/gtk-doc/html/pango/pango-FreeType-Fonts-and-Rendering.html +956 -0
- data/vendor/local/share/gtk-doc/html/pango/pango-Glyph-Storage.html +2627 -0
- data/vendor/local/share/gtk-doc/html/pango/pango-Layout-Objects.html +4153 -0
- data/vendor/local/share/gtk-doc/html/pango/pango-Miscellaneous-Utilities.html +965 -0
- data/vendor/local/share/gtk-doc/html/pango/pango-Modules.html +331 -0
- data/vendor/local/share/gtk-doc/html/pango/pango-OpenType-Font-Handling.html +2202 -0
- data/vendor/local/share/gtk-doc/html/pango/pango-Scripts-and-Languages.html +1430 -0
- data/vendor/local/share/gtk-doc/html/pango/pango-Tab-Stops.html +582 -0
- data/vendor/local/share/gtk-doc/html/pango/pango-Text-Attributes.html +3356 -0
- data/vendor/local/share/gtk-doc/html/pango/pango-Text-Processing.html +2079 -0
- data/vendor/local/share/gtk-doc/html/pango/pango-Version-Checking.html +325 -0
- data/vendor/local/share/gtk-doc/html/pango/pango-Vertical-Text.html +523 -0
- data/vendor/local/share/gtk-doc/html/pango/pango-Win32-Fonts-and-Rendering.html +1028 -0
- data/vendor/local/share/gtk-doc/html/pango/pango-Xft-Fonts-and-Rendering.html +1275 -0
- data/vendor/local/share/gtk-doc/html/pango/pango-hierarchy.html +91 -0
- data/vendor/local/share/gtk-doc/html/pango/pango-querymodules.html +131 -0
- data/vendor/local/share/gtk-doc/html/pango/pango.devhelp2 +786 -0
- data/vendor/local/share/gtk-doc/html/pango/pango.html +63 -0
- data/vendor/local/share/gtk-doc/html/pango/rendering.html +47 -0
- data/vendor/local/share/gtk-doc/html/pango/right-insensitive.png +0 -0
- data/vendor/local/share/gtk-doc/html/pango/right.png +0 -0
- data/vendor/local/share/gtk-doc/html/pango/rotated-text.png +0 -0
- data/vendor/local/share/gtk-doc/html/pango/style.css +476 -0
- data/vendor/local/share/gtk-doc/html/pango/tools.html +33 -0
- data/vendor/local/share/gtk-doc/html/pango/up-insensitive.png +0 -0
- data/vendor/local/share/gtk-doc/html/pango/up.png +0 -0
- data/vendor/local/share/icu/54.1/config/mh-mingw64 +158 -0
- data/vendor/local/share/icu/54.1/install-sh +251 -0
- data/vendor/local/share/icu/54.1/license.html +385 -0
- data/vendor/local/share/icu/54.1/mkinstalldirs +43 -0
- data/vendor/local/share/license/harfbuzz/AUTHORS +9 -0
- data/vendor/local/share/license/harfbuzz/COPYING +36 -0
- data/vendor/local/share/license/pango/AUTHORS +2 -0
- data/vendor/local/share/license/pango/COPYING +482 -0
- data/vendor/local/share/man/man1/derb.1 +196 -0
- data/vendor/local/share/man/man1/genbrk.1 +112 -0
- data/vendor/local/share/man/man1/gencfu.1 +91 -0
- data/vendor/local/share/man/man1/gencnval.1 +91 -0
- data/vendor/local/share/man/man1/gendict.1 +131 -0
- data/vendor/local/share/man/man1/genrb.1 +146 -0
- data/vendor/local/share/man/man1/icu-config.1 +288 -0
- data/vendor/local/share/man/man1/makeconv.1 +112 -0
- data/vendor/local/share/man/man1/pango-querymodules.1 +106 -0
- data/vendor/local/share/man/man1/pango-view.1 +1 -0
- data/vendor/local/share/man/man1/pkgdata.1 +258 -0
- data/vendor/local/share/man/man1/uconv.1 +443 -0
- data/vendor/local/share/man/man8/genccode.8 +106 -0
- data/vendor/local/share/man/man8/gencmn.8 +129 -0
- data/vendor/local/share/man/man8/gensprep.8 +102 -0
- data/vendor/local/share/man/man8/icupkg.8 +204 -0
- metadata +599 -0
@@ -0,0 +1,824 @@
|
|
1
|
+
/*
|
2
|
+
*******************************************************************************
|
3
|
+
*
|
4
|
+
* Copyright (C) 1999-2014, International Business Machines
|
5
|
+
* Corporation and others. All Rights Reserved.
|
6
|
+
*
|
7
|
+
*******************************************************************************
|
8
|
+
* file name: utf8.h
|
9
|
+
* encoding: US-ASCII
|
10
|
+
* tab size: 8 (not used)
|
11
|
+
* indentation:4
|
12
|
+
*
|
13
|
+
* created on: 1999sep13
|
14
|
+
* created by: Markus W. Scherer
|
15
|
+
*/
|
16
|
+
|
17
|
+
/**
|
18
|
+
* \file
|
19
|
+
* \brief C API: 8-bit Unicode handling macros
|
20
|
+
*
|
21
|
+
* This file defines macros to deal with 8-bit Unicode (UTF-8) code units (bytes) and strings.
|
22
|
+
*
|
23
|
+
* For more information see utf.h and the ICU User Guide Strings chapter
|
24
|
+
* (http://userguide.icu-project.org/strings).
|
25
|
+
*
|
26
|
+
* <em>Usage:</em>
|
27
|
+
* ICU coding guidelines for if() statements should be followed when using these macros.
|
28
|
+
* Compound statements (curly braces {}) must be used for if-else-while...
|
29
|
+
* bodies and all macro statements should be terminated with semicolon.
|
30
|
+
*/
|
31
|
+
|
32
|
+
#ifndef __UTF8_H__
|
33
|
+
#define __UTF8_H__
|
34
|
+
|
35
|
+
#include "unicode/umachine.h"
|
36
|
+
#ifndef __UTF_H__
|
37
|
+
# include "unicode/utf.h"
|
38
|
+
#endif
|
39
|
+
|
40
|
+
/* internal definitions ----------------------------------------------------- */
|
41
|
+
|
42
|
+
/**
|
43
|
+
* \var utf8_countTrailBytes
|
44
|
+
* Internal array with numbers of trail bytes for any given byte used in
|
45
|
+
* lead byte position.
|
46
|
+
*
|
47
|
+
* This is internal since it is not meant to be called directly by external clients;
|
48
|
+
* however it is called by public macros in this file and thus must remain stable,
|
49
|
+
* and should not be hidden when other internal functions are hidden (otherwise
|
50
|
+
* public macros would fail to compile).
|
51
|
+
* @internal
|
52
|
+
*/
|
53
|
+
#ifdef U_UTF8_IMPL
|
54
|
+
U_EXPORT const uint8_t
|
55
|
+
#elif defined(U_STATIC_IMPLEMENTATION) || defined(U_COMMON_IMPLEMENTATION)
|
56
|
+
U_CFUNC const uint8_t
|
57
|
+
#else
|
58
|
+
U_CFUNC U_IMPORT const uint8_t /* U_IMPORT2? */ /*U_IMPORT*/
|
59
|
+
#endif
|
60
|
+
utf8_countTrailBytes[256];
|
61
|
+
|
62
|
+
/**
|
63
|
+
* Counts the trail bytes for a UTF-8 lead byte.
|
64
|
+
* Returns 0 for 0..0xbf as well as for 0xfe and 0xff.
|
65
|
+
*
|
66
|
+
* This is internal since it is not meant to be called directly by external clients;
|
67
|
+
* however it is called by public macros in this file and thus must remain stable.
|
68
|
+
*
|
69
|
+
* Note: Beginning with ICU 50, the implementation uses a multi-condition expression
|
70
|
+
* which was shown in 2012 (on x86-64) to compile to fast, branch-free code.
|
71
|
+
* leadByte is evaluated multiple times.
|
72
|
+
*
|
73
|
+
* The pre-ICU 50 implementation used the exported array utf8_countTrailBytes:
|
74
|
+
* #define U8_COUNT_TRAIL_BYTES(leadByte) (utf8_countTrailBytes[leadByte])
|
75
|
+
* leadByte was evaluated exactly once.
|
76
|
+
*
|
77
|
+
* @param leadByte The first byte of a UTF-8 sequence. Must be 0..0xff.
|
78
|
+
* @internal
|
79
|
+
*/
|
80
|
+
#define U8_COUNT_TRAIL_BYTES(leadByte) \
|
81
|
+
((uint8_t)(leadByte)<0xf0 ? \
|
82
|
+
((uint8_t)(leadByte)>=0xc0)+((uint8_t)(leadByte)>=0xe0) : \
|
83
|
+
(uint8_t)(leadByte)<0xfe ? 3+((uint8_t)(leadByte)>=0xf8)+((uint8_t)(leadByte)>=0xfc) : 0)
|
84
|
+
|
85
|
+
/**
|
86
|
+
* Counts the trail bytes for a UTF-8 lead byte of a valid UTF-8 sequence.
|
87
|
+
* The maximum supported lead byte is 0xf4 corresponding to U+10FFFF.
|
88
|
+
* leadByte might be evaluated multiple times.
|
89
|
+
*
|
90
|
+
* This is internal since it is not meant to be called directly by external clients;
|
91
|
+
* however it is called by public macros in this file and thus must remain stable.
|
92
|
+
*
|
93
|
+
* @param leadByte The first byte of a UTF-8 sequence. Must be 0..0xff.
|
94
|
+
* @internal
|
95
|
+
*/
|
96
|
+
#define U8_COUNT_TRAIL_BYTES_UNSAFE(leadByte) \
|
97
|
+
(((leadByte)>=0xc0)+((leadByte)>=0xe0)+((leadByte)>=0xf0))
|
98
|
+
|
99
|
+
/**
|
100
|
+
* Mask a UTF-8 lead byte, leave only the lower bits that form part of the code point value.
|
101
|
+
*
|
102
|
+
* This is internal since it is not meant to be called directly by external clients;
|
103
|
+
* however it is called by public macros in this file and thus must remain stable.
|
104
|
+
* @internal
|
105
|
+
*/
|
106
|
+
#define U8_MASK_LEAD_BYTE(leadByte, countTrailBytes) ((leadByte)&=(1<<(6-(countTrailBytes)))-1)
|
107
|
+
|
108
|
+
/**
|
109
|
+
* Function for handling "next code point" with error-checking.
|
110
|
+
*
|
111
|
+
* This is internal since it is not meant to be called directly by external clients;
|
112
|
+
* however it is U_STABLE (not U_INTERNAL) since it is called by public macros in this
|
113
|
+
* file and thus must remain stable, and should not be hidden when other internal
|
114
|
+
* functions are hidden (otherwise public macros would fail to compile).
|
115
|
+
* @internal
|
116
|
+
*/
|
117
|
+
U_STABLE UChar32 U_EXPORT2
|
118
|
+
utf8_nextCharSafeBody(const uint8_t *s, int32_t *pi, int32_t length, UChar32 c, UBool strict);
|
119
|
+
|
120
|
+
/**
|
121
|
+
* Function for handling "append code point" with error-checking.
|
122
|
+
*
|
123
|
+
* This is internal since it is not meant to be called directly by external clients;
|
124
|
+
* however it is U_STABLE (not U_INTERNAL) since it is called by public macros in this
|
125
|
+
* file and thus must remain stable, and should not be hidden when other internal
|
126
|
+
* functions are hidden (otherwise public macros would fail to compile).
|
127
|
+
* @internal
|
128
|
+
*/
|
129
|
+
U_STABLE int32_t U_EXPORT2
|
130
|
+
utf8_appendCharSafeBody(uint8_t *s, int32_t i, int32_t length, UChar32 c, UBool *pIsError);
|
131
|
+
|
132
|
+
/**
|
133
|
+
* Function for handling "previous code point" with error-checking.
|
134
|
+
*
|
135
|
+
* This is internal since it is not meant to be called directly by external clients;
|
136
|
+
* however it is U_STABLE (not U_INTERNAL) since it is called by public macros in this
|
137
|
+
* file and thus must remain stable, and should not be hidden when other internal
|
138
|
+
* functions are hidden (otherwise public macros would fail to compile).
|
139
|
+
* @internal
|
140
|
+
*/
|
141
|
+
U_STABLE UChar32 U_EXPORT2
|
142
|
+
utf8_prevCharSafeBody(const uint8_t *s, int32_t start, int32_t *pi, UChar32 c, UBool strict);
|
143
|
+
|
144
|
+
/**
|
145
|
+
* Function for handling "skip backward one code point" with error-checking.
|
146
|
+
*
|
147
|
+
* This is internal since it is not meant to be called directly by external clients;
|
148
|
+
* however it is U_STABLE (not U_INTERNAL) since it is called by public macros in this
|
149
|
+
* file and thus must remain stable, and should not be hidden when other internal
|
150
|
+
* functions are hidden (otherwise public macros would fail to compile).
|
151
|
+
* @internal
|
152
|
+
*/
|
153
|
+
U_STABLE int32_t U_EXPORT2
|
154
|
+
utf8_back1SafeBody(const uint8_t *s, int32_t start, int32_t i);
|
155
|
+
|
156
|
+
/* single-code point definitions -------------------------------------------- */
|
157
|
+
|
158
|
+
/**
|
159
|
+
* Does this code unit (byte) encode a code point by itself (US-ASCII 0..0x7f)?
|
160
|
+
* @param c 8-bit code unit (byte)
|
161
|
+
* @return TRUE or FALSE
|
162
|
+
* @stable ICU 2.4
|
163
|
+
*/
|
164
|
+
#define U8_IS_SINGLE(c) (((c)&0x80)==0)
|
165
|
+
|
166
|
+
/**
|
167
|
+
* Is this code unit (byte) a UTF-8 lead byte?
|
168
|
+
* @param c 8-bit code unit (byte)
|
169
|
+
* @return TRUE or FALSE
|
170
|
+
* @stable ICU 2.4
|
171
|
+
*/
|
172
|
+
#define U8_IS_LEAD(c) ((uint8_t)((c)-0xc0)<0x3e)
|
173
|
+
|
174
|
+
/**
|
175
|
+
* Is this code unit (byte) a UTF-8 trail byte?
|
176
|
+
* @param c 8-bit code unit (byte)
|
177
|
+
* @return TRUE or FALSE
|
178
|
+
* @stable ICU 2.4
|
179
|
+
*/
|
180
|
+
#define U8_IS_TRAIL(c) (((c)&0xc0)==0x80)
|
181
|
+
|
182
|
+
/**
|
183
|
+
* How many code units (bytes) are used for the UTF-8 encoding
|
184
|
+
* of this Unicode code point?
|
185
|
+
* @param c 32-bit code point
|
186
|
+
* @return 1..4, or 0 if c is a surrogate or not a Unicode code point
|
187
|
+
* @stable ICU 2.4
|
188
|
+
*/
|
189
|
+
#define U8_LENGTH(c) \
|
190
|
+
((uint32_t)(c)<=0x7f ? 1 : \
|
191
|
+
((uint32_t)(c)<=0x7ff ? 2 : \
|
192
|
+
((uint32_t)(c)<=0xd7ff ? 3 : \
|
193
|
+
((uint32_t)(c)<=0xdfff || (uint32_t)(c)>0x10ffff ? 0 : \
|
194
|
+
((uint32_t)(c)<=0xffff ? 3 : 4)\
|
195
|
+
) \
|
196
|
+
) \
|
197
|
+
) \
|
198
|
+
)
|
199
|
+
|
200
|
+
/**
|
201
|
+
* The maximum number of UTF-8 code units (bytes) per Unicode code point (U+0000..U+10ffff).
|
202
|
+
* @return 4
|
203
|
+
* @stable ICU 2.4
|
204
|
+
*/
|
205
|
+
#define U8_MAX_LENGTH 4
|
206
|
+
|
207
|
+
/**
|
208
|
+
* Get a code point from a string at a random-access offset,
|
209
|
+
* without changing the offset.
|
210
|
+
* The offset may point to either the lead byte or one of the trail bytes
|
211
|
+
* for a code point, in which case the macro will read all of the bytes
|
212
|
+
* for the code point.
|
213
|
+
* The result is undefined if the offset points to an illegal UTF-8
|
214
|
+
* byte sequence.
|
215
|
+
* Iteration through a string is more efficient with U8_NEXT_UNSAFE or U8_NEXT.
|
216
|
+
*
|
217
|
+
* @param s const uint8_t * string
|
218
|
+
* @param i string offset
|
219
|
+
* @param c output UChar32 variable
|
220
|
+
* @see U8_GET
|
221
|
+
* @stable ICU 2.4
|
222
|
+
*/
|
223
|
+
#define U8_GET_UNSAFE(s, i, c) { \
|
224
|
+
int32_t _u8_get_unsafe_index=(int32_t)(i); \
|
225
|
+
U8_SET_CP_START_UNSAFE(s, _u8_get_unsafe_index); \
|
226
|
+
U8_NEXT_UNSAFE(s, _u8_get_unsafe_index, c); \
|
227
|
+
}
|
228
|
+
|
229
|
+
/**
|
230
|
+
* Get a code point from a string at a random-access offset,
|
231
|
+
* without changing the offset.
|
232
|
+
* The offset may point to either the lead byte or one of the trail bytes
|
233
|
+
* for a code point, in which case the macro will read all of the bytes
|
234
|
+
* for the code point.
|
235
|
+
*
|
236
|
+
* The length can be negative for a NUL-terminated string.
|
237
|
+
*
|
238
|
+
* If the offset points to an illegal UTF-8 byte sequence, then
|
239
|
+
* c is set to a negative value.
|
240
|
+
* Iteration through a string is more efficient with U8_NEXT_UNSAFE or U8_NEXT.
|
241
|
+
*
|
242
|
+
* @param s const uint8_t * string
|
243
|
+
* @param start int32_t starting string offset
|
244
|
+
* @param i int32_t string offset, must be start<=i<length
|
245
|
+
* @param length int32_t string length
|
246
|
+
* @param c output UChar32 variable, set to <0 in case of an error
|
247
|
+
* @see U8_GET_UNSAFE
|
248
|
+
* @stable ICU 2.4
|
249
|
+
*/
|
250
|
+
#define U8_GET(s, start, i, length, c) { \
|
251
|
+
int32_t _u8_get_index=(i); \
|
252
|
+
U8_SET_CP_START(s, start, _u8_get_index); \
|
253
|
+
U8_NEXT(s, _u8_get_index, length, c); \
|
254
|
+
}
|
255
|
+
|
256
|
+
/**
|
257
|
+
* Get a code point from a string at a random-access offset,
|
258
|
+
* without changing the offset.
|
259
|
+
* The offset may point to either the lead byte or one of the trail bytes
|
260
|
+
* for a code point, in which case the macro will read all of the bytes
|
261
|
+
* for the code point.
|
262
|
+
*
|
263
|
+
* The length can be negative for a NUL-terminated string.
|
264
|
+
*
|
265
|
+
* If the offset points to an illegal UTF-8 byte sequence, then
|
266
|
+
* c is set to U+FFFD.
|
267
|
+
* Iteration through a string is more efficient with U8_NEXT_UNSAFE or U8_NEXT_OR_FFFD.
|
268
|
+
*
|
269
|
+
* This macro does not distinguish between a real U+FFFD in the text
|
270
|
+
* and U+FFFD returned for an ill-formed sequence.
|
271
|
+
* Use U8_GET() if that distinction is important.
|
272
|
+
*
|
273
|
+
* @param s const uint8_t * string
|
274
|
+
* @param start int32_t starting string offset
|
275
|
+
* @param i int32_t string offset, must be start<=i<length
|
276
|
+
* @param length int32_t string length
|
277
|
+
* @param c output UChar32 variable, set to U+FFFD in case of an error
|
278
|
+
* @see U8_GET
|
279
|
+
* @stable ICU 51
|
280
|
+
*/
|
281
|
+
#define U8_GET_OR_FFFD(s, start, i, length, c) { \
|
282
|
+
int32_t _u8_get_index=(i); \
|
283
|
+
U8_SET_CP_START(s, start, _u8_get_index); \
|
284
|
+
U8_NEXT_OR_FFFD(s, _u8_get_index, length, c); \
|
285
|
+
}
|
286
|
+
|
287
|
+
/* definitions with forward iteration --------------------------------------- */
|
288
|
+
|
289
|
+
/**
|
290
|
+
* Get a code point from a string at a code point boundary offset,
|
291
|
+
* and advance the offset to the next code point boundary.
|
292
|
+
* (Post-incrementing forward iteration.)
|
293
|
+
* "Unsafe" macro, assumes well-formed UTF-8.
|
294
|
+
*
|
295
|
+
* The offset may point to the lead byte of a multi-byte sequence,
|
296
|
+
* in which case the macro will read the whole sequence.
|
297
|
+
* The result is undefined if the offset points to a trail byte
|
298
|
+
* or an illegal UTF-8 sequence.
|
299
|
+
*
|
300
|
+
* @param s const uint8_t * string
|
301
|
+
* @param i string offset
|
302
|
+
* @param c output UChar32 variable
|
303
|
+
* @see U8_NEXT
|
304
|
+
* @stable ICU 2.4
|
305
|
+
*/
|
306
|
+
#define U8_NEXT_UNSAFE(s, i, c) { \
|
307
|
+
(c)=(uint8_t)(s)[(i)++]; \
|
308
|
+
if((c)>=0x80) { \
|
309
|
+
if((c)<0xe0) { \
|
310
|
+
(c)=(((c)&0x1f)<<6)|((s)[(i)++]&0x3f); \
|
311
|
+
} else if((c)<0xf0) { \
|
312
|
+
/* no need for (c&0xf) because the upper bits are truncated after <<12 in the cast to (UChar) */ \
|
313
|
+
(c)=(UChar)(((c)<<12)|(((s)[i]&0x3f)<<6)|((s)[(i)+1]&0x3f)); \
|
314
|
+
(i)+=2; \
|
315
|
+
} else { \
|
316
|
+
(c)=(((c)&7)<<18)|(((s)[i]&0x3f)<<12)|(((s)[(i)+1]&0x3f)<<6)|((s)[(i)+2]&0x3f); \
|
317
|
+
(i)+=3; \
|
318
|
+
} \
|
319
|
+
} \
|
320
|
+
}
|
321
|
+
|
322
|
+
/**
|
323
|
+
* Get a code point from a string at a code point boundary offset,
|
324
|
+
* and advance the offset to the next code point boundary.
|
325
|
+
* (Post-incrementing forward iteration.)
|
326
|
+
* "Safe" macro, checks for illegal sequences and for string boundaries.
|
327
|
+
*
|
328
|
+
* The length can be negative for a NUL-terminated string.
|
329
|
+
*
|
330
|
+
* The offset may point to the lead byte of a multi-byte sequence,
|
331
|
+
* in which case the macro will read the whole sequence.
|
332
|
+
* If the offset points to a trail byte or an illegal UTF-8 sequence, then
|
333
|
+
* c is set to a negative value.
|
334
|
+
*
|
335
|
+
* @param s const uint8_t * string
|
336
|
+
* @param i int32_t string offset, must be i<length
|
337
|
+
* @param length int32_t string length
|
338
|
+
* @param c output UChar32 variable, set to <0 in case of an error
|
339
|
+
* @see U8_NEXT_UNSAFE
|
340
|
+
* @stable ICU 2.4
|
341
|
+
*/
|
342
|
+
#define U8_NEXT(s, i, length, c) { \
|
343
|
+
(c)=(uint8_t)(s)[(i)++]; \
|
344
|
+
if((c)>=0x80) { \
|
345
|
+
uint8_t __t1, __t2; \
|
346
|
+
if( /* handle U+1000..U+CFFF inline */ \
|
347
|
+
(0xe0<(c) && (c)<=0xec) && \
|
348
|
+
(((i)+1)<(length) || (length)<0) && \
|
349
|
+
(__t1=(uint8_t)((s)[i]-0x80))<=0x3f && \
|
350
|
+
(__t2=(uint8_t)((s)[(i)+1]-0x80))<= 0x3f \
|
351
|
+
) { \
|
352
|
+
/* no need for (c&0xf) because the upper bits are truncated after <<12 in the cast to (UChar) */ \
|
353
|
+
(c)=(UChar)(((c)<<12)|(__t1<<6)|__t2); \
|
354
|
+
(i)+=2; \
|
355
|
+
} else if( /* handle U+0080..U+07FF inline */ \
|
356
|
+
((c)<0xe0 && (c)>=0xc2) && \
|
357
|
+
((i)!=(length)) && \
|
358
|
+
(__t1=(uint8_t)((s)[i]-0x80))<=0x3f \
|
359
|
+
) { \
|
360
|
+
(c)=(((c)&0x1f)<<6)|__t1; \
|
361
|
+
++(i); \
|
362
|
+
} else { \
|
363
|
+
/* function call for "complicated" and error cases */ \
|
364
|
+
(c)=utf8_nextCharSafeBody((const uint8_t *)s, &(i), (length), c, -1); \
|
365
|
+
} \
|
366
|
+
} \
|
367
|
+
}
|
368
|
+
|
369
|
+
/**
|
370
|
+
* Get a code point from a string at a code point boundary offset,
|
371
|
+
* and advance the offset to the next code point boundary.
|
372
|
+
* (Post-incrementing forward iteration.)
|
373
|
+
* "Safe" macro, checks for illegal sequences and for string boundaries.
|
374
|
+
*
|
375
|
+
* The length can be negative for a NUL-terminated string.
|
376
|
+
*
|
377
|
+
* The offset may point to the lead byte of a multi-byte sequence,
|
378
|
+
* in which case the macro will read the whole sequence.
|
379
|
+
* If the offset points to a trail byte or an illegal UTF-8 sequence, then
|
380
|
+
* c is set to U+FFFD.
|
381
|
+
*
|
382
|
+
* This macro does not distinguish between a real U+FFFD in the text
|
383
|
+
* and U+FFFD returned for an ill-formed sequence.
|
384
|
+
* Use U8_NEXT() if that distinction is important.
|
385
|
+
*
|
386
|
+
* @param s const uint8_t * string
|
387
|
+
* @param i int32_t string offset, must be i<length
|
388
|
+
* @param length int32_t string length
|
389
|
+
* @param c output UChar32 variable, set to U+FFFD in case of an error
|
390
|
+
* @see U8_NEXT
|
391
|
+
* @stable ICU 51
|
392
|
+
*/
|
393
|
+
#define U8_NEXT_OR_FFFD(s, i, length, c) { \
|
394
|
+
(c)=(uint8_t)(s)[(i)++]; \
|
395
|
+
if((c)>=0x80) { \
|
396
|
+
uint8_t __t1, __t2; \
|
397
|
+
if( /* handle U+1000..U+CFFF inline */ \
|
398
|
+
(0xe0<(c) && (c)<=0xec) && \
|
399
|
+
(((i)+1)<(length) || (length)<0) && \
|
400
|
+
(__t1=(uint8_t)((s)[i]-0x80))<=0x3f && \
|
401
|
+
(__t2=(uint8_t)((s)[(i)+1]-0x80))<= 0x3f \
|
402
|
+
) { \
|
403
|
+
/* no need for (c&0xf) because the upper bits are truncated after <<12 in the cast to (UChar) */ \
|
404
|
+
(c)=(UChar)(((c)<<12)|(__t1<<6)|__t2); \
|
405
|
+
(i)+=2; \
|
406
|
+
} else if( /* handle U+0080..U+07FF inline */ \
|
407
|
+
((c)<0xe0 && (c)>=0xc2) && \
|
408
|
+
((i)!=(length)) && \
|
409
|
+
(__t1=(uint8_t)((s)[i]-0x80))<=0x3f \
|
410
|
+
) { \
|
411
|
+
(c)=(((c)&0x1f)<<6)|__t1; \
|
412
|
+
++(i); \
|
413
|
+
} else { \
|
414
|
+
/* function call for "complicated" and error cases */ \
|
415
|
+
(c)=utf8_nextCharSafeBody((const uint8_t *)s, &(i), (length), c, -3); \
|
416
|
+
} \
|
417
|
+
} \
|
418
|
+
}
|
419
|
+
|
420
|
+
/**
|
421
|
+
* Append a code point to a string, overwriting 1 to 4 bytes.
|
422
|
+
* The offset points to the current end of the string contents
|
423
|
+
* and is advanced (post-increment).
|
424
|
+
* "Unsafe" macro, assumes a valid code point and sufficient space in the string.
|
425
|
+
* Otherwise, the result is undefined.
|
426
|
+
*
|
427
|
+
* @param s const uint8_t * string buffer
|
428
|
+
* @param i string offset
|
429
|
+
* @param c code point to append
|
430
|
+
* @see U8_APPEND
|
431
|
+
* @stable ICU 2.4
|
432
|
+
*/
|
433
|
+
#define U8_APPEND_UNSAFE(s, i, c) { \
|
434
|
+
if((uint32_t)(c)<=0x7f) { \
|
435
|
+
(s)[(i)++]=(uint8_t)(c); \
|
436
|
+
} else { \
|
437
|
+
if((uint32_t)(c)<=0x7ff) { \
|
438
|
+
(s)[(i)++]=(uint8_t)(((c)>>6)|0xc0); \
|
439
|
+
} else { \
|
440
|
+
if((uint32_t)(c)<=0xffff) { \
|
441
|
+
(s)[(i)++]=(uint8_t)(((c)>>12)|0xe0); \
|
442
|
+
} else { \
|
443
|
+
(s)[(i)++]=(uint8_t)(((c)>>18)|0xf0); \
|
444
|
+
(s)[(i)++]=(uint8_t)((((c)>>12)&0x3f)|0x80); \
|
445
|
+
} \
|
446
|
+
(s)[(i)++]=(uint8_t)((((c)>>6)&0x3f)|0x80); \
|
447
|
+
} \
|
448
|
+
(s)[(i)++]=(uint8_t)(((c)&0x3f)|0x80); \
|
449
|
+
} \
|
450
|
+
}
|
451
|
+
|
452
|
+
/**
|
453
|
+
* Append a code point to a string, overwriting 1 to 4 bytes.
|
454
|
+
* The offset points to the current end of the string contents
|
455
|
+
* and is advanced (post-increment).
|
456
|
+
* "Safe" macro, checks for a valid code point.
|
457
|
+
* If a non-ASCII code point is written, checks for sufficient space in the string.
|
458
|
+
* If the code point is not valid or trail bytes do not fit,
|
459
|
+
* then isError is set to TRUE.
|
460
|
+
*
|
461
|
+
* @param s const uint8_t * string buffer
|
462
|
+
* @param i int32_t string offset, must be i<capacity
|
463
|
+
* @param capacity int32_t size of the string buffer
|
464
|
+
* @param c UChar32 code point to append
|
465
|
+
* @param isError output UBool set to TRUE if an error occurs, otherwise not modified
|
466
|
+
* @see U8_APPEND_UNSAFE
|
467
|
+
* @stable ICU 2.4
|
468
|
+
*/
|
469
|
+
#define U8_APPEND(s, i, capacity, c, isError) { \
|
470
|
+
if((uint32_t)(c)<=0x7f) { \
|
471
|
+
(s)[(i)++]=(uint8_t)(c); \
|
472
|
+
} else if((uint32_t)(c)<=0x7ff && (i)+1<(capacity)) { \
|
473
|
+
(s)[(i)++]=(uint8_t)(((c)>>6)|0xc0); \
|
474
|
+
(s)[(i)++]=(uint8_t)(((c)&0x3f)|0x80); \
|
475
|
+
} else if((uint32_t)(c)<=0xd7ff && (i)+2<(capacity)) { \
|
476
|
+
(s)[(i)++]=(uint8_t)(((c)>>12)|0xe0); \
|
477
|
+
(s)[(i)++]=(uint8_t)((((c)>>6)&0x3f)|0x80); \
|
478
|
+
(s)[(i)++]=(uint8_t)(((c)&0x3f)|0x80); \
|
479
|
+
} else { \
|
480
|
+
(i)=utf8_appendCharSafeBody(s, (i), (capacity), c, &(isError)); \
|
481
|
+
} \
|
482
|
+
}
|
483
|
+
|
484
|
+
/**
|
485
|
+
* Advance the string offset from one code point boundary to the next.
|
486
|
+
* (Post-incrementing iteration.)
|
487
|
+
* "Unsafe" macro, assumes well-formed UTF-8.
|
488
|
+
*
|
489
|
+
* @param s const uint8_t * string
|
490
|
+
* @param i string offset
|
491
|
+
* @see U8_FWD_1
|
492
|
+
* @stable ICU 2.4
|
493
|
+
*/
|
494
|
+
#define U8_FWD_1_UNSAFE(s, i) { \
|
495
|
+
(i)+=1+U8_COUNT_TRAIL_BYTES_UNSAFE((uint8_t)(s)[i]); \
|
496
|
+
}
|
497
|
+
|
498
|
+
/**
|
499
|
+
* Advance the string offset from one code point boundary to the next.
|
500
|
+
* (Post-incrementing iteration.)
|
501
|
+
* "Safe" macro, checks for illegal sequences and for string boundaries.
|
502
|
+
*
|
503
|
+
* The length can be negative for a NUL-terminated string.
|
504
|
+
*
|
505
|
+
* @param s const uint8_t * string
|
506
|
+
* @param i int32_t string offset, must be i<length
|
507
|
+
* @param length int32_t string length
|
508
|
+
* @see U8_FWD_1_UNSAFE
|
509
|
+
* @stable ICU 2.4
|
510
|
+
*/
|
511
|
+
#define U8_FWD_1(s, i, length) { \
|
512
|
+
uint8_t __b=(uint8_t)(s)[(i)++]; \
|
513
|
+
if(U8_IS_LEAD(__b)) { \
|
514
|
+
uint8_t __count=U8_COUNT_TRAIL_BYTES(__b); \
|
515
|
+
if((i)+__count>(length) && (length)>=0) { \
|
516
|
+
__count=(uint8_t)((length)-(i)); \
|
517
|
+
} \
|
518
|
+
while(__count>0 && U8_IS_TRAIL((s)[i])) { \
|
519
|
+
++(i); \
|
520
|
+
--__count; \
|
521
|
+
} \
|
522
|
+
} \
|
523
|
+
}
|
524
|
+
|
525
|
+
/**
|
526
|
+
* Advance the string offset from one code point boundary to the n-th next one,
|
527
|
+
* i.e., move forward by n code points.
|
528
|
+
* (Post-incrementing iteration.)
|
529
|
+
* "Unsafe" macro, assumes well-formed UTF-8.
|
530
|
+
*
|
531
|
+
* @param s const uint8_t * string
|
532
|
+
* @param i string offset
|
533
|
+
* @param n number of code points to skip
|
534
|
+
* @see U8_FWD_N
|
535
|
+
* @stable ICU 2.4
|
536
|
+
*/
|
537
|
+
#define U8_FWD_N_UNSAFE(s, i, n) { \
|
538
|
+
int32_t __N=(n); \
|
539
|
+
while(__N>0) { \
|
540
|
+
U8_FWD_1_UNSAFE(s, i); \
|
541
|
+
--__N; \
|
542
|
+
} \
|
543
|
+
}
|
544
|
+
|
545
|
+
/**
|
546
|
+
* Advance the string offset from one code point boundary to the n-th next one,
|
547
|
+
* i.e., move forward by n code points.
|
548
|
+
* (Post-incrementing iteration.)
|
549
|
+
* "Safe" macro, checks for illegal sequences and for string boundaries.
|
550
|
+
*
|
551
|
+
* The length can be negative for a NUL-terminated string.
|
552
|
+
*
|
553
|
+
* @param s const uint8_t * string
|
554
|
+
* @param i int32_t string offset, must be i<length
|
555
|
+
* @param length int32_t string length
|
556
|
+
* @param n number of code points to skip
|
557
|
+
* @see U8_FWD_N_UNSAFE
|
558
|
+
* @stable ICU 2.4
|
559
|
+
*/
|
560
|
+
#define U8_FWD_N(s, i, length, n) { \
|
561
|
+
int32_t __N=(n); \
|
562
|
+
while(__N>0 && ((i)<(length) || ((length)<0 && (s)[i]!=0))) { \
|
563
|
+
U8_FWD_1(s, i, length); \
|
564
|
+
--__N; \
|
565
|
+
} \
|
566
|
+
}
|
567
|
+
|
568
|
+
/**
|
569
|
+
* Adjust a random-access offset to a code point boundary
|
570
|
+
* at the start of a code point.
|
571
|
+
* If the offset points to a UTF-8 trail byte,
|
572
|
+
* then the offset is moved backward to the corresponding lead byte.
|
573
|
+
* Otherwise, it is not modified.
|
574
|
+
* "Unsafe" macro, assumes well-formed UTF-8.
|
575
|
+
*
|
576
|
+
* @param s const uint8_t * string
|
577
|
+
* @param i string offset
|
578
|
+
* @see U8_SET_CP_START
|
579
|
+
* @stable ICU 2.4
|
580
|
+
*/
|
581
|
+
#define U8_SET_CP_START_UNSAFE(s, i) { \
|
582
|
+
while(U8_IS_TRAIL((s)[i])) { --(i); } \
|
583
|
+
}
|
584
|
+
|
585
|
+
/**
|
586
|
+
* Adjust a random-access offset to a code point boundary
|
587
|
+
* at the start of a code point.
|
588
|
+
* If the offset points to a UTF-8 trail byte,
|
589
|
+
* then the offset is moved backward to the corresponding lead byte.
|
590
|
+
* Otherwise, it is not modified.
|
591
|
+
* "Safe" macro, checks for illegal sequences and for string boundaries.
|
592
|
+
*
|
593
|
+
* @param s const uint8_t * string
|
594
|
+
* @param start int32_t starting string offset (usually 0)
|
595
|
+
* @param i int32_t string offset, must be start<=i
|
596
|
+
* @see U8_SET_CP_START_UNSAFE
|
597
|
+
* @stable ICU 2.4
|
598
|
+
*/
|
599
|
+
#define U8_SET_CP_START(s, start, i) { \
|
600
|
+
if(U8_IS_TRAIL((s)[(i)])) { \
|
601
|
+
(i)=utf8_back1SafeBody(s, start, (i)); \
|
602
|
+
} \
|
603
|
+
}
|
604
|
+
|
605
|
+
/* definitions with backward iteration -------------------------------------- */
|
606
|
+
|
607
|
+
/**
|
608
|
+
* Move the string offset from one code point boundary to the previous one
|
609
|
+
* and get the code point between them.
|
610
|
+
* (Pre-decrementing backward iteration.)
|
611
|
+
* "Unsafe" macro, assumes well-formed UTF-8.
|
612
|
+
*
|
613
|
+
* The input offset may be the same as the string length.
|
614
|
+
* If the offset is behind a multi-byte sequence, then the macro will read
|
615
|
+
* the whole sequence.
|
616
|
+
* If the offset is behind a lead byte, then that itself
|
617
|
+
* will be returned as the code point.
|
618
|
+
* The result is undefined if the offset is behind an illegal UTF-8 sequence.
|
619
|
+
*
|
620
|
+
* @param s const uint8_t * string
|
621
|
+
* @param i string offset
|
622
|
+
* @param c output UChar32 variable
|
623
|
+
* @see U8_PREV
|
624
|
+
* @stable ICU 2.4
|
625
|
+
*/
|
626
|
+
#define U8_PREV_UNSAFE(s, i, c) { \
|
627
|
+
(c)=(uint8_t)(s)[--(i)]; \
|
628
|
+
if(U8_IS_TRAIL(c)) { \
|
629
|
+
uint8_t __b, __count=1, __shift=6; \
|
630
|
+
\
|
631
|
+
/* c is a trail byte */ \
|
632
|
+
(c)&=0x3f; \
|
633
|
+
for(;;) { \
|
634
|
+
__b=(uint8_t)(s)[--(i)]; \
|
635
|
+
if(__b>=0xc0) { \
|
636
|
+
U8_MASK_LEAD_BYTE(__b, __count); \
|
637
|
+
(c)|=(UChar32)__b<<__shift; \
|
638
|
+
break; \
|
639
|
+
} else { \
|
640
|
+
(c)|=(UChar32)(__b&0x3f)<<__shift; \
|
641
|
+
++__count; \
|
642
|
+
__shift+=6; \
|
643
|
+
} \
|
644
|
+
} \
|
645
|
+
} \
|
646
|
+
}
|
647
|
+
|
648
|
+
/**
|
649
|
+
* Move the string offset from one code point boundary to the previous one
|
650
|
+
* and get the code point between them.
|
651
|
+
* (Pre-decrementing backward iteration.)
|
652
|
+
* "Safe" macro, checks for illegal sequences and for string boundaries.
|
653
|
+
*
|
654
|
+
* The input offset may be the same as the string length.
|
655
|
+
* If the offset is behind a multi-byte sequence, then the macro will read
|
656
|
+
* the whole sequence.
|
657
|
+
* If the offset is behind a lead byte, then that itself
|
658
|
+
* will be returned as the code point.
|
659
|
+
* If the offset is behind an illegal UTF-8 sequence, then c is set to a negative value.
|
660
|
+
*
|
661
|
+
* @param s const uint8_t * string
|
662
|
+
* @param start int32_t starting string offset (usually 0)
|
663
|
+
* @param i int32_t string offset, must be start<i
|
664
|
+
* @param c output UChar32 variable, set to <0 in case of an error
|
665
|
+
* @see U8_PREV_UNSAFE
|
666
|
+
* @stable ICU 2.4
|
667
|
+
*/
|
668
|
+
#define U8_PREV(s, start, i, c) { \
|
669
|
+
(c)=(uint8_t)(s)[--(i)]; \
|
670
|
+
if((c)>=0x80) { \
|
671
|
+
(c)=utf8_prevCharSafeBody((const uint8_t *)s, start, &(i), c, -1); \
|
672
|
+
} \
|
673
|
+
}
|
674
|
+
|
675
|
+
/**
|
676
|
+
* Move the string offset from one code point boundary to the previous one
|
677
|
+
* and get the code point between them.
|
678
|
+
* (Pre-decrementing backward iteration.)
|
679
|
+
* "Safe" macro, checks for illegal sequences and for string boundaries.
|
680
|
+
*
|
681
|
+
* The input offset may be the same as the string length.
|
682
|
+
* If the offset is behind a multi-byte sequence, then the macro will read
|
683
|
+
* the whole sequence.
|
684
|
+
* If the offset is behind a lead byte, then that itself
|
685
|
+
* will be returned as the code point.
|
686
|
+
* If the offset is behind an illegal UTF-8 sequence, then c is set to U+FFFD.
|
687
|
+
*
|
688
|
+
* This macro does not distinguish between a real U+FFFD in the text
|
689
|
+
* and U+FFFD returned for an ill-formed sequence.
|
690
|
+
* Use U8_PREV() if that distinction is important.
|
691
|
+
*
|
692
|
+
* @param s const uint8_t * string
|
693
|
+
* @param start int32_t starting string offset (usually 0)
|
694
|
+
* @param i int32_t string offset, must be start<i
|
695
|
+
* @param c output UChar32 variable, set to U+FFFD in case of an error
|
696
|
+
* @see U8_PREV
|
697
|
+
* @stable ICU 51
|
698
|
+
*/
|
699
|
+
#define U8_PREV_OR_FFFD(s, start, i, c) { \
|
700
|
+
(c)=(uint8_t)(s)[--(i)]; \
|
701
|
+
if((c)>=0x80) { \
|
702
|
+
(c)=utf8_prevCharSafeBody((const uint8_t *)s, start, &(i), c, -3); \
|
703
|
+
} \
|
704
|
+
}
|
705
|
+
|
706
|
+
/**
|
707
|
+
* Move the string offset from one code point boundary to the previous one.
|
708
|
+
* (Pre-decrementing backward iteration.)
|
709
|
+
* The input offset may be the same as the string length.
|
710
|
+
* "Unsafe" macro, assumes well-formed UTF-8.
|
711
|
+
*
|
712
|
+
* @param s const uint8_t * string
|
713
|
+
* @param i string offset
|
714
|
+
* @see U8_BACK_1
|
715
|
+
* @stable ICU 2.4
|
716
|
+
*/
|
717
|
+
#define U8_BACK_1_UNSAFE(s, i) { \
|
718
|
+
while(U8_IS_TRAIL((s)[--(i)])) {} \
|
719
|
+
}
|
720
|
+
|
721
|
+
/**
|
722
|
+
* Move the string offset from one code point boundary to the previous one.
|
723
|
+
* (Pre-decrementing backward iteration.)
|
724
|
+
* The input offset may be the same as the string length.
|
725
|
+
* "Safe" macro, checks for illegal sequences and for string boundaries.
|
726
|
+
*
|
727
|
+
* @param s const uint8_t * string
|
728
|
+
* @param start int32_t starting string offset (usually 0)
|
729
|
+
* @param i int32_t string offset, must be start<i
|
730
|
+
* @see U8_BACK_1_UNSAFE
|
731
|
+
* @stable ICU 2.4
|
732
|
+
*/
|
733
|
+
#define U8_BACK_1(s, start, i) { \
|
734
|
+
if(U8_IS_TRAIL((s)[--(i)])) { \
|
735
|
+
(i)=utf8_back1SafeBody(s, start, (i)); \
|
736
|
+
} \
|
737
|
+
}
|
738
|
+
|
739
|
+
/**
|
740
|
+
* Move the string offset from one code point boundary to the n-th one before it,
|
741
|
+
* i.e., move backward by n code points.
|
742
|
+
* (Pre-decrementing backward iteration.)
|
743
|
+
* The input offset may be the same as the string length.
|
744
|
+
* "Unsafe" macro, assumes well-formed UTF-8.
|
745
|
+
*
|
746
|
+
* @param s const uint8_t * string
|
747
|
+
* @param i string offset
|
748
|
+
* @param n number of code points to skip
|
749
|
+
* @see U8_BACK_N
|
750
|
+
* @stable ICU 2.4
|
751
|
+
*/
|
752
|
+
#define U8_BACK_N_UNSAFE(s, i, n) { \
|
753
|
+
int32_t __N=(n); \
|
754
|
+
while(__N>0) { \
|
755
|
+
U8_BACK_1_UNSAFE(s, i); \
|
756
|
+
--__N; \
|
757
|
+
} \
|
758
|
+
}
|
759
|
+
|
760
|
+
/**
|
761
|
+
* Move the string offset from one code point boundary to the n-th one before it,
|
762
|
+
* i.e., move backward by n code points.
|
763
|
+
* (Pre-decrementing backward iteration.)
|
764
|
+
* The input offset may be the same as the string length.
|
765
|
+
* "Safe" macro, checks for illegal sequences and for string boundaries.
|
766
|
+
*
|
767
|
+
* @param s const uint8_t * string
|
768
|
+
* @param start int32_t index of the start of the string
|
769
|
+
* @param i int32_t string offset, must be start<i
|
770
|
+
* @param n number of code points to skip
|
771
|
+
* @see U8_BACK_N_UNSAFE
|
772
|
+
* @stable ICU 2.4
|
773
|
+
*/
|
774
|
+
#define U8_BACK_N(s, start, i, n) { \
|
775
|
+
int32_t __N=(n); \
|
776
|
+
while(__N>0 && (i)>(start)) { \
|
777
|
+
U8_BACK_1(s, start, i); \
|
778
|
+
--__N; \
|
779
|
+
} \
|
780
|
+
}
|
781
|
+
|
782
|
+
/**
|
783
|
+
* Adjust a random-access offset to a code point boundary after a code point.
|
784
|
+
* If the offset is behind a partial multi-byte sequence,
|
785
|
+
* then the offset is incremented to behind the whole sequence.
|
786
|
+
* Otherwise, it is not modified.
|
787
|
+
* The input offset may be the same as the string length.
|
788
|
+
* "Unsafe" macro, assumes well-formed UTF-8.
|
789
|
+
*
|
790
|
+
* @param s const uint8_t * string
|
791
|
+
* @param i string offset
|
792
|
+
* @see U8_SET_CP_LIMIT
|
793
|
+
* @stable ICU 2.4
|
794
|
+
*/
|
795
|
+
#define U8_SET_CP_LIMIT_UNSAFE(s, i) { \
|
796
|
+
U8_BACK_1_UNSAFE(s, i); \
|
797
|
+
U8_FWD_1_UNSAFE(s, i); \
|
798
|
+
}
|
799
|
+
|
800
|
+
/**
|
801
|
+
* Adjust a random-access offset to a code point boundary after a code point.
|
802
|
+
* If the offset is behind a partial multi-byte sequence,
|
803
|
+
* then the offset is incremented to behind the whole sequence.
|
804
|
+
* Otherwise, it is not modified.
|
805
|
+
* The input offset may be the same as the string length.
|
806
|
+
* "Safe" macro, checks for illegal sequences and for string boundaries.
|
807
|
+
*
|
808
|
+
* The length can be negative for a NUL-terminated string.
|
809
|
+
*
|
810
|
+
* @param s const uint8_t * string
|
811
|
+
* @param start int32_t starting string offset (usually 0)
|
812
|
+
* @param i int32_t string offset, must be start<=i<=length
|
813
|
+
* @param length int32_t string length
|
814
|
+
* @see U8_SET_CP_LIMIT_UNSAFE
|
815
|
+
* @stable ICU 2.4
|
816
|
+
*/
|
817
|
+
#define U8_SET_CP_LIMIT(s, start, i, length) { \
|
818
|
+
if((start)<(i) && ((i)<(length) || ((length)<0 && (s)[i]!=0))) { \
|
819
|
+
U8_BACK_1(s, start, i); \
|
820
|
+
U8_FWD_1(s, i, length); \
|
821
|
+
} \
|
822
|
+
}
|
823
|
+
|
824
|
+
#endif
|