rugged 0.28.3.1 → 0.28.4
Sign up to get free protection for your applications and to get access to all the features.
- checksums.yaml +4 -4
- data/lib/rugged/version.rb +1 -1
- data/vendor/libgit2/AUTHORS +1 -0
- data/vendor/libgit2/CMakeLists.txt +36 -16
- data/vendor/libgit2/COPYING +28 -0
- data/vendor/libgit2/cmake/Modules/EnableWarnings.cmake +5 -1
- data/vendor/libgit2/cmake/Modules/FindCoreFoundation.cmake +2 -2
- data/vendor/libgit2/cmake/Modules/FindGSSAPI.cmake +1 -1
- data/vendor/libgit2/cmake/Modules/FindGSSFramework.cmake +28 -0
- data/vendor/libgit2/cmake/Modules/FindPCRE.cmake +38 -0
- data/vendor/libgit2/cmake/Modules/FindPCRE2.cmake +37 -0
- data/vendor/libgit2/cmake/Modules/FindSecurity.cmake +2 -2
- data/vendor/libgit2/cmake/Modules/FindStatNsec.cmake +6 -0
- data/vendor/libgit2/cmake/Modules/PkgBuildConfig.cmake +110 -0
- data/vendor/libgit2/cmake/Modules/SelectGSSAPI.cmake +53 -0
- data/vendor/libgit2/cmake/Modules/SelectHTTPSBackend.cmake +124 -0
- data/vendor/libgit2/cmake/Modules/SelectHashes.cmake +66 -0
- data/vendor/libgit2/deps/http-parser/http_parser.c +11 -6
- data/vendor/libgit2/deps/ntlmclient/CMakeLists.txt +21 -0
- data/vendor/libgit2/deps/ntlmclient/compat.h +33 -0
- data/vendor/libgit2/deps/ntlmclient/crypt.h +64 -0
- data/vendor/libgit2/deps/ntlmclient/crypt_commoncrypto.c +120 -0
- data/vendor/libgit2/deps/ntlmclient/crypt_commoncrypto.h +18 -0
- data/vendor/libgit2/deps/ntlmclient/crypt_mbedtls.c +145 -0
- data/vendor/libgit2/deps/ntlmclient/crypt_mbedtls.h +18 -0
- data/vendor/libgit2/deps/ntlmclient/crypt_openssl.c +130 -0
- data/vendor/libgit2/deps/ntlmclient/crypt_openssl.h +21 -0
- data/vendor/libgit2/deps/ntlmclient/ntlm.c +1420 -0
- data/vendor/libgit2/deps/ntlmclient/ntlm.h +174 -0
- data/vendor/libgit2/deps/ntlmclient/ntlmclient.h +320 -0
- data/vendor/libgit2/deps/ntlmclient/unicode.h +36 -0
- data/vendor/libgit2/deps/ntlmclient/unicode_builtin.c +445 -0
- data/vendor/libgit2/deps/ntlmclient/unicode_iconv.c +201 -0
- data/vendor/libgit2/deps/ntlmclient/utf8.h +1257 -0
- data/vendor/libgit2/deps/ntlmclient/util.c +21 -0
- data/vendor/libgit2/deps/ntlmclient/util.h +14 -0
- data/vendor/libgit2/deps/pcre/CMakeLists.txt +140 -0
- data/vendor/libgit2/deps/pcre/COPYING +5 -0
- data/vendor/libgit2/deps/pcre/cmake/COPYING-CMAKE-SCRIPTS +22 -0
- data/vendor/libgit2/deps/pcre/cmake/FindEditline.cmake +17 -0
- data/vendor/libgit2/deps/pcre/cmake/FindPackageHandleStandardArgs.cmake +58 -0
- data/vendor/libgit2/deps/pcre/cmake/FindReadline.cmake +29 -0
- data/vendor/libgit2/deps/pcre/config.h.in +57 -0
- data/vendor/libgit2/deps/pcre/pcre.h +641 -0
- data/vendor/libgit2/deps/pcre/pcre_byte_order.c +319 -0
- data/vendor/libgit2/deps/pcre/pcre_chartables.c +198 -0
- data/vendor/libgit2/deps/pcre/pcre_compile.c +9800 -0
- data/vendor/libgit2/deps/pcre/pcre_config.c +190 -0
- data/vendor/libgit2/deps/pcre/pcre_dfa_exec.c +3676 -0
- data/vendor/libgit2/deps/pcre/pcre_exec.c +7173 -0
- data/vendor/libgit2/deps/pcre/pcre_fullinfo.c +245 -0
- data/vendor/libgit2/deps/pcre/pcre_get.c +669 -0
- data/vendor/libgit2/deps/pcre/pcre_globals.c +86 -0
- data/vendor/libgit2/deps/pcre/pcre_internal.h +2787 -0
- data/vendor/libgit2/deps/pcre/pcre_jit_compile.c +11913 -0
- data/vendor/libgit2/deps/pcre/pcre_maketables.c +156 -0
- data/vendor/libgit2/deps/pcre/pcre_newline.c +210 -0
- data/vendor/libgit2/deps/pcre/pcre_ord2utf8.c +94 -0
- data/vendor/libgit2/deps/pcre/pcre_printint.c +834 -0
- data/vendor/libgit2/deps/pcre/pcre_refcount.c +92 -0
- data/vendor/libgit2/deps/pcre/pcre_string_utils.c +211 -0
- data/vendor/libgit2/deps/pcre/pcre_study.c +1686 -0
- data/vendor/libgit2/deps/pcre/pcre_tables.c +727 -0
- data/vendor/libgit2/deps/pcre/pcre_ucd.c +3644 -0
- data/vendor/libgit2/deps/pcre/pcre_valid_utf8.c +301 -0
- data/vendor/libgit2/deps/pcre/pcre_version.c +98 -0
- data/vendor/libgit2/deps/pcre/pcre_xclass.c +268 -0
- data/vendor/libgit2/deps/pcre/pcreposix.c +421 -0
- data/vendor/libgit2/deps/pcre/pcreposix.h +117 -0
- data/vendor/libgit2/deps/pcre/ucp.h +224 -0
- data/vendor/libgit2/deps/zlib/adler32.c +0 -7
- data/vendor/libgit2/deps/zlib/crc32.c +0 -7
- data/vendor/libgit2/include/git2.h +2 -0
- data/vendor/libgit2/include/git2/apply.h +22 -2
- data/vendor/libgit2/include/git2/attr.h +19 -12
- data/vendor/libgit2/include/git2/blame.h +2 -2
- data/vendor/libgit2/include/git2/blob.h +44 -12
- data/vendor/libgit2/include/git2/buffer.h +20 -14
- data/vendor/libgit2/include/git2/cert.h +135 -0
- data/vendor/libgit2/include/git2/checkout.h +46 -14
- data/vendor/libgit2/include/git2/cherrypick.h +3 -3
- data/vendor/libgit2/include/git2/clone.h +2 -2
- data/vendor/libgit2/include/git2/commit.h +23 -1
- data/vendor/libgit2/include/git2/common.h +7 -5
- data/vendor/libgit2/include/git2/config.h +12 -12
- data/vendor/libgit2/include/git2/cred.h +308 -0
- data/vendor/libgit2/include/git2/deprecated.h +243 -3
- data/vendor/libgit2/include/git2/describe.h +4 -4
- data/vendor/libgit2/include/git2/diff.h +16 -14
- data/vendor/libgit2/include/git2/filter.h +8 -0
- data/vendor/libgit2/include/git2/index.h +2 -1
- data/vendor/libgit2/include/git2/indexer.h +48 -4
- data/vendor/libgit2/include/git2/merge.h +6 -10
- data/vendor/libgit2/include/git2/net.h +0 -5
- data/vendor/libgit2/include/git2/object.h +2 -14
- data/vendor/libgit2/include/git2/odb.h +3 -2
- data/vendor/libgit2/include/git2/odb_backend.h +5 -4
- data/vendor/libgit2/include/git2/oid.h +1 -1
- data/vendor/libgit2/include/git2/pack.h +12 -1
- data/vendor/libgit2/include/git2/proxy.h +5 -3
- data/vendor/libgit2/include/git2/rebase.h +46 -2
- data/vendor/libgit2/include/git2/refs.h +19 -0
- data/vendor/libgit2/include/git2/remote.h +35 -12
- data/vendor/libgit2/include/git2/repository.h +24 -2
- data/vendor/libgit2/include/git2/revert.h +1 -1
- data/vendor/libgit2/include/git2/stash.h +3 -3
- data/vendor/libgit2/include/git2/status.h +25 -16
- data/vendor/libgit2/include/git2/submodule.h +20 -3
- data/vendor/libgit2/include/git2/sys/alloc.h +9 -9
- data/vendor/libgit2/include/git2/sys/cred.h +90 -0
- data/vendor/libgit2/include/git2/sys/odb_backend.h +48 -4
- data/vendor/libgit2/include/git2/sys/refdb_backend.h +57 -21
- data/vendor/libgit2/include/git2/sys/repository.h +5 -1
- data/vendor/libgit2/include/git2/sys/transport.h +2 -2
- data/vendor/libgit2/include/git2/tag.h +11 -2
- data/vendor/libgit2/include/git2/trace.h +2 -2
- data/vendor/libgit2/include/git2/transport.h +11 -340
- data/vendor/libgit2/include/git2/tree.h +1 -1
- data/vendor/libgit2/include/git2/types.h +4 -89
- data/vendor/libgit2/include/git2/version.h +2 -2
- data/vendor/libgit2/include/git2/worktree.h +5 -5
- data/vendor/libgit2/src/CMakeLists.txt +88 -222
- data/vendor/libgit2/src/alloc.c +2 -14
- data/vendor/libgit2/src/{stdalloc.c → allocators/stdalloc.c} +3 -4
- data/vendor/libgit2/src/{stdalloc.h → allocators/stdalloc.h} +4 -4
- data/vendor/libgit2/src/allocators/win32_crtdbg.c +118 -0
- data/vendor/libgit2/src/{transports/cred.h → allocators/win32_crtdbg.h} +5 -4
- data/vendor/libgit2/src/apply.c +60 -30
- data/vendor/libgit2/src/attr.c +70 -64
- data/vendor/libgit2/src/attr_file.c +189 -96
- data/vendor/libgit2/src/attr_file.h +9 -9
- data/vendor/libgit2/src/attrcache.c +44 -46
- data/vendor/libgit2/src/attrcache.h +2 -1
- data/vendor/libgit2/src/blame.c +17 -5
- data/vendor/libgit2/src/blame.h +1 -1
- data/vendor/libgit2/src/blame_git.c +21 -7
- data/vendor/libgit2/src/blob.c +81 -17
- data/vendor/libgit2/src/blob.h +2 -2
- data/vendor/libgit2/src/branch.c +29 -5
- data/vendor/libgit2/src/buffer.c +14 -7
- data/vendor/libgit2/src/cache.c +26 -33
- data/vendor/libgit2/src/cache.h +1 -1
- data/vendor/libgit2/src/cc-compat.h +5 -0
- data/vendor/libgit2/src/checkout.c +26 -16
- data/vendor/libgit2/src/cherrypick.c +9 -3
- data/vendor/libgit2/src/clone.c +29 -7
- data/vendor/libgit2/src/clone.h +4 -0
- data/vendor/libgit2/src/commit.c +69 -21
- data/vendor/libgit2/src/commit.h +6 -0
- data/vendor/libgit2/src/commit_list.c +28 -76
- data/vendor/libgit2/src/commit_list.h +2 -2
- data/vendor/libgit2/src/common.h +3 -75
- data/vendor/libgit2/src/config.c +31 -40
- data/vendor/libgit2/src/config.h +7 -6
- data/vendor/libgit2/src/config_backend.h +12 -0
- data/vendor/libgit2/src/config_cache.c +39 -39
- data/vendor/libgit2/src/config_entries.c +69 -99
- data/vendor/libgit2/src/config_entries.h +1 -0
- data/vendor/libgit2/src/config_file.c +337 -380
- data/vendor/libgit2/src/config_mem.c +12 -16
- data/vendor/libgit2/src/config_parse.c +49 -29
- data/vendor/libgit2/src/config_parse.h +13 -12
- data/vendor/libgit2/src/config_snapshot.c +206 -0
- data/vendor/libgit2/src/crlf.c +14 -14
- data/vendor/libgit2/src/describe.c +21 -20
- data/vendor/libgit2/src/diff.c +43 -58
- data/vendor/libgit2/src/diff.h +2 -1
- data/vendor/libgit2/src/diff_driver.c +37 -38
- data/vendor/libgit2/src/diff_file.c +9 -7
- data/vendor/libgit2/src/diff_file.h +1 -1
- data/vendor/libgit2/src/diff_generate.c +135 -85
- data/vendor/libgit2/src/diff_generate.h +2 -2
- data/vendor/libgit2/src/diff_parse.c +1 -1
- data/vendor/libgit2/src/diff_print.c +25 -13
- data/vendor/libgit2/src/diff_stats.c +1 -1
- data/vendor/libgit2/src/diff_tform.c +4 -4
- data/vendor/libgit2/src/errors.c +12 -22
- data/vendor/libgit2/src/errors.h +81 -0
- data/vendor/libgit2/src/features.h.in +9 -2
- data/vendor/libgit2/src/fetch.c +7 -2
- data/vendor/libgit2/src/fetchhead.c +1 -1
- data/vendor/libgit2/src/filebuf.c +6 -10
- data/vendor/libgit2/src/filebuf.h +2 -2
- data/vendor/libgit2/src/filter.c +16 -8
- data/vendor/libgit2/src/{fileops.c → futils.c} +21 -17
- data/vendor/libgit2/src/{fileops.h → futils.h} +5 -5
- data/vendor/libgit2/src/global.c +12 -40
- data/vendor/libgit2/src/global.h +0 -2
- data/vendor/libgit2/src/hash.c +61 -0
- data/vendor/libgit2/src/hash.h +19 -21
- data/vendor/libgit2/src/hash/sha1.h +38 -0
- data/vendor/libgit2/src/hash/{hash_collisiondetect.h → sha1/collisiondetect.c} +14 -17
- data/vendor/libgit2/src/hash/sha1/collisiondetect.h +19 -0
- data/vendor/libgit2/src/hash/{hash_common_crypto.h → sha1/common_crypto.c} +15 -19
- data/vendor/libgit2/src/hash/sha1/common_crypto.h +19 -0
- data/vendor/libgit2/src/hash/{hash_generic.c → sha1/generic.c} +22 -10
- data/vendor/libgit2/src/hash/{hash_generic.h → sha1/generic.h} +4 -14
- data/vendor/libgit2/src/hash/{hash_mbedtls.c → sha1/mbedtls.c} +15 -7
- data/vendor/libgit2/src/hash/{hash_mbedtls.h → sha1/mbedtls.h} +6 -11
- data/vendor/libgit2/src/hash/{hash_openssl.h → sha1/openssl.c} +14 -18
- data/vendor/libgit2/src/hash/sha1/openssl.h +19 -0
- data/vendor/libgit2/src/hash/{sha1dc → sha1/sha1dc}/sha1.c +14 -3
- data/vendor/libgit2/src/hash/{sha1dc → sha1/sha1dc}/sha1.h +0 -0
- data/vendor/libgit2/src/hash/{sha1dc → sha1/sha1dc}/ubc_check.c +0 -0
- data/vendor/libgit2/src/hash/{sha1dc → sha1/sha1dc}/ubc_check.h +0 -0
- data/vendor/libgit2/src/hash/{hash_win32.c → sha1/win32.c} +34 -24
- data/vendor/libgit2/src/hash/{hash_win32.h → sha1/win32.h} +6 -19
- data/vendor/libgit2/src/hashsig.c +1 -1
- data/vendor/libgit2/src/idxmap.c +91 -65
- data/vendor/libgit2/src/idxmap.h +151 -15
- data/vendor/libgit2/src/ignore.c +32 -38
- data/vendor/libgit2/src/index.c +66 -43
- data/vendor/libgit2/src/index.h +1 -1
- data/vendor/libgit2/src/indexer.c +69 -70
- data/vendor/libgit2/src/integer.h +39 -4
- data/vendor/libgit2/src/iterator.c +27 -22
- data/vendor/libgit2/src/map.h +1 -1
- data/vendor/libgit2/src/merge.c +58 -44
- data/vendor/libgit2/src/merge_driver.c +4 -4
- data/vendor/libgit2/src/merge_file.c +1 -1
- data/vendor/libgit2/src/mwindow.c +18 -23
- data/vendor/libgit2/src/mwindow.h +4 -4
- data/vendor/libgit2/src/net.c +184 -0
- data/vendor/libgit2/src/net.h +36 -0
- data/vendor/libgit2/src/netops.c +55 -165
- data/vendor/libgit2/src/netops.h +3 -25
- data/vendor/libgit2/src/notes.c +2 -2
- data/vendor/libgit2/src/object.c +2 -2
- data/vendor/libgit2/src/object.h +2 -0
- data/vendor/libgit2/src/odb.c +41 -23
- data/vendor/libgit2/src/odb.h +3 -2
- data/vendor/libgit2/src/odb_loose.c +17 -10
- data/vendor/libgit2/src/odb_mempack.c +10 -23
- data/vendor/libgit2/src/odb_pack.c +4 -4
- data/vendor/libgit2/src/offmap.c +43 -55
- data/vendor/libgit2/src/offmap.h +102 -24
- data/vendor/libgit2/src/oid.c +6 -1
- data/vendor/libgit2/src/oidmap.c +39 -57
- data/vendor/libgit2/src/oidmap.h +99 -19
- data/vendor/libgit2/src/pack-objects.c +25 -32
- data/vendor/libgit2/src/pack-objects.h +1 -1
- data/vendor/libgit2/src/pack.c +45 -47
- data/vendor/libgit2/src/pack.h +12 -14
- data/vendor/libgit2/src/parse.c +10 -0
- data/vendor/libgit2/src/parse.h +3 -3
- data/vendor/libgit2/src/patch.c +1 -1
- data/vendor/libgit2/src/patch_generate.c +2 -2
- data/vendor/libgit2/src/patch_parse.c +124 -31
- data/vendor/libgit2/src/path.c +95 -27
- data/vendor/libgit2/src/path.h +2 -0
- data/vendor/libgit2/src/pathspec.c +13 -13
- data/vendor/libgit2/src/pool.c +26 -22
- data/vendor/libgit2/src/pool.h +7 -7
- data/vendor/libgit2/src/posix.c +7 -7
- data/vendor/libgit2/src/posix.h +12 -1
- data/vendor/libgit2/src/proxy.c +7 -2
- data/vendor/libgit2/src/push.c +10 -5
- data/vendor/libgit2/src/reader.c +2 -2
- data/vendor/libgit2/src/rebase.c +66 -7
- data/vendor/libgit2/src/refdb.c +12 -0
- data/vendor/libgit2/src/refdb_fs.c +214 -165
- data/vendor/libgit2/src/reflog.c +11 -13
- data/vendor/libgit2/src/refs.c +24 -18
- data/vendor/libgit2/src/refspec.c +9 -16
- data/vendor/libgit2/src/regexp.c +221 -0
- data/vendor/libgit2/src/regexp.h +97 -0
- data/vendor/libgit2/src/remote.c +50 -52
- data/vendor/libgit2/src/remote.h +2 -2
- data/vendor/libgit2/src/repository.c +115 -100
- data/vendor/libgit2/src/repository.h +49 -40
- data/vendor/libgit2/src/revert.c +8 -3
- data/vendor/libgit2/src/revparse.c +18 -19
- data/vendor/libgit2/src/revwalk.c +63 -30
- data/vendor/libgit2/src/revwalk.h +20 -0
- data/vendor/libgit2/src/settings.c +5 -0
- data/vendor/libgit2/src/sortedcache.c +12 -26
- data/vendor/libgit2/src/sortedcache.h +1 -1
- data/vendor/libgit2/src/stash.c +45 -65
- data/vendor/libgit2/src/status.c +15 -9
- data/vendor/libgit2/src/streams/openssl.c +20 -0
- data/vendor/libgit2/src/streams/socket.c +2 -2
- data/vendor/libgit2/src/strmap.c +37 -84
- data/vendor/libgit2/src/strmap.h +105 -33
- data/vendor/libgit2/src/submodule.c +102 -70
- data/vendor/libgit2/src/submodule.h +1 -1
- data/vendor/libgit2/src/sysdir.c +11 -1
- data/vendor/libgit2/src/tag.c +10 -2
- data/vendor/libgit2/src/trace.c +1 -1
- data/vendor/libgit2/src/trace.h +2 -2
- data/vendor/libgit2/src/trailer.c +46 -32
- data/vendor/libgit2/src/transaction.c +10 -9
- data/vendor/libgit2/src/transports/auth.c +10 -9
- data/vendor/libgit2/src/transports/auth.h +11 -4
- data/vendor/libgit2/src/transports/auth_negotiate.c +23 -9
- data/vendor/libgit2/src/transports/auth_negotiate.h +2 -2
- data/vendor/libgit2/src/transports/auth_ntlm.c +223 -0
- data/vendor/libgit2/src/transports/auth_ntlm.h +35 -0
- data/vendor/libgit2/src/transports/cred.c +6 -6
- data/vendor/libgit2/src/transports/git.c +11 -16
- data/vendor/libgit2/src/transports/http.c +419 -276
- data/vendor/libgit2/src/transports/http.h +1 -1
- data/vendor/libgit2/src/transports/local.c +9 -9
- data/vendor/libgit2/src/transports/smart.c +17 -17
- data/vendor/libgit2/src/transports/smart.h +2 -2
- data/vendor/libgit2/src/transports/smart_protocol.c +36 -60
- data/vendor/libgit2/src/transports/ssh.c +46 -36
- data/vendor/libgit2/src/transports/winhttp.c +231 -207
- data/vendor/libgit2/src/tree-cache.c +14 -7
- data/vendor/libgit2/src/tree.c +10 -24
- data/vendor/libgit2/src/unix/map.c +1 -1
- data/vendor/libgit2/src/unix/posix.h +1 -11
- data/vendor/libgit2/src/userdiff.h +3 -1
- data/vendor/libgit2/src/util.c +51 -53
- data/vendor/libgit2/src/util.h +16 -21
- data/vendor/libgit2/src/wildmatch.c +320 -0
- data/vendor/libgit2/src/wildmatch.h +23 -0
- data/vendor/libgit2/src/win32/map.c +3 -5
- data/vendor/libgit2/src/win32/path_w32.c +12 -2
- data/vendor/libgit2/src/win32/path_w32.h +0 -29
- data/vendor/libgit2/src/win32/posix.h +1 -4
- data/vendor/libgit2/src/win32/posix_w32.c +40 -5
- data/vendor/libgit2/src/win32/precompiled.h +0 -2
- data/vendor/libgit2/src/win32/thread.c +5 -10
- data/vendor/libgit2/src/win32/w32_buffer.c +7 -3
- data/vendor/libgit2/src/win32/w32_common.h +39 -0
- data/vendor/libgit2/src/win32/w32_crtdbg_stacktrace.c +0 -93
- data/vendor/libgit2/src/win32/w32_crtdbg_stacktrace.h +0 -2
- data/vendor/libgit2/src/win32/w32_stack.c +4 -9
- data/vendor/libgit2/src/win32/w32_stack.h +3 -3
- data/vendor/libgit2/src/win32/w32_util.c +31 -0
- data/vendor/libgit2/src/win32/w32_util.h +6 -32
- data/vendor/libgit2/src/worktree.c +36 -22
- data/vendor/libgit2/src/xdiff/xdiffi.c +1 -1
- data/vendor/libgit2/src/xdiff/xmerge.c +12 -0
- data/vendor/libgit2/src/xdiff/xpatience.c +3 -0
- metadata +98 -34
- data/vendor/libgit2/deps/regex/CMakeLists.txt +0 -2
- data/vendor/libgit2/deps/regex/COPYING +0 -502
- data/vendor/libgit2/deps/regex/config.h +0 -7
- data/vendor/libgit2/deps/regex/regcomp.c +0 -3857
- data/vendor/libgit2/deps/regex/regex.c +0 -92
- data/vendor/libgit2/deps/regex/regex.h +0 -582
- data/vendor/libgit2/deps/regex/regex_internal.c +0 -1744
- data/vendor/libgit2/deps/regex/regex_internal.h +0 -819
- data/vendor/libgit2/deps/regex/regexec.c +0 -4369
- data/vendor/libgit2/include/git2/inttypes.h +0 -309
- data/vendor/libgit2/include/git2/sys/time.h +0 -31
- data/vendor/libgit2/libgit2.pc.in +0 -13
- data/vendor/libgit2/src/fnmatch.c +0 -248
- data/vendor/libgit2/src/fnmatch.h +0 -48
@@ -0,0 +1,301 @@
|
|
1
|
+
/*************************************************
|
2
|
+
* Perl-Compatible Regular Expressions *
|
3
|
+
*************************************************/
|
4
|
+
|
5
|
+
/* PCRE is a library of functions to support regular expressions whose syntax
|
6
|
+
and semantics are as close as possible to those of the Perl 5 language.
|
7
|
+
|
8
|
+
Written by Philip Hazel
|
9
|
+
Copyright (c) 1997-2013 University of Cambridge
|
10
|
+
|
11
|
+
-----------------------------------------------------------------------------
|
12
|
+
Redistribution and use in source and binary forms, with or without
|
13
|
+
modification, are permitted provided that the following conditions are met:
|
14
|
+
|
15
|
+
* Redistributions of source code must retain the above copyright notice,
|
16
|
+
this list of conditions and the following disclaimer.
|
17
|
+
|
18
|
+
* Redistributions in binary form must reproduce the above copyright
|
19
|
+
notice, this list of conditions and the following disclaimer in the
|
20
|
+
documentation and/or other materials provided with the distribution.
|
21
|
+
|
22
|
+
* Neither the name of the University of Cambridge nor the names of its
|
23
|
+
contributors may be used to endorse or promote products derived from
|
24
|
+
this software without specific prior written permission.
|
25
|
+
|
26
|
+
THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
|
27
|
+
AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
|
28
|
+
IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
|
29
|
+
ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
|
30
|
+
LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
|
31
|
+
CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
|
32
|
+
SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
|
33
|
+
INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
|
34
|
+
CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
|
35
|
+
ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
|
36
|
+
POSSIBILITY OF SUCH DAMAGE.
|
37
|
+
-----------------------------------------------------------------------------
|
38
|
+
*/
|
39
|
+
|
40
|
+
|
41
|
+
/* This module contains an internal function for validating UTF-8 character
|
42
|
+
strings. */
|
43
|
+
|
44
|
+
|
45
|
+
#ifdef HAVE_CONFIG_H
|
46
|
+
#include "config.h"
|
47
|
+
#endif
|
48
|
+
|
49
|
+
#include "pcre_internal.h"
|
50
|
+
|
51
|
+
|
52
|
+
/*************************************************
|
53
|
+
* Validate a UTF-8 string *
|
54
|
+
*************************************************/
|
55
|
+
|
56
|
+
/* This function is called (optionally) at the start of compile or match, to
|
57
|
+
check that a supposed UTF-8 string is actually valid. The early check means
|
58
|
+
that subsequent code can assume it is dealing with a valid string. The check
|
59
|
+
can be turned off for maximum performance, but the consequences of supplying an
|
60
|
+
invalid string are then undefined.
|
61
|
+
|
62
|
+
Originally, this function checked according to RFC 2279, allowing for values in
|
63
|
+
the range 0 to 0x7fffffff, up to 6 bytes long, but ensuring that they were in
|
64
|
+
the canonical format. Once somebody had pointed out RFC 3629 to me (it
|
65
|
+
obsoletes 2279), additional restrictions were applied. The values are now
|
66
|
+
limited to be between 0 and 0x0010ffff, no more than 4 bytes long, and the
|
67
|
+
subrange 0xd000 to 0xdfff is excluded. However, the format of 5-byte and 6-byte
|
68
|
+
characters is still checked.
|
69
|
+
|
70
|
+
From release 8.13 more information about the details of the error are passed
|
71
|
+
back in the returned value:
|
72
|
+
|
73
|
+
PCRE_UTF8_ERR0 No error
|
74
|
+
PCRE_UTF8_ERR1 Missing 1 byte at the end of the string
|
75
|
+
PCRE_UTF8_ERR2 Missing 2 bytes at the end of the string
|
76
|
+
PCRE_UTF8_ERR3 Missing 3 bytes at the end of the string
|
77
|
+
PCRE_UTF8_ERR4 Missing 4 bytes at the end of the string
|
78
|
+
PCRE_UTF8_ERR5 Missing 5 bytes at the end of the string
|
79
|
+
PCRE_UTF8_ERR6 2nd-byte's two top bits are not 0x80
|
80
|
+
PCRE_UTF8_ERR7 3rd-byte's two top bits are not 0x80
|
81
|
+
PCRE_UTF8_ERR8 4th-byte's two top bits are not 0x80
|
82
|
+
PCRE_UTF8_ERR9 5th-byte's two top bits are not 0x80
|
83
|
+
PCRE_UTF8_ERR10 6th-byte's two top bits are not 0x80
|
84
|
+
PCRE_UTF8_ERR11 5-byte character is not permitted by RFC 3629
|
85
|
+
PCRE_UTF8_ERR12 6-byte character is not permitted by RFC 3629
|
86
|
+
PCRE_UTF8_ERR13 4-byte character with value > 0x10ffff is not permitted
|
87
|
+
PCRE_UTF8_ERR14 3-byte character with value 0xd000-0xdfff is not permitted
|
88
|
+
PCRE_UTF8_ERR15 Overlong 2-byte sequence
|
89
|
+
PCRE_UTF8_ERR16 Overlong 3-byte sequence
|
90
|
+
PCRE_UTF8_ERR17 Overlong 4-byte sequence
|
91
|
+
PCRE_UTF8_ERR18 Overlong 5-byte sequence (won't ever occur)
|
92
|
+
PCRE_UTF8_ERR19 Overlong 6-byte sequence (won't ever occur)
|
93
|
+
PCRE_UTF8_ERR20 Isolated 0x80 byte (not within UTF-8 character)
|
94
|
+
PCRE_UTF8_ERR21 Byte with the illegal value 0xfe or 0xff
|
95
|
+
PCRE_UTF8_ERR22 Unused (was non-character)
|
96
|
+
|
97
|
+
Arguments:
|
98
|
+
string points to the string
|
99
|
+
length length of string, or -1 if the string is zero-terminated
|
100
|
+
errp pointer to an error position offset variable
|
101
|
+
|
102
|
+
Returns: = 0 if the string is a valid UTF-8 string
|
103
|
+
> 0 otherwise, setting the offset of the bad character
|
104
|
+
*/
|
105
|
+
|
106
|
+
int
|
107
|
+
PRIV(valid_utf)(PCRE_PUCHAR string, int length, int *erroroffset)
|
108
|
+
{
|
109
|
+
#ifdef SUPPORT_UTF
|
110
|
+
register PCRE_PUCHAR p;
|
111
|
+
|
112
|
+
if (length < 0)
|
113
|
+
{
|
114
|
+
for (p = string; *p != 0; p++);
|
115
|
+
length = (int)(p - string);
|
116
|
+
}
|
117
|
+
|
118
|
+
for (p = string; length-- > 0; p++)
|
119
|
+
{
|
120
|
+
register pcre_uchar ab, c, d;
|
121
|
+
|
122
|
+
c = *p;
|
123
|
+
if (c < 128) continue; /* ASCII character */
|
124
|
+
|
125
|
+
if (c < 0xc0) /* Isolated 10xx xxxx byte */
|
126
|
+
{
|
127
|
+
*erroroffset = (int)(p - string);
|
128
|
+
return PCRE_UTF8_ERR20;
|
129
|
+
}
|
130
|
+
|
131
|
+
if (c >= 0xfe) /* Invalid 0xfe or 0xff bytes */
|
132
|
+
{
|
133
|
+
*erroroffset = (int)(p - string);
|
134
|
+
return PCRE_UTF8_ERR21;
|
135
|
+
}
|
136
|
+
|
137
|
+
ab = PRIV(utf8_table4)[c & 0x3f]; /* Number of additional bytes */
|
138
|
+
if (length < ab)
|
139
|
+
{
|
140
|
+
*erroroffset = (int)(p - string); /* Missing bytes */
|
141
|
+
return ab - length; /* Codes ERR1 to ERR5 */
|
142
|
+
}
|
143
|
+
length -= ab; /* Length remaining */
|
144
|
+
|
145
|
+
/* Check top bits in the second byte */
|
146
|
+
|
147
|
+
if (((d = *(++p)) & 0xc0) != 0x80)
|
148
|
+
{
|
149
|
+
*erroroffset = (int)(p - string) - 1;
|
150
|
+
return PCRE_UTF8_ERR6;
|
151
|
+
}
|
152
|
+
|
153
|
+
/* For each length, check that the remaining bytes start with the 0x80 bit
|
154
|
+
set and not the 0x40 bit. Then check for an overlong sequence, and for the
|
155
|
+
excluded range 0xd800 to 0xdfff. */
|
156
|
+
|
157
|
+
switch (ab)
|
158
|
+
{
|
159
|
+
/* 2-byte character. No further bytes to check for 0x80. Check first byte
|
160
|
+
for for xx00 000x (overlong sequence). */
|
161
|
+
|
162
|
+
case 1: if ((c & 0x3e) == 0)
|
163
|
+
{
|
164
|
+
*erroroffset = (int)(p - string) - 1;
|
165
|
+
return PCRE_UTF8_ERR15;
|
166
|
+
}
|
167
|
+
break;
|
168
|
+
|
169
|
+
/* 3-byte character. Check third byte for 0x80. Then check first 2 bytes
|
170
|
+
for 1110 0000, xx0x xxxx (overlong sequence) or
|
171
|
+
1110 1101, 1010 xxxx (0xd800 - 0xdfff) */
|
172
|
+
|
173
|
+
case 2:
|
174
|
+
if ((*(++p) & 0xc0) != 0x80) /* Third byte */
|
175
|
+
{
|
176
|
+
*erroroffset = (int)(p - string) - 2;
|
177
|
+
return PCRE_UTF8_ERR7;
|
178
|
+
}
|
179
|
+
if (c == 0xe0 && (d & 0x20) == 0)
|
180
|
+
{
|
181
|
+
*erroroffset = (int)(p - string) - 2;
|
182
|
+
return PCRE_UTF8_ERR16;
|
183
|
+
}
|
184
|
+
if (c == 0xed && d >= 0xa0)
|
185
|
+
{
|
186
|
+
*erroroffset = (int)(p - string) - 2;
|
187
|
+
return PCRE_UTF8_ERR14;
|
188
|
+
}
|
189
|
+
break;
|
190
|
+
|
191
|
+
/* 4-byte character. Check 3rd and 4th bytes for 0x80. Then check first 2
|
192
|
+
bytes for for 1111 0000, xx00 xxxx (overlong sequence), then check for a
|
193
|
+
character greater than 0x0010ffff (f4 8f bf bf) */
|
194
|
+
|
195
|
+
case 3:
|
196
|
+
if ((*(++p) & 0xc0) != 0x80) /* Third byte */
|
197
|
+
{
|
198
|
+
*erroroffset = (int)(p - string) - 2;
|
199
|
+
return PCRE_UTF8_ERR7;
|
200
|
+
}
|
201
|
+
if ((*(++p) & 0xc0) != 0x80) /* Fourth byte */
|
202
|
+
{
|
203
|
+
*erroroffset = (int)(p - string) - 3;
|
204
|
+
return PCRE_UTF8_ERR8;
|
205
|
+
}
|
206
|
+
if (c == 0xf0 && (d & 0x30) == 0)
|
207
|
+
{
|
208
|
+
*erroroffset = (int)(p - string) - 3;
|
209
|
+
return PCRE_UTF8_ERR17;
|
210
|
+
}
|
211
|
+
if (c > 0xf4 || (c == 0xf4 && d > 0x8f))
|
212
|
+
{
|
213
|
+
*erroroffset = (int)(p - string) - 3;
|
214
|
+
return PCRE_UTF8_ERR13;
|
215
|
+
}
|
216
|
+
break;
|
217
|
+
|
218
|
+
/* 5-byte and 6-byte characters are not allowed by RFC 3629, and will be
|
219
|
+
rejected by the length test below. However, we do the appropriate tests
|
220
|
+
here so that overlong sequences get diagnosed, and also in case there is
|
221
|
+
ever an option for handling these larger code points. */
|
222
|
+
|
223
|
+
/* 5-byte character. Check 3rd, 4th, and 5th bytes for 0x80. Then check for
|
224
|
+
1111 1000, xx00 0xxx */
|
225
|
+
|
226
|
+
case 4:
|
227
|
+
if ((*(++p) & 0xc0) != 0x80) /* Third byte */
|
228
|
+
{
|
229
|
+
*erroroffset = (int)(p - string) - 2;
|
230
|
+
return PCRE_UTF8_ERR7;
|
231
|
+
}
|
232
|
+
if ((*(++p) & 0xc0) != 0x80) /* Fourth byte */
|
233
|
+
{
|
234
|
+
*erroroffset = (int)(p - string) - 3;
|
235
|
+
return PCRE_UTF8_ERR8;
|
236
|
+
}
|
237
|
+
if ((*(++p) & 0xc0) != 0x80) /* Fifth byte */
|
238
|
+
{
|
239
|
+
*erroroffset = (int)(p - string) - 4;
|
240
|
+
return PCRE_UTF8_ERR9;
|
241
|
+
}
|
242
|
+
if (c == 0xf8 && (d & 0x38) == 0)
|
243
|
+
{
|
244
|
+
*erroroffset = (int)(p - string) - 4;
|
245
|
+
return PCRE_UTF8_ERR18;
|
246
|
+
}
|
247
|
+
break;
|
248
|
+
|
249
|
+
/* 6-byte character. Check 3rd-6th bytes for 0x80. Then check for
|
250
|
+
1111 1100, xx00 00xx. */
|
251
|
+
|
252
|
+
case 5:
|
253
|
+
if ((*(++p) & 0xc0) != 0x80) /* Third byte */
|
254
|
+
{
|
255
|
+
*erroroffset = (int)(p - string) - 2;
|
256
|
+
return PCRE_UTF8_ERR7;
|
257
|
+
}
|
258
|
+
if ((*(++p) & 0xc0) != 0x80) /* Fourth byte */
|
259
|
+
{
|
260
|
+
*erroroffset = (int)(p - string) - 3;
|
261
|
+
return PCRE_UTF8_ERR8;
|
262
|
+
}
|
263
|
+
if ((*(++p) & 0xc0) != 0x80) /* Fifth byte */
|
264
|
+
{
|
265
|
+
*erroroffset = (int)(p - string) - 4;
|
266
|
+
return PCRE_UTF8_ERR9;
|
267
|
+
}
|
268
|
+
if ((*(++p) & 0xc0) != 0x80) /* Sixth byte */
|
269
|
+
{
|
270
|
+
*erroroffset = (int)(p - string) - 5;
|
271
|
+
return PCRE_UTF8_ERR10;
|
272
|
+
}
|
273
|
+
if (c == 0xfc && (d & 0x3c) == 0)
|
274
|
+
{
|
275
|
+
*erroroffset = (int)(p - string) - 5;
|
276
|
+
return PCRE_UTF8_ERR19;
|
277
|
+
}
|
278
|
+
break;
|
279
|
+
}
|
280
|
+
|
281
|
+
/* Character is valid under RFC 2279, but 4-byte and 5-byte characters are
|
282
|
+
excluded by RFC 3629. The pointer p is currently at the last byte of the
|
283
|
+
character. */
|
284
|
+
|
285
|
+
if (ab > 3)
|
286
|
+
{
|
287
|
+
*erroroffset = (int)(p - string) - ab;
|
288
|
+
return (ab == 4)? PCRE_UTF8_ERR11 : PCRE_UTF8_ERR12;
|
289
|
+
}
|
290
|
+
}
|
291
|
+
|
292
|
+
#else /* Not SUPPORT_UTF */
|
293
|
+
(void)(string); /* Keep picky compilers happy */
|
294
|
+
(void)(length);
|
295
|
+
(void)(erroroffset);
|
296
|
+
#endif
|
297
|
+
|
298
|
+
return PCRE_UTF8_ERR0; /* This indicates success */
|
299
|
+
}
|
300
|
+
|
301
|
+
/* End of pcre_valid_utf8.c */
|
@@ -0,0 +1,98 @@
|
|
1
|
+
/*************************************************
|
2
|
+
* Perl-Compatible Regular Expressions *
|
3
|
+
*************************************************/
|
4
|
+
|
5
|
+
/* PCRE is a library of functions to support regular expressions whose syntax
|
6
|
+
and semantics are as close as possible to those of the Perl 5 language.
|
7
|
+
|
8
|
+
Written by Philip Hazel
|
9
|
+
Copyright (c) 1997-2012 University of Cambridge
|
10
|
+
|
11
|
+
-----------------------------------------------------------------------------
|
12
|
+
Redistribution and use in source and binary forms, with or without
|
13
|
+
modification, are permitted provided that the following conditions are met:
|
14
|
+
|
15
|
+
* Redistributions of source code must retain the above copyright notice,
|
16
|
+
this list of conditions and the following disclaimer.
|
17
|
+
|
18
|
+
* Redistributions in binary form must reproduce the above copyright
|
19
|
+
notice, this list of conditions and the following disclaimer in the
|
20
|
+
documentation and/or other materials provided with the distribution.
|
21
|
+
|
22
|
+
* Neither the name of the University of Cambridge nor the names of its
|
23
|
+
contributors may be used to endorse or promote products derived from
|
24
|
+
this software without specific prior written permission.
|
25
|
+
|
26
|
+
THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
|
27
|
+
AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
|
28
|
+
IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
|
29
|
+
ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
|
30
|
+
LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
|
31
|
+
CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
|
32
|
+
SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
|
33
|
+
INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
|
34
|
+
CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
|
35
|
+
ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
|
36
|
+
POSSIBILITY OF SUCH DAMAGE.
|
37
|
+
-----------------------------------------------------------------------------
|
38
|
+
*/
|
39
|
+
|
40
|
+
|
41
|
+
/* This module contains the external function pcre_version(), which returns a
|
42
|
+
string that identifies the PCRE version that is in use. */
|
43
|
+
|
44
|
+
|
45
|
+
#ifdef HAVE_CONFIG_H
|
46
|
+
#include "config.h"
|
47
|
+
#endif
|
48
|
+
|
49
|
+
#include "pcre_internal.h"
|
50
|
+
|
51
|
+
|
52
|
+
/*************************************************
|
53
|
+
* Return version string *
|
54
|
+
*************************************************/
|
55
|
+
|
56
|
+
/* These macros are the standard way of turning unquoted text into C strings.
|
57
|
+
They allow macros like PCRE_MAJOR to be defined without quotes, which is
|
58
|
+
convenient for user programs that want to test its value. */
|
59
|
+
|
60
|
+
#define STRING(a) # a
|
61
|
+
#define XSTRING(s) STRING(s)
|
62
|
+
|
63
|
+
/* A problem turned up with PCRE_PRERELEASE, which is defined empty for
|
64
|
+
production releases. Originally, it was used naively in this code:
|
65
|
+
|
66
|
+
return XSTRING(PCRE_MAJOR)
|
67
|
+
"." XSTRING(PCRE_MINOR)
|
68
|
+
XSTRING(PCRE_PRERELEASE)
|
69
|
+
" " XSTRING(PCRE_DATE);
|
70
|
+
|
71
|
+
However, when PCRE_PRERELEASE is empty, this leads to an attempted expansion of
|
72
|
+
STRING(). The C standard states: "If (before argument substitution) any
|
73
|
+
argument consists of no preprocessing tokens, the behavior is undefined." It
|
74
|
+
turns out the gcc treats this case as a single empty string - which is what we
|
75
|
+
really want - but Visual C grumbles about the lack of an argument for the
|
76
|
+
macro. Unfortunately, both are within their rights. To cope with both ways of
|
77
|
+
handling this, I had resort to some messy hackery that does a test at run time.
|
78
|
+
I could find no way of detecting that a macro is defined as an empty string at
|
79
|
+
pre-processor time. This hack uses a standard trick for avoiding calling
|
80
|
+
the STRING macro with an empty argument when doing the test. */
|
81
|
+
|
82
|
+
#if defined COMPILE_PCRE8
|
83
|
+
PCRE_EXP_DEFN const char * PCRE_CALL_CONVENTION
|
84
|
+
pcre_version(void)
|
85
|
+
#elif defined COMPILE_PCRE16
|
86
|
+
PCRE_EXP_DEFN const char * PCRE_CALL_CONVENTION
|
87
|
+
pcre16_version(void)
|
88
|
+
#elif defined COMPILE_PCRE32
|
89
|
+
PCRE_EXP_DEFN const char * PCRE_CALL_CONVENTION
|
90
|
+
pcre32_version(void)
|
91
|
+
#endif
|
92
|
+
{
|
93
|
+
return (XSTRING(Z PCRE_PRERELEASE)[1] == 0)?
|
94
|
+
XSTRING(PCRE_MAJOR.PCRE_MINOR PCRE_DATE) :
|
95
|
+
XSTRING(PCRE_MAJOR.PCRE_MINOR) XSTRING(PCRE_PRERELEASE PCRE_DATE);
|
96
|
+
}
|
97
|
+
|
98
|
+
/* End of pcre_version.c */
|
@@ -0,0 +1,268 @@
|
|
1
|
+
/*************************************************
|
2
|
+
* Perl-Compatible Regular Expressions *
|
3
|
+
*************************************************/
|
4
|
+
|
5
|
+
/* PCRE is a library of functions to support regular expressions whose syntax
|
6
|
+
and semantics are as close as possible to those of the Perl 5 language.
|
7
|
+
|
8
|
+
Written by Philip Hazel
|
9
|
+
Copyright (c) 1997-2013 University of Cambridge
|
10
|
+
|
11
|
+
-----------------------------------------------------------------------------
|
12
|
+
Redistribution and use in source and binary forms, with or without
|
13
|
+
modification, are permitted provided that the following conditions are met:
|
14
|
+
|
15
|
+
* Redistributions of source code must retain the above copyright notice,
|
16
|
+
this list of conditions and the following disclaimer.
|
17
|
+
|
18
|
+
* Redistributions in binary form must reproduce the above copyright
|
19
|
+
notice, this list of conditions and the following disclaimer in the
|
20
|
+
documentation and/or other materials provided with the distribution.
|
21
|
+
|
22
|
+
* Neither the name of the University of Cambridge nor the names of its
|
23
|
+
contributors may be used to endorse or promote products derived from
|
24
|
+
this software without specific prior written permission.
|
25
|
+
|
26
|
+
THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
|
27
|
+
AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
|
28
|
+
IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
|
29
|
+
ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
|
30
|
+
LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
|
31
|
+
CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
|
32
|
+
SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
|
33
|
+
INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
|
34
|
+
CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
|
35
|
+
ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
|
36
|
+
POSSIBILITY OF SUCH DAMAGE.
|
37
|
+
-----------------------------------------------------------------------------
|
38
|
+
*/
|
39
|
+
|
40
|
+
|
41
|
+
/* This module contains an internal function that is used to match an extended
|
42
|
+
class. It is used by both pcre_exec() and pcre_def_exec(). */
|
43
|
+
|
44
|
+
|
45
|
+
#ifdef HAVE_CONFIG_H
|
46
|
+
#include "config.h"
|
47
|
+
#endif
|
48
|
+
|
49
|
+
#include "pcre_internal.h"
|
50
|
+
|
51
|
+
|
52
|
+
/*************************************************
|
53
|
+
* Match character against an XCLASS *
|
54
|
+
*************************************************/
|
55
|
+
|
56
|
+
/* This function is called to match a character against an extended class that
|
57
|
+
might contain values > 255 and/or Unicode properties.
|
58
|
+
|
59
|
+
Arguments:
|
60
|
+
c the character
|
61
|
+
data points to the flag byte of the XCLASS data
|
62
|
+
|
63
|
+
Returns: TRUE if character matches, else FALSE
|
64
|
+
*/
|
65
|
+
|
66
|
+
BOOL
|
67
|
+
PRIV(xclass)(pcre_uint32 c, const pcre_uchar *data, BOOL utf)
|
68
|
+
{
|
69
|
+
pcre_uchar t;
|
70
|
+
BOOL negated = (*data & XCL_NOT) != 0;
|
71
|
+
|
72
|
+
(void)utf;
|
73
|
+
#ifdef COMPILE_PCRE8
|
74
|
+
/* In 8 bit mode, this must always be TRUE. Help the compiler to know that. */
|
75
|
+
utf = TRUE;
|
76
|
+
#endif
|
77
|
+
|
78
|
+
/* Character values < 256 are matched against a bitmap, if one is present. If
|
79
|
+
not, we still carry on, because there may be ranges that start below 256 in the
|
80
|
+
additional data. */
|
81
|
+
|
82
|
+
if (c < 256)
|
83
|
+
{
|
84
|
+
if ((*data & XCL_HASPROP) == 0)
|
85
|
+
{
|
86
|
+
if ((*data & XCL_MAP) == 0) return negated;
|
87
|
+
return (((pcre_uint8 *)(data + 1))[c/8] & (1 << (c&7))) != 0;
|
88
|
+
}
|
89
|
+
if ((*data & XCL_MAP) != 0 &&
|
90
|
+
(((pcre_uint8 *)(data + 1))[c/8] & (1 << (c&7))) != 0)
|
91
|
+
return !negated; /* char found */
|
92
|
+
}
|
93
|
+
|
94
|
+
/* First skip the bit map if present. Then match against the list of Unicode
|
95
|
+
properties or large chars or ranges that end with a large char. We won't ever
|
96
|
+
encounter XCL_PROP or XCL_NOTPROP when UCP support is not compiled. */
|
97
|
+
|
98
|
+
if ((*data++ & XCL_MAP) != 0) data += 32 / sizeof(pcre_uchar);
|
99
|
+
|
100
|
+
while ((t = *data++) != XCL_END)
|
101
|
+
{
|
102
|
+
pcre_uint32 x, y;
|
103
|
+
if (t == XCL_SINGLE)
|
104
|
+
{
|
105
|
+
#ifdef SUPPORT_UTF
|
106
|
+
if (utf)
|
107
|
+
{
|
108
|
+
GETCHARINC(x, data); /* macro generates multiple statements */
|
109
|
+
}
|
110
|
+
else
|
111
|
+
#endif
|
112
|
+
x = *data++;
|
113
|
+
if (c == x) return !negated;
|
114
|
+
}
|
115
|
+
else if (t == XCL_RANGE)
|
116
|
+
{
|
117
|
+
#ifdef SUPPORT_UTF
|
118
|
+
if (utf)
|
119
|
+
{
|
120
|
+
GETCHARINC(x, data); /* macro generates multiple statements */
|
121
|
+
GETCHARINC(y, data); /* macro generates multiple statements */
|
122
|
+
}
|
123
|
+
else
|
124
|
+
#endif
|
125
|
+
{
|
126
|
+
x = *data++;
|
127
|
+
y = *data++;
|
128
|
+
}
|
129
|
+
if (c >= x && c <= y) return !negated;
|
130
|
+
}
|
131
|
+
|
132
|
+
#ifdef SUPPORT_UCP
|
133
|
+
else /* XCL_PROP & XCL_NOTPROP */
|
134
|
+
{
|
135
|
+
const ucd_record *prop = GET_UCD(c);
|
136
|
+
BOOL isprop = t == XCL_PROP;
|
137
|
+
|
138
|
+
switch(*data)
|
139
|
+
{
|
140
|
+
case PT_ANY:
|
141
|
+
if (isprop) return !negated;
|
142
|
+
break;
|
143
|
+
|
144
|
+
case PT_LAMP:
|
145
|
+
if ((prop->chartype == ucp_Lu || prop->chartype == ucp_Ll ||
|
146
|
+
prop->chartype == ucp_Lt) == isprop) return !negated;
|
147
|
+
break;
|
148
|
+
|
149
|
+
case PT_GC:
|
150
|
+
if ((data[1] == PRIV(ucp_gentype)[prop->chartype]) == isprop)
|
151
|
+
return !negated;
|
152
|
+
break;
|
153
|
+
|
154
|
+
case PT_PC:
|
155
|
+
if ((data[1] == prop->chartype) == isprop) return !negated;
|
156
|
+
break;
|
157
|
+
|
158
|
+
case PT_SC:
|
159
|
+
if ((data[1] == prop->script) == isprop) return !negated;
|
160
|
+
break;
|
161
|
+
|
162
|
+
case PT_ALNUM:
|
163
|
+
if ((PRIV(ucp_gentype)[prop->chartype] == ucp_L ||
|
164
|
+
PRIV(ucp_gentype)[prop->chartype] == ucp_N) == isprop)
|
165
|
+
return !negated;
|
166
|
+
break;
|
167
|
+
|
168
|
+
/* Perl space used to exclude VT, but from Perl 5.18 it is included,
|
169
|
+
which means that Perl space and POSIX space are now identical. PCRE
|
170
|
+
was changed at release 8.34. */
|
171
|
+
|
172
|
+
case PT_SPACE: /* Perl space */
|
173
|
+
case PT_PXSPACE: /* POSIX space */
|
174
|
+
switch(c)
|
175
|
+
{
|
176
|
+
HSPACE_CASES:
|
177
|
+
VSPACE_CASES:
|
178
|
+
if (isprop) return !negated;
|
179
|
+
break;
|
180
|
+
|
181
|
+
default:
|
182
|
+
if ((PRIV(ucp_gentype)[prop->chartype] == ucp_Z) == isprop)
|
183
|
+
return !negated;
|
184
|
+
break;
|
185
|
+
}
|
186
|
+
break;
|
187
|
+
|
188
|
+
case PT_WORD:
|
189
|
+
if ((PRIV(ucp_gentype)[prop->chartype] == ucp_L ||
|
190
|
+
PRIV(ucp_gentype)[prop->chartype] == ucp_N || c == CHAR_UNDERSCORE)
|
191
|
+
== isprop)
|
192
|
+
return !negated;
|
193
|
+
break;
|
194
|
+
|
195
|
+
case PT_UCNC:
|
196
|
+
if (c < 0xa0)
|
197
|
+
{
|
198
|
+
if ((c == CHAR_DOLLAR_SIGN || c == CHAR_COMMERCIAL_AT ||
|
199
|
+
c == CHAR_GRAVE_ACCENT) == isprop)
|
200
|
+
return !negated;
|
201
|
+
}
|
202
|
+
else
|
203
|
+
{
|
204
|
+
if ((c < 0xd800 || c > 0xdfff) == isprop)
|
205
|
+
return !negated;
|
206
|
+
}
|
207
|
+
break;
|
208
|
+
|
209
|
+
/* The following three properties can occur only in an XCLASS, as there
|
210
|
+
is no \p or \P coding for them. */
|
211
|
+
|
212
|
+
/* Graphic character. Implement this as not Z (space or separator) and
|
213
|
+
not C (other), except for Cf (format) with a few exceptions. This seems
|
214
|
+
to be what Perl does. The exceptional characters are:
|
215
|
+
|
216
|
+
U+061C Arabic Letter Mark
|
217
|
+
U+180E Mongolian Vowel Separator
|
218
|
+
U+2066 - U+2069 Various "isolate"s
|
219
|
+
*/
|
220
|
+
|
221
|
+
case PT_PXGRAPH:
|
222
|
+
if ((PRIV(ucp_gentype)[prop->chartype] != ucp_Z &&
|
223
|
+
(PRIV(ucp_gentype)[prop->chartype] != ucp_C ||
|
224
|
+
(prop->chartype == ucp_Cf &&
|
225
|
+
c != 0x061c && c != 0x180e && (c < 0x2066 || c > 0x2069))
|
226
|
+
)) == isprop)
|
227
|
+
return !negated;
|
228
|
+
break;
|
229
|
+
|
230
|
+
/* Printable character: same as graphic, with the addition of Zs, i.e.
|
231
|
+
not Zl and not Zp, and U+180E. */
|
232
|
+
|
233
|
+
case PT_PXPRINT:
|
234
|
+
if ((prop->chartype != ucp_Zl &&
|
235
|
+
prop->chartype != ucp_Zp &&
|
236
|
+
(PRIV(ucp_gentype)[prop->chartype] != ucp_C ||
|
237
|
+
(prop->chartype == ucp_Cf &&
|
238
|
+
c != 0x061c && (c < 0x2066 || c > 0x2069))
|
239
|
+
)) == isprop)
|
240
|
+
return !negated;
|
241
|
+
break;
|
242
|
+
|
243
|
+
/* Punctuation: all Unicode punctuation, plus ASCII characters that
|
244
|
+
Unicode treats as symbols rather than punctuation, for Perl
|
245
|
+
compatibility (these are $+<=>^`|~). */
|
246
|
+
|
247
|
+
case PT_PXPUNCT:
|
248
|
+
if ((PRIV(ucp_gentype)[prop->chartype] == ucp_P ||
|
249
|
+
(c < 128 && PRIV(ucp_gentype)[prop->chartype] == ucp_S)) == isprop)
|
250
|
+
return !negated;
|
251
|
+
break;
|
252
|
+
|
253
|
+
/* This should never occur, but compilers may mutter if there is no
|
254
|
+
default. */
|
255
|
+
|
256
|
+
default:
|
257
|
+
return FALSE;
|
258
|
+
}
|
259
|
+
|
260
|
+
data += 2;
|
261
|
+
}
|
262
|
+
#endif /* SUPPORT_UCP */
|
263
|
+
}
|
264
|
+
|
265
|
+
return negated; /* char did not match */
|
266
|
+
}
|
267
|
+
|
268
|
+
/* End of pcre_xclass.c */
|