debase-ruby_core_source 0.7.9 → 0.7.10

Sign up to get free protection for your applications and to get access to all the features.
Files changed (127) hide show
  1. checksums.yaml +4 -4
  2. data/CHANGELOG.md +6 -0
  3. data/README.md +2 -0
  4. data/lib/debase/ruby_core_source/ruby-2.0.0-p647/addr2line.h +21 -0
  5. data/lib/debase/ruby_core_source/ruby-2.0.0-p647/constant.h +36 -0
  6. data/lib/debase/ruby_core_source/ruby-2.0.0-p647/dln.h +50 -0
  7. data/lib/debase/ruby_core_source/ruby-2.0.0-p647/encdb.h +169 -0
  8. data/lib/debase/ruby_core_source/ruby-2.0.0-p647/eval_intern.h +241 -0
  9. data/lib/debase/ruby_core_source/ruby-2.0.0-p647/gc.h +104 -0
  10. data/lib/debase/ruby_core_source/ruby-2.0.0-p647/id.h +135 -0
  11. data/lib/debase/ruby_core_source/ruby-2.0.0-p647/insns.inc +187 -0
  12. data/lib/debase/ruby_core_source/ruby-2.0.0-p647/insns_info.inc +724 -0
  13. data/lib/debase/ruby_core_source/ruby-2.0.0-p647/internal.h +395 -0
  14. data/lib/debase/ruby_core_source/ruby-2.0.0-p647/iseq.h +140 -0
  15. data/lib/debase/ruby_core_source/ruby-2.0.0-p647/known_errors.inc +731 -0
  16. data/lib/debase/ruby_core_source/ruby-2.0.0-p647/method.h +141 -0
  17. data/lib/debase/ruby_core_source/ruby-2.0.0-p647/node.h +541 -0
  18. data/lib/debase/ruby_core_source/ruby-2.0.0-p647/node_name.inc +212 -0
  19. data/lib/debase/ruby_core_source/ruby-2.0.0-p647/opt_sc.inc +702 -0
  20. data/lib/debase/ruby_core_source/ruby-2.0.0-p647/optinsn.inc +83 -0
  21. data/lib/debase/ruby_core_source/ruby-2.0.0-p647/optunifs.inc +120 -0
  22. data/lib/debase/ruby_core_source/ruby-2.0.0-p647/parse.h +181 -0
  23. data/lib/debase/ruby_core_source/ruby-2.0.0-p647/probes_helper.h +67 -0
  24. data/lib/debase/ruby_core_source/ruby-2.0.0-p647/regenc.h +227 -0
  25. data/lib/debase/ruby_core_source/ruby-2.0.0-p647/regint.h +915 -0
  26. data/lib/debase/ruby_core_source/ruby-2.0.0-p647/regparse.h +367 -0
  27. data/lib/debase/ruby_core_source/ruby-2.0.0-p647/revision.h +1 -0
  28. data/lib/debase/ruby_core_source/ruby-2.0.0-p647/ruby_atomic.h +170 -0
  29. data/lib/debase/ruby_core_source/ruby-2.0.0-p647/siphash.h +48 -0
  30. data/lib/debase/ruby_core_source/ruby-2.0.0-p647/thread_pthread.h +56 -0
  31. data/lib/debase/ruby_core_source/ruby-2.0.0-p647/thread_win32.h +45 -0
  32. data/lib/debase/ruby_core_source/ruby-2.0.0-p647/timev.h +21 -0
  33. data/lib/debase/ruby_core_source/ruby-2.0.0-p647/transcode_data.h +127 -0
  34. data/lib/debase/ruby_core_source/ruby-2.0.0-p647/transdb.h +193 -0
  35. data/lib/debase/ruby_core_source/ruby-2.0.0-p647/version.h +52 -0
  36. data/lib/debase/ruby_core_source/ruby-2.0.0-p647/vm.inc +3196 -0
  37. data/lib/debase/ruby_core_source/ruby-2.0.0-p647/vm_core.h +1020 -0
  38. data/lib/debase/ruby_core_source/ruby-2.0.0-p647/vm_debug.h +41 -0
  39. data/lib/debase/ruby_core_source/ruby-2.0.0-p647/vm_exec.h +173 -0
  40. data/lib/debase/ruby_core_source/ruby-2.0.0-p647/vm_insnhelper.h +274 -0
  41. data/lib/debase/ruby_core_source/ruby-2.0.0-p647/vm_opts.h +56 -0
  42. data/lib/debase/ruby_core_source/ruby-2.0.0-p647/vmtc.inc +101 -0
  43. data/lib/debase/ruby_core_source/ruby-2.1.7-p400/addr2line.h +21 -0
  44. data/lib/debase/ruby_core_source/ruby-2.1.7-p400/constant.h +36 -0
  45. data/lib/debase/ruby_core_source/ruby-2.1.7-p400/dln.h +51 -0
  46. data/lib/debase/ruby_core_source/ruby-2.1.7-p400/encdb.h +170 -0
  47. data/lib/debase/ruby_core_source/ruby-2.1.7-p400/eval_intern.h +270 -0
  48. data/lib/debase/ruby_core_source/ruby-2.1.7-p400/gc.h +101 -0
  49. data/lib/debase/ruby_core_source/ruby-2.1.7-p400/id.h +171 -0
  50. data/lib/debase/ruby_core_source/ruby-2.1.7-p400/insns.inc +189 -0
  51. data/lib/debase/ruby_core_source/ruby-2.1.7-p400/insns_info.inc +731 -0
  52. data/lib/debase/ruby_core_source/ruby-2.1.7-p400/internal.h +894 -0
  53. data/lib/debase/ruby_core_source/ruby-2.1.7-p400/iseq.h +136 -0
  54. data/lib/debase/ruby_core_source/ruby-2.1.7-p400/known_errors.inc +731 -0
  55. data/lib/debase/ruby_core_source/ruby-2.1.7-p400/method.h +145 -0
  56. data/lib/debase/ruby_core_source/ruby-2.1.7-p400/node.h +543 -0
  57. data/lib/debase/ruby_core_source/ruby-2.1.7-p400/node_name.inc +212 -0
  58. data/lib/debase/ruby_core_source/ruby-2.1.7-p400/opt_sc.inc +710 -0
  59. data/lib/debase/ruby_core_source/ruby-2.1.7-p400/optinsn.inc +83 -0
  60. data/lib/debase/ruby_core_source/ruby-2.1.7-p400/optunifs.inc +121 -0
  61. data/lib/debase/ruby_core_source/ruby-2.1.7-p400/parse.h +183 -0
  62. data/lib/debase/ruby_core_source/ruby-2.1.7-p400/probes_helper.h +67 -0
  63. data/lib/debase/ruby_core_source/ruby-2.1.7-p400/regenc.h +223 -0
  64. data/lib/debase/ruby_core_source/ruby-2.1.7-p400/regint.h +911 -0
  65. data/lib/debase/ruby_core_source/ruby-2.1.7-p400/regparse.h +363 -0
  66. data/lib/debase/ruby_core_source/ruby-2.1.7-p400/revision.h +1 -0
  67. data/lib/debase/ruby_core_source/ruby-2.1.7-p400/ruby_atomic.h +170 -0
  68. data/lib/debase/ruby_core_source/ruby-2.1.7-p400/siphash.h +48 -0
  69. data/lib/debase/ruby_core_source/ruby-2.1.7-p400/thread_native.h +23 -0
  70. data/lib/debase/ruby_core_source/ruby-2.1.7-p400/thread_pthread.h +56 -0
  71. data/lib/debase/ruby_core_source/ruby-2.1.7-p400/thread_win32.h +45 -0
  72. data/lib/debase/ruby_core_source/ruby-2.1.7-p400/timev.h +42 -0
  73. data/lib/debase/ruby_core_source/ruby-2.1.7-p400/transcode_data.h +123 -0
  74. data/lib/debase/ruby_core_source/ruby-2.1.7-p400/transdb.h +190 -0
  75. data/lib/debase/ruby_core_source/ruby-2.1.7-p400/version.h +52 -0
  76. data/lib/debase/ruby_core_source/ruby-2.1.7-p400/vm.inc +3243 -0
  77. data/lib/debase/ruby_core_source/ruby-2.1.7-p400/vm_core.h +1057 -0
  78. data/lib/debase/ruby_core_source/ruby-2.1.7-p400/vm_debug.h +37 -0
  79. data/lib/debase/ruby_core_source/ruby-2.1.7-p400/vm_exec.h +182 -0
  80. data/lib/debase/ruby_core_source/ruby-2.1.7-p400/vm_insnhelper.h +273 -0
  81. data/lib/debase/ruby_core_source/ruby-2.1.7-p400/vm_opts.h +56 -0
  82. data/lib/debase/ruby_core_source/ruby-2.1.7-p400/vmtc.inc +102 -0
  83. data/lib/debase/ruby_core_source/ruby-2.2.3-p173/addr2line.h +21 -0
  84. data/lib/debase/ruby_core_source/ruby-2.2.3-p173/ccan/build_assert/build_assert.h +40 -0
  85. data/lib/debase/ruby_core_source/ruby-2.2.3-p173/ccan/check_type/check_type.h +63 -0
  86. data/lib/debase/ruby_core_source/ruby-2.2.3-p173/ccan/container_of/container_of.h +142 -0
  87. data/lib/debase/ruby_core_source/ruby-2.2.3-p173/ccan/list/list.h +635 -0
  88. data/lib/debase/ruby_core_source/ruby-2.2.3-p173/ccan/str/str.h +16 -0
  89. data/lib/debase/ruby_core_source/ruby-2.2.3-p173/constant.h +43 -0
  90. data/lib/debase/ruby_core_source/ruby-2.2.3-p173/dln.h +51 -0
  91. data/lib/debase/ruby_core_source/ruby-2.2.3-p173/eval_intern.h +275 -0
  92. data/lib/debase/ruby_core_source/ruby-2.2.3-p173/gc.h +107 -0
  93. data/lib/debase/ruby_core_source/ruby-2.2.3-p173/id.h +210 -0
  94. data/lib/debase/ruby_core_source/ruby-2.2.3-p173/insns.inc +107 -0
  95. data/lib/debase/ruby_core_source/ruby-2.2.3-p173/insns_info.inc +752 -0
  96. data/lib/debase/ruby_core_source/ruby-2.2.3-p173/internal.h +1187 -0
  97. data/lib/debase/ruby_core_source/ruby-2.2.3-p173/iseq.h +158 -0
  98. data/lib/debase/ruby_core_source/ruby-2.2.3-p173/known_errors.inc +746 -0
  99. data/lib/debase/ruby_core_source/ruby-2.2.3-p173/method.h +144 -0
  100. data/lib/debase/ruby_core_source/ruby-2.2.3-p173/node.h +544 -0
  101. data/lib/debase/ruby_core_source/ruby-2.2.3-p173/node_name.inc +212 -0
  102. data/lib/debase/ruby_core_source/ruby-2.2.3-p173/opt_sc.inc +734 -0
  103. data/lib/debase/ruby_core_source/ruby-2.2.3-p173/optinsn.inc +83 -0
  104. data/lib/debase/ruby_core_source/ruby-2.2.3-p173/optunifs.inc +124 -0
  105. data/lib/debase/ruby_core_source/ruby-2.2.3-p173/parse.h +184 -0
  106. data/lib/debase/ruby_core_source/ruby-2.2.3-p173/probes_helper.h +67 -0
  107. data/lib/debase/ruby_core_source/ruby-2.2.3-p173/regenc.h +234 -0
  108. data/lib/debase/ruby_core_source/ruby-2.2.3-p173/regint.h +972 -0
  109. data/lib/debase/ruby_core_source/ruby-2.2.3-p173/regparse.h +363 -0
  110. data/lib/debase/ruby_core_source/ruby-2.2.3-p173/revision.h +1 -0
  111. data/lib/debase/ruby_core_source/ruby-2.2.3-p173/ruby_atomic.h +170 -0
  112. data/lib/debase/ruby_core_source/ruby-2.2.3-p173/siphash.h +48 -0
  113. data/lib/debase/ruby_core_source/ruby-2.2.3-p173/symbol.h +88 -0
  114. data/lib/debase/ruby_core_source/ruby-2.2.3-p173/thread_pthread.h +54 -0
  115. data/lib/debase/ruby_core_source/ruby-2.2.3-p173/thread_win32.h +36 -0
  116. data/lib/debase/ruby_core_source/ruby-2.2.3-p173/timev.h +42 -0
  117. data/lib/debase/ruby_core_source/ruby-2.2.3-p173/transcode_data.h +123 -0
  118. data/lib/debase/ruby_core_source/ruby-2.2.3-p173/version.h +52 -0
  119. data/lib/debase/ruby_core_source/ruby-2.2.3-p173/vm.inc +3353 -0
  120. data/lib/debase/ruby_core_source/ruby-2.2.3-p173/vm_core.h +1160 -0
  121. data/lib/debase/ruby_core_source/ruby-2.2.3-p173/vm_debug.h +37 -0
  122. data/lib/debase/ruby_core_source/ruby-2.2.3-p173/vm_exec.h +182 -0
  123. data/lib/debase/ruby_core_source/ruby-2.2.3-p173/vm_insnhelper.h +233 -0
  124. data/lib/debase/ruby_core_source/ruby-2.2.3-p173/vm_opts.h +56 -0
  125. data/lib/debase/ruby_core_source/ruby-2.2.3-p173/vmtc.inc +105 -0
  126. data/lib/debase/ruby_core_source/version.rb +1 -1
  127. metadata +124 -2
@@ -0,0 +1,48 @@
1
+ #ifndef SIPHASH_H
2
+ #define SIPHASH_H 1
3
+ #include <stdlib.h>
4
+ #ifdef HAVE_STDINT_H
5
+ #include <stdint.h>
6
+ #endif
7
+ #ifdef HAVE_INTTYPES_H
8
+ #include <inttypes.h>
9
+ #endif
10
+
11
+ #ifndef HAVE_UINT64_T
12
+ typedef struct {
13
+ uint32_t u32[2];
14
+ } sip_uint64_t;
15
+ #define uint64_t sip_uint64_t
16
+ #else
17
+ typedef uint64_t sip_uint64_t;
18
+ #endif
19
+
20
+ typedef struct {
21
+ int c;
22
+ int d;
23
+ uint64_t v[4];
24
+ uint8_t buf[sizeof(uint64_t)];
25
+ uint8_t buflen;
26
+ uint8_t msglen_byte;
27
+ } sip_state;
28
+
29
+ typedef struct sip_interface_st sip_interface;
30
+
31
+ typedef struct {
32
+ sip_state state[1];
33
+ const sip_interface *methods;
34
+ } sip_hash;
35
+
36
+ sip_hash *sip_hash_new(const uint8_t key[16], int c, int d);
37
+ sip_hash *sip_hash_init(sip_hash *h, const uint8_t key[16], int c, int d);
38
+ int sip_hash_update(sip_hash *h, const uint8_t *data, size_t len);
39
+ int sip_hash_final(sip_hash *h, uint8_t **digest, size_t *len);
40
+ int sip_hash_final_integer(sip_hash *h, uint64_t *digest);
41
+ int sip_hash_digest(sip_hash *h, const uint8_t *data, size_t data_len, uint8_t **digest, size_t *digest_len);
42
+ int sip_hash_digest_integer(sip_hash *h, const uint8_t *data, size_t data_len, uint64_t *digest);
43
+ void sip_hash_free(sip_hash *h);
44
+ void sip_hash_dump(sip_hash *h);
45
+
46
+ uint64_t sip_hash24(const uint8_t key[16], const uint8_t *data, size_t len);
47
+
48
+ #endif
@@ -0,0 +1,23 @@
1
+ #ifndef RUBY_THREAD_NATIVE_H
2
+ #define RUBY_THREAD_NATIVE_H
3
+
4
+ #if defined(_WIN32)
5
+ #include "thread_win32.h"
6
+ #elif defined(HAVE_PTHREAD_H)
7
+ #include "thread_pthread.h"
8
+ #else
9
+ #error "unsupported thread type"
10
+ #endif
11
+
12
+ RUBY_SYMBOL_EXPORT_BEGIN
13
+
14
+ rb_nativethread_id_t rb_nativethread_self();
15
+
16
+ void rb_nativethread_lock_initialize(rb_nativethread_lock_t *lock);
17
+ void rb_nativethread_lock_destroy(rb_nativethread_lock_t *lock);
18
+ void rb_nativethread_lock_lock(rb_nativethread_lock_t *lock);
19
+ void rb_nativethread_lock_unlock(rb_nativethread_lock_t *lock);
20
+
21
+ RUBY_SYMBOL_EXPORT_END
22
+
23
+ #endif
@@ -0,0 +1,56 @@
1
+ /**********************************************************************
2
+
3
+ thread_pthread.h -
4
+
5
+ $Author: ko1 $
6
+
7
+ Copyright (C) 2004-2007 Koichi Sasada
8
+
9
+ **********************************************************************/
10
+
11
+ #ifndef RUBY_THREAD_PTHREAD_H
12
+ #define RUBY_THREAD_PTHREAD_H
13
+
14
+ #include <pthread.h>
15
+ #ifdef HAVE_PTHREAD_NP_H
16
+ #include <pthread_np.h>
17
+ #endif
18
+ typedef pthread_t rb_nativethread_id_t;
19
+ typedef pthread_mutex_t rb_nativethread_lock_t;
20
+
21
+ typedef struct rb_thread_cond_struct {
22
+ pthread_cond_t cond;
23
+ #ifdef HAVE_CLOCKID_T
24
+ clockid_t clockid;
25
+ #endif
26
+ } rb_nativethread_cond_t;
27
+
28
+ typedef struct native_thread_data_struct {
29
+ void *signal_thread_list;
30
+ rb_nativethread_cond_t sleep_cond;
31
+ } native_thread_data_t;
32
+
33
+ #include <semaphore.h>
34
+
35
+ #undef except
36
+ #undef try
37
+ #undef leave
38
+ #undef finally
39
+
40
+ typedef struct rb_global_vm_lock_struct {
41
+ /* fast path */
42
+ unsigned long acquired;
43
+ pthread_mutex_t lock;
44
+
45
+ /* slow path */
46
+ volatile unsigned long waiting;
47
+ rb_nativethread_cond_t cond;
48
+
49
+ /* yield */
50
+ rb_nativethread_cond_t switch_cond;
51
+ rb_nativethread_cond_t switch_wait_cond;
52
+ int need_yield;
53
+ int wait_yield;
54
+ } rb_global_vm_lock_t;
55
+
56
+ #endif /* RUBY_THREAD_PTHREAD_H */
@@ -0,0 +1,45 @@
1
+ /**********************************************************************
2
+
3
+ thread_win32.h -
4
+
5
+ $Author: ko1 $
6
+
7
+ Copyright (C) 2004-2007 Koichi Sasada
8
+
9
+ **********************************************************************/
10
+
11
+ /* interface */
12
+ #ifndef RUBY_THREAD_WIN32_H
13
+ #define RUBY_THREAD_WIN32_H
14
+
15
+ #include <windows.h>
16
+
17
+ # ifdef __CYGWIN__
18
+ # undef _WIN32
19
+ # endif
20
+
21
+ WINBASEAPI BOOL WINAPI
22
+ TryEnterCriticalSection(IN OUT LPCRITICAL_SECTION lpCriticalSection);
23
+
24
+ typedef HANDLE rb_nativethread_id_t;
25
+
26
+ typedef union rb_thread_lock_union {
27
+ HANDLE mutex;
28
+ CRITICAL_SECTION crit;
29
+ } rb_nativethread_lock_t;
30
+
31
+ typedef struct rb_thread_cond_struct {
32
+ struct cond_event_entry *next;
33
+ struct cond_event_entry *prev;
34
+ } rb_nativethread_cond_t;
35
+
36
+ typedef struct native_thread_data_struct {
37
+ HANDLE interrupt_event;
38
+ } native_thread_data_t;
39
+
40
+ typedef struct rb_global_vm_lock_struct {
41
+ HANDLE lock;
42
+ } rb_global_vm_lock_t;
43
+
44
+ #endif /* RUBY_THREAD_WIN32_H */
45
+
@@ -0,0 +1,42 @@
1
+ #ifndef RUBY_TIMEV_H
2
+ #define RUBY_TIMEV_H
3
+
4
+ struct vtm {
5
+ VALUE year; /* 2000 for example. Integer. */
6
+ int mon; /* 1..12 */
7
+ int mday; /* 1..31 */
8
+ int hour; /* 0..23 */
9
+ int min; /* 0..59 */
10
+ int sec; /* 0..60 */
11
+ VALUE subsecx; /* 0 <= subsecx < TIME_SCALE. possibly Rational. */
12
+ VALUE utc_offset; /* -3600 as -01:00 for example. possibly Rational. */
13
+ int wday; /* 0:Sunday, 1:Monday, ..., 6:Saturday */
14
+ int yday; /* 1..366 */
15
+ int isdst; /* 0:StandardTime 1:DayLightSavingTime */
16
+ const char *zone; /* "JST", "EST", "EDT", etc. */
17
+ };
18
+
19
+ #define TIME_SCALE 1000000000
20
+
21
+ #ifndef TYPEOF_TIMEVAL_TV_SEC
22
+ # define TYPEOF_TIMEVAL_TV_SEC time_t
23
+ #endif
24
+ #ifndef TYPEOF_TIMEVAL_TV_USEC
25
+ # if INT_MAX >= 1000000
26
+ # define TYPEOF_TIMEVAL_TV_USEC int
27
+ # else
28
+ # define TYPEOF_TIMEVAL_TV_USEC long
29
+ # endif
30
+ #endif
31
+
32
+ #if SIZEOF_TIME_T == SIZEOF_LONG
33
+ typedef unsigned long unsigned_time_t;
34
+ #elif SIZEOF_TIME_T == SIZEOF_INT
35
+ typedef unsigned int unsigned_time_t;
36
+ #elif SIZEOF_TIME_T == SIZEOF_LONG_LONG
37
+ typedef unsigned LONG_LONG unsigned_time_t;
38
+ #else
39
+ # error cannot find integer type which size is same as time_t.
40
+ #endif
41
+
42
+ #endif
@@ -0,0 +1,123 @@
1
+ /**********************************************************************
2
+
3
+ transcode_data.h -
4
+
5
+ $Author: nobu $
6
+ created at: Mon 10 Dec 2007 14:01:47 JST 2007
7
+
8
+ Copyright (C) 2007 Martin Duerst
9
+
10
+ **********************************************************************/
11
+
12
+ #include "ruby/ruby.h"
13
+
14
+ #ifndef RUBY_TRANSCODE_DATA_H
15
+ #define RUBY_TRANSCODE_DATA_H 1
16
+
17
+ RUBY_SYMBOL_EXPORT_BEGIN
18
+
19
+ #define WORDINDEX_SHIFT_BITS 2
20
+ #define WORDINDEX2INFO(widx) ((widx) << WORDINDEX_SHIFT_BITS)
21
+ #define INFO2WORDINDEX(info) ((info) >> WORDINDEX_SHIFT_BITS)
22
+ #define BYTE_LOOKUP_BASE(bl) ((bl)[0])
23
+ #define BYTE_LOOKUP_INFO(bl) ((bl)[1])
24
+
25
+ #define PType (unsigned int)
26
+
27
+ #define NOMAP (PType 0x01) /* direct map */
28
+ #define ONEbt (0x02) /* one byte payload */
29
+ #define TWObt (0x03) /* two bytes payload */
30
+ #define THREEbt (0x05) /* three bytes payload */
31
+ #define FOURbt (0x06) /* four bytes payload, UTF-8 only, macros start at getBT0 */
32
+ #define INVALID (PType 0x07) /* invalid byte sequence */
33
+ #define UNDEF (PType 0x09) /* legal but undefined */
34
+ #define ZERObt (PType 0x0A) /* zero bytes of payload, i.e. remove */
35
+ #define FUNii (PType 0x0B) /* function from info to info */
36
+ #define FUNsi (PType 0x0D) /* function from start to info */
37
+ #define FUNio (PType 0x0E) /* function from info to output */
38
+ #define FUNso (PType 0x0F) /* function from start to output */
39
+ #define STR1 (PType 0x11) /* string 4 <= len <= 259 bytes: 1byte length + content */
40
+ #define GB4bt (PType 0x12) /* GB18030 four bytes payload */
41
+ #define FUNsio (PType 0x13) /* function from start and info to output */
42
+
43
+ #define STR1_LENGTH(byte_addr) (unsigned int)(*(byte_addr) + 4)
44
+ #define STR1_BYTEINDEX(w) ((w) >> 6)
45
+ #define makeSTR1(bi) (((bi) << 6) | STR1)
46
+ #define makeSTR1LEN(len) ((len)-4)
47
+
48
+ #define o1(b1) (PType((((unsigned char)(b1))<<8)|ONEbt))
49
+ #define o2(b1,b2) (PType((((unsigned char)(b1))<<8)|(((unsigned char)(b2))<<16)|TWObt))
50
+ #define o3(b1,b2,b3) (PType(((((unsigned char)(b1))<<8)|(((unsigned char)(b2))<<16)|(((unsigned int)(unsigned char)(b3))<<24)|THREEbt)&0xffffffffU))
51
+ #define o4(b0,b1,b2,b3) (PType(((((unsigned char)(b1))<<8)|(((unsigned char)(b2))<<16)|(((unsigned char)(b3))<<24)|((((unsigned char)(b0))&0x07)<<5)|FOURbt)&0xffffffffU))
52
+ #define g4(b0,b1,b2,b3) (PType(((((unsigned char)(b0))<<8)|(((unsigned char)(b2))<<16)|((((unsigned char)(b1))&0x0f)<<24)|((((unsigned int)(unsigned char)(b3))&0x0f)<<28)|GB4bt)&0xffffffffU))
53
+ #define funsio(diff) (PType((((unsigned int)(diff))<<8)|FUNsio))
54
+
55
+ #define getBT1(a) ((unsigned char)((a)>> 8))
56
+ #define getBT2(a) ((unsigned char)((a)>>16))
57
+ #define getBT3(a) ((unsigned char)((a)>>24))
58
+ #define getBT0(a) (((unsigned char)((a)>> 5)&0x07)|0xF0) /* for UTF-8 only!!! */
59
+
60
+ #define getGB4bt0(a) ((unsigned char)((a)>> 8))
61
+ #define getGB4bt1(a) (((unsigned char)((a)>>24)&0x0F)|0x30)
62
+ #define getGB4bt2(a) ((unsigned char)((a)>>16))
63
+ #define getGB4bt3(a) (((unsigned char)((a)>>28)&0x0F)|0x30)
64
+
65
+ #define o2FUNii(b1,b2) (PType((((unsigned char)(b1))<<8)|(((unsigned char)(b2))<<16)|FUNii))
66
+
67
+ /* do we need these??? maybe not, can be done with simple tables */
68
+ #define ONETRAIL /* legal but undefined if one more trailing UTF-8 */
69
+ #define TWOTRAIL /* legal but undefined if two more trailing UTF-8 */
70
+ #define THREETRAIL /* legal but undefined if three more trailing UTF-8 */
71
+
72
+ typedef enum {
73
+ asciicompat_converter, /* ASCII-compatible -> ASCII-compatible */
74
+ asciicompat_decoder, /* ASCII-incompatible -> ASCII-compatible */
75
+ asciicompat_encoder /* ASCII-compatible -> ASCII-incompatible */
76
+ /* ASCII-incompatible -> ASCII-incompatible is intentionally omitted. */
77
+ } rb_transcoder_asciicompat_type_t;
78
+
79
+ typedef struct rb_transcoder rb_transcoder;
80
+
81
+ /* static structure, one per supported encoding pair */
82
+ struct rb_transcoder {
83
+ const char *src_encoding;
84
+ const char *dst_encoding;
85
+ unsigned int conv_tree_start;
86
+ const unsigned char *byte_array;
87
+ unsigned int byte_array_length;
88
+ const unsigned int *word_array;
89
+ unsigned int word_array_length;
90
+ int word_size;
91
+ int input_unit_length;
92
+ int max_input;
93
+ int max_output;
94
+ rb_transcoder_asciicompat_type_t asciicompat_type;
95
+ size_t state_size;
96
+ int (*state_init_func)(void*); /* ret==0:success ret!=0:failure(errno) */
97
+ int (*state_fini_func)(void*); /* ret==0:success ret!=0:failure(errno) */
98
+ VALUE (*func_ii)(void*, VALUE); /* info -> info */
99
+ VALUE (*func_si)(void*, const unsigned char*, size_t); /* start -> info */
100
+ ssize_t (*func_io)(void*, VALUE, const unsigned char*, size_t); /* info -> output */
101
+ ssize_t (*func_so)(void*, const unsigned char*, size_t, unsigned char*, size_t); /* start -> output */
102
+ ssize_t (*finish_func)(void*, unsigned char*, size_t); /* -> output */
103
+ ssize_t (*resetsize_func)(void*); /* -> len */
104
+ ssize_t (*resetstate_func)(void*, unsigned char*, size_t); /* -> output */
105
+ ssize_t (*func_sio)(void*, const unsigned char*, size_t, VALUE, unsigned char*, size_t); /* start -> output */
106
+ };
107
+
108
+ void rb_declare_transcoder(const char *enc1, const char *enc2, const char *lib);
109
+ void rb_register_transcoder(const rb_transcoder *);
110
+
111
+ /*
112
+ * To get rid of collision of initializer symbols in statically-linked encodings
113
+ * and transcoders
114
+ */
115
+ #if defined(EXTSTATIC) && EXTSTATIC
116
+ # define TRANS_INIT(name) void Init_trans_ ## name(void)
117
+ #else
118
+ # define TRANS_INIT(name) void Init_ ## name(void)
119
+ #endif
120
+
121
+ RUBY_SYMBOL_EXPORT_END
122
+
123
+ #endif /* RUBY_TRANSCODE_DATA_H */
@@ -0,0 +1,190 @@
1
+ rb_declare_transcoder("Big5", "UTF-8", "big5");
2
+ rb_declare_transcoder("UTF-8", "Big5", "big5");
3
+ rb_declare_transcoder("CP950", "UTF-8", "big5");
4
+ rb_declare_transcoder("UTF-8", "CP950", "big5");
5
+ rb_declare_transcoder("Big5-HKSCS", "UTF-8", "big5");
6
+ rb_declare_transcoder("UTF-8", "Big5-HKSCS", "big5");
7
+ rb_declare_transcoder("CP951", "UTF-8", "big5");
8
+ rb_declare_transcoder("UTF-8", "CP951", "big5");
9
+ rb_declare_transcoder("Big5-UAO", "UTF-8", "big5");
10
+ rb_declare_transcoder("UTF-8", "Big5-UAO", "big5");
11
+ rb_declare_transcoder("GB2312", "UTF-8", "chinese");
12
+ rb_declare_transcoder("GB12345", "UTF-8", "chinese");
13
+ rb_declare_transcoder("UTF-8", "GB2312", "chinese");
14
+ rb_declare_transcoder("UTF-8", "GB12345", "chinese");
15
+ rb_declare_transcoder("UTF8-DoCoMo", "UTF8-KDDI", "emoji");
16
+ rb_declare_transcoder("UTF8-DoCoMo", "UTF8-SoftBank", "emoji");
17
+ rb_declare_transcoder("UTF8-DoCoMo", "UTF-8", "emoji");
18
+ rb_declare_transcoder("UTF8-KDDI", "UTF8-DoCoMo", "emoji");
19
+ rb_declare_transcoder("UTF8-KDDI", "UTF8-SoftBank", "emoji");
20
+ rb_declare_transcoder("UTF8-KDDI", "UTF-8", "emoji");
21
+ rb_declare_transcoder("UTF8-SoftBank", "UTF8-DoCoMo", "emoji");
22
+ rb_declare_transcoder("UTF8-SoftBank", "UTF8-KDDI", "emoji");
23
+ rb_declare_transcoder("UTF8-SoftBank", "UTF-8", "emoji");
24
+ rb_declare_transcoder("UTF-8", "UTF8-DoCoMo", "emoji");
25
+ rb_declare_transcoder("UTF-8", "UTF8-KDDI", "emoji");
26
+ rb_declare_transcoder("UTF-8", "UTF8-SoftBank", "emoji");
27
+ rb_declare_transcoder("stateless-ISO-2022-JP-KDDI", "UTF8-KDDI", "emoji_iso2022_kddi");
28
+ rb_declare_transcoder("UTF8-KDDI", "stateless-ISO-2022-JP-KDDI", "emoji_iso2022_kddi");
29
+ rb_declare_transcoder("ISO-2022-JP-KDDI", "stateless-ISO-2022-JP-KDDI", "emoji_iso2022_kddi");
30
+ rb_declare_transcoder("stateless-ISO-2022-JP-KDDI", "ISO-2022-JP-KDDI", "emoji_iso2022_kddi");
31
+ rb_declare_transcoder("SJIS-DOCOMO", "UTF8-DOCOMO", "emoji_sjis_docomo");
32
+ rb_declare_transcoder("UTF8-DOCOMO", "SJIS-DOCOMO", "emoji_sjis_docomo");
33
+ rb_declare_transcoder("SJIS-KDDI", "UTF8-KDDI", "emoji_sjis_kddi");
34
+ rb_declare_transcoder("UTF8-KDDI", "SJIS-KDDI", "emoji_sjis_kddi");
35
+ rb_declare_transcoder("SJIS-SoftBank", "UTF8-SoftBank", "emoji_sjis_softbank");
36
+ rb_declare_transcoder("UTF8-SoftBank", "SJIS-SoftBank", "emoji_sjis_softbank");
37
+ rb_declare_transcoder("", "amp_escape", "escape");
38
+ rb_declare_transcoder("", "xml_text_escape", "escape");
39
+ rb_declare_transcoder("", "xml_attr_content_escape", "escape");
40
+ rb_declare_transcoder("", "xml_attr_quote", "escape");
41
+ rb_declare_transcoder("GB18030", "UTF-8", "gb18030");
42
+ rb_declare_transcoder("UTF-8", "GB18030", "gb18030");
43
+ rb_declare_transcoder("GBK", "UTF-8", "gbk");
44
+ rb_declare_transcoder("UTF-8", "GBK", "gbk");
45
+ rb_declare_transcoder("ISO-2022-JP", "stateless-ISO-2022-JP", "iso2022");
46
+ rb_declare_transcoder("stateless-ISO-2022-JP", "ISO-2022-JP", "iso2022");
47
+ rb_declare_transcoder("stateless-ISO-2022-JP", "EUC-JP", "iso2022");
48
+ rb_declare_transcoder("EUC-JP", "stateless-ISO-2022-JP", "iso2022");
49
+ rb_declare_transcoder("CP50220", "cp51932", "iso2022");
50
+ rb_declare_transcoder("CP50221", "cp51932", "iso2022");
51
+ rb_declare_transcoder("CP51932", "CP50221", "iso2022");
52
+ rb_declare_transcoder("CP51932", "CP50220", "iso2022");
53
+ rb_declare_transcoder("EUC-JP", "Shift_JIS", "japanese");
54
+ rb_declare_transcoder("Shift_JIS", "EUC-JP", "japanese");
55
+ rb_declare_transcoder("EUC-JP", "UTF-8", "japanese_euc");
56
+ rb_declare_transcoder("eucJP-ms", "UTF-8", "japanese_euc");
57
+ rb_declare_transcoder("CP51932", "UTF-8", "japanese_euc");
58
+ rb_declare_transcoder("EUC-JIS-2004", "UTF-8", "japanese_euc");
59
+ rb_declare_transcoder("UTF-8", "EUC-JP", "japanese_euc");
60
+ rb_declare_transcoder("UTF-8", "eucJP-ms", "japanese_euc");
61
+ rb_declare_transcoder("UTF-8", "CP51932", "japanese_euc");
62
+ rb_declare_transcoder("UTF-8", "EUC-JIS-2004", "japanese_euc");
63
+ rb_declare_transcoder("Shift_JIS", "UTF-8", "japanese_sjis");
64
+ rb_declare_transcoder("Windows-31J", "UTF-8", "japanese_sjis");
65
+ rb_declare_transcoder("UTF-8", "Shift_JIS", "japanese_sjis");
66
+ rb_declare_transcoder("UTF-8", "Windows-31J", "japanese_sjis");
67
+ rb_declare_transcoder("UTF-8", "EUC-KR", "korean");
68
+ rb_declare_transcoder("EUC-KR", "UTF-8", "korean");
69
+ rb_declare_transcoder("UTF-8", "CP949", "korean");
70
+ rb_declare_transcoder("CP949", "UTF-8", "korean");
71
+ rb_declare_transcoder("US-ASCII", "UTF-8", "single_byte");
72
+ rb_declare_transcoder("UTF-8", "US-ASCII", "single_byte");
73
+ rb_declare_transcoder("ASCII-8BIT", "UTF-8", "single_byte");
74
+ rb_declare_transcoder("UTF-8", "ASCII-8BIT", "single_byte");
75
+ rb_declare_transcoder("ISO-8859-1", "UTF-8", "single_byte");
76
+ rb_declare_transcoder("UTF-8", "ISO-8859-1", "single_byte");
77
+ rb_declare_transcoder("ISO-8859-2", "UTF-8", "single_byte");
78
+ rb_declare_transcoder("UTF-8", "ISO-8859-2", "single_byte");
79
+ rb_declare_transcoder("ISO-8859-3", "UTF-8", "single_byte");
80
+ rb_declare_transcoder("UTF-8", "ISO-8859-3", "single_byte");
81
+ rb_declare_transcoder("ISO-8859-4", "UTF-8", "single_byte");
82
+ rb_declare_transcoder("UTF-8", "ISO-8859-4", "single_byte");
83
+ rb_declare_transcoder("ISO-8859-5", "UTF-8", "single_byte");
84
+ rb_declare_transcoder("UTF-8", "ISO-8859-5", "single_byte");
85
+ rb_declare_transcoder("ISO-8859-6", "UTF-8", "single_byte");
86
+ rb_declare_transcoder("UTF-8", "ISO-8859-6", "single_byte");
87
+ rb_declare_transcoder("ISO-8859-7", "UTF-8", "single_byte");
88
+ rb_declare_transcoder("UTF-8", "ISO-8859-7", "single_byte");
89
+ rb_declare_transcoder("ISO-8859-8", "UTF-8", "single_byte");
90
+ rb_declare_transcoder("UTF-8", "ISO-8859-8", "single_byte");
91
+ rb_declare_transcoder("ISO-8859-9", "UTF-8", "single_byte");
92
+ rb_declare_transcoder("UTF-8", "ISO-8859-9", "single_byte");
93
+ rb_declare_transcoder("ISO-8859-10", "UTF-8", "single_byte");
94
+ rb_declare_transcoder("UTF-8", "ISO-8859-10", "single_byte");
95
+ rb_declare_transcoder("ISO-8859-11", "UTF-8", "single_byte");
96
+ rb_declare_transcoder("UTF-8", "ISO-8859-11", "single_byte");
97
+ rb_declare_transcoder("ISO-8859-13", "UTF-8", "single_byte");
98
+ rb_declare_transcoder("UTF-8", "ISO-8859-13", "single_byte");
99
+ rb_declare_transcoder("ISO-8859-14", "UTF-8", "single_byte");
100
+ rb_declare_transcoder("UTF-8", "ISO-8859-14", "single_byte");
101
+ rb_declare_transcoder("ISO-8859-15", "UTF-8", "single_byte");
102
+ rb_declare_transcoder("UTF-8", "ISO-8859-15", "single_byte");
103
+ rb_declare_transcoder("ISO-8859-16", "UTF-8", "single_byte");
104
+ rb_declare_transcoder("UTF-8", "ISO-8859-16", "single_byte");
105
+ rb_declare_transcoder("WINDOWS-874", "UTF-8", "single_byte");
106
+ rb_declare_transcoder("UTF-8", "WINDOWS-874", "single_byte");
107
+ rb_declare_transcoder("WINDOWS-1250", "UTF-8", "single_byte");
108
+ rb_declare_transcoder("UTF-8", "WINDOWS-1250", "single_byte");
109
+ rb_declare_transcoder("WINDOWS-1251", "UTF-8", "single_byte");
110
+ rb_declare_transcoder("UTF-8", "WINDOWS-1251", "single_byte");
111
+ rb_declare_transcoder("WINDOWS-1252", "UTF-8", "single_byte");
112
+ rb_declare_transcoder("UTF-8", "WINDOWS-1252", "single_byte");
113
+ rb_declare_transcoder("WINDOWS-1253", "UTF-8", "single_byte");
114
+ rb_declare_transcoder("UTF-8", "WINDOWS-1253", "single_byte");
115
+ rb_declare_transcoder("WINDOWS-1254", "UTF-8", "single_byte");
116
+ rb_declare_transcoder("UTF-8", "WINDOWS-1254", "single_byte");
117
+ rb_declare_transcoder("WINDOWS-1255", "UTF-8", "single_byte");
118
+ rb_declare_transcoder("UTF-8", "WINDOWS-1255", "single_byte");
119
+ rb_declare_transcoder("WINDOWS-1256", "UTF-8", "single_byte");
120
+ rb_declare_transcoder("UTF-8", "WINDOWS-1256", "single_byte");
121
+ rb_declare_transcoder("WINDOWS-1257", "UTF-8", "single_byte");
122
+ rb_declare_transcoder("UTF-8", "WINDOWS-1257", "single_byte");
123
+ rb_declare_transcoder("IBM437", "UTF-8", "single_byte");
124
+ rb_declare_transcoder("UTF-8", "IBM437", "single_byte");
125
+ rb_declare_transcoder("IBM775", "UTF-8", "single_byte");
126
+ rb_declare_transcoder("UTF-8", "IBM775", "single_byte");
127
+ rb_declare_transcoder("IBM737", "UTF-8", "single_byte");
128
+ rb_declare_transcoder("UTF-8", "IBM737", "single_byte");
129
+ rb_declare_transcoder("IBM852", "UTF-8", "single_byte");
130
+ rb_declare_transcoder("UTF-8", "IBM852", "single_byte");
131
+ rb_declare_transcoder("IBM855", "UTF-8", "single_byte");
132
+ rb_declare_transcoder("UTF-8", "IBM855", "single_byte");
133
+ rb_declare_transcoder("IBM857", "UTF-8", "single_byte");
134
+ rb_declare_transcoder("UTF-8", "IBM857", "single_byte");
135
+ rb_declare_transcoder("IBM860", "UTF-8", "single_byte");
136
+ rb_declare_transcoder("UTF-8", "IBM860", "single_byte");
137
+ rb_declare_transcoder("IBM861", "UTF-8", "single_byte");
138
+ rb_declare_transcoder("UTF-8", "IBM861", "single_byte");
139
+ rb_declare_transcoder("IBM862", "UTF-8", "single_byte");
140
+ rb_declare_transcoder("UTF-8", "IBM862", "single_byte");
141
+ rb_declare_transcoder("IBM863", "UTF-8", "single_byte");
142
+ rb_declare_transcoder("UTF-8", "IBM863", "single_byte");
143
+ rb_declare_transcoder("IBM865", "UTF-8", "single_byte");
144
+ rb_declare_transcoder("UTF-8", "IBM865", "single_byte");
145
+ rb_declare_transcoder("IBM866", "UTF-8", "single_byte");
146
+ rb_declare_transcoder("UTF-8", "IBM866", "single_byte");
147
+ rb_declare_transcoder("IBM869", "UTF-8", "single_byte");
148
+ rb_declare_transcoder("UTF-8", "IBM869", "single_byte");
149
+ rb_declare_transcoder("MACCROATIAN", "UTF-8", "single_byte");
150
+ rb_declare_transcoder("UTF-8", "MACCROATIAN", "single_byte");
151
+ rb_declare_transcoder("MACCYRILLIC", "UTF-8", "single_byte");
152
+ rb_declare_transcoder("UTF-8", "MACCYRILLIC", "single_byte");
153
+ rb_declare_transcoder("MACGREEK", "UTF-8", "single_byte");
154
+ rb_declare_transcoder("UTF-8", "MACGREEK", "single_byte");
155
+ rb_declare_transcoder("MACICELAND", "UTF-8", "single_byte");
156
+ rb_declare_transcoder("UTF-8", "MACICELAND", "single_byte");
157
+ rb_declare_transcoder("MACROMAN", "UTF-8", "single_byte");
158
+ rb_declare_transcoder("UTF-8", "MACROMAN", "single_byte");
159
+ rb_declare_transcoder("MACROMANIA", "UTF-8", "single_byte");
160
+ rb_declare_transcoder("UTF-8", "MACROMANIA", "single_byte");
161
+ rb_declare_transcoder("MACTURKISH", "UTF-8", "single_byte");
162
+ rb_declare_transcoder("UTF-8", "MACTURKISH", "single_byte");
163
+ rb_declare_transcoder("MACUKRAINE", "UTF-8", "single_byte");
164
+ rb_declare_transcoder("UTF-8", "MACUKRAINE", "single_byte");
165
+ rb_declare_transcoder("KOI8-U", "UTF-8", "single_byte");
166
+ rb_declare_transcoder("UTF-8", "KOI8-U", "single_byte");
167
+ rb_declare_transcoder("KOI8-R", "UTF-8", "single_byte");
168
+ rb_declare_transcoder("UTF-8", "KOI8-R", "single_byte");
169
+ rb_declare_transcoder("TIS-620", "UTF-8", "single_byte");
170
+ rb_declare_transcoder("UTF-8", "TIS-620", "single_byte");
171
+ rb_declare_transcoder("CP850", "UTF-8", "single_byte");
172
+ rb_declare_transcoder("UTF-8", "CP850", "single_byte");
173
+ rb_declare_transcoder("CP852", "UTF-8", "single_byte");
174
+ rb_declare_transcoder("UTF-8", "CP852", "single_byte");
175
+ rb_declare_transcoder("CP855", "UTF-8", "single_byte");
176
+ rb_declare_transcoder("UTF-8", "CP855", "single_byte");
177
+ rb_declare_transcoder("UTF-8", "UTF8-MAC", "utf8_mac");
178
+ rb_declare_transcoder("UTF8-MAC", "UTF-8", "utf8_mac");
179
+ rb_declare_transcoder("UTF-16BE", "UTF-8", "utf_16_32");
180
+ rb_declare_transcoder("UTF-8", "UTF-16BE", "utf_16_32");
181
+ rb_declare_transcoder("UTF-16LE", "UTF-8", "utf_16_32");
182
+ rb_declare_transcoder("UTF-8", "UTF-16LE", "utf_16_32");
183
+ rb_declare_transcoder("UTF-32BE", "UTF-8", "utf_16_32");
184
+ rb_declare_transcoder("UTF-8", "UTF-32BE", "utf_16_32");
185
+ rb_declare_transcoder("UTF-32LE", "UTF-8", "utf_16_32");
186
+ rb_declare_transcoder("UTF-8", "UTF-32LE", "utf_16_32");
187
+ rb_declare_transcoder("UTF-16", "UTF-8", "utf_16_32");
188
+ rb_declare_transcoder("UTF-32", "UTF-8", "utf_16_32");
189
+ rb_declare_transcoder("UTF-8", "UTF-16", "utf_16_32");
190
+ rb_declare_transcoder("UTF-8", "UTF-32", "utf_16_32");