jruby-prism-parser 0.23.0.pre.SNAPSHOT-java
Sign up to get free protection for your applications and to get access to all the features.
- checksums.yaml +7 -0
- data/CHANGELOG.md +401 -0
- data/CODE_OF_CONDUCT.md +76 -0
- data/CONTRIBUTING.md +62 -0
- data/LICENSE.md +7 -0
- data/Makefile +101 -0
- data/README.md +98 -0
- data/config.yml +2902 -0
- data/docs/build_system.md +91 -0
- data/docs/configuration.md +64 -0
- data/docs/cruby_compilation.md +27 -0
- data/docs/design.md +53 -0
- data/docs/encoding.md +121 -0
- data/docs/fuzzing.md +88 -0
- data/docs/heredocs.md +36 -0
- data/docs/javascript.md +118 -0
- data/docs/local_variable_depth.md +229 -0
- data/docs/mapping.md +117 -0
- data/docs/parser_translation.md +34 -0
- data/docs/parsing_rules.md +19 -0
- data/docs/releasing.md +98 -0
- data/docs/ripper.md +36 -0
- data/docs/ruby_api.md +43 -0
- data/docs/ruby_parser_translation.md +19 -0
- data/docs/serialization.md +209 -0
- data/docs/testing.md +55 -0
- data/ext/prism/api_node.c +5098 -0
- data/ext/prism/api_pack.c +267 -0
- data/ext/prism/extconf.rb +110 -0
- data/ext/prism/extension.c +1155 -0
- data/ext/prism/extension.h +18 -0
- data/include/prism/ast.h +5807 -0
- data/include/prism/defines.h +102 -0
- data/include/prism/diagnostic.h +339 -0
- data/include/prism/encoding.h +265 -0
- data/include/prism/node.h +57 -0
- data/include/prism/options.h +230 -0
- data/include/prism/pack.h +152 -0
- data/include/prism/parser.h +732 -0
- data/include/prism/prettyprint.h +26 -0
- data/include/prism/regexp.h +33 -0
- data/include/prism/util/pm_buffer.h +155 -0
- data/include/prism/util/pm_char.h +205 -0
- data/include/prism/util/pm_constant_pool.h +209 -0
- data/include/prism/util/pm_list.h +97 -0
- data/include/prism/util/pm_memchr.h +29 -0
- data/include/prism/util/pm_newline_list.h +93 -0
- data/include/prism/util/pm_state_stack.h +42 -0
- data/include/prism/util/pm_string.h +150 -0
- data/include/prism/util/pm_string_list.h +44 -0
- data/include/prism/util/pm_strncasecmp.h +32 -0
- data/include/prism/util/pm_strpbrk.h +46 -0
- data/include/prism/version.h +29 -0
- data/include/prism.h +289 -0
- data/jruby-prism.jar +0 -0
- data/lib/prism/compiler.rb +486 -0
- data/lib/prism/debug.rb +206 -0
- data/lib/prism/desugar_compiler.rb +207 -0
- data/lib/prism/dispatcher.rb +2150 -0
- data/lib/prism/dot_visitor.rb +4634 -0
- data/lib/prism/dsl.rb +785 -0
- data/lib/prism/ffi.rb +346 -0
- data/lib/prism/lex_compat.rb +908 -0
- data/lib/prism/mutation_compiler.rb +753 -0
- data/lib/prism/node.rb +17864 -0
- data/lib/prism/node_ext.rb +212 -0
- data/lib/prism/node_inspector.rb +68 -0
- data/lib/prism/pack.rb +224 -0
- data/lib/prism/parse_result/comments.rb +177 -0
- data/lib/prism/parse_result/newlines.rb +64 -0
- data/lib/prism/parse_result.rb +498 -0
- data/lib/prism/pattern.rb +250 -0
- data/lib/prism/serialize.rb +1354 -0
- data/lib/prism/translation/parser/compiler.rb +1838 -0
- data/lib/prism/translation/parser/lexer.rb +335 -0
- data/lib/prism/translation/parser/rubocop.rb +37 -0
- data/lib/prism/translation/parser.rb +178 -0
- data/lib/prism/translation/ripper.rb +577 -0
- data/lib/prism/translation/ruby_parser.rb +1521 -0
- data/lib/prism/translation.rb +11 -0
- data/lib/prism/version.rb +3 -0
- data/lib/prism/visitor.rb +495 -0
- data/lib/prism.rb +99 -0
- data/prism.gemspec +135 -0
- data/rbi/prism.rbi +7767 -0
- data/rbi/prism_static.rbi +207 -0
- data/sig/prism.rbs +4773 -0
- data/sig/prism_static.rbs +201 -0
- data/src/diagnostic.c +400 -0
- data/src/encoding.c +5132 -0
- data/src/node.c +2786 -0
- data/src/options.c +213 -0
- data/src/pack.c +493 -0
- data/src/prettyprint.c +8881 -0
- data/src/prism.c +18406 -0
- data/src/regexp.c +638 -0
- data/src/serialize.c +1554 -0
- data/src/token_type.c +700 -0
- data/src/util/pm_buffer.c +190 -0
- data/src/util/pm_char.c +318 -0
- data/src/util/pm_constant_pool.c +322 -0
- data/src/util/pm_list.c +49 -0
- data/src/util/pm_memchr.c +35 -0
- data/src/util/pm_newline_list.c +84 -0
- data/src/util/pm_state_stack.c +25 -0
- data/src/util/pm_string.c +203 -0
- data/src/util/pm_string_list.c +28 -0
- data/src/util/pm_strncasecmp.c +24 -0
- data/src/util/pm_strpbrk.c +180 -0
- metadata +156 -0
@@ -0,0 +1,97 @@
|
|
1
|
+
/**
|
2
|
+
* @file pm_list.h
|
3
|
+
*
|
4
|
+
* An abstract linked list.
|
5
|
+
*/
|
6
|
+
#ifndef PRISM_LIST_H
|
7
|
+
#define PRISM_LIST_H
|
8
|
+
|
9
|
+
#include "prism/defines.h"
|
10
|
+
|
11
|
+
#include <stdbool.h>
|
12
|
+
#include <stddef.h>
|
13
|
+
#include <stdint.h>
|
14
|
+
#include <stdlib.h>
|
15
|
+
|
16
|
+
/**
|
17
|
+
* This struct represents an abstract linked list that provides common
|
18
|
+
* functionality. It is meant to be used any time a linked list is necessary to
|
19
|
+
* store data.
|
20
|
+
*
|
21
|
+
* The linked list itself operates off a set of pointers. Because the pointers
|
22
|
+
* are not necessarily sequential, they can be of any size. We use this fact to
|
23
|
+
* allow the consumer of this linked list to extend the node struct to include
|
24
|
+
* any data they want. This is done by using the pm_list_node_t as the first
|
25
|
+
* member of the struct.
|
26
|
+
*
|
27
|
+
* For example, if we want to store a list of integers, we can do the following:
|
28
|
+
*
|
29
|
+
* ```c
|
30
|
+
* typedef struct {
|
31
|
+
* pm_list_node_t node;
|
32
|
+
* int value;
|
33
|
+
* } pm_int_node_t;
|
34
|
+
*
|
35
|
+
* pm_list_t list = { 0 };
|
36
|
+
* pm_int_node_t *node = malloc(sizeof(pm_int_node_t));
|
37
|
+
* node->value = 5;
|
38
|
+
*
|
39
|
+
* pm_list_append(&list, &node->node);
|
40
|
+
* ```
|
41
|
+
*
|
42
|
+
* The pm_list_t struct is used to represent the overall linked list. It
|
43
|
+
* contains a pointer to the head and tail of the list. This allows for easy
|
44
|
+
* iteration and appending of new nodes.
|
45
|
+
*/
|
46
|
+
typedef struct pm_list_node {
|
47
|
+
/** A pointer to the next node in the list. */
|
48
|
+
struct pm_list_node *next;
|
49
|
+
} pm_list_node_t;
|
50
|
+
|
51
|
+
/**
|
52
|
+
* This represents the overall linked list. It keeps a pointer to the head and
|
53
|
+
* tail so that iteration is easy and pushing new nodes is easy.
|
54
|
+
*/
|
55
|
+
typedef struct {
|
56
|
+
/** The size of the list. */
|
57
|
+
size_t size;
|
58
|
+
|
59
|
+
/** A pointer to the head of the list. */
|
60
|
+
pm_list_node_t *head;
|
61
|
+
|
62
|
+
/** A pointer to the tail of the list. */
|
63
|
+
pm_list_node_t *tail;
|
64
|
+
} pm_list_t;
|
65
|
+
|
66
|
+
/**
|
67
|
+
* Returns true if the given list is empty.
|
68
|
+
*
|
69
|
+
* @param list The list to check.
|
70
|
+
* @return True if the given list is empty, otherwise false.
|
71
|
+
*/
|
72
|
+
PRISM_EXPORTED_FUNCTION bool pm_list_empty_p(pm_list_t *list);
|
73
|
+
|
74
|
+
/**
|
75
|
+
* Returns the size of the list.
|
76
|
+
*
|
77
|
+
* @param list The list to check.
|
78
|
+
* @return The size of the list.
|
79
|
+
*/
|
80
|
+
PRISM_EXPORTED_FUNCTION size_t pm_list_size(pm_list_t *list);
|
81
|
+
|
82
|
+
/**
|
83
|
+
* Append a node to the given list.
|
84
|
+
*
|
85
|
+
* @param list The list to append to.
|
86
|
+
* @param node The node to append.
|
87
|
+
*/
|
88
|
+
void pm_list_append(pm_list_t *list, pm_list_node_t *node);
|
89
|
+
|
90
|
+
/**
|
91
|
+
* Deallocate the internal state of the given list.
|
92
|
+
*
|
93
|
+
* @param list The list to free.
|
94
|
+
*/
|
95
|
+
PRISM_EXPORTED_FUNCTION void pm_list_free(pm_list_t *list);
|
96
|
+
|
97
|
+
#endif
|
@@ -0,0 +1,29 @@
|
|
1
|
+
/**
|
2
|
+
* @file pm_memchr.h
|
3
|
+
*
|
4
|
+
* A custom memchr implementation.
|
5
|
+
*/
|
6
|
+
#ifndef PRISM_MEMCHR_H
|
7
|
+
#define PRISM_MEMCHR_H
|
8
|
+
|
9
|
+
#include "prism/defines.h"
|
10
|
+
#include "prism/encoding.h"
|
11
|
+
|
12
|
+
#include <stddef.h>
|
13
|
+
|
14
|
+
/**
|
15
|
+
* We need to roll our own memchr to handle cases where the encoding changes and
|
16
|
+
* we need to search for a character in a buffer that could be the trailing byte
|
17
|
+
* of a multibyte character.
|
18
|
+
*
|
19
|
+
* @param source The source string.
|
20
|
+
* @param character The character to search for.
|
21
|
+
* @param number The maximum number of bytes to search.
|
22
|
+
* @param encoding_changed Whether the encoding changed.
|
23
|
+
* @param encoding A pointer to the encoding.
|
24
|
+
* @return A pointer to the first occurrence of the character in the source
|
25
|
+
* string, or NULL if no such character exists.
|
26
|
+
*/
|
27
|
+
void * pm_memchr(const void *source, int character, size_t number, bool encoding_changed, const pm_encoding_t *encoding);
|
28
|
+
|
29
|
+
#endif
|
@@ -0,0 +1,93 @@
|
|
1
|
+
/**
|
2
|
+
* @file pm_newline_list.h
|
3
|
+
*
|
4
|
+
* A list of byte offsets of newlines in a string.
|
5
|
+
*
|
6
|
+
* When compiling the syntax tree, it's necessary to know the line and column
|
7
|
+
* of many nodes. This is necessary to support things like error messages,
|
8
|
+
* tracepoints, etc.
|
9
|
+
*
|
10
|
+
* It's possible that we could store the start line, start column, end line, and
|
11
|
+
* end column on every node in addition to the offsets that we already store,
|
12
|
+
* but that would be quite a lot of memory overhead.
|
13
|
+
*/
|
14
|
+
#ifndef PRISM_NEWLINE_LIST_H
|
15
|
+
#define PRISM_NEWLINE_LIST_H
|
16
|
+
|
17
|
+
#include "prism/defines.h"
|
18
|
+
|
19
|
+
#include <assert.h>
|
20
|
+
#include <stdbool.h>
|
21
|
+
#include <stddef.h>
|
22
|
+
#include <stdlib.h>
|
23
|
+
|
24
|
+
/**
|
25
|
+
* A list of offsets of newlines in a string. The offsets are assumed to be
|
26
|
+
* sorted/inserted in ascending order.
|
27
|
+
*/
|
28
|
+
typedef struct {
|
29
|
+
/** A pointer to the start of the source string. */
|
30
|
+
const uint8_t *start;
|
31
|
+
|
32
|
+
/** The number of offsets in the list. */
|
33
|
+
size_t size;
|
34
|
+
|
35
|
+
/** The capacity of the list that has been allocated. */
|
36
|
+
size_t capacity;
|
37
|
+
|
38
|
+
/** The list of offsets. */
|
39
|
+
size_t *offsets;
|
40
|
+
} pm_newline_list_t;
|
41
|
+
|
42
|
+
/**
|
43
|
+
* A line and column in a string.
|
44
|
+
*/
|
45
|
+
typedef struct {
|
46
|
+
/** The line number. */
|
47
|
+
size_t line;
|
48
|
+
|
49
|
+
/** The column number. */
|
50
|
+
size_t column;
|
51
|
+
} pm_line_column_t;
|
52
|
+
|
53
|
+
/**
|
54
|
+
* Initialize a new newline list with the given capacity. Returns true if the
|
55
|
+
* allocation of the offsets succeeds, otherwise returns false.
|
56
|
+
*
|
57
|
+
* @param list The list to initialize.
|
58
|
+
* @param start A pointer to the start of the source string.
|
59
|
+
* @param capacity The initial capacity of the list.
|
60
|
+
* @return True if the allocation of the offsets succeeds, otherwise false.
|
61
|
+
*/
|
62
|
+
bool pm_newline_list_init(pm_newline_list_t *list, const uint8_t *start, size_t capacity);
|
63
|
+
|
64
|
+
/**
|
65
|
+
* Append a new offset to the newline list. Returns true if the reallocation of
|
66
|
+
* the offsets succeeds (if one was necessary), otherwise returns false.
|
67
|
+
*
|
68
|
+
* @param list The list to append to.
|
69
|
+
* @param cursor A pointer to the offset to append.
|
70
|
+
* @return True if the reallocation of the offsets succeeds (if one was
|
71
|
+
* necessary), otherwise false.
|
72
|
+
*/
|
73
|
+
bool pm_newline_list_append(pm_newline_list_t *list, const uint8_t *cursor);
|
74
|
+
|
75
|
+
/**
|
76
|
+
* Returns the line and column of the given offset. If the offset is not in the
|
77
|
+
* list, the line and column of the closest offset less than the given offset
|
78
|
+
* are returned.
|
79
|
+
*
|
80
|
+
* @param list The list to search.
|
81
|
+
* @param cursor A pointer to the offset to search for.
|
82
|
+
* @return The line and column of the given offset.
|
83
|
+
*/
|
84
|
+
pm_line_column_t pm_newline_list_line_column(const pm_newline_list_t *list, const uint8_t *cursor);
|
85
|
+
|
86
|
+
/**
|
87
|
+
* Free the internal memory allocated for the newline list.
|
88
|
+
*
|
89
|
+
* @param list The list to free.
|
90
|
+
*/
|
91
|
+
void pm_newline_list_free(pm_newline_list_t *list);
|
92
|
+
|
93
|
+
#endif
|
@@ -0,0 +1,42 @@
|
|
1
|
+
/**
|
2
|
+
* @file pm_state_stack.h
|
3
|
+
*
|
4
|
+
* A stack of boolean values.
|
5
|
+
*/
|
6
|
+
#ifndef PRISM_STATE_STACK_H
|
7
|
+
#define PRISM_STATE_STACK_H
|
8
|
+
|
9
|
+
#include "prism/defines.h"
|
10
|
+
|
11
|
+
#include <stdbool.h>
|
12
|
+
#include <stdint.h>
|
13
|
+
|
14
|
+
/**
|
15
|
+
* A struct that represents a stack of boolean values.
|
16
|
+
*/
|
17
|
+
typedef uint32_t pm_state_stack_t;
|
18
|
+
|
19
|
+
/**
|
20
|
+
* Pushes a value onto the stack.
|
21
|
+
*
|
22
|
+
* @param stack The stack to push the value onto.
|
23
|
+
* @param value The value to push onto the stack.
|
24
|
+
*/
|
25
|
+
void pm_state_stack_push(pm_state_stack_t *stack, bool value);
|
26
|
+
|
27
|
+
/**
|
28
|
+
* Pops a value off the stack.
|
29
|
+
*
|
30
|
+
* @param stack The stack to pop the value off of.
|
31
|
+
*/
|
32
|
+
void pm_state_stack_pop(pm_state_stack_t *stack);
|
33
|
+
|
34
|
+
/**
|
35
|
+
* Returns the value at the top of the stack.
|
36
|
+
*
|
37
|
+
* @param stack The stack to get the value from.
|
38
|
+
* @return The value at the top of the stack.
|
39
|
+
*/
|
40
|
+
bool pm_state_stack_p(pm_state_stack_t *stack);
|
41
|
+
|
42
|
+
#endif
|
@@ -0,0 +1,150 @@
|
|
1
|
+
/**
|
2
|
+
* @file pm_string.h
|
3
|
+
*
|
4
|
+
* A generic string type that can have various ownership semantics.
|
5
|
+
*/
|
6
|
+
#ifndef PRISM_STRING_H
|
7
|
+
#define PRISM_STRING_H
|
8
|
+
|
9
|
+
#include "prism/defines.h"
|
10
|
+
|
11
|
+
#include <assert.h>
|
12
|
+
#include <stdbool.h>
|
13
|
+
#include <stddef.h>
|
14
|
+
#include <stdlib.h>
|
15
|
+
#include <string.h>
|
16
|
+
|
17
|
+
// The following headers are necessary to read files using demand paging.
|
18
|
+
#ifdef _WIN32
|
19
|
+
#include <windows.h>
|
20
|
+
#else
|
21
|
+
#include <fcntl.h>
|
22
|
+
#include <sys/mman.h>
|
23
|
+
#include <sys/stat.h>
|
24
|
+
#include <unistd.h>
|
25
|
+
#endif
|
26
|
+
|
27
|
+
/**
|
28
|
+
* A generic string type that can have various ownership semantics.
|
29
|
+
*/
|
30
|
+
typedef struct {
|
31
|
+
/** A pointer to the start of the string. */
|
32
|
+
const uint8_t *source;
|
33
|
+
|
34
|
+
/** The length of the string in bytes of memory. */
|
35
|
+
size_t length;
|
36
|
+
|
37
|
+
/** The type of the string. This field determines how the string should be freed. */
|
38
|
+
enum {
|
39
|
+
/** This string is a constant string, and should not be freed. */
|
40
|
+
PM_STRING_CONSTANT,
|
41
|
+
|
42
|
+
/** This is a slice of another string, and should not be freed. */
|
43
|
+
PM_STRING_SHARED,
|
44
|
+
|
45
|
+
/** This string owns its memory, and should be freed using `pm_string_free`. */
|
46
|
+
PM_STRING_OWNED,
|
47
|
+
|
48
|
+
/** This string is a memory-mapped file, and should be freed using `pm_string_free`. */
|
49
|
+
PM_STRING_MAPPED
|
50
|
+
} type;
|
51
|
+
} pm_string_t;
|
52
|
+
|
53
|
+
/**
|
54
|
+
* Returns the size of the pm_string_t struct. This is necessary to allocate the
|
55
|
+
* correct amount of memory in the FFI backend.
|
56
|
+
*
|
57
|
+
* @return The size of the pm_string_t struct.
|
58
|
+
*/
|
59
|
+
PRISM_EXPORTED_FUNCTION size_t pm_string_sizeof(void);
|
60
|
+
|
61
|
+
/**
|
62
|
+
* Defines an empty string. This is useful for initializing a string that will
|
63
|
+
* be filled in later.
|
64
|
+
*/
|
65
|
+
#define PM_STRING_EMPTY ((pm_string_t) { .type = PM_STRING_CONSTANT, .source = NULL, .length = 0 })
|
66
|
+
|
67
|
+
/**
|
68
|
+
* Initialize a shared string that is based on initial input.
|
69
|
+
*
|
70
|
+
* @param string The string to initialize.
|
71
|
+
* @param start The start of the string.
|
72
|
+
* @param end The end of the string.
|
73
|
+
*/
|
74
|
+
void pm_string_shared_init(pm_string_t *string, const uint8_t *start, const uint8_t *end);
|
75
|
+
|
76
|
+
/**
|
77
|
+
* Initialize an owned string that is responsible for freeing allocated memory.
|
78
|
+
*
|
79
|
+
* @param string The string to initialize.
|
80
|
+
* @param source The source of the string.
|
81
|
+
* @param length The length of the string.
|
82
|
+
*/
|
83
|
+
void pm_string_owned_init(pm_string_t *string, uint8_t *source, size_t length);
|
84
|
+
|
85
|
+
/**
|
86
|
+
* Initialize a constant string that doesn't own its memory source.
|
87
|
+
*
|
88
|
+
* @param string The string to initialize.
|
89
|
+
* @param source The source of the string.
|
90
|
+
* @param length The length of the string.
|
91
|
+
*/
|
92
|
+
void pm_string_constant_init(pm_string_t *string, const char *source, size_t length);
|
93
|
+
|
94
|
+
/**
|
95
|
+
* Read the file indicated by the filepath parameter into source and load its
|
96
|
+
* contents and size into the given `pm_string_t`. The given `pm_string_t`
|
97
|
+
* should be freed using `pm_string_free` when it is no longer used.
|
98
|
+
*
|
99
|
+
* We want to use demand paging as much as possible in order to avoid having to
|
100
|
+
* read the entire file into memory (which could be detrimental to performance
|
101
|
+
* for large files). This means that if we're on windows we'll use
|
102
|
+
* `MapViewOfFile`, on POSIX systems that have access to `mmap` we'll use
|
103
|
+
* `mmap`, and on other POSIX systems we'll use `read`.
|
104
|
+
*
|
105
|
+
* @param string The string to initialize.
|
106
|
+
* @param filepath The filepath to read.
|
107
|
+
* @return Whether or not the file was successfully mapped.
|
108
|
+
*/
|
109
|
+
PRISM_EXPORTED_FUNCTION bool pm_string_mapped_init(pm_string_t *string, const char *filepath);
|
110
|
+
|
111
|
+
/**
|
112
|
+
* Returns the memory size associated with the string.
|
113
|
+
*
|
114
|
+
* @param string The string to get the memory size of.
|
115
|
+
* @return The size of the memory associated with the string.
|
116
|
+
*/
|
117
|
+
size_t pm_string_memsize(const pm_string_t *string);
|
118
|
+
|
119
|
+
/**
|
120
|
+
* Ensure the string is owned. If it is not, then reinitialize it as owned and
|
121
|
+
* copy over the previous source.
|
122
|
+
*
|
123
|
+
* @param string The string to ensure is owned.
|
124
|
+
*/
|
125
|
+
void pm_string_ensure_owned(pm_string_t *string);
|
126
|
+
|
127
|
+
/**
|
128
|
+
* Returns the length associated with the string.
|
129
|
+
*
|
130
|
+
* @param string The string to get the length of.
|
131
|
+
* @return The length of the string.
|
132
|
+
*/
|
133
|
+
PRISM_EXPORTED_FUNCTION size_t pm_string_length(const pm_string_t *string);
|
134
|
+
|
135
|
+
/**
|
136
|
+
* Returns the start pointer associated with the string.
|
137
|
+
*
|
138
|
+
* @param string The string to get the start pointer of.
|
139
|
+
* @return The start pointer of the string.
|
140
|
+
*/
|
141
|
+
PRISM_EXPORTED_FUNCTION const uint8_t * pm_string_source(const pm_string_t *string);
|
142
|
+
|
143
|
+
/**
|
144
|
+
* Free the associated memory of the given string.
|
145
|
+
*
|
146
|
+
* @param string The string to free.
|
147
|
+
*/
|
148
|
+
PRISM_EXPORTED_FUNCTION void pm_string_free(pm_string_t *string);
|
149
|
+
|
150
|
+
#endif
|
@@ -0,0 +1,44 @@
|
|
1
|
+
/**
|
2
|
+
* @file pm_string_list.h
|
3
|
+
*
|
4
|
+
* A list of strings.
|
5
|
+
*/
|
6
|
+
#ifndef PRISM_STRING_LIST_H
|
7
|
+
#define PRISM_STRING_LIST_H
|
8
|
+
|
9
|
+
#include "prism/defines.h"
|
10
|
+
#include "prism/util/pm_string.h"
|
11
|
+
|
12
|
+
#include <stddef.h>
|
13
|
+
#include <stdlib.h>
|
14
|
+
|
15
|
+
/**
|
16
|
+
* A list of strings.
|
17
|
+
*/
|
18
|
+
typedef struct {
|
19
|
+
/** The length of the string list. */
|
20
|
+
size_t length;
|
21
|
+
|
22
|
+
/** The capacity of the string list that has been allocated. */
|
23
|
+
size_t capacity;
|
24
|
+
|
25
|
+
/** A pointer to the start of the string list. */
|
26
|
+
pm_string_t *strings;
|
27
|
+
} pm_string_list_t;
|
28
|
+
|
29
|
+
/**
|
30
|
+
* Append a pm_string_t to the given string list.
|
31
|
+
*
|
32
|
+
* @param string_list The string list to append to.
|
33
|
+
* @param string The string to append.
|
34
|
+
*/
|
35
|
+
void pm_string_list_append(pm_string_list_t *string_list, pm_string_t *string);
|
36
|
+
|
37
|
+
/**
|
38
|
+
* Free the memory associated with the string list.
|
39
|
+
*
|
40
|
+
* @param string_list The string list to free.
|
41
|
+
*/
|
42
|
+
PRISM_EXPORTED_FUNCTION void pm_string_list_free(pm_string_list_t *string_list);
|
43
|
+
|
44
|
+
#endif
|
@@ -0,0 +1,32 @@
|
|
1
|
+
/**
|
2
|
+
* @file pm_strncasecmp.h
|
3
|
+
*
|
4
|
+
* A custom strncasecmp implementation.
|
5
|
+
*/
|
6
|
+
#ifndef PRISM_STRNCASECMP_H
|
7
|
+
#define PRISM_STRNCASECMP_H
|
8
|
+
|
9
|
+
#include "prism/defines.h"
|
10
|
+
|
11
|
+
#include <ctype.h>
|
12
|
+
#include <stddef.h>
|
13
|
+
#include <stdint.h>
|
14
|
+
|
15
|
+
/**
|
16
|
+
* Compare two strings, ignoring case, up to the given length. Returns 0 if the
|
17
|
+
* strings are equal, a negative number if string1 is less than string2, or a
|
18
|
+
* positive number if string1 is greater than string2.
|
19
|
+
*
|
20
|
+
* Note that this is effectively our own implementation of strncasecmp, but it's
|
21
|
+
* not available on all of the platforms we want to support so we're rolling it
|
22
|
+
* here.
|
23
|
+
*
|
24
|
+
* @param string1 The first string to compare.
|
25
|
+
* @param string2 The second string to compare
|
26
|
+
* @param length The maximum number of characters to compare.
|
27
|
+
* @return 0 if the strings are equal, a negative number if string1 is less than
|
28
|
+
* string2, or a positive number if string1 is greater than string2.
|
29
|
+
*/
|
30
|
+
int pm_strncasecmp(const uint8_t *string1, const uint8_t *string2, size_t length);
|
31
|
+
|
32
|
+
#endif
|
@@ -0,0 +1,46 @@
|
|
1
|
+
/**
|
2
|
+
* @file pm_strpbrk.h
|
3
|
+
*
|
4
|
+
* A custom strpbrk implementation.
|
5
|
+
*/
|
6
|
+
#ifndef PRISM_STRPBRK_H
|
7
|
+
#define PRISM_STRPBRK_H
|
8
|
+
|
9
|
+
#include "prism/defines.h"
|
10
|
+
#include "prism/diagnostic.h"
|
11
|
+
#include "prism/parser.h"
|
12
|
+
|
13
|
+
#include <stddef.h>
|
14
|
+
#include <string.h>
|
15
|
+
|
16
|
+
/**
|
17
|
+
* Here we have rolled our own version of strpbrk. The standard library strpbrk
|
18
|
+
* has undefined behavior when the source string is not null-terminated. We want
|
19
|
+
* to support strings that are not null-terminated because pm_parse does not
|
20
|
+
* have the contract that the string is null-terminated. (This is desirable
|
21
|
+
* because it means the extension can call pm_parse with the result of a call to
|
22
|
+
* mmap).
|
23
|
+
*
|
24
|
+
* The standard library strpbrk also does not support passing a maximum length
|
25
|
+
* to search. We want to support this for the reason mentioned above, but we
|
26
|
+
* also don't want it to stop on null bytes. Ruby actually allows null bytes
|
27
|
+
* within strings, comments, regular expressions, etc. So we need to be able to
|
28
|
+
* skip past them.
|
29
|
+
*
|
30
|
+
* Finally, we want to support encodings wherein the charset could contain
|
31
|
+
* characters that are trailing bytes of multi-byte characters. For example, in
|
32
|
+
* Shift-JIS, the backslash character can be a trailing byte. In that case we
|
33
|
+
* need to take a slower path and iterate one multi-byte character at a time.
|
34
|
+
*
|
35
|
+
* @param parser The parser.
|
36
|
+
* @param source The source to search.
|
37
|
+
* @param charset The charset to search for.
|
38
|
+
* @param length The maximum number of bytes to search.
|
39
|
+
* @param validate Whether to validate that the source string is valid in the
|
40
|
+
* current encoding of the parser.
|
41
|
+
* @return A pointer to the first character in the source string that is in the
|
42
|
+
* charset, or NULL if no such character exists.
|
43
|
+
*/
|
44
|
+
const uint8_t * pm_strpbrk(pm_parser_t *parser, const uint8_t *source, const uint8_t *charset, ptrdiff_t length, bool validate);
|
45
|
+
|
46
|
+
#endif
|
@@ -0,0 +1,29 @@
|
|
1
|
+
/**
|
2
|
+
* @file version.h
|
3
|
+
*
|
4
|
+
* The version of the Prism library.
|
5
|
+
*/
|
6
|
+
#ifndef PRISM_VERSION_H
|
7
|
+
#define PRISM_VERSION_H
|
8
|
+
|
9
|
+
/**
|
10
|
+
* The major version of the Prism library as an int.
|
11
|
+
*/
|
12
|
+
#define PRISM_VERSION_MAJOR 0
|
13
|
+
|
14
|
+
/**
|
15
|
+
* The minor version of the Prism library as an int.
|
16
|
+
*/
|
17
|
+
#define PRISM_VERSION_MINOR 23
|
18
|
+
|
19
|
+
/**
|
20
|
+
* The patch version of the Prism library as an int.
|
21
|
+
*/
|
22
|
+
#define PRISM_VERSION_PATCH 0
|
23
|
+
|
24
|
+
/**
|
25
|
+
* The version of the Prism library as a constant string.
|
26
|
+
*/
|
27
|
+
#define PRISM_VERSION "0.23.0"
|
28
|
+
|
29
|
+
#endif
|