Compare commits

...

24 Commits

Author SHA1 Message Date
b59c59e7e1 Refactor the lexer to use the state transitions table 2023-07-30 22:44:11 +01:00
574f771444 Update the state transitions table 2023-07-30 22:43:53 +01:00
1d118c8568 Remove notes 2023-07-30 22:43:37 +01:00
896a9ff085 Update run_tests.py 2023-07-30 22:29:06 +01:00
eece52600b Update run_tests.py 2023-07-30 21:46:28 +01:00
7cb4b28da8 Store the current character and add more handlers after the state
transition
2023-07-30 19:18:10 +01:00
bf958056bd Add basic test suite to validate that the parser works 2023-07-30 12:43:08 +01:00
ec6df32839 Start implementing using the state transition table in the lexer 2023-07-30 11:47:26 +01:00
de57d9f14b Add enum value for newline 2023-07-30 00:37:39 +01:00
f1f90cf56b Specify the length of the strings tables explicitly 2023-07-29 22:10:28 +01:00
41d7cf2717 Reformat 2023-07-29 22:09:09 +01:00
002a8e7064 Get the input and state strings from tables instead of switch cases 2023-07-29 22:07:03 +01:00
fc80095d1f Remove clear_file and update write_table to accept a file pointer 2023-07-29 21:46:59 +01:00
642d000ebd Fix keyword handling so the final keyword states don't consume input 2023-07-29 21:42:20 +01:00
b4a4865870 Regenerate the state table 2023-07-27 00:54:53 +01:00
1b4d6a6156 Update column width and write row state as a comment 2023-07-27 00:53:39 +01:00
26fabd91b9 Ensure build scripts fail if attempting to run them from different
directory
2023-07-25 09:00:11 +01:00
adde1db0f4 Finalise generating the state table 2023-07-25 08:56:42 +01:00
7eec0e0730 Add generating the table to the main build script 2023-07-25 08:56:18 +01:00
6c454fbb8e Add char_type function to lexer.c but exclude it from build 2023-07-25 08:55:46 +01:00
fd8231b02d Pull states and inputs enums to a separate header 2023-07-23 22:49:23 +01:00
09f2315b66 Test generating a state transition table 2023-07-23 22:49:09 +01:00
91162654b3 Initial work on converting the state machine to a state table 2023-07-23 22:48:28 +01:00
6e93d3ecd1 Update .gitignore 2023-07-23 22:48:05 +01:00
11 changed files with 1234 additions and 788 deletions

1
.gitignore vendored
View File

@ -3,3 +3,4 @@
src/ignore/**/* src/ignore/**/*
main main
compile_commands.json compile_commands.json
gentable

28
compile
View File

@ -1,24 +1,28 @@
#!/bin/bash #!/bin/bash
CC=clang CC=clang
CFLAGS="-g -Wall -Werror -pedantic -Iinclude" CFLAGS="-g -Wall -Werror -pedantic -I./include"
SRC="src/main.c" SRC="./src/main.c"
OUT=main OUT=./main
# STATE_TABLE
(set -x;$CC $CFLAGS -I./include/lexer ./generate_state_table.c -o ./gentable)
./gentable
# DSTRING # DSTRING
CFLAGS+=" -Iinclude/dstring" CFLAGS+=" -I./include/dstring"
SRC+=" src/dstring/*.c" SRC+=" ./src/dstring/*.c"
# JSON_ENTITIES # JSON_ENTITIES
CFLAGS+=" -Iinclude/json_entities" CFLAGS+=" -I./include/json_entities"
SRC+=" src/json_entities/*.c" SRC+=" ./src/json_entities/*.c"
# LEXER # LEXER
CFLAGS+=" -Iinclude/lexer" CFLAGS+=" -I./include/lexer"
SRC+=" src/lexer/*.c" SRC+=" ./src/lexer/*.c"
# PARSER # PARSER
CFLAGS+=" -Iinclude/parser" CFLAGS+=" -I./include/parser"
SRC+=" src/parser/*.c" SRC+=" ./src/parser/*.c"
$CC $CFLAGS $SRC -o $OUT (set -x;$CC $CFLAGS $SRC -o $OUT)

673
generate_state_table.c Normal file
View File

@ -0,0 +1,673 @@
#include "aliases.h"
#include "lexer_data.h"
#include <ctype.h>
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#define STRING_BUF_LENGTH 100
INTERNAL void fill_table(void);
INTERNAL void write_table(FILE *fp);
INTERNAL void set_column_width(lexer_state_t state);
INTERNAL const char *get_input_string(lexer_input_t input);
INTERNAL const char *get_state_string(lexer_state_t state);
INTERNAL lexer_state_t lexer_state_machine(lexer_state_t state,
lexer_input_t input);
INTERNAL lexer_state_t handle_lexer_start(lexer_input_t input);
INTERNAL lexer_state_t handle_last_collection(char input);
INTERNAL lexer_state_t handle_object(lexer_input_t input);
INTERNAL lexer_state_t handle_object_end(lexer_input_t input);
INTERNAL lexer_state_t handle_array(lexer_input_t input);
INTERNAL lexer_state_t handle_array_end(lexer_input_t input);
INTERNAL lexer_state_t handle_key(lexer_input_t input);
INTERNAL lexer_state_t handle_value(lexer_input_t input);
INTERNAL lexer_state_t handle_string(lexer_input_t input);
INTERNAL lexer_state_t handle_string_end(lexer_input_t input);
INTERNAL lexer_state_t handle_escape_sequence(lexer_input_t input);
INTERNAL lexer_state_t handle_unicode_hex(lexer_input_t input,
lexer_state_t return_state);
INTERNAL lexer_state_t handle_decimal(lexer_input_t input);
INTERNAL lexer_state_t handle_number(lexer_input_t input);
INTERNAL lexer_state_t handle_fraction(lexer_input_t input);
INTERNAL lexer_state_t handle_exponent(lexer_input_t input);
INTERNAL lexer_state_t handle_exp_sign(lexer_input_t input);
INTERNAL lexer_state_t handle_power(lexer_input_t input);
INTERNAL lexer_state_t handle_number_end(lexer_input_t input);
INTERNAL lexer_state_t handle_true(lexer_input_t input,
lexer_state_t start_state);
INTERNAL lexer_state_t handle_false(lexer_input_t input,
lexer_state_t start_state);
INTERNAL lexer_state_t handle_null(lexer_input_t input,
lexer_state_t start_state);
INTERNAL lexer_state_t handle_keyword_end(lexer_input_t input);
INTERNAL i32 column_width = 0;
INTERNAL lexer_state_t state_table[COUNT_LEXER_STATES][COUNT_LEXER_INPUTS] = {
0};
INTERNAL const char *input_strings[COUNT_LEXER_STATES] = {
[LEXER_INPUT_NEWLINE] = "NEWLINE",
[LEXER_INPUT_WHITE_SPACE] = "WHITE_SPACE",
[LEXER_INPUT_OPEN_BRACE] = "OPEN_BRACE",
[LEXER_INPUT_CLOSE_BRACE] = "CLOSE_BRACE",
[LEXER_INPUT_OPEN_BRACKET] = "OPEN_BRACKET",
[LEXER_INPUT_CLOSE_BRACKET] = "CLOSE_BRACKET",
[LEXER_INPUT_COMMA] = "COMMA",
[LEXER_INPUT_COLON] = "COLON",
[LEXER_INPUT_DOUBLE_QUOTE] = "DOUBLE_QUOTE",
[LEXER_INPUT_BACK_SLASH] = "BACK_SLASH",
[LEXER_INPUT_FORWARD_SLASH] = "FORWARD_SLASH",
[LEXER_INPUT_LOWER_A] = "LOWER_A",
[LEXER_INPUT_LOWER_B] = "LOWER_B",
[LEXER_INPUT_LOWER_C] = "LOWER_C",
[LEXER_INPUT_LOWER_D] = "LOWER_D",
[LEXER_INPUT_LOWER_E] = "LOWER_E",
[LEXER_INPUT_LOWER_F] = "LOWER_F",
[LEXER_INPUT_LOWER_L] = "LOWER_L",
[LEXER_INPUT_LOWER_N] = "LOWER_N",
[LEXER_INPUT_LOWER_R] = "LOWER_R",
[LEXER_INPUT_LOWER_S] = "LOWER_S",
[LEXER_INPUT_LOWER_T] = "LOWER_T",
[LEXER_INPUT_LOWER_U] = "LOWER_U",
[LEXER_INPUT_UPPER_A] = "UPPER_A",
[LEXER_INPUT_UPPER_B] = "UPPER_B",
[LEXER_INPUT_UPPER_C] = "UPPER_C",
[LEXER_INPUT_UPPER_D] = "UPPER_D",
[LEXER_INPUT_UPPER_E] = "UPPER_E",
[LEXER_INPUT_UPPER_F] = "UPPER_F",
[LEXER_INPUT_MINUS] = "MINUS",
[LEXER_INPUT_PLUS] = "PLUS",
[LEXER_INPUT_DECIMAL] = "DECIMAL",
[LEXER_INPUT_ZERO] = "ZERO",
[LEXER_INPUT_NON_ZERO] = "NON_ZERO",
[LEXER_INPUT_OTHER] = "OTHER",
};
INTERNAL const char *state_strings[COUNT_LEXER_STATES] = {
[LEXER_STATE_ERROR] = "LEXER_STATE_ERROR",
[LEXER_STATE_START] = "LEXER_STATE_START",
[LEXER_STATE_VALUE] = "LEXER_STATE_VALUE",
[LEXER_STATE_VALUE_END] = "LEXER_STATE_VALUE_END",
[LEXER_STATE_OBJECT_START] = "LEXER_STATE_OBJECT_START",
[LEXER_STATE_OBJECT] = "LEXER_STATE_OBJECT",
[LEXER_STATE_OBJECT_END] = "LEXER_STATE_OBJECT_END",
[LEXER_STATE_ARRAY_START] = "LEXER_STATE_ARRAY_START",
[LEXER_STATE_ARRAY] = "LEXER_STATE_ARRAY",
[LEXER_STATE_ARRAY_END] = "LEXER_STATE_ARRAY_END",
[LEXER_STATE_LAST_COLLECTION] = "LEXER_STATE_LAST_COLLECTION",
[LEXER_STATE_KEY] = "LEXER_STATE_KEY",
[LEXER_STATE_KEY_END] = "LEXER_STATE_KEY_END",
[LEXER_STATE_DECIMAL] = "LEXER_STATE_DECIMAL",
[LEXER_STATE_NUMBER] = "LEXER_STATE_NUMBER",
[LEXER_STATE_FRACTION] = "LEXER_STATE_FRACTION",
[LEXER_STATE_EXPONENT] = "LEXER_STATE_EXPONENT",
[LEXER_STATE_EXP_SIGN] = "LEXER_STATE_EXP_SIGN",
[LEXER_STATE_POWER] = "LEXER_STATE_POWER",
[LEXER_STATE_NUMBER_END] = "LEXER_STATE_NUMBER_END",
[LEXER_STATE_STRING] = "LEXER_STATE_STRING",
[LEXER_STATE_STRING_END] = "LEXER_STATE_STRING_END",
[LEXER_STATE_ESCAPE_SEQUENCE] = "LEXER_STATE_ESCAPE_SEQUENCE",
[LEXER_STATE_UNICODE_HEX1] = "LEXER_STATE_UNICODE_HEX1",
[LEXER_STATE_UNICODE_HEX2] = "LEXER_STATE_UNICODE_HEX2",
[LEXER_STATE_UNICODE_HEX3] = "LEXER_STATE_UNICODE_HEX3",
[LEXER_STATE_UNICODE_HEX4] = "LEXER_STATE_UNICODE_HEX4",
[LEXER_STATE_T] = "LEXER_STATE_T",
[LEXER_STATE_TR] = "LEXER_STATE_TR",
[LEXER_STATE_TRU] = "LEXER_STATE_TRU",
[LEXER_STATE_TRUE] = "LEXER_STATE_TRUE",
[LEXER_STATE_F] = "LEXER_STATE_F",
[LEXER_STATE_FA] = "LEXER_STATE_FA",
[LEXER_STATE_FAL] = "LEXER_STATE_FAL",
[LEXER_STATE_FALS] = "LEXER_STATE_FALS",
[LEXER_STATE_FALSE] = "LEXER_STATE_FALSE",
[LEXER_STATE_N] = "LEXER_STATE_N",
[LEXER_STATE_NU] = "LEXER_STATE_NU",
[LEXER_STATE_NUL] = "LEXER_STATE_NUL",
[LEXER_STATE_NULL] = "LEXER_STATE_NULL",
[LEXER_STATE_KEYWORD_END] = "LEXER_STATE_KEYWORD_END",
};
INTERNAL const char *filename = "./include/lexer/lexer_state_transitions.table";
int main(void) {
FILE *fp = fopen(filename, "w");
if (!fp) {
printf("Failed to open file\n");
return EXIT_FAILURE;
}
fill_table();
write_table(fp);
fclose(fp);
return EXIT_SUCCESS;
}
INTERNAL void fill_table(void) {
lexer_state_t state;
lexer_input_t input;
for (u64 i = 0; i < COUNT_LEXER_STATES; ++i) {
state = (lexer_state_t)i;
for (u64 j = 0; j < COUNT_LEXER_INPUTS; ++j) {
input = (lexer_input_t)j;
state_table[i][j] = (lexer_state_t)lexer_state_machine(state, input);
}
}
}
void write_table(FILE *fp) {
const char *array_open = "{ ";
const u64 array_open_length = strlen(array_open);
const char *array_close = "},";
const u64 array_close_length = strlen(array_close);
const char *comment = "//";
const u64 comment_length = strlen(comment);
const char *table_header_end = " \n";
const u64 table_header_end_length = strlen(table_header_end);
char output[STRING_BUF_LENGTH] = {0};
u64 length = 0;
for (u64 i = 0; i < COUNT_LEXER_STATES; ++i) {
set_column_width((lexer_state_t)i);
}
fwrite(comment, sizeof(char), comment_length, fp);
i32 column_white_space = 0;
for (u64 i = 0; i < COUNT_LEXER_INPUTS; ++i) {
const char *input_str = get_input_string((lexer_input_t)i);
column_white_space = (column_width - strlen(input_str)) / 2;
sprintf(output, "%*s%*s| ", column_width - column_white_space, input_str,
column_white_space, " ");
length = strlen(output);
fwrite(output, sizeof(char), length, fp);
}
fwrite(table_header_end, sizeof(char), table_header_end_length, fp);
for (u64 i = 0; i < COUNT_LEXER_STATES; ++i) {
fwrite(array_open, sizeof(char), array_open_length, fp);
for (u64 j = 0; j < COUNT_LEXER_INPUTS; ++j) {
sprintf(output, "%*s, ", column_width,
get_state_string((lexer_state_t)state_table[i][j]));
length = strlen(output);
fwrite(output, sizeof(char), length, fp);
}
fwrite(array_close, sizeof(char), array_close_length, fp);
sprintf(output, " // %s\n", get_state_string((lexer_state_t)i));
length = strlen(output);
fwrite(output, sizeof(char), length, fp);
memset(output, 0, STRING_BUF_LENGTH);
}
}
INTERNAL void set_column_width(lexer_state_t state) {
if (state >= COUNT_LEXER_STATES) {
return;
}
const char *output = state_strings[state];
i32 length = strlen(output);
column_width = length > column_width ? length : column_width;
}
INTERNAL const char *get_input_string(lexer_input_t input) {
if (input >= COUNT_LEXER_INPUTS) {
return "";
}
return input_strings[input];
}
INTERNAL const char *get_state_string(lexer_state_t state) {
if (state >= COUNT_LEXER_STATES) {
return "";
}
return state_strings[state];
}
lexer_state_t lexer_state_machine(lexer_state_t state, lexer_input_t input) {
switch (state) {
case LEXER_STATE_START:
return handle_lexer_start(input);
case LEXER_STATE_VALUE:
return handle_value(input);
case LEXER_STATE_OBJECT:
return handle_object(input);
case LEXER_STATE_OBJECT_END:
return handle_object_end(input);
case LEXER_STATE_ARRAY:
return handle_array(input);
case LEXER_STATE_ARRAY_END:
return handle_array_end(input);
case LEXER_STATE_KEY:
return handle_key(input);
case LEXER_STATE_DECIMAL:
return handle_decimal(input);
case LEXER_STATE_NUMBER:
return handle_number(input);
case LEXER_STATE_FRACTION:
return handle_fraction(input);
case LEXER_STATE_EXPONENT:
return handle_exponent(input);
case LEXER_STATE_EXP_SIGN:
return handle_exp_sign(input);
case LEXER_STATE_POWER:
return handle_power(input);
case LEXER_STATE_NUMBER_END:
return handle_number_end(input);
case LEXER_STATE_STRING:
return handle_string(input);
case LEXER_STATE_STRING_END:
return handle_string_end(input);
case LEXER_STATE_ESCAPE_SEQUENCE:
return handle_escape_sequence(input);
case LEXER_STATE_UNICODE_HEX1:
return handle_unicode_hex(input, LEXER_STATE_UNICODE_HEX2);
case LEXER_STATE_UNICODE_HEX2:
return handle_unicode_hex(input, LEXER_STATE_UNICODE_HEX3);
case LEXER_STATE_UNICODE_HEX3:
return handle_unicode_hex(input, LEXER_STATE_UNICODE_HEX4);
case LEXER_STATE_UNICODE_HEX4:
return handle_unicode_hex(input, LEXER_STATE_STRING);
case LEXER_STATE_T:
return handle_true(input, LEXER_STATE_T);
case LEXER_STATE_TR:
return handle_true(input, LEXER_STATE_TR);
case LEXER_STATE_TRU:
return handle_true(input, LEXER_STATE_TRU);
case LEXER_STATE_F:
return handle_false(input, LEXER_STATE_F);
case LEXER_STATE_FA:
return handle_false(input, LEXER_STATE_FA);
case LEXER_STATE_FAL:
return handle_false(input, LEXER_STATE_FAL);
case LEXER_STATE_FALS:
return handle_false(input, LEXER_STATE_FALS);
case LEXER_STATE_N:
return handle_null(input, LEXER_STATE_N);
case LEXER_STATE_NU:
return handle_null(input, LEXER_STATE_NU);
case LEXER_STATE_NUL:
return handle_null(input, LEXER_STATE_NUL);
case LEXER_STATE_KEYWORD_END:
return handle_keyword_end(input);
case LEXER_STATE_LAST_COLLECTION:
return handle_last_collection(input);
case LEXER_STATE_TRUE:
case LEXER_STATE_FALSE:
case LEXER_STATE_NULL:
case LEXER_STATE_OBJECT_START:
case LEXER_STATE_ARRAY_START:
case LEXER_STATE_KEY_END:
case LEXER_STATE_VALUE_END:
case LEXER_STATE_ERROR:
case COUNT_LEXER_STATES:
return LEXER_STATE_ERROR;
}
}
lexer_state_t handle_lexer_start(lexer_input_t input) {
switch (input) {
case LEXER_INPUT_NEWLINE:
case LEXER_INPUT_WHITE_SPACE:
return LEXER_STATE_START;
case LEXER_INPUT_OPEN_BRACE:
return LEXER_STATE_OBJECT_START;
case LEXER_INPUT_OPEN_BRACKET:
return LEXER_STATE_ARRAY_START;
default:
return LEXER_STATE_ERROR;
}
}
lexer_state_t handle_last_collection(char input) {
if (input == LEXER_INPUT_NEWLINE || input == LEXER_INPUT_WHITE_SPACE) {
return LEXER_STATE_LAST_COLLECTION;
}
return LEXER_STATE_ERROR;
}
lexer_state_t handle_object(lexer_input_t input) {
switch (input) {
case LEXER_INPUT_NEWLINE:
case LEXER_INPUT_WHITE_SPACE:
return LEXER_STATE_OBJECT;
case LEXER_INPUT_DOUBLE_QUOTE:
return LEXER_STATE_KEY;
case LEXER_INPUT_CLOSE_BRACE:
return LEXER_STATE_OBJECT_END;
default:
return LEXER_STATE_ERROR;
}
}
lexer_state_t handle_object_end(lexer_input_t input) {
switch (input) {
case LEXER_INPUT_NEWLINE:
case LEXER_INPUT_WHITE_SPACE:
case LEXER_INPUT_CLOSE_BRACE:
return LEXER_STATE_OBJECT_END;
case LEXER_INPUT_CLOSE_BRACKET:
return LEXER_STATE_ARRAY_END;
case LEXER_INPUT_COMMA:
return LEXER_STATE_VALUE_END;
default:
return LEXER_STATE_ERROR;
}
}
lexer_state_t handle_array(lexer_input_t input) {
switch (input) {
case LEXER_INPUT_NEWLINE:
case LEXER_INPUT_WHITE_SPACE:
return LEXER_STATE_ARRAY;
case LEXER_INPUT_CLOSE_BRACKET:
return LEXER_STATE_ARRAY_END;
default:
return handle_value(input);
}
}
lexer_state_t handle_array_end(lexer_input_t input) {
switch (input) {
case LEXER_INPUT_NEWLINE:
case LEXER_INPUT_WHITE_SPACE:
case LEXER_INPUT_CLOSE_BRACKET:
return LEXER_STATE_ARRAY_END;
case LEXER_INPUT_CLOSE_BRACE:
return LEXER_STATE_OBJECT_END;
case LEXER_INPUT_COMMA:
return LEXER_STATE_VALUE_END;
default:
return LEXER_STATE_ERROR;
}
}
lexer_state_t handle_key(lexer_input_t input) { return LEXER_STATE_STRING; }
lexer_state_t handle_value(lexer_input_t input) {
switch (input) {
case LEXER_INPUT_NEWLINE:
case LEXER_INPUT_WHITE_SPACE:
return LEXER_STATE_VALUE;
case LEXER_INPUT_NON_ZERO:
case LEXER_INPUT_MINUS:
return LEXER_STATE_NUMBER;
case LEXER_INPUT_ZERO:
return LEXER_STATE_DECIMAL;
case LEXER_INPUT_DOUBLE_QUOTE:
return LEXER_STATE_STRING;
case LEXER_INPUT_OPEN_BRACE:
return LEXER_STATE_OBJECT_START;
case LEXER_INPUT_OPEN_BRACKET:
return LEXER_STATE_ARRAY_START;
case LEXER_INPUT_LOWER_T:
return LEXER_STATE_T;
case LEXER_INPUT_LOWER_F:
return LEXER_STATE_F;
case LEXER_INPUT_LOWER_N:
return LEXER_STATE_N;
default:
return LEXER_STATE_ERROR;
}
}
lexer_state_t handle_string(lexer_input_t input) {
switch (input) {
case LEXER_INPUT_BACK_SLASH:
return LEXER_STATE_ESCAPE_SEQUENCE;
case LEXER_INPUT_DOUBLE_QUOTE:
return LEXER_STATE_STRING_END;
default:
return LEXER_STATE_STRING;
}
}
lexer_state_t handle_string_end(lexer_input_t input) {
switch (input) {
case LEXER_INPUT_NEWLINE:
case LEXER_INPUT_WHITE_SPACE:
return LEXER_STATE_STRING_END;
case LEXER_INPUT_COLON:
return LEXER_STATE_KEY_END;
case LEXER_INPUT_COMMA:
return LEXER_STATE_VALUE_END;
case LEXER_INPUT_CLOSE_BRACE:
return LEXER_STATE_OBJECT_END;
case LEXER_INPUT_CLOSE_BRACKET:
return LEXER_STATE_ARRAY_END;
default:
return LEXER_STATE_ERROR;
}
}
lexer_state_t handle_escape_sequence(lexer_input_t input) {
switch (input) {
case LEXER_INPUT_DOUBLE_QUOTE:
case LEXER_INPUT_FORWARD_SLASH:
case LEXER_INPUT_BACK_SLASH:
case LEXER_INPUT_LOWER_B:
case LEXER_INPUT_LOWER_F:
case LEXER_INPUT_LOWER_N:
case LEXER_INPUT_LOWER_R:
case LEXER_INPUT_LOWER_T:
return LEXER_STATE_STRING;
case LEXER_INPUT_LOWER_U:
return LEXER_STATE_UNICODE_HEX1;
default:
return LEXER_STATE_ERROR;
}
}
INTERNAL lexer_state_t handle_unicode_hex(lexer_input_t input,
lexer_state_t return_state) {
switch (input) {
case LEXER_INPUT_LOWER_A:
case LEXER_INPUT_LOWER_B:
case LEXER_INPUT_LOWER_C:
case LEXER_INPUT_LOWER_D:
case LEXER_INPUT_LOWER_E:
case LEXER_INPUT_LOWER_F:
case LEXER_INPUT_UPPER_A:
case LEXER_INPUT_UPPER_B:
case LEXER_INPUT_UPPER_C:
case LEXER_INPUT_UPPER_D:
case LEXER_INPUT_UPPER_E:
case LEXER_INPUT_UPPER_F:
case LEXER_INPUT_ZERO:
case LEXER_INPUT_NON_ZERO:
return return_state;
default:
return LEXER_STATE_ERROR;
}
}
lexer_state_t handle_decimal(lexer_input_t input) {
if (input == LEXER_INPUT_DECIMAL) {
return LEXER_STATE_FRACTION;
}
return LEXER_STATE_ERROR;
}
lexer_state_t handle_number(lexer_input_t input) {
switch (input) {
case LEXER_INPUT_ZERO:
case LEXER_INPUT_NON_ZERO:
return LEXER_STATE_NUMBER;
case LEXER_INPUT_DECIMAL:
return LEXER_STATE_FRACTION;
case LEXER_INPUT_CLOSE_BRACE:
return LEXER_STATE_OBJECT_END;
case LEXER_INPUT_CLOSE_BRACKET:
return LEXER_STATE_ARRAY_END;
case LEXER_INPUT_COMMA:
return LEXER_STATE_VALUE_END;
case LEXER_INPUT_NEWLINE:
case LEXER_INPUT_WHITE_SPACE:
return LEXER_STATE_NUMBER_END;
default:
return LEXER_STATE_ERROR;
}
}
lexer_state_t handle_fraction(lexer_input_t input) {
switch (input) {
case LEXER_INPUT_ZERO:
case LEXER_INPUT_NON_ZERO:
return LEXER_STATE_FRACTION;
case LEXER_INPUT_CLOSE_BRACE:
return LEXER_STATE_OBJECT_END;
case LEXER_INPUT_CLOSE_BRACKET:
return LEXER_STATE_ARRAY_END;
case LEXER_INPUT_LOWER_E:
case LEXER_INPUT_UPPER_E:
return LEXER_STATE_EXPONENT;
case LEXER_INPUT_COMMA:
return LEXER_STATE_VALUE_END;
case LEXER_INPUT_NEWLINE:
case LEXER_INPUT_WHITE_SPACE:
return LEXER_STATE_NUMBER_END;
default:
return LEXER_STATE_ERROR;
}
}
lexer_state_t handle_exponent(lexer_input_t input) {
switch (input) {
case LEXER_INPUT_ZERO:
case LEXER_INPUT_NON_ZERO:
return LEXER_STATE_POWER;
case LEXER_INPUT_PLUS:
case LEXER_INPUT_MINUS:
return LEXER_STATE_EXP_SIGN;
default:
return LEXER_STATE_ERROR;
}
}
lexer_state_t handle_exp_sign(lexer_input_t input) {
switch (input) {
case LEXER_INPUT_ZERO:
case LEXER_INPUT_NON_ZERO:
return LEXER_STATE_POWER;
default:
return LEXER_STATE_ERROR;
}
}
lexer_state_t handle_power(lexer_input_t input) {
switch (input) {
case LEXER_INPUT_ZERO:
case LEXER_INPUT_NON_ZERO:
return LEXER_STATE_POWER;
case LEXER_INPUT_CLOSE_BRACE:
return LEXER_STATE_OBJECT_END;
case LEXER_INPUT_CLOSE_BRACKET:
return LEXER_STATE_ARRAY_END;
case LEXER_INPUT_COMMA:
return LEXER_STATE_VALUE_END;
case LEXER_INPUT_NEWLINE:
case LEXER_INPUT_WHITE_SPACE:
return LEXER_STATE_NUMBER_END;
default:
return LEXER_STATE_ERROR;
}
}
lexer_state_t handle_number_end(lexer_input_t input) {
switch (input) {
case LEXER_INPUT_NEWLINE:
case LEXER_INPUT_WHITE_SPACE:
return LEXER_STATE_NUMBER_END;
case LEXER_INPUT_CLOSE_BRACE:
return LEXER_STATE_OBJECT_END;
case LEXER_INPUT_CLOSE_BRACKET:
return LEXER_STATE_ARRAY_END;
case LEXER_INPUT_COMMA:
return LEXER_STATE_VALUE_END;
default:
return LEXER_STATE_ERROR;
}
}
lexer_state_t handle_true(lexer_input_t input, lexer_state_t start_state) {
switch (start_state) {
case LEXER_STATE_T:
return input == LEXER_INPUT_LOWER_R ? LEXER_STATE_TR : LEXER_STATE_ERROR;
case LEXER_STATE_TR:
return input == LEXER_INPUT_LOWER_U ? LEXER_STATE_TRU : LEXER_STATE_ERROR;
case LEXER_STATE_TRU:
return input == LEXER_INPUT_LOWER_E ? LEXER_STATE_TRUE : LEXER_STATE_ERROR;
default:
return LEXER_STATE_ERROR;
}
}
lexer_state_t handle_false(lexer_input_t input, lexer_state_t start_state) {
switch (start_state) {
case LEXER_STATE_F:
return input == LEXER_INPUT_LOWER_A ? LEXER_STATE_FA : LEXER_STATE_ERROR;
case LEXER_STATE_FA:
return input == LEXER_INPUT_LOWER_L ? LEXER_STATE_FAL : LEXER_STATE_ERROR;
case LEXER_STATE_FAL:
return input == LEXER_INPUT_LOWER_S ? LEXER_STATE_FALS : LEXER_STATE_ERROR;
case LEXER_STATE_FALS:
return input == LEXER_INPUT_LOWER_E ? LEXER_STATE_FALSE : LEXER_STATE_ERROR;
default:
return LEXER_STATE_ERROR;
}
}
lexer_state_t handle_null(lexer_input_t input, lexer_state_t start_state) {
switch (start_state) {
case LEXER_STATE_N:
return input == LEXER_INPUT_LOWER_U ? LEXER_STATE_NU : LEXER_STATE_ERROR;
case LEXER_STATE_NU:
return input == LEXER_INPUT_LOWER_L ? LEXER_STATE_NUL : LEXER_STATE_ERROR;
case LEXER_STATE_NUL:
return input == LEXER_INPUT_LOWER_L ? LEXER_STATE_NULL : LEXER_STATE_ERROR;
default:
return LEXER_STATE_ERROR;
}
}
lexer_state_t handle_keyword_end(lexer_input_t input) {
switch (input) {
case LEXER_INPUT_NEWLINE:
case LEXER_INPUT_WHITE_SPACE:
return LEXER_STATE_KEYWORD_END;
case LEXER_INPUT_CLOSE_BRACE:
return LEXER_STATE_OBJECT_END;
case LEXER_INPUT_CLOSE_BRACKET:
return LEXER_STATE_ARRAY_END;
case LEXER_INPUT_COMMA:
return LEXER_STATE_VALUE_END;
default:
return LEXER_STATE_ERROR;
}
}

View File

@ -4,9 +4,6 @@
#include "aliases.h" #include "aliases.h"
#include <stdbool.h> #include <stdbool.h>
#define VALID_JSON true
#define INVALID_JSON false
typedef const char *str_view_t; typedef const char *str_view_t;
typedef enum { typedef enum {

View File

@ -0,0 +1,96 @@
#ifndef LEXER_DATA_H
#define LEXER_DATA_H
typedef enum {
// GENERAL STATES
LEXER_STATE_ERROR,
LEXER_STATE_START,
LEXER_STATE_VALUE,
LEXER_STATE_VALUE_END,
// COLLECTION STATES
LEXER_STATE_OBJECT_START,
LEXER_STATE_OBJECT,
LEXER_STATE_OBJECT_END,
LEXER_STATE_ARRAY_START,
LEXER_STATE_ARRAY,
LEXER_STATE_ARRAY_END,
LEXER_STATE_LAST_COLLECTION,
// OBJECT STATES
LEXER_STATE_KEY,
LEXER_STATE_KEY_END,
// NUMBER STATES
LEXER_STATE_DECIMAL,
LEXER_STATE_NUMBER,
LEXER_STATE_FRACTION,
LEXER_STATE_EXPONENT,
LEXER_STATE_EXP_SIGN,
LEXER_STATE_POWER,
LEXER_STATE_NUMBER_END,
// STRING STATES
LEXER_STATE_STRING,
LEXER_STATE_STRING_END,
LEXER_STATE_ESCAPE_SEQUENCE,
LEXER_STATE_UNICODE_HEX1,
LEXER_STATE_UNICODE_HEX2,
LEXER_STATE_UNICODE_HEX3,
LEXER_STATE_UNICODE_HEX4,
// KEYWORD STATES
LEXER_STATE_T,
LEXER_STATE_TR,
LEXER_STATE_TRU,
LEXER_STATE_TRUE,
LEXER_STATE_F,
LEXER_STATE_FA,
LEXER_STATE_FAL,
LEXER_STATE_FALS,
LEXER_STATE_FALSE,
LEXER_STATE_N,
LEXER_STATE_NU,
LEXER_STATE_NUL,
LEXER_STATE_NULL,
LEXER_STATE_KEYWORD_END,
COUNT_LEXER_STATES,
} lexer_state_t;
typedef enum {
LEXER_INPUT_NEWLINE,
LEXER_INPUT_WHITE_SPACE,
LEXER_INPUT_OPEN_BRACE,
LEXER_INPUT_CLOSE_BRACE,
LEXER_INPUT_OPEN_BRACKET,
LEXER_INPUT_CLOSE_BRACKET,
LEXER_INPUT_COMMA,
LEXER_INPUT_COLON,
LEXER_INPUT_DOUBLE_QUOTE,
LEXER_INPUT_BACK_SLASH,
LEXER_INPUT_FORWARD_SLASH,
LEXER_INPUT_LOWER_A,
LEXER_INPUT_LOWER_B,
LEXER_INPUT_LOWER_C,
LEXER_INPUT_LOWER_D,
LEXER_INPUT_LOWER_E,
LEXER_INPUT_LOWER_F,
LEXER_INPUT_LOWER_L,
LEXER_INPUT_LOWER_N,
LEXER_INPUT_LOWER_R,
LEXER_INPUT_LOWER_S,
LEXER_INPUT_LOWER_T,
LEXER_INPUT_LOWER_U,
LEXER_INPUT_UPPER_A,
LEXER_INPUT_UPPER_B,
LEXER_INPUT_UPPER_C,
LEXER_INPUT_UPPER_D,
LEXER_INPUT_UPPER_E,
LEXER_INPUT_UPPER_F,
LEXER_INPUT_MINUS,
LEXER_INPUT_PLUS,
LEXER_INPUT_DECIMAL,
LEXER_INPUT_ZERO,
LEXER_INPUT_NON_ZERO,
LEXER_INPUT_OTHER,
COUNT_LEXER_INPUTS,
} lexer_input_t;
#endif // !LEXER_DATA_H

View File

@ -0,0 +1,42 @@
// NEWLINE | WHITE_SPACE | OPEN_BRACE | CLOSE_BRACE | OPEN_BRACKET | CLOSE_BRACKET | COMMA | COLON | DOUBLE_QUOTE | BACK_SLASH | FORWARD_SLASH | LOWER_A | LOWER_B | LOWER_C | LOWER_D | LOWER_E | LOWER_F | LOWER_L | LOWER_N | LOWER_R | LOWER_S | LOWER_T | LOWER_U | UPPER_A | UPPER_B | UPPER_C | UPPER_D | UPPER_E | UPPER_F | MINUS | PLUS | DECIMAL | ZERO | NON_ZERO | OTHER |
{ LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, }, // LEXER_STATE_ERROR
{ LEXER_STATE_START, LEXER_STATE_START, LEXER_STATE_OBJECT_START, LEXER_STATE_ERROR, LEXER_STATE_ARRAY_START, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, }, // LEXER_STATE_START
{ LEXER_STATE_VALUE, LEXER_STATE_VALUE, LEXER_STATE_OBJECT_START, LEXER_STATE_ERROR, LEXER_STATE_ARRAY_START, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_STRING, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_F, LEXER_STATE_ERROR, LEXER_STATE_N, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_T, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_NUMBER, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_DECIMAL, LEXER_STATE_NUMBER, LEXER_STATE_ERROR, }, // LEXER_STATE_VALUE
{ LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, }, // LEXER_STATE_VALUE_END
{ LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, }, // LEXER_STATE_OBJECT_START
{ LEXER_STATE_OBJECT, LEXER_STATE_OBJECT, LEXER_STATE_ERROR, LEXER_STATE_OBJECT_END, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_KEY, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, }, // LEXER_STATE_OBJECT
{ LEXER_STATE_OBJECT_END, LEXER_STATE_OBJECT_END, LEXER_STATE_ERROR, LEXER_STATE_OBJECT_END, LEXER_STATE_ERROR, LEXER_STATE_ARRAY_END, LEXER_STATE_VALUE_END, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, }, // LEXER_STATE_OBJECT_END
{ LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, }, // LEXER_STATE_ARRAY_START
{ LEXER_STATE_ARRAY, LEXER_STATE_ARRAY, LEXER_STATE_OBJECT_START, LEXER_STATE_ERROR, LEXER_STATE_ARRAY_START, LEXER_STATE_ARRAY_END, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_STRING, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_F, LEXER_STATE_ERROR, LEXER_STATE_N, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_T, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_NUMBER, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_DECIMAL, LEXER_STATE_NUMBER, LEXER_STATE_ERROR, }, // LEXER_STATE_ARRAY
{ LEXER_STATE_ARRAY_END, LEXER_STATE_ARRAY_END, LEXER_STATE_ERROR, LEXER_STATE_OBJECT_END, LEXER_STATE_ERROR, LEXER_STATE_ARRAY_END, LEXER_STATE_VALUE_END, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, }, // LEXER_STATE_ARRAY_END
{ LEXER_STATE_LAST_COLLECTION, LEXER_STATE_LAST_COLLECTION, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, }, // LEXER_STATE_LAST_COLLECTION
{ LEXER_STATE_STRING, LEXER_STATE_STRING, LEXER_STATE_STRING, LEXER_STATE_STRING, LEXER_STATE_STRING, LEXER_STATE_STRING, LEXER_STATE_STRING, LEXER_STATE_STRING, LEXER_STATE_STRING, LEXER_STATE_STRING, LEXER_STATE_STRING, LEXER_STATE_STRING, LEXER_STATE_STRING, LEXER_STATE_STRING, LEXER_STATE_STRING, LEXER_STATE_STRING, LEXER_STATE_STRING, LEXER_STATE_STRING, LEXER_STATE_STRING, LEXER_STATE_STRING, LEXER_STATE_STRING, LEXER_STATE_STRING, LEXER_STATE_STRING, LEXER_STATE_STRING, LEXER_STATE_STRING, LEXER_STATE_STRING, LEXER_STATE_STRING, LEXER_STATE_STRING, LEXER_STATE_STRING, LEXER_STATE_STRING, LEXER_STATE_STRING, LEXER_STATE_STRING, LEXER_STATE_STRING, LEXER_STATE_STRING, LEXER_STATE_STRING, }, // LEXER_STATE_KEY
{ LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, }, // LEXER_STATE_KEY_END
{ LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_FRACTION, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, }, // LEXER_STATE_DECIMAL
{ LEXER_STATE_NUMBER_END, LEXER_STATE_NUMBER_END, LEXER_STATE_ERROR, LEXER_STATE_OBJECT_END, LEXER_STATE_ERROR, LEXER_STATE_ARRAY_END, LEXER_STATE_VALUE_END, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_FRACTION, LEXER_STATE_NUMBER, LEXER_STATE_NUMBER, LEXER_STATE_ERROR, }, // LEXER_STATE_NUMBER
{ LEXER_STATE_NUMBER_END, LEXER_STATE_NUMBER_END, LEXER_STATE_ERROR, LEXER_STATE_OBJECT_END, LEXER_STATE_ERROR, LEXER_STATE_ARRAY_END, LEXER_STATE_VALUE_END, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_EXPONENT, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_EXPONENT, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_FRACTION, LEXER_STATE_FRACTION, LEXER_STATE_ERROR, }, // LEXER_STATE_FRACTION
{ LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_EXP_SIGN, LEXER_STATE_EXP_SIGN, LEXER_STATE_ERROR, LEXER_STATE_POWER, LEXER_STATE_POWER, LEXER_STATE_ERROR, }, // LEXER_STATE_EXPONENT
{ LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_POWER, LEXER_STATE_POWER, LEXER_STATE_ERROR, }, // LEXER_STATE_EXP_SIGN
{ LEXER_STATE_NUMBER_END, LEXER_STATE_NUMBER_END, LEXER_STATE_ERROR, LEXER_STATE_OBJECT_END, LEXER_STATE_ERROR, LEXER_STATE_ARRAY_END, LEXER_STATE_VALUE_END, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_POWER, LEXER_STATE_POWER, LEXER_STATE_ERROR, }, // LEXER_STATE_POWER
{ LEXER_STATE_NUMBER_END, LEXER_STATE_NUMBER_END, LEXER_STATE_ERROR, LEXER_STATE_OBJECT_END, LEXER_STATE_ERROR, LEXER_STATE_ARRAY_END, LEXER_STATE_VALUE_END, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, }, // LEXER_STATE_NUMBER_END
{ LEXER_STATE_STRING, LEXER_STATE_STRING, LEXER_STATE_STRING, LEXER_STATE_STRING, LEXER_STATE_STRING, LEXER_STATE_STRING, LEXER_STATE_STRING, LEXER_STATE_STRING, LEXER_STATE_STRING_END, LEXER_STATE_ESCAPE_SEQUENCE, LEXER_STATE_STRING, LEXER_STATE_STRING, LEXER_STATE_STRING, LEXER_STATE_STRING, LEXER_STATE_STRING, LEXER_STATE_STRING, LEXER_STATE_STRING, LEXER_STATE_STRING, LEXER_STATE_STRING, LEXER_STATE_STRING, LEXER_STATE_STRING, LEXER_STATE_STRING, LEXER_STATE_STRING, LEXER_STATE_STRING, LEXER_STATE_STRING, LEXER_STATE_STRING, LEXER_STATE_STRING, LEXER_STATE_STRING, LEXER_STATE_STRING, LEXER_STATE_STRING, LEXER_STATE_STRING, LEXER_STATE_STRING, LEXER_STATE_STRING, LEXER_STATE_STRING, LEXER_STATE_STRING, }, // LEXER_STATE_STRING
{ LEXER_STATE_STRING_END, LEXER_STATE_STRING_END, LEXER_STATE_ERROR, LEXER_STATE_OBJECT_END, LEXER_STATE_ERROR, LEXER_STATE_ARRAY_END, LEXER_STATE_VALUE_END, LEXER_STATE_KEY_END, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, }, // LEXER_STATE_STRING_END
{ LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_STRING, LEXER_STATE_STRING, LEXER_STATE_STRING, LEXER_STATE_ERROR, LEXER_STATE_STRING, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_STRING, LEXER_STATE_ERROR, LEXER_STATE_STRING, LEXER_STATE_STRING, LEXER_STATE_ERROR, LEXER_STATE_STRING, LEXER_STATE_UNICODE_HEX1, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, }, // LEXER_STATE_ESCAPE_SEQUENCE
{ LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_UNICODE_HEX2, LEXER_STATE_UNICODE_HEX2, LEXER_STATE_UNICODE_HEX2, LEXER_STATE_UNICODE_HEX2, LEXER_STATE_UNICODE_HEX2, LEXER_STATE_UNICODE_HEX2, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_UNICODE_HEX2, LEXER_STATE_UNICODE_HEX2, LEXER_STATE_UNICODE_HEX2, LEXER_STATE_UNICODE_HEX2, LEXER_STATE_UNICODE_HEX2, LEXER_STATE_UNICODE_HEX2, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_UNICODE_HEX2, LEXER_STATE_UNICODE_HEX2, LEXER_STATE_ERROR, }, // LEXER_STATE_UNICODE_HEX1
{ LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_UNICODE_HEX3, LEXER_STATE_UNICODE_HEX3, LEXER_STATE_UNICODE_HEX3, LEXER_STATE_UNICODE_HEX3, LEXER_STATE_UNICODE_HEX3, LEXER_STATE_UNICODE_HEX3, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_UNICODE_HEX3, LEXER_STATE_UNICODE_HEX3, LEXER_STATE_UNICODE_HEX3, LEXER_STATE_UNICODE_HEX3, LEXER_STATE_UNICODE_HEX3, LEXER_STATE_UNICODE_HEX3, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_UNICODE_HEX3, LEXER_STATE_UNICODE_HEX3, LEXER_STATE_ERROR, }, // LEXER_STATE_UNICODE_HEX2
{ LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_UNICODE_HEX4, LEXER_STATE_UNICODE_HEX4, LEXER_STATE_UNICODE_HEX4, LEXER_STATE_UNICODE_HEX4, LEXER_STATE_UNICODE_HEX4, LEXER_STATE_UNICODE_HEX4, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_UNICODE_HEX4, LEXER_STATE_UNICODE_HEX4, LEXER_STATE_UNICODE_HEX4, LEXER_STATE_UNICODE_HEX4, LEXER_STATE_UNICODE_HEX4, LEXER_STATE_UNICODE_HEX4, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_UNICODE_HEX4, LEXER_STATE_UNICODE_HEX4, LEXER_STATE_ERROR, }, // LEXER_STATE_UNICODE_HEX3
{ LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_STRING, LEXER_STATE_STRING, LEXER_STATE_STRING, LEXER_STATE_STRING, LEXER_STATE_STRING, LEXER_STATE_STRING, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_STRING, LEXER_STATE_STRING, LEXER_STATE_STRING, LEXER_STATE_STRING, LEXER_STATE_STRING, LEXER_STATE_STRING, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_STRING, LEXER_STATE_STRING, LEXER_STATE_ERROR, }, // LEXER_STATE_UNICODE_HEX4
{ LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_TR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, }, // LEXER_STATE_T
{ LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_TRU, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, }, // LEXER_STATE_TR
{ LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_TRUE, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, }, // LEXER_STATE_TRU
{ LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, }, // LEXER_STATE_TRUE
{ LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_FA, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, }, // LEXER_STATE_F
{ LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_FAL, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, }, // LEXER_STATE_FA
{ LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_FALS, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, }, // LEXER_STATE_FAL
{ LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_FALSE, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, }, // LEXER_STATE_FALS
{ LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, }, // LEXER_STATE_FALSE
{ LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_NU, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, }, // LEXER_STATE_N
{ LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_NUL, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, }, // LEXER_STATE_NU
{ LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_NULL, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, }, // LEXER_STATE_NUL
{ LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, }, // LEXER_STATE_NULL
{ LEXER_STATE_KEYWORD_END, LEXER_STATE_KEYWORD_END, LEXER_STATE_ERROR, LEXER_STATE_OBJECT_END, LEXER_STATE_ERROR, LEXER_STATE_ARRAY_END, LEXER_STATE_VALUE_END, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, LEXER_STATE_ERROR, }, // LEXER_STATE_KEYWORD_END

41
notes
View File

@ -1,41 +0,0 @@
TOKENS
Symbols
Array notation
[
]
Object notation
{
}
:
Separator
,
String
"
\ (for escape sequences)
Numerical
-
.
eE (exponents only)
+ (exponents only)
Keywords
true
false
null
Key
strings only
Implement stack data structure for pushing and pulling states when necessary
LEXER STATES
START
ERROR
END
VALUE
OBJECT_KEY
---------
OBJECT |
ARRAY |
PRIMITIVES |------> Can be values
STRING--------|------> Only one that can be an object key
NUMBER |
---------

View File

@ -1,5 +0,0 @@
#!/bin/bash
for JSON in $(find test_files -iregex .*json); do
./main $JSON
done

71
run_tests.py Executable file
View File

@ -0,0 +1,71 @@
#!/bin/env python3
import json
import subprocess
from pathlib import Path
class TermFormat:
OKGREEN = "\033[92m"
FAIL = "\033[91m"
ENDC = "\033[0m"
BOLD = "\033[1m"
def print_header(header, width, padding):
print(
f"{TermFormat.BOLD}{'=' * (int(width / 3) + padding)}{header}{'=' * (int(width / 3) + padding)}{TermFormat.ENDC}"
)
test_dir = Path(__file__).parent / "test_files"
hj_exec = Path(__file__).parent / "main"
valid_files = [
json_file
for json_file in test_dir.iterdir()
if json_file.is_file()
and "json" in json_file.suffix
and "invalid" not in json_file.stem
]
name_width = 0
for vf in valid_files:
if len(str(vf)) > name_width:
name_width = len(str(vf))
print_header("helloJSON TEST SUITE", name_width, 9)
print()
print_header("VALID FILES", name_width, 13)
for vf in valid_files:
with open(vf, "r") as infile:
try:
original = json.load(infile)
except json.JSONDecodeError as e:
print(
f"\n{TermFormat.BOLD}{TermFormat.FAIL}ERROR:{TermFormat.ENDC} Failed to decode {str(vf)}\n{e.msg}"
)
continue
cmd = [hj_exec, vf]
proc = subprocess.Popen(cmd, stdout=subprocess.PIPE, stderr=subprocess.STDOUT)
proc.wait()
stdout, _ = proc.communicate()
try:
parsed = json.loads(stdout)
except:
parsed = None
pass
match = original == parsed
print(
f"\n{str(vf):{name_width + 3}} {TermFormat.BOLD}{TermFormat.OKGREEN if match else TermFormat.FAIL}{'PASSED' if match else 'FAILED'}{TermFormat.ENDC}"
)

File diff suppressed because it is too large Load Diff

View File

@ -5,7 +5,7 @@
"position": [ "position": [
25.1212, 25.1212,
55.1535 55.1535
], ]
}, },
{ {
"name": "Shangri-La Hotel", "name": "Shangri-La Hotel",