#line 1 "/Users/aslakhellesoy/scm/gherkin/tasks/../ragel/i18n/enlol.c.rl" #include #include #if defined(_WIN32) #include #endif #ifdef HAVE_RUBY_RE_H #include #else #include #endif #ifdef HAVE_RUBY_ENCODING_H #include #define ENCODED_STR_NEW(ptr, len) \ rb_enc_str_new(ptr, len, rb_utf8_encoding()) #else #define ENCODED_STR_NEW(ptr, len) \ rb_str_new(ptr, len) #endif #define LF_FLAG 0 #define CRLF_FLAG 1 #define LF "\n" #define CRLF "\r\n" #ifndef RSTRING_PTR #define RSTRING_PTR(s) (RSTRING(s)->ptr) #endif #ifndef RSTRING_LEN #define RSTRING_LEN(s) (RSTRING(s)->len) #endif #define DATA_GET(FROM, TYPE, NAME) \ Data_Get_Struct(FROM, TYPE, NAME); \ if (NAME == NULL) { \ rb_raise(rb_eArgError, "NULL found for " # NAME " when it shouldn't be."); \ } typedef struct lexer_state { int content_len; int line_number; int current_line; int start_col; int eol; size_t mark; size_t keyword_start; size_t keyword_end; size_t next_keyword_start; size_t content_start; size_t content_end; size_t query_start; size_t last_newline; size_t final_newline; } lexer_state; static VALUE mGherkin; static VALUE mCLexer; static VALUE cI18nLexer; static VALUE rb_eGherkinLexingError; #define LEN(AT, P) (P - data - lexer->AT) #define MARK(M, P) (lexer->M = (P) - data) #define PTR_TO(P) (data + lexer->P) #define STORE_KW_END_CON(EVENT) \ store_kw_con(listener, # EVENT, \ PTR_TO(keyword_start), LEN(keyword_start, PTR_TO(keyword_end - 1)), \ PTR_TO(content_start), LEN(content_start, PTR_TO(content_end)), \ lexer->current_line, lexer->eol); \ if (lexer->content_end != 0) { \ p = PTR_TO(content_end - 1); \ } \ lexer->content_end = 0 #define STORE_ATTR(ATTR) \ store_attr(listener, # ATTR, \ PTR_TO(content_start), LEN(content_start, p), \ lexer->line_number) #line 235 "/Users/aslakhellesoy/scm/gherkin/tasks/../ragel/i18n/enlol.c.rl" /** Data **/ #line 92 "ext/gherkin_lexer_enlol/gherkin_lexer_enlol.c" static const char _lexer_actions[] = { 0, 1, 0, 1, 1, 1, 2, 1, 3, 1, 4, 1, 5, 1, 6, 1, 7, 1, 9, 1, 10, 1, 11, 1, 14, 1, 15, 1, 16, 1, 17, 1, 18, 1, 19, 1, 20, 1, 21, 2, 1, 16, 2, 12, 13, 2, 15, 0, 2, 15, 2, 2, 15, 14, 2, 15, 17, 2, 16, 4, 2, 16, 5, 2, 16, 6, 2, 16, 7, 2, 16, 8, 2, 16, 14, 2, 18, 19, 2, 20, 0, 2, 20, 2, 2, 20, 14, 2, 20, 17, 3, 3, 12, 13, 3, 9, 12, 13, 3, 10, 12, 13, 3, 11, 12, 13, 3, 12, 13, 16, 3, 15, 12, 13, 4, 1, 12, 13, 16, 4, 15, 0, 12, 13 }; static const short _lexer_key_offsets[] = { 0, 0, 18, 19, 20, 24, 29, 34, 39, 44, 48, 52, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 73, 78, 85, 90, 91, 93, 94, 95, 96, 110, 112, 114, 116, 118, 120, 122, 124, 126, 128, 130, 132, 134, 136, 138, 140, 158, 159, 160, 161, 162, 163, 164, 165, 166, 167, 168, 173, 174, 175, 176, 177, 178, 179, 180, 181, 182, 183, 184, 185, 186, 188, 189, 190, 191, 192, 193, 194, 195, 196, 210, 212, 214, 216, 218, 220, 222, 224, 226, 228, 230, 232, 234, 236, 238, 240, 242, 244, 246, 248, 250, 252, 254, 256, 258, 260, 262, 264, 266, 268, 270, 272, 274, 276, 277, 278, 292, 294, 296, 298, 300, 302, 304, 306, 308, 310, 312, 314, 316, 318, 320, 322, 324, 326, 328, 330, 332, 334, 336, 338, 340, 342, 344, 346, 348, 350, 352, 354, 356, 359, 361, 363, 365, 367, 369, 371, 372, 373, 374, 375, 376, 377, 378, 379, 388, 390, 392, 394, 396, 398, 400, 402, 404, 406, 408, 410, 412, 414, 416, 418, 420, 422, 424, 426, 428, 430, 433, 435, 437, 439, 441, 443, 447, 452, 453, 458, 476, 478, 480, 482, 484, 486, 488, 490, 492, 494, 496, 498, 500, 502, 504, 506, 508, 510, 513, 515, 517, 519, 521, 523, 525, 526 }; static const char _lexer_trans_keys[] = { 10, 32, 34, 35, 37, 42, 64, 65, 66, 68, 69, 73, 77, 79, 87, 124, 9, 13, 34, 34, 10, 32, 9, 13, 10, 32, 34, 9, 13, 10, 32, 34, 9, 13, 10, 32, 34, 9, 13, 10, 32, 34, 9, 13, 10, 32, 9, 13, 10, 32, 9, 13, 10, 13, 10, 95, 70, 69, 65, 84, 85, 82, 69, 95, 69, 78, 68, 95, 37, 32, 10, 10, 13, 13, 32, 64, 9, 10, 9, 10, 13, 32, 64, 11, 12, 10, 32, 64, 9, 13, 78, 52, 85, 58, 10, 10, 10, 32, 35, 37, 42, 64, 65, 66, 68, 73, 77, 87, 9, 13, 10, 95, 10, 70, 10, 69, 10, 65, 10, 84, 10, 85, 10, 82, 10, 69, 10, 95, 10, 69, 10, 78, 10, 68, 10, 95, 10, 37, 10, 32, 10, 32, 34, 35, 37, 42, 64, 65, 66, 68, 69, 73, 77, 79, 87, 124, 9, 13, 69, 88, 65, 77, 80, 76, 90, 58, 10, 10, 10, 32, 124, 9, 13, 32, 67, 65, 78, 32, 72, 65, 90, 73, 83, 72, 85, 78, 32, 58, 83, 82, 83, 76, 89, 58, 10, 10, 10, 32, 35, 37, 42, 64, 65, 66, 68, 73, 77, 87, 9, 13, 10, 95, 10, 70, 10, 69, 10, 65, 10, 84, 10, 85, 10, 82, 10, 69, 10, 95, 10, 69, 10, 78, 10, 68, 10, 95, 10, 37, 10, 32, 10, 78, 10, 85, 10, 84, 10, 69, 10, 32, 10, 67, 10, 65, 10, 78, 10, 32, 10, 72, 10, 65, 10, 90, 10, 73, 10, 83, 10, 72, 10, 85, 10, 78, 10, 58, 10, 10, 10, 32, 35, 37, 42, 64, 65, 66, 68, 73, 77, 87, 9, 13, 10, 95, 10, 70, 10, 69, 10, 65, 10, 84, 10, 85, 10, 82, 10, 69, 10, 95, 10, 69, 10, 78, 10, 68, 10, 95, 10, 37, 10, 32, 10, 78, 10, 85, 10, 84, 10, 69, 10, 32, 10, 67, 10, 65, 10, 78, 10, 32, 10, 72, 10, 65, 10, 90, 10, 73, 10, 83, 10, 72, 10, 85, 10, 78, 10, 32, 58, 10, 83, 10, 82, 10, 83, 10, 76, 10, 89, 10, 58, 72, 32, 72, 65, 73, 58, 10, 10, 10, 32, 35, 37, 64, 66, 77, 9, 13, 10, 95, 10, 70, 10, 69, 10, 65, 10, 84, 10, 85, 10, 82, 10, 69, 10, 95, 10, 69, 10, 78, 10, 68, 10, 95, 10, 37, 10, 52, 10, 58, 10, 73, 10, 83, 10, 72, 10, 85, 10, 78, 10, 32, 58, 10, 83, 10, 82, 10, 83, 10, 76, 10, 89, 32, 124, 9, 13, 10, 32, 124, 9, 13, 124, 10, 32, 124, 9, 13, 10, 32, 34, 35, 37, 42, 64, 65, 66, 68, 69, 73, 77, 79, 87, 124, 9, 13, 10, 78, 10, 85, 10, 84, 10, 69, 10, 32, 10, 67, 10, 65, 10, 78, 10, 32, 10, 72, 10, 65, 10, 90, 10, 73, 10, 83, 10, 72, 10, 85, 10, 78, 10, 32, 58, 10, 83, 10, 82, 10, 83, 10, 76, 10, 89, 10, 58, 84, 0 }; static const char _lexer_single_lengths[] = { 0, 16, 1, 1, 2, 3, 3, 3, 3, 2, 2, 2, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 2, 3, 5, 3, 1, 2, 1, 1, 1, 12, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 16, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 3, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 2, 1, 1, 1, 1, 1, 1, 1, 1, 12, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 1, 1, 12, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 3, 2, 2, 2, 2, 2, 2, 1, 1, 1, 1, 1, 1, 1, 1, 7, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 3, 2, 2, 2, 2, 2, 2, 3, 1, 3, 16, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 3, 2, 2, 2, 2, 2, 2, 1, 0 }; static const char _lexer_range_lengths[] = { 0, 1, 0, 0, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 1, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0 }; static const short _lexer_index_offsets[] = { 0, 0, 18, 20, 22, 26, 31, 36, 41, 46, 50, 54, 57, 59, 61, 63, 65, 67, 69, 71, 73, 75, 77, 79, 81, 83, 85, 87, 89, 91, 94, 99, 106, 111, 113, 116, 118, 120, 122, 136, 139, 142, 145, 148, 151, 154, 157, 160, 163, 166, 169, 172, 175, 178, 181, 199, 201, 203, 205, 207, 209, 211, 213, 215, 217, 219, 224, 226, 228, 230, 232, 234, 236, 238, 240, 242, 244, 246, 248, 250, 253, 255, 257, 259, 261, 263, 265, 267, 269, 283, 286, 289, 292, 295, 298, 301, 304, 307, 310, 313, 316, 319, 322, 325, 328, 331, 334, 337, 340, 343, 346, 349, 352, 355, 358, 361, 364, 367, 370, 373, 376, 379, 382, 384, 386, 400, 403, 406, 409, 412, 415, 418, 421, 424, 427, 430, 433, 436, 439, 442, 445, 448, 451, 454, 457, 460, 463, 466, 469, 472, 475, 478, 481, 484, 487, 490, 493, 496, 500, 503, 506, 509, 512, 515, 518, 520, 522, 524, 526, 528, 530, 532, 534, 543, 546, 549, 552, 555, 558, 561, 564, 567, 570, 573, 576, 579, 582, 585, 588, 591, 594, 597, 600, 603, 606, 610, 613, 616, 619, 622, 625, 629, 634, 636, 641, 659, 662, 665, 668, 671, 674, 677, 680, 683, 686, 689, 692, 695, 698, 701, 704, 707, 710, 714, 717, 720, 723, 726, 729, 732, 734 }; static const unsigned char _lexer_trans_targs[] = { 1, 1, 2, 11, 13, 27, 30, 33, 34, 55, 56, 66, 74, 164, 55, 200, 1, 0, 3, 0, 4, 0, 5, 4, 4, 0, 6, 6, 7, 6, 6, 6, 6, 7, 6, 6, 6, 6, 8, 6, 6, 6, 6, 9, 6, 6, 1, 10, 10, 0, 1, 10, 10, 0, 1, 12, 11, 1, 0, 14, 0, 15, 0, 16, 0, 17, 0, 18, 0, 19, 0, 20, 0, 21, 0, 22, 0, 23, 0, 24, 0, 25, 0, 26, 0, 230, 0, 28, 0, 0, 29, 1, 12, 29, 0, 0, 0, 0, 31, 32, 1, 32, 32, 30, 31, 31, 1, 32, 30, 32, 0, 27, 0, 35, 229, 0, 36, 0, 38, 37, 38, 37, 38, 38, 1, 39, 53, 1, 205, 206, 208, 209, 217, 208, 38, 37, 38, 40, 37, 38, 41, 37, 38, 42, 37, 38, 43, 37, 38, 44, 37, 38, 45, 37, 38, 46, 37, 38, 47, 37, 38, 48, 37, 38, 49, 37, 38, 50, 37, 38, 51, 37, 38, 52, 37, 38, 1, 37, 38, 54, 37, 1, 1, 2, 11, 13, 27, 30, 33, 34, 55, 56, 66, 74, 164, 55, 200, 1, 0, 33, 0, 57, 0, 58, 0, 59, 0, 60, 0, 61, 0, 62, 0, 63, 0, 65, 64, 65, 64, 65, 65, 1, 65, 64, 67, 0, 68, 0, 69, 0, 70, 0, 71, 0, 72, 0, 73, 0, 27, 0, 75, 0, 76, 0, 77, 0, 78, 0, 79, 0, 80, 122, 0, 81, 0, 82, 0, 83, 0, 84, 0, 85, 0, 86, 0, 88, 87, 88, 87, 88, 88, 1, 89, 103, 1, 104, 105, 107, 108, 116, 107, 88, 87, 88, 90, 87, 88, 91, 87, 88, 92, 87, 88, 93, 87, 88, 94, 87, 88, 95, 87, 88, 96, 87, 88, 97, 87, 88, 98, 87, 88, 99, 87, 88, 100, 87, 88, 101, 87, 88, 102, 87, 88, 1, 87, 88, 54, 87, 88, 103, 87, 88, 106, 87, 88, 103, 87, 88, 104, 87, 88, 109, 87, 88, 110, 87, 88, 111, 87, 88, 112, 87, 88, 113, 87, 88, 114, 87, 88, 115, 87, 88, 103, 87, 88, 117, 87, 88, 118, 87, 88, 119, 87, 88, 120, 87, 88, 121, 87, 88, 54, 87, 124, 123, 124, 123, 124, 124, 1, 125, 139, 1, 140, 141, 143, 144, 152, 143, 124, 123, 124, 126, 123, 124, 127, 123, 124, 128, 123, 124, 129, 123, 124, 130, 123, 124, 131, 123, 124, 132, 123, 124, 133, 123, 124, 134, 123, 124, 135, 123, 124, 136, 123, 124, 137, 123, 124, 138, 123, 124, 1, 123, 124, 54, 123, 124, 139, 123, 124, 142, 123, 124, 139, 123, 124, 140, 123, 124, 145, 123, 124, 146, 123, 124, 147, 123, 124, 148, 123, 124, 149, 123, 124, 150, 123, 124, 151, 123, 124, 139, 123, 124, 153, 123, 124, 154, 123, 124, 155, 123, 124, 156, 123, 124, 157, 123, 124, 158, 54, 123, 124, 159, 123, 124, 160, 123, 124, 161, 123, 124, 162, 123, 124, 163, 123, 124, 54, 123, 165, 0, 166, 0, 167, 0, 168, 0, 169, 0, 170, 0, 172, 171, 172, 171, 172, 172, 1, 173, 1, 187, 189, 172, 171, 172, 174, 171, 172, 175, 171, 172, 176, 171, 172, 177, 171, 172, 178, 171, 172, 179, 171, 172, 180, 171, 172, 181, 171, 172, 182, 171, 172, 183, 171, 172, 184, 171, 172, 185, 171, 172, 186, 171, 172, 1, 171, 172, 188, 171, 172, 54, 171, 172, 190, 171, 172, 191, 171, 172, 192, 171, 172, 193, 171, 172, 194, 171, 172, 195, 54, 171, 172, 196, 171, 172, 197, 171, 172, 198, 171, 172, 199, 171, 172, 188, 171, 200, 201, 200, 0, 204, 203, 201, 203, 202, 201, 202, 204, 203, 201, 203, 202, 204, 204, 2, 11, 13, 27, 30, 33, 34, 55, 56, 66, 74, 164, 55, 200, 204, 0, 38, 53, 37, 38, 207, 37, 38, 53, 37, 38, 205, 37, 38, 210, 37, 38, 211, 37, 38, 212, 37, 38, 213, 37, 38, 214, 37, 38, 215, 37, 38, 216, 37, 38, 53, 37, 38, 218, 37, 38, 219, 37, 38, 220, 37, 38, 221, 37, 38, 222, 37, 38, 223, 54, 37, 38, 224, 37, 38, 225, 37, 38, 226, 37, 38, 227, 37, 38, 228, 37, 38, 54, 37, 27, 0, 0, 0 }; static const char _lexer_trans_actions[] = { 42, 0, 5, 1, 0, 23, 0, 23, 23, 23, 23, 23, 23, 23, 23, 29, 0, 37, 0, 37, 0, 37, 42, 0, 0, 37, 114, 39, 39, 39, 3, 106, 27, 27, 27, 0, 106, 27, 27, 27, 0, 106, 27, 0, 27, 0, 90, 7, 7, 37, 42, 0, 0, 37, 98, 19, 0, 42, 37, 0, 37, 0, 37, 0, 37, 0, 37, 0, 37, 0, 37, 0, 37, 0, 37, 0, 37, 0, 37, 0, 37, 0, 37, 0, 37, 0, 37, 0, 37, 37, 45, 94, 17, 0, 37, 37, 37, 37, 1, 21, 102, 21, 21, 21, 21, 0, 42, 0, 0, 0, 37, 0, 37, 0, 0, 37, 0, 37, 119, 45, 42, 0, 42, 0, 60, 27, 72, 60, 72, 72, 72, 72, 72, 72, 0, 0, 42, 0, 0, 42, 0, 0, 42, 0, 0, 42, 0, 0, 42, 0, 0, 42, 0, 0, 42, 0, 0, 42, 0, 0, 42, 0, 0, 42, 0, 0, 42, 0, 0, 42, 0, 0, 42, 0, 0, 42, 11, 0, 42, 11, 0, 110, 25, 48, 45, 25, 51, 25, 51, 51, 51, 51, 51, 51, 51, 51, 54, 25, 37, 0, 37, 0, 37, 0, 37, 0, 37, 0, 37, 0, 37, 0, 37, 0, 37, 119, 45, 42, 0, 42, 0, 69, 0, 0, 0, 37, 0, 37, 0, 37, 0, 37, 0, 37, 0, 37, 0, 37, 0, 37, 0, 37, 0, 37, 0, 37, 0, 37, 0, 37, 0, 0, 37, 0, 37, 0, 37, 0, 37, 0, 37, 0, 37, 0, 37, 119, 45, 42, 0, 42, 0, 66, 27, 72, 66, 72, 72, 72, 72, 72, 72, 0, 0, 42, 0, 0, 42, 0, 0, 42, 0, 0, 42, 0, 0, 42, 0, 0, 42, 0, 0, 42, 0, 0, 42, 0, 0, 42, 0, 0, 42, 0, 0, 42, 0, 0, 42, 0, 0, 42, 0, 0, 42, 15, 0, 42, 15, 0, 42, 0, 0, 42, 0, 0, 42, 0, 0, 42, 0, 0, 42, 0, 0, 42, 0, 0, 42, 0, 0, 42, 0, 0, 42, 0, 0, 42, 0, 0, 42, 0, 0, 42, 0, 0, 42, 0, 0, 42, 0, 0, 42, 0, 0, 42, 0, 0, 42, 0, 0, 42, 15, 0, 119, 45, 42, 0, 42, 0, 63, 27, 72, 63, 72, 72, 72, 72, 72, 72, 0, 0, 42, 0, 0, 42, 0, 0, 42, 0, 0, 42, 0, 0, 42, 0, 0, 42, 0, 0, 42, 0, 0, 42, 0, 0, 42, 0, 0, 42, 0, 0, 42, 0, 0, 42, 0, 0, 42, 0, 0, 42, 13, 0, 42, 13, 0, 42, 0, 0, 42, 0, 0, 42, 0, 0, 42, 0, 0, 42, 0, 0, 42, 0, 0, 42, 0, 0, 42, 0, 0, 42, 0, 0, 42, 0, 0, 42, 0, 0, 42, 0, 0, 42, 0, 0, 42, 0, 0, 42, 0, 0, 42, 0, 0, 42, 0, 0, 42, 0, 13, 0, 42, 0, 0, 42, 0, 0, 42, 0, 0, 42, 0, 0, 42, 0, 0, 42, 13, 0, 0, 37, 0, 37, 0, 37, 0, 37, 0, 37, 0, 37, 119, 45, 42, 0, 42, 0, 57, 27, 57, 72, 72, 0, 0, 42, 0, 0, 42, 0, 0, 42, 0, 0, 42, 0, 0, 42, 0, 0, 42, 0, 0, 42, 0, 0, 42, 0, 0, 42, 0, 0, 42, 0, 0, 42, 0, 0, 42, 0, 0, 42, 0, 0, 42, 9, 0, 42, 0, 0, 42, 9, 0, 42, 0, 0, 42, 0, 0, 42, 0, 0, 42, 0, 0, 42, 0, 0, 42, 0, 9, 0, 42, 0, 0, 42, 0, 0, 42, 0, 0, 42, 0, 0, 42, 0, 0, 0, 0, 0, 37, 42, 31, 75, 31, 31, 33, 0, 42, 0, 33, 0, 0, 42, 0, 81, 78, 35, 84, 35, 84, 84, 84, 84, 84, 84, 84, 84, 87, 0, 37, 42, 0, 0, 42, 0, 0, 42, 0, 0, 42, 0, 0, 42, 0, 0, 42, 0, 0, 42, 0, 0, 42, 0, 0, 42, 0, 0, 42, 0, 0, 42, 0, 0, 42, 0, 0, 42, 0, 0, 42, 0, 0, 42, 0, 0, 42, 0, 0, 42, 0, 0, 42, 0, 11, 0, 42, 0, 0, 42, 0, 0, 42, 0, 0, 42, 0, 0, 42, 0, 0, 42, 11, 0, 0, 37, 0, 0 }; static const char _lexer_eof_actions[] = { 0, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37, 37 }; static const int lexer_start = 1; static const int lexer_first_final = 230; static const int lexer_error = 0; static const int lexer_en_main = 1; #line 239 "/Users/aslakhellesoy/scm/gherkin/tasks/../ragel/i18n/enlol.c.rl" static VALUE strip_i(VALUE str, VALUE ary) { rb_funcall(str, rb_intern("strip!"), 0); rb_ary_push(ary, str); return Qnil; } static VALUE multiline_strip(VALUE text, int eol) { VALUE map = rb_ary_new(); VALUE split = rb_str_split(text, "\n"); rb_iterate(rb_each, split, strip_i, map); return rb_ary_join(split, rb_str_new2( \ eol == CRLF_FLAG ? CRLF : LF )); } static void store_kw_con(VALUE listener, const char * event_name, const char * keyword_at, size_t keyword_length, const char * at, size_t length, int current_line, int eol) { VALUE con = Qnil, kw = Qnil; kw = ENCODED_STR_NEW(keyword_at, keyword_length); con = ENCODED_STR_NEW(at, length); con = multiline_strip(con, eol); rb_funcall(con, rb_intern("strip!"), 0); rb_funcall(listener, rb_intern(event_name), 3, kw, con, INT2FIX(current_line)); } static void store_attr(VALUE listener, const char * attr_type, const char * at, size_t length, int line) { VALUE val = ENCODED_STR_NEW(at, length); rb_funcall(listener, rb_intern(attr_type), 2, val, INT2FIX(line)); } static void store_pystring_content(VALUE listener, int start_col, const char *at, size_t length, int current_line) { VALUE con = ENCODED_STR_NEW(at, length); // Gherkin will crash gracefully if the string representation of start_col pushes the pattern past 32 characters char pat[32]; snprintf(pat, 32, "^ {0,%d}", start_col); VALUE re = rb_reg_regcomp(rb_str_new2(pat)); VALUE re2 = rb_reg_regcomp(rb_str_new2("\r\\Z")); rb_funcall(con, rb_intern("gsub!"), 2, re, rb_str_new2("")); rb_funcall(con, rb_intern("sub!"), 2, re2, rb_str_new2("")); rb_funcall(listener, rb_intern("py_string"), 2, con, INT2FIX(current_line)); } static void raise_lexer_error(const char * at, int line) { rb_raise(rb_eGherkinLexingError, "Lexing error on line %d: '%s'.", line, at); } static int count_char(char char_to_count, char *str) { int count = 0; int i = 0; while(str[i] != '\0') { if(str[i] == char_to_count) { count++; } i++; } return count; } static void lexer_init(lexer_state *lexer) { lexer->content_start = 0; lexer->content_end = 0; lexer->content_len = 0; lexer->mark = 0; lexer->keyword_start = 0; lexer->keyword_end = 0; lexer->next_keyword_start = 0; lexer->line_number = 1; lexer->last_newline = 0; lexer->final_newline = 0; lexer->start_col = 0; lexer->eol = LF_FLAG; } static VALUE CLexer_alloc(VALUE klass) { VALUE obj; lexer_state *lxr = ALLOC(lexer_state); lexer_init(lxr); obj = Data_Wrap_Struct(klass, NULL, -1, lxr); return obj; } static VALUE CLexer_init(VALUE self, VALUE listener) { rb_iv_set(self, "@listener", listener); lexer_state *lxr = NULL; DATA_GET(self, lexer_state, lxr); lexer_init(lxr); return self; } static VALUE CLexer_scan(VALUE self, VALUE input) { lexer_state *lexer = NULL; DATA_GET(self, lexer_state, lexer); VALUE input_copy = rb_str_dup(input); rb_str_append(input_copy, rb_str_new2("\n%_FEATURE_END_%")); char *data = RSTRING_PTR(input_copy); size_t len = RSTRING_LEN(input_copy); if (count_char('\r', data) > (count_char('\n', data) / 2)) { lexer->eol = CRLF_FLAG; } if (len == 0) { rb_raise(rb_eGherkinLexingError, "No content to lex."); } else { const char *p, *pe, *eof; int cs = 0; VALUE listener = rb_iv_get(self, "@listener"); VALUE current_row = Qnil; p = data; pe = data + len; eof = pe; assert(*pe == '\0' && "pointer does not end on NULL"); #line 691 "ext/gherkin_lexer_enlol/gherkin_lexer_enlol.c" { cs = lexer_start; } #line 391 "/Users/aslakhellesoy/scm/gherkin/tasks/../ragel/i18n/enlol.c.rl" #line 698 "ext/gherkin_lexer_enlol/gherkin_lexer_enlol.c" { int _klen; unsigned int _trans; const char *_acts; unsigned int _nacts; const char *_keys; if ( p == pe ) goto _test_eof; if ( cs == 0 ) goto _out; _resume: _keys = _lexer_trans_keys + _lexer_key_offsets[cs]; _trans = _lexer_index_offsets[cs]; _klen = _lexer_single_lengths[cs]; if ( _klen > 0 ) { const char *_lower = _keys; const char *_mid; const char *_upper = _keys + _klen - 1; while (1) { if ( _upper < _lower ) break; _mid = _lower + ((_upper-_lower) >> 1); if ( (*p) < *_mid ) _upper = _mid - 1; else if ( (*p) > *_mid ) _lower = _mid + 1; else { _trans += (_mid - _keys); goto _match; } } _keys += _klen; _trans += _klen; } _klen = _lexer_range_lengths[cs]; if ( _klen > 0 ) { const char *_lower = _keys; const char *_mid; const char *_upper = _keys + (_klen<<1) - 2; while (1) { if ( _upper < _lower ) break; _mid = _lower + (((_upper-_lower) >> 1) & ~1); if ( (*p) < _mid[0] ) _upper = _mid - 2; else if ( (*p) > _mid[1] ) _lower = _mid + 2; else { _trans += ((_mid - _keys)>>1); goto _match; } } _trans += _klen; } _match: cs = _lexer_trans_targs[_trans]; if ( _lexer_trans_actions[_trans] == 0 ) goto _again; _acts = _lexer_actions + _lexer_trans_actions[_trans]; _nacts = (unsigned int) *_acts++; while ( _nacts-- > 0 ) { switch ( *_acts++ ) { case 0: #line 86 "/Users/aslakhellesoy/scm/gherkin/tasks/../ragel/i18n/enlol.c.rl" { MARK(content_start, p); lexer->current_line = lexer->line_number; } break; case 1: #line 91 "/Users/aslakhellesoy/scm/gherkin/tasks/../ragel/i18n/enlol.c.rl" { MARK(content_start, p); } break; case 2: #line 95 "/Users/aslakhellesoy/scm/gherkin/tasks/../ragel/i18n/enlol.c.rl" { lexer->current_line = lexer->line_number; lexer->start_col = p - data - lexer->last_newline; } break; case 3: #line 100 "/Users/aslakhellesoy/scm/gherkin/tasks/../ragel/i18n/enlol.c.rl" { int len = LEN(content_start, PTR_TO(final_newline)); if (len < 0) len = 0; store_pystring_content(listener, lexer->start_col, PTR_TO(content_start), len, lexer->current_line); } break; case 4: #line 108 "/Users/aslakhellesoy/scm/gherkin/tasks/../ragel/i18n/enlol.c.rl" { STORE_KW_END_CON(feature); } break; case 5: #line 112 "/Users/aslakhellesoy/scm/gherkin/tasks/../ragel/i18n/enlol.c.rl" { STORE_KW_END_CON(background); } break; case 6: #line 116 "/Users/aslakhellesoy/scm/gherkin/tasks/../ragel/i18n/enlol.c.rl" { STORE_KW_END_CON(scenario); } break; case 7: #line 120 "/Users/aslakhellesoy/scm/gherkin/tasks/../ragel/i18n/enlol.c.rl" { STORE_KW_END_CON(scenario_outline); } break; case 8: #line 124 "/Users/aslakhellesoy/scm/gherkin/tasks/../ragel/i18n/enlol.c.rl" { STORE_KW_END_CON(examples); } break; case 9: #line 128 "/Users/aslakhellesoy/scm/gherkin/tasks/../ragel/i18n/enlol.c.rl" { store_kw_con(listener, "step", PTR_TO(keyword_start), LEN(keyword_start, PTR_TO(keyword_end)), PTR_TO(content_start), LEN(content_start, p), lexer->current_line, lexer->eol); } break; case 10: #line 135 "/Users/aslakhellesoy/scm/gherkin/tasks/../ragel/i18n/enlol.c.rl" { STORE_ATTR(comment); lexer->mark = 0; } break; case 11: #line 140 "/Users/aslakhellesoy/scm/gherkin/tasks/../ragel/i18n/enlol.c.rl" { STORE_ATTR(tag); lexer->mark = 0; } break; case 12: #line 145 "/Users/aslakhellesoy/scm/gherkin/tasks/../ragel/i18n/enlol.c.rl" { lexer->line_number += 1; MARK(final_newline, p); } break; case 13: #line 150 "/Users/aslakhellesoy/scm/gherkin/tasks/../ragel/i18n/enlol.c.rl" { MARK(last_newline, p + 1); } break; case 14: #line 154 "/Users/aslakhellesoy/scm/gherkin/tasks/../ragel/i18n/enlol.c.rl" { if (lexer->mark == 0) { MARK(mark, p); } } break; case 15: #line 160 "/Users/aslakhellesoy/scm/gherkin/tasks/../ragel/i18n/enlol.c.rl" { MARK(keyword_end, p); MARK(keyword_start, PTR_TO(mark)); MARK(content_start, p + 1); lexer->mark = 0; } break; case 16: #line 167 "/Users/aslakhellesoy/scm/gherkin/tasks/../ragel/i18n/enlol.c.rl" { MARK(content_end, p); } break; case 17: #line 171 "/Users/aslakhellesoy/scm/gherkin/tasks/../ragel/i18n/enlol.c.rl" { p = p - 1; lexer->current_line = lexer->line_number; current_row = rb_ary_new(); } break; case 18: #line 177 "/Users/aslakhellesoy/scm/gherkin/tasks/../ragel/i18n/enlol.c.rl" { MARK(content_start, p); } break; case 19: #line 181 "/Users/aslakhellesoy/scm/gherkin/tasks/../ragel/i18n/enlol.c.rl" { VALUE con = ENCODED_STR_NEW(PTR_TO(content_start), LEN(content_start, p)); rb_funcall(con, rb_intern("strip!"), 0); rb_ary_push(current_row, con); } break; case 20: #line 188 "/Users/aslakhellesoy/scm/gherkin/tasks/../ragel/i18n/enlol.c.rl" { rb_funcall(listener, rb_intern("row"), 2, current_row, INT2FIX(lexer->current_line)); } break; case 21: #line 192 "/Users/aslakhellesoy/scm/gherkin/tasks/../ragel/i18n/enlol.c.rl" { if (cs < lexer_first_final) { if (raise_lexer_error != NULL) { size_t count = 0; int newstr_count = 0; size_t len; const char *buff; if (lexer->last_newline != 0) { len = LEN(last_newline, eof); buff = PTR_TO(last_newline); } else { len = strlen(data); buff = data; } char newstr[len]; for (count = 0; count < len; count++) { if(buff[count] == 10) { newstr[newstr_count] = '\0'; // terminate new string at first newline found break; } else { if (buff[count] == '%') { newstr[newstr_count++] = buff[count]; newstr[newstr_count] = buff[count]; } else { newstr[newstr_count] = buff[count]; } } newstr_count++; } int line = lexer->line_number; lexer_init(lexer); // Re-initialize so we can scan again with the same lexer raise_lexer_error(newstr, line); } } else { rb_funcall(listener, rb_intern("eof"), 0); } } break; #line 962 "ext/gherkin_lexer_enlol/gherkin_lexer_enlol.c" } } _again: if ( cs == 0 ) goto _out; if ( ++p != pe ) goto _resume; _test_eof: {} if ( p == eof ) { const char *__acts = _lexer_actions + _lexer_eof_actions[cs]; unsigned int __nacts = (unsigned int) *__acts++; while ( __nacts-- > 0 ) { switch ( *__acts++ ) { case 21: #line 192 "/Users/aslakhellesoy/scm/gherkin/tasks/../ragel/i18n/enlol.c.rl" { if (cs < lexer_first_final) { if (raise_lexer_error != NULL) { size_t count = 0; int newstr_count = 0; size_t len; const char *buff; if (lexer->last_newline != 0) { len = LEN(last_newline, eof); buff = PTR_TO(last_newline); } else { len = strlen(data); buff = data; } char newstr[len]; for (count = 0; count < len; count++) { if(buff[count] == 10) { newstr[newstr_count] = '\0'; // terminate new string at first newline found break; } else { if (buff[count] == '%') { newstr[newstr_count++] = buff[count]; newstr[newstr_count] = buff[count]; } else { newstr[newstr_count] = buff[count]; } } newstr_count++; } int line = lexer->line_number; lexer_init(lexer); // Re-initialize so we can scan again with the same lexer raise_lexer_error(newstr, line); } } else { rb_funcall(listener, rb_intern("eof"), 0); } } break; #line 1021 "ext/gherkin_lexer_enlol/gherkin_lexer_enlol.c" } } } _out: {} } #line 392 "/Users/aslakhellesoy/scm/gherkin/tasks/../ragel/i18n/enlol.c.rl" assert(p <= pe && "data overflow after parsing execute"); assert(lexer->content_start <= len && "content starts after data end"); assert(lexer->mark < len && "mark is after data end"); // Reset lexer by re-initializing the whole thing lexer_init(lexer); if (cs == lexer_error) { rb_raise(rb_eGherkinLexingError, "Invalid format, lexing fails."); } else { return Qtrue; } } } void Init_gherkin_lexer_enlol() { mGherkin = rb_define_module("Gherkin"); rb_eGherkinLexingError = rb_const_get(mGherkin, rb_intern("LexingError")); mCLexer = rb_define_module_under(mGherkin, "CLexer"); cI18nLexer = rb_define_class_under(mCLexer, "Enlol", rb_cObject); rb_define_alloc_func(cI18nLexer, CLexer_alloc); rb_define_method(cI18nLexer, "initialize", CLexer_init, 1); rb_define_method(cI18nLexer, "scan", CLexer_scan, 1); }