// line 1 "ext/hpricot_scan/hpricot_scan.java.rl" import java.io.IOException; import org.jruby.Ruby; import org.jruby.RubyClass; import org.jruby.RubyHash; import org.jruby.RubyModule; import org.jruby.RubyNumeric; import org.jruby.RubyObjectAdapter; import org.jruby.RubyString; import org.jruby.javasupport.JavaEmbedUtils; import org.jruby.runtime.Block; import org.jruby.runtime.CallbackFactory; import org.jruby.runtime.builtin.IRubyObject; import org.jruby.exceptions.RaiseException; import org.jruby.runtime.load.BasicLibraryService; public class HpricotScanService implements BasicLibraryService { public static String NO_WAY_SERIOUSLY="*** This should not happen, please send a bug report with the HTML you're parsing to why@whytheluckystiff.net. So sorry!"; private static RubyObjectAdapter rubyApi; public void ELE(IRubyObject N) { if (te > ts || text) { IRubyObject raw_string = runtime.getNil(); ele_open = false; text = false; if (ts != -1 && N != cdata && N != sym_text && N != procins && N != comment) { raw_string = runtime.newString(new String(buf,ts,te-ts)); } rb_yield_tokens(N, tag[0], attr, raw_string, taint); } } public void SET(IRubyObject[] N, int E) { int mark = 0; if(N == tag) { if(mark_tag == -1 || E == mark_tag) { tag[0] = runtime.newString(""); } else if(E > mark_tag) { tag[0] = runtime.newString(new String(buf,mark_tag, E-mark_tag)); } } else if(N == akey) { if(mark_akey == -1 || E == mark_akey) { akey[0] = runtime.newString(""); } else if(E > mark_akey) { akey[0] = runtime.newString(new String(buf,mark_akey, E-mark_akey)); } } else if(N == aval) { if(mark_aval == -1 || E == mark_aval) { aval[0] = runtime.newString(""); } else if(E > mark_aval) { aval[0] = runtime.newString(new String(buf,mark_aval, E-mark_aval)); } } } public void CAT(IRubyObject[] N, int E) { if(N[0].isNil()) { SET(N,E); } else { int mark = 0; if(N == tag) { mark = mark_tag; } else if(N == akey) { mark = mark_akey; } else if(N == aval) { mark = mark_aval; } ((RubyString)(N[0])).append(runtime.newString(new String(buf, mark, E-mark))); } } public void SLIDE(Object N) { int mark = 0; if(N == tag) { mark = mark_tag; } else if(N == akey) { mark = mark_akey; } else if(N == aval) { mark = mark_aval; } if(mark > ts) { if(N == tag) { mark_tag -= ts; } else if(N == akey) { mark_akey -= ts; } else if(N == aval) { mark_aval -= ts; } } } public void ATTR(IRubyObject K, IRubyObject V) { if(!K.isNil()) { if(attr.isNil()) { attr = RubyHash.newHash(runtime); } ((RubyHash)attr).op_aset(runtime.getCurrentContext(),K,V); // ((RubyHash)attr).aset(K,V); } } public void ATTR(IRubyObject[] K, IRubyObject V) { ATTR(K[0],V); } public void ATTR(IRubyObject K, IRubyObject[] V) { ATTR(K,V[0]); } public void ATTR(IRubyObject[] K, IRubyObject[] V) { ATTR(K[0],V[0]); } public void TEXT_PASS() { if(!text) { if(ele_open) { ele_open = false; if(ts > -1) { mark_tag = ts; } } else { mark_tag = p; } attr = runtime.getNil(); tag[0] = runtime.getNil(); text = true; } } public void EBLK(IRubyObject N, int T) { CAT(tag, p - T + 1); ELE(N); } public void rb_raise(RubyClass error, String message) { throw new RaiseException(runtime, error, message, true); } public IRubyObject rb_str_new2(String s) { return runtime.newString(s); } // line 189 "ext/hpricot_scan/hpricot_scan.java.rl" // line 150 "ext/hpricot_scan/HpricotScanService.java" private static byte[] init__hpricot_scan_actions_0() { return new byte [] { 0, 1, 1, 1, 2, 1, 4, 1, 5, 1, 6, 1, 7, 1, 8, 1, 9, 1, 10, 1, 11, 1, 12, 1, 14, 1, 16, 1, 20, 1, 21, 1, 22, 1, 24, 1, 25, 1, 26, 1, 28, 1, 29, 1, 30, 1, 32, 1, 33, 1, 38, 1, 39, 1, 40, 1, 41, 1, 42, 1, 43, 1, 44, 1, 45, 1, 46, 1, 47, 1, 48, 1, 49, 1, 50, 1, 51, 2, 2, 5, 2, 2, 6, 2, 2, 11, 2, 2, 12, 2, 2, 14, 2, 4, 39, 2, 4, 40, 2, 4, 41, 2, 5, 2, 2, 6, 14, 2, 7, 6, 2, 7, 14, 2, 11, 12, 2, 13, 3, 2, 14, 6, 2, 14, 40, 2, 15, 24, 2, 15, 28, 2, 15, 32, 2, 15, 45, 2, 17, 23, 2, 18, 27, 2, 19, 31, 2, 22, 34, 2, 22, 36, 3, 2, 6, 14, 3, 2, 14, 6, 3, 6, 7, 14, 3, 6, 14, 40, 3, 7, 14, 40, 3, 11, 2, 12, 3, 14, 6, 40, 3, 14, 13, 3, 3, 22, 0, 37, 3, 22, 2, 34, 3, 22, 14, 35, 4, 2, 14, 13, 3, 4, 6, 7, 14, 40, 4, 22, 2, 14, 35, 4, 22, 6, 14, 35, 4, 22, 7, 14, 35, 4, 22, 14, 6, 35, 5, 22, 2, 6, 14, 35, 5, 22, 2, 14, 6, 35, 5, 22, 6, 7, 14, 35 }; } private static final byte _hpricot_scan_actions[] = init__hpricot_scan_actions_0(); private static short[] init__hpricot_scan_key_offsets_0() { return new short [] { 0, 3, 4, 5, 6, 7, 8, 9, 10, 13, 22, 37, 44, 45, 46, 47, 48, 49, 52, 57, 69, 81, 86, 93, 94, 95, 100, 101, 105, 106, 107, 121, 135, 152, 169, 186, 203, 210, 212, 214, 220, 222, 227, 232, 238, 240, 245, 251, 265, 266, 267, 268, 269, 270, 271, 272, 273, 274, 275, 276, 282, 296, 300, 313, 326, 340, 354, 355, 366, 375, 388, 405, 423, 441, 450, 461, 480, 499, 510, 521, 536, 538, 540, 556, 572, 575, 587, 599, 619, 639, 658, 677, 697, 717, 728, 739, 751, 763, 775, 791, 794, 809, 811, 813, 829, 845, 848, 860, 871, 890, 910, 930, 941, 952, 964, 984, 1004, 1016, 1036, 1057, 1074, 1091, 1095, 1098, 1110, 1122, 1142, 1162, 1182, 1194, 1206, 1226, 1242, 1258, 1270, 1291, 1310, 1313, 1328, 1340, 1355, 1358, 1369, 1371, 1373, 1384, 1391, 1404, 1418, 1432, 1445, 1446, 1447, 1448, 1449, 1450, 1451, 1455, 1460, 1469, 1479, 1484, 1491, 1492, 1493, 1494, 1495, 1496, 1497, 1498, 1499, 1503, 1508, 1512, 1522, 1527, 1533, 1534, 1535, 1536, 1537, 1538, 1539, 1540, 1541, 1542, 1546, 1551, 1553, 1554, 1555, 1560, 1561, 1562, 1564, 1565, 1566, 1567, 1568, 1572, 1582, 1591, 1601, 1602, 1603, 1605, 1614, 1615, 1616, 1617, 1619, 1621, 1624, 1627, 1631, 1633, 1634, 1636, 1637, 1640 }; } private static final short _hpricot_scan_key_offsets[] = init__hpricot_scan_key_offsets_0(); private static char[] init__hpricot_scan_trans_keys_0() { return new char [] { 45, 68, 91, 45, 79, 67, 84, 89, 80, 69, 32, 9, 13, 32, 58, 95, 9, 13, 65, 90, 97, 122, 32, 62, 63, 91, 95, 9, 13, 45, 46, 48, 58, 65, 90, 97, 122, 32, 62, 80, 83, 91, 9, 13, 85, 66, 76, 73, 67, 32, 9, 13, 32, 34, 39, 9, 13, 9, 34, 61, 95, 32, 37, 39, 59, 63, 90, 97, 122, 9, 34, 61, 95, 32, 37, 39, 59, 63, 90, 97, 122, 32, 62, 91, 9, 13, 32, 34, 39, 62, 91, 9, 13, 34, 34, 32, 62, 91, 9, 13, 93, 32, 62, 9, 13, 39, 39, 9, 39, 61, 95, 32, 33, 35, 37, 40, 59, 63, 90, 97, 122, 9, 39, 61, 95, 32, 33, 35, 37, 40, 59, 63, 90, 97, 122, 9, 32, 33, 39, 62, 91, 95, 10, 13, 35, 37, 40, 59, 61, 90, 97, 122, 9, 32, 34, 39, 62, 91, 95, 10, 13, 33, 37, 40, 59, 61, 90, 97, 122, 9, 32, 33, 39, 62, 91, 95, 10, 13, 35, 37, 40, 59, 61, 90, 97, 122, 9, 32, 34, 39, 62, 91, 95, 10, 13, 33, 37, 40, 59, 61, 90, 97, 122, 32, 34, 39, 62, 91, 9, 13, 34, 39, 34, 39, 32, 39, 62, 91, 9, 13, 39, 93, 32, 62, 93, 9, 13, 32, 39, 62, 9, 13, 32, 34, 62, 91, 9, 13, 34, 93, 32, 34, 62, 9, 13, 32, 39, 62, 91, 9, 13, 9, 39, 61, 95, 32, 33, 35, 37, 40, 59, 63, 90, 97, 122, 89, 83, 84, 69, 77, 67, 68, 65, 84, 65, 91, 58, 95, 65, 90, 97, 122, 32, 62, 63, 95, 9, 13, 45, 46, 48, 58, 65, 90, 97, 122, 32, 62, 9, 13, 32, 47, 62, 63, 95, 9, 13, 45, 58, 65, 90, 97, 122, 32, 47, 62, 63, 95, 9, 13, 45, 58, 65, 90, 97, 122, 32, 47, 61, 62, 63, 95, 9, 13, 45, 58, 65, 90, 97, 122, 32, 47, 61, 62, 63, 95, 9, 13, 45, 58, 65, 90, 97, 122, 62, 13, 32, 34, 39, 47, 60, 62, 9, 10, 11, 12, 13, 32, 47, 60, 62, 9, 10, 11, 12, 32, 47, 62, 63, 95, 9, 13, 45, 58, 65, 90, 97, 122, 13, 32, 47, 60, 62, 63, 95, 9, 10, 11, 12, 45, 58, 65, 90, 97, 122, 13, 32, 47, 60, 61, 62, 63, 95, 9, 10, 11, 12, 45, 58, 65, 90, 97, 122, 13, 32, 47, 60, 61, 62, 63, 95, 9, 10, 11, 12, 45, 58, 65, 90, 97, 122, 13, 32, 47, 60, 62, 9, 10, 11, 12, 13, 32, 34, 39, 47, 60, 62, 9, 10, 11, 12, 13, 32, 34, 39, 47, 60, 62, 63, 95, 9, 10, 11, 12, 45, 58, 65, 90, 97, 122, 13, 32, 34, 39, 47, 60, 62, 63, 95, 9, 10, 11, 12, 45, 58, 65, 90, 97, 122, 13, 32, 34, 47, 60, 62, 92, 9, 10, 11, 12, 13, 32, 34, 47, 60, 62, 92, 9, 10, 11, 12, 32, 34, 47, 62, 63, 92, 95, 9, 13, 45, 58, 65, 90, 97, 122, 34, 92, 34, 92, 32, 34, 47, 61, 62, 63, 92, 95, 9, 13, 45, 58, 65, 90, 97, 122, 32, 34, 47, 61, 62, 63, 92, 95, 9, 13, 45, 58, 65, 90, 97, 122, 34, 62, 92, 13, 32, 34, 39, 47, 60, 62, 92, 9, 10, 11, 12, 13, 32, 34, 39, 47, 60, 62, 92, 9, 10, 11, 12, 13, 32, 34, 39, 47, 60, 62, 63, 92, 95, 9, 10, 11, 12, 45, 58, 65, 90, 97, 122, 13, 32, 34, 39, 47, 60, 62, 63, 92, 95, 9, 10, 11, 12, 45, 58, 65, 90, 97, 122, 13, 32, 34, 47, 60, 62, 63, 92, 95, 9, 10, 11, 12, 45, 58, 65, 90, 97, 122, 13, 32, 34, 47, 60, 62, 63, 92, 95, 9, 10, 11, 12, 45, 58, 65, 90, 97, 122, 13, 32, 34, 47, 60, 61, 62, 63, 92, 95, 9, 10, 11, 12, 45, 58, 65, 90, 97, 122, 13, 32, 34, 47, 60, 61, 62, 63, 92, 95, 9, 10, 11, 12, 45, 58, 65, 90, 97, 122, 13, 32, 34, 47, 60, 62, 92, 9, 10, 11, 12, 13, 32, 34, 47, 60, 62, 92, 9, 10, 11, 12, 13, 32, 34, 39, 47, 60, 62, 92, 9, 10, 11, 12, 13, 32, 34, 39, 47, 60, 62, 92, 9, 10, 11, 12, 13, 32, 34, 39, 47, 60, 62, 92, 9, 10, 11, 12, 32, 34, 39, 47, 62, 63, 92, 95, 9, 13, 45, 58, 65, 90, 97, 122, 34, 39, 92, 32, 39, 47, 62, 63, 92, 95, 9, 13, 45, 58, 65, 90, 97, 122, 39, 92, 39, 92, 32, 39, 47, 61, 62, 63, 92, 95, 9, 13, 45, 58, 65, 90, 97, 122, 32, 39, 47, 61, 62, 63, 92, 95, 9, 13, 45, 58, 65, 90, 97, 122, 39, 62, 92, 13, 32, 34, 39, 47, 60, 62, 92, 9, 10, 11, 12, 13, 32, 39, 47, 60, 62, 92, 9, 10, 11, 12, 13, 32, 39, 47, 60, 62, 63, 92, 95, 9, 10, 11, 12, 45, 58, 65, 90, 97, 122, 13, 32, 39, 47, 60, 61, 62, 63, 92, 95, 9, 10, 11, 12, 45, 58, 65, 90, 97, 122, 13, 32, 39, 47, 60, 61, 62, 63, 92, 95, 9, 10, 11, 12, 45, 58, 65, 90, 97, 122, 13, 32, 39, 47, 60, 62, 92, 9, 10, 11, 12, 13, 32, 39, 47, 60, 62, 92, 9, 10, 11, 12, 13, 32, 34, 39, 47, 60, 62, 92, 9, 10, 11, 12, 13, 32, 34, 39, 47, 60, 62, 63, 92, 95, 9, 10, 11, 12, 45, 58, 65, 90, 97, 122, 13, 32, 34, 39, 47, 60, 62, 63, 92, 95, 9, 10, 11, 12, 45, 58, 65, 90, 97, 122, 13, 32, 34, 39, 47, 60, 62, 92, 9, 10, 11, 12, 13, 32, 34, 39, 47, 60, 62, 63, 92, 95, 9, 10, 11, 12, 45, 58, 65, 90, 97, 122, 13, 32, 34, 39, 47, 60, 61, 62, 63, 92, 95, 9, 10, 11, 12, 45, 58, 65, 90, 97, 122, 32, 34, 39, 47, 61, 62, 63, 92, 95, 9, 13, 45, 58, 65, 90, 97, 122, 32, 34, 39, 47, 61, 62, 63, 92, 95, 9, 13, 45, 58, 65, 90, 97, 122, 34, 39, 62, 92, 34, 39, 92, 13, 32, 34, 39, 47, 60, 62, 92, 9, 10, 11, 12, 13, 32, 34, 39, 47, 60, 62, 92, 9, 10, 11, 12, 13, 32, 34, 39, 47, 60, 62, 63, 92, 95, 9, 10, 11, 12, 45, 58, 65, 90, 97, 122, 13, 32, 34, 39, 47, 60, 62, 63, 92, 95, 9, 10, 11, 12, 45, 58, 65, 90, 97, 122, 13, 32, 34, 39, 47, 60, 62, 63, 92, 95, 9, 10, 11, 12, 45, 58, 65, 90, 97, 122, 13, 32, 34, 39, 47, 60, 62, 92, 9, 10, 11, 12, 13, 32, 34, 39, 47, 60, 62, 92, 9, 10, 11, 12, 13, 32, 34, 39, 47, 60, 62, 63, 92, 95, 9, 10, 11, 12, 45, 58, 65, 90, 97, 122, 32, 34, 39, 47, 62, 63, 92, 95, 9, 13, 45, 58, 65, 90, 97, 122, 32, 34, 39, 47, 62, 63, 92, 95, 9, 13, 45, 58, 65, 90, 97, 122, 13, 32, 34, 39, 47, 60, 62, 92, 9, 10, 11, 12, 13, 32, 34, 39, 47, 60, 61, 62, 63, 92, 95, 9, 10, 11, 12, 45, 58, 65, 90, 97, 122, 13, 32, 39, 47, 60, 62, 63, 92, 95, 9, 10, 11, 12, 45, 58, 65, 90, 97, 122, 34, 39, 92, 32, 39, 47, 62, 63, 92, 95, 9, 13, 45, 58, 65, 90, 97, 122, 13, 32, 34, 39, 47, 60, 62, 92, 9, 10, 11, 12, 32, 34, 47, 62, 63, 92, 95, 9, 13, 45, 58, 65, 90, 97, 122, 34, 39, 92, 13, 32, 39, 47, 60, 62, 92, 9, 10, 11, 12, 34, 92, 39, 92, 13, 32, 34, 39, 47, 60, 62, 9, 10, 11, 12, 58, 95, 120, 65, 90, 97, 122, 32, 63, 95, 9, 13, 45, 46, 48, 58, 65, 90, 97, 122, 32, 63, 95, 109, 9, 13, 45, 46, 48, 58, 65, 90, 97, 122, 32, 63, 95, 108, 9, 13, 45, 46, 48, 58, 65, 90, 97, 122, 32, 63, 95, 9, 13, 45, 46, 48, 58, 65, 90, 97, 122, 101, 114, 115, 105, 111, 110, 32, 61, 9, 13, 32, 34, 39, 9, 13, 95, 45, 46, 48, 58, 65, 90, 97, 122, 34, 95, 45, 46, 48, 58, 65, 90, 97, 122, 32, 62, 63, 9, 13, 32, 62, 63, 101, 115, 9, 13, 62, 110, 99, 111, 100, 105, 110, 103, 32, 61, 9, 13, 32, 34, 39, 9, 13, 65, 90, 97, 122, 34, 95, 45, 46, 48, 57, 65, 90, 97, 122, 32, 62, 63, 9, 13, 32, 62, 63, 115, 9, 13, 116, 97, 110, 100, 97, 108, 111, 110, 101, 32, 61, 9, 13, 32, 34, 39, 9, 13, 110, 121, 111, 34, 32, 62, 63, 9, 13, 101, 115, 110, 121, 111, 39, 101, 115, 65, 90, 97, 122, 39, 95, 45, 46, 48, 57, 65, 90, 97, 122, 95, 45, 46, 48, 58, 65, 90, 97, 122, 39, 95, 45, 46, 48, 58, 65, 90, 97, 122, 62, 62, 10, 60, 33, 47, 58, 63, 95, 65, 90, 97, 122, 39, 93, 34, 34, 92, 39, 92, 34, 39, 92, 32, 9, 13, 32, 118, 9, 13, 10, 45, 45, 10, 93, 93, 10, 62, 63, 62, 0 }; } private static final char _hpricot_scan_trans_keys[] = init__hpricot_scan_trans_keys_0(); private static byte[] init__hpricot_scan_single_lengths_0() { return new byte [] { 3, 1, 1, 1, 1, 1, 1, 1, 1, 3, 5, 5, 1, 1, 1, 1, 1, 1, 3, 4, 4, 3, 5, 1, 1, 3, 1, 2, 1, 1, 4, 4, 7, 7, 7, 7, 5, 2, 2, 4, 2, 3, 3, 4, 2, 3, 4, 4, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 2, 4, 2, 5, 5, 6, 6, 1, 7, 5, 5, 7, 8, 8, 5, 7, 9, 9, 7, 7, 7, 2, 2, 8, 8, 3, 8, 8, 10, 10, 9, 9, 10, 10, 7, 7, 8, 8, 8, 8, 3, 7, 2, 2, 8, 8, 3, 8, 7, 9, 10, 10, 7, 7, 8, 10, 10, 8, 10, 11, 9, 9, 4, 3, 8, 8, 10, 10, 10, 8, 8, 10, 8, 8, 8, 11, 9, 3, 7, 8, 7, 3, 7, 2, 2, 7, 3, 3, 4, 4, 3, 1, 1, 1, 1, 1, 1, 2, 3, 1, 2, 3, 5, 1, 1, 1, 1, 1, 1, 1, 1, 2, 3, 0, 2, 3, 4, 1, 1, 1, 1, 1, 1, 1, 1, 1, 2, 3, 2, 1, 1, 3, 1, 1, 2, 1, 1, 1, 1, 0, 2, 1, 2, 1, 1, 2, 5, 1, 1, 1, 2, 2, 3, 1, 2, 2, 1, 2, 1, 3, 1 }; } private static final byte _hpricot_scan_single_lengths[] = init__hpricot_scan_single_lengths_0(); private static byte[] init__hpricot_scan_range_lengths_0() { return new byte [] { 0, 0, 0, 0, 0, 0, 0, 0, 1, 3, 5, 1, 0, 0, 0, 0, 0, 1, 1, 4, 4, 1, 1, 0, 0, 1, 0, 1, 0, 0, 5, 5, 5, 5, 5, 5, 1, 0, 0, 1, 0, 1, 1, 1, 0, 1, 1, 5, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 2, 5, 1, 4, 4, 4, 4, 0, 2, 2, 4, 5, 5, 5, 2, 2, 5, 5, 2, 2, 4, 0, 0, 4, 4, 0, 2, 2, 5, 5, 5, 5, 5, 5, 2, 2, 2, 2, 2, 4, 0, 4, 0, 0, 4, 4, 0, 2, 2, 5, 5, 5, 2, 2, 2, 5, 5, 2, 5, 5, 4, 4, 0, 0, 2, 2, 5, 5, 5, 2, 2, 5, 4, 4, 2, 5, 5, 0, 4, 2, 4, 0, 2, 0, 0, 2, 2, 5, 5, 5, 5, 0, 0, 0, 0, 0, 0, 1, 1, 4, 4, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 2, 4, 1, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 1, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 2, 4, 4, 4, 0, 0, 0, 2, 0, 0, 0, 0, 0, 0, 1, 1, 0, 0, 0, 0, 0, 0 }; } private static final byte _hpricot_scan_range_lengths[] = init__hpricot_scan_range_lengths_0(); private static short[] init__hpricot_scan_index_offsets_0() { return new short [] { 0, 4, 6, 8, 10, 12, 14, 16, 18, 21, 28, 39, 46, 48, 50, 52, 54, 56, 59, 64, 73, 82, 87, 94, 96, 98, 103, 105, 109, 111, 113, 123, 133, 146, 159, 172, 185, 192, 195, 198, 204, 207, 212, 217, 223, 226, 231, 237, 247, 249, 251, 253, 255, 257, 259, 261, 263, 265, 267, 269, 274, 284, 288, 298, 308, 319, 330, 332, 342, 350, 360, 373, 387, 401, 409, 419, 434, 449, 459, 469, 481, 484, 487, 500, 513, 517, 528, 539, 555, 571, 586, 601, 617, 633, 643, 653, 664, 675, 686, 699, 703, 715, 718, 721, 734, 747, 751, 762, 772, 787, 803, 819, 829, 839, 850, 866, 882, 893, 909, 926, 940, 954, 959, 963, 974, 985, 1001, 1017, 1033, 1044, 1055, 1071, 1084, 1097, 1108, 1125, 1140, 1144, 1156, 1167, 1179, 1183, 1193, 1196, 1199, 1209, 1215, 1224, 1234, 1244, 1253, 1255, 1257, 1259, 1261, 1263, 1265, 1269, 1274, 1280, 1287, 1292, 1299, 1301, 1303, 1305, 1307, 1309, 1311, 1313, 1315, 1319, 1324, 1327, 1334, 1339, 1345, 1347, 1349, 1351, 1353, 1355, 1357, 1359, 1361, 1363, 1367, 1372, 1375, 1377, 1379, 1384, 1386, 1388, 1391, 1393, 1395, 1397, 1399, 1402, 1409, 1415, 1422, 1424, 1426, 1429, 1437, 1439, 1441, 1443, 1446, 1449, 1453, 1456, 1460, 1463, 1465, 1468, 1470, 1474 }; } private static final short _hpricot_scan_index_offsets[] = init__hpricot_scan_index_offsets_0(); private static short[] init__hpricot_scan_indicies_0() { return new short [] { 1, 2, 3, 0, 4, 0, 5, 0, 6, 0, 7, 0, 8, 0, 9, 0, 10, 0, 11, 11, 0, 11, 12, 12, 11, 12, 12, 0, 13, 15, 14, 16, 14, 13, 14, 14, 14, 14, 0, 17, 18, 19, 20, 21, 17, 0, 22, 0, 23, 0, 24, 0, 25, 0, 26, 0, 27, 27, 0, 27, 28, 29, 27, 0, 30, 31, 30, 30, 30, 30, 30, 30, 0, 32, 33, 32, 32, 32, 32, 32, 32, 0, 34, 18, 21, 34, 0, 34, 35, 36, 18, 21, 34, 0, 38, 37, 41, 40, 42, 18, 21, 42, 39, 43, 21, 43, 18, 43, 39, 38, 44, 41, 45, 46, 47, 46, 46, 46, 46, 46, 46, 46, 0, 48, 49, 48, 48, 48, 48, 48, 48, 48, 0, 50, 50, 48, 49, 18, 21, 48, 34, 48, 48, 48, 48, 0, 50, 50, 35, 51, 18, 21, 48, 34, 48, 48, 48, 48, 0, 52, 52, 54, 55, 56, 57, 54, 53, 54, 54, 54, 54, 44, 58, 58, 61, 62, 63, 64, 60, 59, 60, 60, 60, 60, 45, 59, 61, 65, 63, 64, 59, 45, 67, 68, 66, 70, 71, 69, 72, 41, 63, 64, 72, 45, 73, 74, 64, 75, 76, 43, 75, 21, 74, 41, 63, 74, 45, 77, 41, 78, 79, 77, 40, 73, 80, 79, 80, 41, 78, 80, 40, 81, 38, 56, 57, 81, 44, 60, 82, 60, 60, 60, 60, 60, 60, 60, 45, 83, 0, 84, 0, 85, 0, 86, 0, 87, 0, 88, 0, 89, 0, 90, 0, 91, 0, 92, 0, 93, 0, 94, 94, 94, 94, 0, 95, 97, 96, 96, 95, 96, 96, 96, 96, 0, 98, 99, 98, 0, 100, 102, 103, 101, 101, 100, 101, 101, 101, 0, 104, 106, 107, 105, 105, 104, 105, 105, 105, 0, 108, 110, 111, 112, 109, 109, 108, 109, 109, 109, 39, 113, 115, 116, 117, 114, 114, 113, 114, 114, 114, 39, 118, 39, 120, 120, 122, 123, 124, 39, 117, 120, 121, 119, 126, 126, 128, 39, 129, 126, 127, 125, 130, 115, 117, 114, 114, 130, 114, 114, 114, 39, 126, 126, 132, 39, 133, 131, 131, 126, 127, 131, 131, 131, 125, 134, 134, 137, 39, 138, 139, 136, 136, 134, 135, 136, 136, 136, 125, 140, 140, 132, 39, 142, 133, 131, 131, 140, 141, 131, 131, 131, 125, 126, 126, 128, 39, 129, 126, 127, 125, 143, 143, 145, 146, 147, 39, 129, 143, 144, 119, 148, 148, 122, 123, 124, 39, 117, 150, 150, 148, 149, 150, 150, 150, 119, 143, 143, 145, 146, 151, 39, 133, 150, 150, 143, 144, 150, 150, 150, 119, 153, 153, 155, 156, 157, 158, 159, 153, 154, 152, 161, 161, 163, 164, 165, 166, 167, 161, 162, 160, 168, 169, 171, 172, 170, 173, 170, 168, 170, 170, 170, 165, 169, 173, 165, 174, 173, 165, 175, 169, 177, 178, 179, 176, 173, 176, 175, 176, 176, 176, 165, 180, 169, 171, 181, 172, 170, 173, 170, 180, 170, 170, 170, 165, 169, 182, 173, 165, 183, 183, 185, 186, 187, 165, 172, 159, 183, 184, 152, 188, 188, 185, 186, 187, 165, 172, 159, 188, 189, 152, 188, 188, 185, 186, 187, 165, 172, 190, 159, 190, 188, 189, 190, 190, 190, 152, 191, 191, 193, 194, 195, 165, 196, 190, 159, 190, 191, 192, 190, 190, 190, 152, 153, 153, 155, 195, 157, 197, 190, 159, 190, 153, 154, 190, 190, 190, 152, 161, 161, 163, 199, 165, 196, 198, 167, 198, 161, 162, 198, 198, 198, 160, 200, 200, 163, 203, 165, 204, 205, 202, 167, 202, 200, 201, 202, 202, 202, 160, 206, 206, 163, 199, 165, 208, 196, 198, 167, 198, 206, 207, 198, 198, 198, 160, 161, 161, 163, 164, 165, 166, 167, 161, 162, 160, 161, 161, 209, 164, 165, 166, 167, 161, 162, 160, 191, 191, 193, 194, 156, 165, 166, 159, 191, 192, 152, 211, 211, 213, 214, 215, 216, 217, 218, 211, 212, 210, 220, 220, 222, 209, 223, 224, 225, 226, 220, 221, 219, 227, 228, 174, 230, 231, 229, 232, 229, 227, 229, 229, 229, 224, 228, 174, 232, 224, 234, 169, 236, 237, 235, 238, 235, 234, 235, 235, 235, 233, 169, 238, 233, 228, 238, 233, 239, 169, 241, 242, 243, 240, 238, 240, 239, 240, 240, 240, 233, 244, 169, 236, 245, 237, 235, 238, 235, 244, 235, 235, 235, 233, 169, 246, 238, 233, 248, 248, 250, 251, 252, 233, 237, 253, 248, 249, 247, 255, 255, 163, 257, 233, 258, 259, 255, 256, 254, 255, 255, 163, 261, 233, 262, 260, 259, 260, 255, 256, 260, 260, 260, 254, 263, 263, 163, 266, 233, 267, 268, 265, 259, 265, 263, 264, 265, 265, 265, 254, 269, 269, 163, 261, 233, 271, 262, 260, 259, 260, 269, 270, 260, 260, 260, 254, 255, 255, 163, 257, 233, 258, 259, 255, 256, 254, 255, 255, 222, 257, 233, 258, 259, 255, 256, 254, 272, 272, 274, 275, 276, 233, 258, 253, 272, 273, 247, 277, 277, 250, 251, 252, 233, 237, 279, 253, 279, 277, 278, 279, 279, 279, 247, 272, 272, 274, 275, 280, 233, 262, 279, 253, 279, 272, 273, 279, 279, 279, 247, 211, 211, 281, 214, 215, 216, 217, 218, 211, 212, 210, 220, 220, 222, 209, 283, 224, 284, 282, 226, 282, 220, 221, 282, 282, 282, 219, 285, 285, 222, 209, 288, 224, 289, 290, 287, 226, 287, 285, 286, 287, 287, 287, 219, 291, 228, 174, 230, 292, 231, 229, 232, 229, 291, 229, 229, 229, 224, 293, 228, 174, 295, 296, 297, 294, 232, 294, 293, 294, 294, 294, 224, 228, 174, 298, 232, 224, 299, 299, 232, 224, 300, 300, 302, 303, 304, 224, 231, 218, 300, 301, 210, 305, 305, 302, 303, 304, 224, 231, 218, 305, 306, 210, 305, 305, 302, 303, 304, 224, 231, 307, 218, 307, 305, 306, 307, 307, 307, 210, 308, 308, 310, 311, 312, 224, 284, 307, 218, 307, 308, 309, 307, 307, 307, 210, 211, 211, 281, 214, 312, 216, 313, 307, 218, 307, 211, 212, 307, 307, 307, 210, 220, 220, 222, 209, 223, 224, 225, 226, 220, 221, 219, 220, 220, 314, 314, 223, 224, 225, 226, 220, 221, 219, 211, 211, 213, 214, 312, 216, 313, 307, 218, 307, 211, 212, 307, 307, 307, 210, 315, 316, 317, 319, 320, 318, 321, 318, 315, 318, 318, 318, 216, 315, 322, 317, 319, 320, 318, 321, 318, 315, 318, 318, 318, 216, 308, 308, 310, 311, 215, 224, 225, 218, 308, 309, 210, 323, 323, 222, 209, 283, 224, 325, 284, 282, 226, 282, 323, 324, 282, 282, 282, 219, 326, 326, 155, 280, 328, 329, 279, 253, 279, 326, 327, 279, 279, 279, 247, 316, 317, 321, 216, 330, 331, 333, 334, 332, 335, 332, 330, 332, 332, 332, 328, 277, 277, 250, 251, 252, 233, 237, 253, 277, 278, 247, 336, 331, 338, 339, 337, 340, 337, 336, 337, 337, 337, 157, 322, 317, 321, 216, 326, 326, 155, 276, 328, 341, 253, 326, 327, 247, 331, 340, 157, 331, 335, 328, 148, 148, 122, 123, 124, 39, 117, 148, 149, 119, 342, 342, 343, 342, 342, 0, 344, 345, 345, 344, 345, 345, 345, 345, 0, 344, 345, 345, 346, 344, 345, 345, 345, 345, 0, 344, 345, 345, 347, 344, 345, 345, 345, 345, 0, 348, 345, 345, 348, 345, 345, 345, 345, 0, 350, 349, 351, 349, 352, 349, 353, 349, 354, 349, 355, 349, 355, 356, 355, 349, 356, 357, 358, 356, 349, 359, 359, 359, 359, 359, 349, 360, 361, 361, 361, 361, 361, 349, 362, 363, 364, 362, 349, 362, 363, 364, 365, 366, 362, 349, 363, 349, 367, 349, 368, 349, 369, 349, 370, 349, 371, 349, 372, 349, 373, 349, 373, 374, 373, 349, 374, 375, 376, 374, 349, 377, 377, 349, 378, 379, 379, 379, 379, 379, 349, 380, 363, 364, 380, 349, 380, 363, 364, 366, 380, 349, 381, 349, 382, 349, 383, 349, 384, 349, 385, 349, 386, 349, 387, 349, 388, 349, 389, 349, 389, 390, 389, 349, 390, 391, 392, 390, 349, 393, 394, 349, 395, 349, 396, 349, 397, 363, 364, 397, 349, 398, 349, 395, 349, 399, 400, 349, 401, 349, 396, 349, 402, 349, 401, 349, 403, 403, 349, 378, 404, 404, 404, 404, 404, 349, 405, 405, 405, 405, 405, 349, 360, 406, 406, 406, 406, 406, 349, 408, 407, 410, 409, 412, 413, 411, 415, 416, 417, 418, 417, 417, 417, 414, 41, 45, 43, 21, 41, 40, 169, 173, 165, 169, 238, 233, 228, 174, 232, 224, 344, 344, 420, 348, 421, 348, 420, 423, 424, 422, 426, 425, 428, 429, 427, 431, 430, 433, 434, 435, 432, 434, 436, 0 }; } private static final short _hpricot_scan_indicies[] = init__hpricot_scan_indicies_0(); private static short[] init__hpricot_scan_trans_targs_0() { return new short [] { 204, 1, 2, 53, 204, 3, 4, 5, 6, 7, 8, 9, 10, 11, 10, 204, 26, 11, 204, 12, 48, 26, 13, 14, 15, 16, 17, 18, 19, 30, 20, 21, 20, 21, 22, 23, 28, 24, 25, 204, 24, 25, 25, 27, 29, 29, 31, 32, 31, 32, 33, 34, 35, 36, 47, 32, 206, 40, 35, 36, 47, 37, 34, 206, 40, 46, 38, 39, 43, 38, 39, 43, 39, 41, 42, 41, 207, 43, 208, 44, 45, 39, 32, 49, 50, 51, 52, 21, 54, 55, 56, 57, 58, 204, 60, 61, 60, 204, 61, 204, 63, 62, 66, 204, 63, 64, 66, 204, 65, 64, 66, 67, 204, 65, 64, 66, 67, 204, 204, 68, 144, 74, 142, 143, 73, 68, 69, 70, 73, 204, 69, 71, 73, 204, 65, 72, 71, 73, 74, 204, 65, 72, 74, 75, 76, 77, 141, 73, 75, 76, 71, 73, 78, 79, 90, 70, 93, 80, 209, 94, 78, 79, 90, 70, 93, 80, 209, 94, 79, 69, 82, 84, 209, 81, 79, 83, 82, 84, 85, 209, 83, 85, 209, 86, 95, 139, 140, 93, 87, 88, 91, 87, 88, 89, 96, 93, 209, 209, 91, 93, 83, 92, 91, 93, 95, 209, 83, 92, 95, 90, 97, 98, 117, 108, 90, 128, 99, 211, 129, 97, 98, 117, 108, 128, 99, 211, 129, 98, 100, 120, 121, 211, 122, 101, 100, 103, 105, 210, 102, 104, 103, 105, 106, 210, 104, 106, 210, 107, 138, 113, 136, 137, 111, 112, 107, 100, 108, 111, 210, 112, 109, 111, 210, 104, 110, 109, 111, 113, 210, 104, 110, 113, 114, 115, 116, 135, 111, 114, 115, 109, 111, 108, 118, 128, 211, 119, 134, 118, 128, 133, 211, 119, 123, 119, 120, 121, 123, 211, 211, 98, 124, 133, 131, 132, 128, 125, 126, 118, 125, 126, 127, 130, 128, 211, 117, 98, 100, 79, 120, 121, 211, 122, 100, 119, 134, 133, 100, 108, 101, 210, 100, 69, 103, 105, 210, 102, 79, 82, 84, 209, 81, 210, 146, 147, 212, 146, 148, 149, 213, 204, 151, 152, 153, 154, 155, 156, 157, 158, 200, 159, 160, 159, 161, 204, 162, 163, 176, 164, 165, 166, 167, 168, 169, 170, 171, 172, 198, 173, 174, 173, 175, 177, 178, 179, 180, 181, 182, 183, 184, 185, 186, 187, 193, 188, 191, 189, 190, 190, 192, 194, 196, 195, 197, 199, 199, 201, 201, 214, 214, 216, 216, 204, 204, 205, 204, 0, 59, 62, 145, 204, 204, 150, 214, 214, 215, 214, 202, 216, 216, 217, 216, 203, 218, 218, 218, 219, 218 }; } private static final short _hpricot_scan_trans_targs[] = init__hpricot_scan_trans_targs_0(); private static short[] init__hpricot_scan_trans_actions_0() { return new short [] { 73, 0, 0, 0, 59, 0, 0, 0, 0, 0, 0, 0, 1, 5, 0, 92, 5, 0, 51, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 3, 83, 0, 19, 0, 0, 0, 3, 86, 75, 0, 21, 0, 0, 3, 0, 3, 83, 0, 19, 0, 19, 3, 3, 3, 172, 188, 3, 0, 0, 0, 0, 113, 146, 0, 21, 3, 86, 86, 0, 21, 21, 0, 21, 0, 0, 146, 0, 146, 0, 0, 3, 113, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 61, 1, 5, 0, 98, 0, 55, 5, 0, 5, 95, 0, 116, 0, 53, 11, 0, 110, 11, 168, 0, 180, 23, 0, 122, 57, 3, 3, 3, 0, 0, 89, 0, 9, 9, 104, 164, 0, 180, 119, 176, 107, 107, 0, 160, 11, 201, 9, 9, 0, 80, 80, 0, 0, 152, 3, 3, 196, 156, 3, 80, 80, 77, 152, 3, 226, 3, 0, 9, 9, 7, 104, 0, 211, 0, 0, 7, 180, 23, 192, 0, 7, 11, 0, 110, 11, 216, 0, 0, 149, 3, 3, 7, 0, 89, 3, 3, 196, 80, 80, 7, 0, 156, 221, 232, 180, 119, 107, 107, 0, 160, 11, 238, 9, 9, 0, 7, 3, 80, 80, 101, 77, 152, 3, 226, 3, 0, 9, 9, 7, 104, 0, 211, 0, 0, 7, 180, 23, 192, 0, 0, 0, 180, 23, 192, 0, 11, 0, 110, 11, 216, 0, 0, 149, 3, 3, 3, 0, 7, 89, 3, 0, 9, 9, 104, 211, 0, 180, 119, 221, 107, 107, 0, 160, 11, 238, 9, 9, 0, 80, 80, 0, 7, 152, 3, 3, 196, 156, 77, 180, 119, 221, 107, 107, 0, 160, 11, 238, 0, 0, 11, 0, 110, 11, 216, 149, 7, 3, 3, 7, 7, 89, 3, 3, 196, 80, 80, 7, 7, 156, 232, 7, 3, 77, 77, 196, 89, 206, 3, 101, 9, 9, 0, 80, 80, 3, 232, 3, 77, 196, 89, 206, 3, 3, 196, 89, 206, 3, 226, 25, 25, 0, 0, 0, 0, 31, 71, 0, 0, 0, 0, 0, 0, 0, 0, 0, 3, 13, 0, 0, 49, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 3, 15, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 3, 3, 0, 17, 0, 0, 3, 3, 0, 0, 3, 0, 3, 0, 37, 137, 43, 140, 63, 134, 184, 69, 0, 0, 1, 0, 65, 67, 0, 33, 125, 31, 35, 0, 39, 128, 31, 41, 0, 45, 131, 143, 0, 47 }; } private static final short _hpricot_scan_trans_actions[] = init__hpricot_scan_trans_actions_0(); private static short[] init__hpricot_scan_to_state_actions_0() { return new short [] { 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 27, 0, 0, 0, 0, 0, 0, 0, 0, 0, 27, 0, 27, 0, 27, 0 }; } private static final short _hpricot_scan_to_state_actions[] = init__hpricot_scan_to_state_actions_0(); private static short[] init__hpricot_scan_from_state_actions_0() { return new short [] { 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 29, 0, 0, 0, 0, 0, 0, 0, 0, 0, 29, 0, 29, 0, 29, 0 }; } private static final short _hpricot_scan_from_state_actions[] = init__hpricot_scan_from_state_actions_0(); private static short[] init__hpricot_scan_eof_trans_0() { return new short [] { 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 40, 40, 40, 40, 1, 40, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 40, 40, 40, 40, 40, 40, 40, 40, 40, 40, 40, 40, 40, 40, 40, 40, 40, 40, 40, 40, 40, 40, 40, 40, 40, 40, 40, 40, 40, 40, 40, 40, 40, 40, 40, 40, 40, 40, 40, 40, 40, 40, 40, 40, 40, 40, 40, 40, 40, 40, 40, 40, 40, 40, 40, 40, 40, 40, 40, 40, 40, 40, 40, 40, 40, 40, 40, 40, 40, 40, 40, 40, 40, 40, 40, 40, 40, 40, 40, 40, 40, 1, 1, 1, 1, 1, 350, 350, 350, 350, 350, 350, 350, 350, 350, 350, 350, 350, 350, 350, 350, 350, 350, 350, 350, 350, 350, 350, 350, 350, 350, 350, 350, 350, 350, 350, 350, 350, 350, 350, 350, 350, 350, 350, 350, 350, 350, 350, 350, 350, 350, 350, 350, 350, 350, 350, 350, 350, 408, 410, 0, 415, 420, 420, 420, 40, 40, 40, 421, 421, 0, 426, 0, 431, 0, 437 }; } private static final short _hpricot_scan_eof_trans[] = init__hpricot_scan_eof_trans_0(); static final int hpricot_scan_start = 204; static final int hpricot_scan_error = -1; static final int hpricot_scan_en_html_comment = 214; static final int hpricot_scan_en_html_cdata = 216; static final int hpricot_scan_en_html_procins = 218; static final int hpricot_scan_en_main = 204; // line 192 "ext/hpricot_scan/hpricot_scan.java.rl" public final static int BUFSIZE=16384; private void rb_yield_tokens(IRubyObject sym, IRubyObject tag, IRubyObject attr, IRubyObject raw, boolean taint) { IRubyObject ary; if (sym == runtime.newSymbol("text")) { raw = tag; } ary = runtime.newArray(new IRubyObject[]{sym, tag, attr, raw}); if (taint) { ary.setTaint(true); tag.setTaint(true); attr.setTaint(true); raw.setTaint(true); } block.yield(runtime.getCurrentContext(), ary, null, null, false); } int cs, act, have = 0, nread = 0, curline = 1, p=-1; boolean text = false; int ts=-1, te; int eof=-1; char[] buf; Ruby runtime; IRubyObject attr, bufsize; IRubyObject[] tag, akey, aval; int mark_tag, mark_akey, mark_aval; boolean done = false, ele_open = false; int buffer_size = 0; boolean taint = false; Block block = null; IRubyObject xmldecl, doctype, procins, stag, etag, emptytag, comment, cdata, sym_text; IRubyObject hpricot_scan(IRubyObject recv, IRubyObject port) { attr = bufsize = runtime.getNil(); tag = new IRubyObject[]{runtime.getNil()}; akey = new IRubyObject[]{runtime.getNil()}; aval = new IRubyObject[]{runtime.getNil()}; RubyClass rb_eHpricotParseError = runtime.getModule("Hpricot").getClass("ParseError"); taint = port.isTaint(); if ( !port.respondsTo("read")) { if ( port.respondsTo("to_str")) { port = port.callMethod(runtime.getCurrentContext(),"to_str"); } else { throw runtime.newArgumentError("bad Hpricot argument, String or IO only please."); } } buffer_size = BUFSIZE; if (rubyApi.getInstanceVariable(recv, "@buffer_size") != null) { bufsize = rubyApi.getInstanceVariable(recv, "@buffer_size"); if (!bufsize.isNil()) { buffer_size = RubyNumeric.fix2int(bufsize); } } buf = new char[buffer_size]; // line 821 "ext/hpricot_scan/HpricotScanService.java" { cs = hpricot_scan_start; ts = -1; te = -1; act = 0; } // line 256 "ext/hpricot_scan/hpricot_scan.java.rl" while( !done ) { IRubyObject str; p = have; int pe; int len, space = buffer_size - have; if ( space == 0 ) { /* We've used up the entire buffer storing an already-parsed token * prefix that must be preserved. Likely caused by super-long attributes. * See ticket #13. */ buffer_size += BUFSIZE; char[] new_buf = new char[buffer_size]; System.arraycopy(buf, 0, new_buf, 0, buf.length); buf = new_buf; space = buffer_size - have; } if (port.respondsTo("read")) { str = port.callMethod(runtime.getCurrentContext(),"read",runtime.newFixnum(space)); } else { str = ((RubyString)port).substr(nread,space); } str = str.convertToString(); String sss = str.toString(); char[] chars = sss.toCharArray(); System.arraycopy(chars,0,buf,p,chars.length); len = sss.length(); nread += len; if ( len < space ) { len++; done = true; } pe = p + len; char[] data = buf; // line 870 "ext/hpricot_scan/HpricotScanService.java" { int _klen; int _trans = 0; int _acts; int _nacts; int _keys; int _goto_targ = 0; _goto: while (true) { switch ( _goto_targ ) { case 0: if ( p == pe ) { _goto_targ = 4; continue _goto; } case 1: _acts = _hpricot_scan_from_state_actions[cs]; _nacts = (int) _hpricot_scan_actions[_acts++]; while ( _nacts-- > 0 ) { switch ( _hpricot_scan_actions[_acts++] ) { case 21: // line 1 "ext/hpricot_scan/hpricot_scan.java.rl" {ts = p;} break; // line 895 "ext/hpricot_scan/HpricotScanService.java" } } _match: do { _keys = _hpricot_scan_key_offsets[cs]; _trans = _hpricot_scan_index_offsets[cs]; _klen = _hpricot_scan_single_lengths[cs]; if ( _klen > 0 ) { int _lower = _keys; int _mid; int _upper = _keys + _klen - 1; while (true) { if ( _upper < _lower ) break; _mid = _lower + ((_upper-_lower) >> 1); if ( data[p] < _hpricot_scan_trans_keys[_mid] ) _upper = _mid - 1; else if ( data[p] > _hpricot_scan_trans_keys[_mid] ) _lower = _mid + 1; else { _trans += (_mid - _keys); break _match; } } _keys += _klen; _trans += _klen; } _klen = _hpricot_scan_range_lengths[cs]; if ( _klen > 0 ) { int _lower = _keys; int _mid; int _upper = _keys + (_klen<<1) - 2; while (true) { if ( _upper < _lower ) break; _mid = _lower + (((_upper-_lower) >> 1) & ~1); if ( data[p] < _hpricot_scan_trans_keys[_mid] ) _upper = _mid - 2; else if ( data[p] > _hpricot_scan_trans_keys[_mid+1] ) _lower = _mid + 2; else { _trans += ((_mid - _keys)>>1); break _match; } } _trans += _klen; } } while (false); _trans = _hpricot_scan_indicies[_trans]; case 3: cs = _hpricot_scan_trans_targs[_trans]; if ( _hpricot_scan_trans_actions[_trans] != 0 ) { _acts = _hpricot_scan_trans_actions[_trans]; _nacts = (int) _hpricot_scan_actions[_acts++]; while ( _nacts-- > 0 ) { switch ( _hpricot_scan_actions[_acts++] ) { case 0: // line 147 "ext/hpricot_scan/hpricot_scan.java.rl" { if (text) { CAT(tag, p); ELE(sym_text); text = false; } attr = runtime.getNil(); tag[0] = runtime.getNil(); mark_tag = -1; ele_open = true; } break; case 1: // line 159 "ext/hpricot_scan/hpricot_scan.java.rl" { mark_tag = p; } break; case 2: // line 160 "ext/hpricot_scan/hpricot_scan.java.rl" { mark_aval = p; } break; case 3: // line 161 "ext/hpricot_scan/hpricot_scan.java.rl" { mark_akey = p; } break; case 4: // line 162 "ext/hpricot_scan/hpricot_scan.java.rl" { SET(tag, p); } break; case 5: // line 164 "ext/hpricot_scan/hpricot_scan.java.rl" { SET(aval, p); } break; case 6: // line 165 "ext/hpricot_scan/hpricot_scan.java.rl" { if (buf[p-1] == '"' || buf[p-1] == '\'') { SET(aval, p-1); } else { SET(aval, p); } } break; case 7: // line 169 "ext/hpricot_scan/hpricot_scan.java.rl" { SET(akey, p); } break; case 8: // line 170 "ext/hpricot_scan/hpricot_scan.java.rl" { SET(aval, p); ATTR(rb_str_new2("version"), aval); } break; case 9: // line 171 "ext/hpricot_scan/hpricot_scan.java.rl" { SET(aval, p); ATTR(rb_str_new2("encoding"), aval); } break; case 10: // line 172 "ext/hpricot_scan/hpricot_scan.java.rl" { SET(aval, p); ATTR(rb_str_new2("standalone"), aval); } break; case 11: // line 173 "ext/hpricot_scan/hpricot_scan.java.rl" { SET(aval, p); ATTR(rb_str_new2("public_id"), aval); } break; case 12: // line 174 "ext/hpricot_scan/hpricot_scan.java.rl" { SET(aval, p); ATTR(rb_str_new2("system_id"), aval); } break; case 13: // line 176 "ext/hpricot_scan/hpricot_scan.java.rl" { akey[0] = runtime.getNil(); aval[0] = runtime.getNil(); mark_akey = -1; mark_aval = -1; } break; case 14: // line 183 "ext/hpricot_scan/hpricot_scan.java.rl" { ATTR(akey, aval); } break; case 15: // line 9 "ext/hpricot_scan/hpricot_scan.java.rl" {curline += 1;} break; case 16: // line 46 "ext/hpricot_scan/hpricot_scan.java.rl" { TEXT_PASS(); } break; case 17: // line 50 "ext/hpricot_scan/hpricot_scan.java.rl" { EBLK(comment, 3); {cs = 204; _goto_targ = 2; if (true) continue _goto;} } break; case 18: // line 55 "ext/hpricot_scan/hpricot_scan.java.rl" { EBLK(cdata, 3); {cs = 204; _goto_targ = 2; if (true) continue _goto;} } break; case 19: // line 60 "ext/hpricot_scan/hpricot_scan.java.rl" { EBLK(procins, 2); {cs = 204; _goto_targ = 2; if (true) continue _goto;} } break; case 22: // line 1 "ext/hpricot_scan/hpricot_scan.java.rl" {te = p+1;} break; case 23: // line 50 "ext/hpricot_scan/hpricot_scan.java.rl" {te = p+1;} break; case 24: // line 51 "ext/hpricot_scan/hpricot_scan.java.rl" {te = p+1;{ TEXT_PASS(); }} break; case 25: // line 51 "ext/hpricot_scan/hpricot_scan.java.rl" {te = p;p--;{ TEXT_PASS(); }} break; case 26: // line 51 "ext/hpricot_scan/hpricot_scan.java.rl" {{p = ((te))-1;}{ TEXT_PASS(); }} break; case 27: // line 55 "ext/hpricot_scan/hpricot_scan.java.rl" {te = p+1;} break; case 28: // line 56 "ext/hpricot_scan/hpricot_scan.java.rl" {te = p+1;{ TEXT_PASS(); }} break; case 29: // line 56 "ext/hpricot_scan/hpricot_scan.java.rl" {te = p;p--;{ TEXT_PASS(); }} break; case 30: // line 56 "ext/hpricot_scan/hpricot_scan.java.rl" {{p = ((te))-1;}{ TEXT_PASS(); }} break; case 31: // line 60 "ext/hpricot_scan/hpricot_scan.java.rl" {te = p+1;} break; case 32: // line 61 "ext/hpricot_scan/hpricot_scan.java.rl" {te = p+1;{ TEXT_PASS(); }} break; case 33: // line 61 "ext/hpricot_scan/hpricot_scan.java.rl" {te = p;p--;{ TEXT_PASS(); }} break; case 34: // line 66 "ext/hpricot_scan/hpricot_scan.java.rl" {act = 8;} break; case 35: // line 68 "ext/hpricot_scan/hpricot_scan.java.rl" {act = 10;} break; case 36: // line 70 "ext/hpricot_scan/hpricot_scan.java.rl" {act = 12;} break; case 37: // line 73 "ext/hpricot_scan/hpricot_scan.java.rl" {act = 15;} break; case 38: // line 65 "ext/hpricot_scan/hpricot_scan.java.rl" {te = p+1;{ ELE(xmldecl); }} break; case 39: // line 66 "ext/hpricot_scan/hpricot_scan.java.rl" {te = p+1;{ ELE(doctype); }} break; case 40: // line 68 "ext/hpricot_scan/hpricot_scan.java.rl" {te = p+1;{ ELE(stag); }} break; case 41: // line 69 "ext/hpricot_scan/hpricot_scan.java.rl" {te = p+1;{ ELE(etag); }} break; case 42: // line 70 "ext/hpricot_scan/hpricot_scan.java.rl" {te = p+1;{ ELE(emptytag); }} break; case 43: // line 71 "ext/hpricot_scan/hpricot_scan.java.rl" {te = p+1;{ {cs = 214; _goto_targ = 2; if (true) continue _goto;} }} break; case 44: // line 72 "ext/hpricot_scan/hpricot_scan.java.rl" {te = p+1;{ {cs = 216; _goto_targ = 2; if (true) continue _goto;} }} break; case 45: // line 73 "ext/hpricot_scan/hpricot_scan.java.rl" {te = p+1;{ TEXT_PASS(); }} break; case 46: // line 66 "ext/hpricot_scan/hpricot_scan.java.rl" {te = p;p--;{ ELE(doctype); }} break; case 47: // line 67 "ext/hpricot_scan/hpricot_scan.java.rl" {te = p;p--;{ {cs = 218; _goto_targ = 2; if (true) continue _goto;} }} break; case 48: // line 73 "ext/hpricot_scan/hpricot_scan.java.rl" {te = p;p--;{ TEXT_PASS(); }} break; case 49: // line 67 "ext/hpricot_scan/hpricot_scan.java.rl" {{p = ((te))-1;}{ {cs = 218; _goto_targ = 2; if (true) continue _goto;} }} break; case 50: // line 73 "ext/hpricot_scan/hpricot_scan.java.rl" {{p = ((te))-1;}{ TEXT_PASS(); }} break; case 51: // line 1 "ext/hpricot_scan/hpricot_scan.java.rl" { switch( act ) { case 8: {{p = ((te))-1;} ELE(doctype); } break; case 10: {{p = ((te))-1;} ELE(stag); } break; case 12: {{p = ((te))-1;} ELE(emptytag); } break; case 15: {{p = ((te))-1;} TEXT_PASS(); } break; } } break; // line 1193 "ext/hpricot_scan/HpricotScanService.java" } } } case 2: _acts = _hpricot_scan_to_state_actions[cs]; _nacts = (int) _hpricot_scan_actions[_acts++]; while ( _nacts-- > 0 ) { switch ( _hpricot_scan_actions[_acts++] ) { case 20: // line 1 "ext/hpricot_scan/hpricot_scan.java.rl" {ts = -1;} break; // line 1207 "ext/hpricot_scan/HpricotScanService.java" } } if ( ++p != pe ) { _goto_targ = 1; continue _goto; } case 4: if ( p == eof ) { if ( _hpricot_scan_eof_trans[cs] > 0 ) { _trans = _hpricot_scan_eof_trans[cs] - 1; _goto_targ = 3; continue _goto; } } case 5: } break; } } // line 297 "ext/hpricot_scan/hpricot_scan.java.rl" if ( cs == hpricot_scan_error ) { if(!tag[0].isNil()) { rb_raise(rb_eHpricotParseError, "parse error on element <"+tag.toString()+">, starting on line "+curline+".\n" + NO_WAY_SERIOUSLY); } else { rb_raise(rb_eHpricotParseError, "parse error on line "+curline+".\n" + NO_WAY_SERIOUSLY); } } if ( done && ele_open ) { ele_open = false; if(ts > -1) { mark_tag = ts; ts = -1; text = true; } } if(ts == -1) { have = 0; /* text nodes have no ts because each byte is parsed alone */ if(mark_tag != -1 && text) { if (done) { if(mark_tag < p-1) { CAT(tag, p-1); ELE(sym_text); } } else { CAT(tag, p); } } mark_tag = 0; } else { have = pe - ts; System.arraycopy(buf,ts,buf,0,have); SLIDE(tag); SLIDE(akey); SLIDE(aval); te = (te - ts); ts = 0; } } return runtime.getNil(); } public static IRubyObject __hpricot_scan(IRubyObject recv, IRubyObject port, Block block) { Ruby runtime = recv.getRuntime(); HpricotScanService service = new HpricotScanService(); service.runtime = runtime; service.xmldecl = runtime.newSymbol("xmldecl"); service.doctype = runtime.newSymbol("doctype"); service.procins = runtime.newSymbol("procins"); service.stag = runtime.newSymbol("stag"); service.etag = runtime.newSymbol("etag"); service.emptytag = runtime.newSymbol("emptytag"); service.comment = runtime.newSymbol("comment"); service.cdata = runtime.newSymbol("cdata"); service.sym_text = runtime.newSymbol("text"); service.block = block; return service.hpricot_scan(recv, port); } public boolean basicLoad(final Ruby runtime) throws IOException { Init_hpricot_scan(runtime); return true; } public static void Init_hpricot_scan(Ruby runtime) { RubyModule mHpricot = runtime.defineModule("Hpricot"); mHpricot.getMetaClass().attr_accessor(runtime.getCurrentContext(),new IRubyObject[]{runtime.newSymbol("buffer_size")}); CallbackFactory fact = runtime.callbackFactory(HpricotScanService.class); mHpricot.getMetaClass().defineMethod("scan",fact.getSingletonMethod("__hpricot_scan",IRubyObject.class)); mHpricot.defineClassUnder("ParseError",runtime.getClass("StandardError"),runtime.getClass("StandardError").getAllocator()); rubyApi = JavaEmbedUtils.newObjectAdapter(); } }