.gitignore | 100644 | 0 | 0 | | | 87 Bytes | 5ea197fbb6ea6c4ea4a087b18ec8391a9e95f8d94d381ea2eac6a0a74ecc49c1 |
.rspec | 100644 | 0 | 0 | | | 31 Bytes | 04ea314ec27821b7e7cf198c2b3f1dc643fbc27429e3d8eb5f6253c2104d51ca |
.rubocop.yml | 100644 | 0 | 0 | | | 5.17 KB | d3d0ce4195c328d8fc9498ab86b05774924f49e5cd1e545017221623a5f8aacf |
.rubocop_todo.yml | 100644 | 0 | 0 | | | 3.73 KB | 05b1bf5d8cb42ecc7f89bf26f59cf8a640e0fe7f4f64f4f5387b2386a61a74bf |
.travis.yml | 100644 | 0 | 0 | | | 29 Bytes | 9874863f071f592de2e5788ddf9c4597f540361221c63bfbf5ce0f36333ce180 |
Gemfile | 100644 | 0 | 0 | | | 104 Bytes | f8c777c0b43d2fabdfb566f165dfcb831e41a6c62cbbb0e4f0605a04a14e7052 |
LICENSE.txt | 100644 | 0 | 0 | | | 1.05 KB | 6036efd35750b360d78923735e5fd3eefba3d931c26b2baebac57ea129fad5cd |
README.md | 100644 | 0 | 0 | | | 11 KB | f609c7849214389299c32c5cea90141c4964071d21663f53dc7b0567781cddc7 |
Rakefile | 100644 | 0 | 0 | | | 113 Bytes | 04def30df0ea5bdfa483398fcdd3ff18f5ce971e23072d37170ca88686bc6696 |
lib/pragmatic_tokenizer.rb | 100644 | 0 | 0 | | | 78 Bytes | cc1b0e257c76a87686a88257b908e7b397f5fe380da9118af1d59261e8f8aa54 |
lib/pragmatic_tokenizer/ending_punctuation_separator.rb | 100644 | 0 | 0 | | | 796 Bytes | 2a5de0483760c02ef404d78dbbbc39418c8ccffe361c2270bddda79e0abc7d60 |
lib/pragmatic_tokenizer/full_stop_separator.rb | 100644 | 0 | 0 | | | 1.48 KB | 1983cb3d8654185c424c8b62285ad3a19be7785bcdd6eefd0103c7a40bfcff3f |
lib/pragmatic_tokenizer/languages.rb | 100644 | 0 | 0 | | | 2 KB | 06fa7f83c9329dbdb8a891d960a1fc18aa696858421519e9aedd5705e6c6716e |
lib/pragmatic_tokenizer/languages/arabic.rb | 100644 | 0 | 0 | | | 2.18 KB | 7e1f95dac58f0c7f0fd013ffbde2829a5cf397d337fedcc8be895f39491f8832 |
lib/pragmatic_tokenizer/languages/bulgarian.rb | 100644 | 0 | 0 | | | 3.96 KB | 133d105a44d8c370f8c8e17c21365adff49239e449739e15609cfe210697065f |
lib/pragmatic_tokenizer/languages/catalan.rb | 100644 | 0 | 0 | | | 1.25 KB | ea5db12ea610f3f0bfdb36d97bc668c283ffad8401b5cc0d24021d856512b3c0 |
lib/pragmatic_tokenizer/languages/common.rb | 100644 | 0 | 0 | | | 4.26 KB | 0aaafd19151c776706a956fe92664de0883686bc64a0a862c90cfe0c5761288a |
lib/pragmatic_tokenizer/languages/czech.rb | 100644 | 0 | 0 | | | 3.64 KB | e8b5da3f20ce23c1fdd70524d5c4ee22f9bf44b0cfc439463b7b5d96f3aa97a3 |
lib/pragmatic_tokenizer/languages/danish.rb | 100644 | 0 | 0 | | | 547 Bytes | 0e9ca9d96392c5ef2fee88d67e80c45ecd922697871dbe7201f2065dbf3fdfe5 |
lib/pragmatic_tokenizer/languages/deutsch.rb | 100644 | 0 | 0 | | | 9.55 KB | bb3ded50eff7a30237b5f8a113d6f1bcfa84ae55c5f10df3421a5ea4803bcc57 |
lib/pragmatic_tokenizer/languages/dutch.rb | 100644 | 0 | 0 | | | 1.94 KB | f61fdc0ffad47a66e7569ab78d2ba9f9d8a6e7049d669af0d5366ae773424278 |
lib/pragmatic_tokenizer/languages/english.rb | 100644 | 0 | 0 | | | 14.6 KB | 02022315d71b0707998e3077e5bf3fa12dd6017612a83b0200574033f496510d |
lib/pragmatic_tokenizer/languages/finnish.rb | 100644 | 0 | 0 | | | 5.8 KB | afa13c23d6d1db333cf741ae6feb4d3151592164673f8632558fdfae7592c799 |
lib/pragmatic_tokenizer/languages/french.rb | 100644 | 0 | 0 | | | 5.87 KB | 4051b4eccd12797cec2ad371f861111a87a2005d04bead3c54e34fd5a82e3894 |
lib/pragmatic_tokenizer/languages/greek.rb | 100644 | 0 | 0 | | | 1.9 KB | 99704bb88466cd8f41f00da81ddf4cd069eb9baade39715e20881f5f358f33b5 |
lib/pragmatic_tokenizer/languages/indonesian.rb | 100644 | 0 | 0 | | | 2.84 KB | 4efce38831ca5a044d91ed5bf6f7d5cab91e264b872c9a0dd4f8a945a38930a1 |
lib/pragmatic_tokenizer/languages/italian.rb | 100644 | 0 | 0 | | | 21.2 KB | 5ee1b3eb468a1e373fe734394ab12043f14f59e3e0b6769a6564a35b5017c974 |
lib/pragmatic_tokenizer/languages/latvian.rb | 100644 | 0 | 0 | | | 1.66 KB | 7b324aa0c981e2d58739669f03d5eaa2c4414ce29009f3104f0f230f6646fbb2 |
lib/pragmatic_tokenizer/languages/norwegian.rb | 100644 | 0 | 0 | | | 879 Bytes | ced15fd4e11540741ff378e47963fdf1d13cfe158fddd59df72bf666b6ae56c0 |
lib/pragmatic_tokenizer/languages/persian.rb | 100644 | 0 | 0 | | | 3.09 KB | 9a1854773ad5ec4bdb340f735b5933b9fd70ac75973393f8f26fa37e7fab58e8 |
lib/pragmatic_tokenizer/languages/polish.rb | 100644 | 0 | 0 | | | 2.86 KB | 19dd35af9d10ae5085d2ce73a20428f14cf2f3f14634baef3bd5db8a6db33a17 |
lib/pragmatic_tokenizer/languages/portuguese.rb | 100644 | 0 | 0 | | | 2.88 KB | ea939e616f833c3e352b4ea9a15f5034d6f6cb9db7833e2dae489f4de0c8c0eb |
lib/pragmatic_tokenizer/languages/romanian.rb | 100644 | 0 | 0 | | | 2.64 KB | 2096fe809b3c2e2165fac7c04aa5b05209d7344eab30aeb776a72b607ddaab64 |
lib/pragmatic_tokenizer/languages/russian.rb | 100644 | 0 | 0 | | | 5.28 KB | 992f175d5b00baa126fab4757d6c10163a667ce972bbecc685bf05c60be8fec3 |
lib/pragmatic_tokenizer/languages/slovak.rb | 100644 | 0 | 0 | | | 1.09 KB | 7463d002ac4ecbb204bae75a6ee268c5e1a540f500a6990cdc92aa74489fcae5 |
lib/pragmatic_tokenizer/languages/spanish.rb | 100644 | 0 | 0 | | | 6.29 KB | 7fe6c3c6e11a48e83974ac54c0c7dfed6ce36cbe088d4524de38f4c5f49c7e0e |
lib/pragmatic_tokenizer/languages/swedish.rb | 100644 | 0 | 0 | | | 2.66 KB | c894ae1756c0b7ed00b370abb97ef4f81d8cb69362684fa497b9dbc10cdfa0ce |
lib/pragmatic_tokenizer/languages/turkish.rb | 100644 | 0 | 0 | | | 1.7 KB | ac2fef3682d7c4314d1456b99c325c5500ce60cfd15085a628c6a9092aa08d1d |
lib/pragmatic_tokenizer/post_processor.rb | 100644 | 0 | 0 | | | 3.95 KB | 27ff79809b4e831e4d8277ad97a9c3a329b7dc3f08cebb78dff59efc51190692 |
lib/pragmatic_tokenizer/pre_processor.rb | 100644 | 0 | 0 | | | 4.78 KB | be4d632591150861138417c096d7a4881ad0f0c7a10c6f90b30c012fcf2761b0 |
lib/pragmatic_tokenizer/tokenizer.rb | 100644 | 0 | 0 | | | 14.5 KB | b800f88fcda22d5b935066b1f1170f4b26acd444bd2ea46207959d7c36773e81 |
lib/pragmatic_tokenizer/version.rb | 100644 | 0 | 0 | | | 57 Bytes | a3fd325a6b5635a6f7927c07676207ed14f0af3440536423e50ac90586a35c87 |
pragmatic_tokenizer.gemspec | 100644 | 0 | 0 | | | 1.06 KB | ef3d4c4e259cfc2d0ebd6d8f3fcd60283cac8db87a9dcdc699cef4975c4b32b6 |
spec/languages/bulgarian_spec.rb | 100644 | 0 | 0 | | | 2.05 KB | ff2f649f9897a3a190bb1a2173e257b1b176fc2d82fe4ee5cd20fa28582f408e |
spec/languages/deutsch_spec.rb | 100644 | 0 | 0 | | | 8.8 KB | 3491240e7e895ff98727e872e5252f2c56701227d4414ba334c9080c0e15c50f |
spec/languages/english_spec.rb | 100644 | 0 | 0 | | | 72.8 KB | 0bf50a2bc1b2e29add6fe146bea49bae12879567f0082211b2584bdaaa1021ac |
spec/languages/french_spec.rb | 100644 | 0 | 0 | | | 375 Bytes | 236484526f73cb3d4b1c9cf147f622e732e80bed5701e62b0a0db108a828de6e |
spec/performance_spec.rb | 100644 | 0 | 0 | | | 9 KB | 608e6e16534353bcd1fd0bf6448aaf18f53c1c8d01f948a4a9d8d1c15ca1029e |
spec/pragmatic_tokenizer_spec.rb | 100644 | 0 | 0 | | | 1.66 KB | 1ed4df55af8ea23a58831aa2330bcf3067aa94be5fdbf75b06081426b6a22a89 |
spec/spec_helper.rb | 100644 | 0 | 0 | | | 89 Bytes | 9e5b2005435dca8e36fc6fd6759158319dfa2f13bc54967bdb1dcc73dd0109b3 |