require 'boilerpipe/version' require_relative 'boilerpipe-common-2.0-SNAPSHOT-jar-with-dependencies.jar' module Boilerpipe java_import 'com.kohlschutter.boilerpipe.extractors.ArticleExtractor' java_import 'com.kohlschutter.boilerpipe.util.UnicodeTokenizer' java_import java.net.URL class ArticleExtractor def self.get_text(s) url = nil begin url = Java::JavaNet::URL.new(s) rescue Java::JavaNet::MalformedURLException => e # not a URL end input = url ? url : s ArticleExtractor::INSTANCE.get_text(input) end class <