Sha256: 0df6e97b68ad687e9a34cb495c4b80c2c437b0037b795fb702092197dde23bf7
Contents?: true
Size: 1.83 KB
Versions: 2
Compression:
Stored size: 1.83 KB
Contents
require File.dirname(__FILE__) + '/../spec_helper' describe "PlainTextExtractors" do before(:all) do IndexReader.ensure_existence end PlainTextExtractor.each{|extractor| extractor.exts.each{|ext| should_extract= "should be able to extract content from #{extractor.description} (.#{ext})" content_and_file_examples_for_this_ext=extractor.content_and_file_examples.select{|content,file| File.ext_as_sym(file)==ext} unless content_and_file_examples_for_this_ext.empty? then it should_extract do content_and_file_examples_for_this_ext.each{|content_example,file_example| finder=Finder.new(content_example) finder.execute! matching_documents=finder.matching_documents matching_documents_filenames=matching_documents.collect{|d| d.filename} matching_documents_filenames.should include(file_example) } end else ## It means that the spec for this extension file is "Not yet implemented"! ## add this line to the corresponding extractor in lib/extractors: # which_should_for_example_extract 'some content', :from => 'a file you could add in spec/test_dirs/indexed/' it should_extract end } } it "should guess language when enough content is available" do Document.new("spec/test_dirs/indexed/lang/goethe").lang.should == "de" Document.new("spec/test_dirs/indexed/lang/shakespeare").lang.should == "en" Document.new("spec/test_dirs/indexed/lang/lorca").lang.should == "es" Document.new("spec/test_dirs/indexed/lang/hugo").lang.should == "fr" end it "should not try to guess language when file is too small" do Document.new("spec/test_dirs/indexed/basic/hello.rb").lang.should be_empty Document.new("spec/test_dirs/indexed/README").lang.should be_empty end end
Version data entries
2 entries across 2 versions & 1 rubygems
Version | Path |
---|---|
picolena-0.1.2 | lib/picolena/templates/spec/models/plain_text_extractor_spec.rb |
picolena-0.1.3 | lib/picolena/templates/spec/models/plain_text_extractor_spec.rb |