Sha256: f1ba4e2df113de02d02645e3abdc0f9d66ebfdb2f93b75a8f178c0c482d7ca24
Contents?: true
Size: 1.41 KB
Versions: 6
Compression:
Stored size: 1.41 KB
Contents
#Powerpoint 97-2003 PlainTextExtractor.new { every :ppt, :pps as "application/powerpoint" aka "Microsoft Office Powerpoint document" with "catppt SOURCE" => :on_linux_and_mac_os, "some other command" => :on_windows which_should_for_example_extract 'unofficial written by OOo Impress', :from => 'one_page.ppt' #FIXME: it seems that catppt cannot open .pps files. #or_extract 'a lightweight ferret-powered search engine written in Ruby on rails.', :from => 'picolena.pps' } #Powerpoint 2007 require 'zip/zip' PlainTextExtractor.new { every :pptx as 'application/vnd.openxmlformats-officedocument.presentationml.presentation' #could that mime BE any longer? aka "Microsoft Office 2007 Powerpoint document" with {|source| Zip::ZipFile.open(source){|zipfile| slides=zipfile.entries.select{|l| l.name=~/^ppt\/slides\/slide\d+.xml/} slides.collect{|entry| zipfile.read(entry).split(/</).grep(/^a:t/).collect{|l| l.sub(/^[^>]+>/,'') } }.join("\n") } } which_should_for_example_extract 'Welcome to Picolena (one more time!)', :from => 'office2007-powerpoint.pptx' } ## Microsoft Powerpoint to text conversion: ## Program: catppt ## Version tested: Catdoc Version 0.94.2 ## Installation: Ubuntu catdoc package ## Home page: http://www.wagner.pp.ru/~vitus/software/catdoc/ ## MS OOXML powerpoint to text conversion: ## Ruby code written by Eric DUMINIL
Version data entries
6 entries across 6 versions & 1 rubygems