lib/treat/workers/formatters/readers/doc.rb
# A wrapper for the 'antiword' command-line utility.
class Treat::Workers::Formatters::Readers::DOC
# Extract the readable text from a DOC file
# using the antiword command-line utility.
#
# Options: none.
def self.read(document, options = {})
f = `antiword #{document.file}`
f.gsub!("\n\n", '#keep#')
f.gsub!("\n", ' ')
f.gsub!('#keep#', "\n\n")
document.value = f
document.set :format, 'doc'
document
end
end