lib/attachment_to_html/adapters/rtf.rb
module AttachmentToHTML
module Adapters
# Convert application/rtf documents in to HTML
class RTF < Adapter
attr_reader :tmpdir
# Public: Initialize a RTF converter
#
# attachment - the FoiAttachment to convert to HTML
# opts - a Hash of options (default: {}):
# :tmpdir - String name of directory to store the
# converted document
def initialize(attachment, opts = {})
super
@tmpdir = opts.fetch(:tmpdir, ::Rails.root.join('tmp'))
end
# Public: Was the document conversion successful?
#
# Returns a Boolean
def success?
has_content? || contains_images?
end
private
def parse_body
match = convert.match(/<body[^>]*>(.*?)<\/body>/mi)
match ? match[1] : ''
end
def convert
# Get the attachment body outside of the chdir call as getting
# the body may require opening files too
text = attachment_body
@converted ||= Dir.chdir(tmpdir) do
tempfile = create_tempfile(text)
html = AlaveteliExternalCommand.run("unrtf", "--html",
tempfile.path, timeout: 120
)
cleanup_tempfile(tempfile)
sanitize_converted(html)
end
end
# Works around http://savannah.gnu.org/bugs/?42015 in unrtf ~> 0.21
def sanitize_converted(html)
html.nil? ? html = '' : html
invalid = %Q(<!DOCTYPE html PUBLIC -//W3C//DTD HTML 4.01 Transitional//EN>)
valid = %Q(<!DOCTYPE html PUBLIC "-//W3C//DTD HTML 4.01 Transitional//EN>")
html.sub!(invalid, valid) if html.include?(invalid)
html
end
end
end
end