sul-dlss/was_robot_suite

View on GitHub
lib/robots/dor_repo/was_crawl_dissemination/warc_extractor.rb

Summary

Maintainability
A
0 mins
Test Coverage
A
100%
# frozen_string_literal: true

module Robots
  module DorRepo
    module WasCrawlDissemination
      # Extracts WARC files from a WACZ file.
      class WarcExtractor < Base
        def initialize
          super('wasCrawlDisseminationWF', 'warc-extractor')
        end

        def perform_work
          Dor::WasCrawl::Dissemination::Utilities.wacz_file_location_info(druid) => {item_path:, file_list:}

          file_list.each { |filename| Dor::WasCrawl::WarcExtractorService.extract(item_path, filename) }
        end
      end
    end
  end
end