genome/dgi-db

View on GitHub
lib/genome/importers/cancer_commons/cancer_commons_tsv_importer.rb

Summary

Maintainability
A
20 mins
Test Coverage
module Genome
  module Importers
    module CancerCommons

      def self.source_info
        {
          base_url: 'http://www.cancercommons.org/researchers-clinicians/',
          site_url: 'http://www.cancercommons.org/',
          citation: 'Cancer Commons: Biomedicine in the Internet Age. Shrager J, Tenenbaum JM, and Travers M. Collaborative Computational Technologies for Biomedical Research, (Sean Elkins, Maggie Hupcey, and Antony Williams Eds). Wiley, 2010.',
          source_db_version: '25-Jul-2013',
          source_type_id: DataModel::SourceType.INTERACTION,
          source_trust_level_id: DataModel::SourceTrustLevel.EXPERT_CURATED,
          source_db_name: 'CancerCommons',
          full_name: 'Cancer Commons',
          license: 'Custom non-commercial',
          license_link: 'https://www.cancercommons.org/terms-of-use/',
        }
      end

      def self.run(tsv_path)
        TSVImporter.import tsv_path, CancerCommonsRow, source_info do
          interaction known_action_type: 'unknown' do
            gene :primary_gene_name, nomenclature: 'Gene Target Symbol', transform: ->(x) { x.upcase } do
              name :entrez_gene_id, nomenclature: 'Entrez Gene ID'
              attribute :reported_gene_names, name: 'CancerCommons Reported Gene Name'
            end

            drug :primary_drug_name, nomenclature: 'Primary Drug Name', primary_name: :primary_drug_name do
              attribute :drug_class, name: 'Drug Class' 
              name :pubchem_drug_name, nomenclature: 'PubChem Drug Name'
              name :pubchem_drug_id, nomenclature: 'PubChem Drug ID'
              attribute :source_reported_drug_name, name: 'Source Reported Drug Name(s)'
              name :drug_trade_name, nomenclature: 'Drug Trade Name'
              name :drug_development_name, nomenclature: 'Drug Development Name'
              attribute :pharmaceutical_developer, name: 'Pharmaceutical Developer'
            end

            attribute :interaction_type, name: 'Interaction Type'
            attribute :cancer_type, name: 'Reported Cancer Type'
          end
        end.save!
        s = DataModel::Source.find_by(source_db_name: source_info['source_db_name'])
        s.interaction_claims.each do |ic|
          Genome::OnlineUpdater.new.create_interaction_claim_link(ic, 'Source TSV', File.join('data', 'source_tsvs', 'CancerCommons_INTERACTIONS.tsv'))
        end
      end
    end
  end
end