genome/dgi-db

View on GitHub
lib/genome/importers/chembl/chembl_tsv_importer.rb

Summary

Maintainability
A
1 hr
Test Coverage
module Genome
  module Importers
    module Chembl

      def self.source_info
        {
          site_url: 'https://www.ebi.ac.uk/chembl',
          base_url: 'https://www.ebi.ac.uk/chembldb/index.php/target/inspect/',
          citation: "Mendez,D., Gaulton,A., Bento,A.P., Chambers,J., De Veij,M., Félix,E., Magariños,M.P., Mosquera,J.F., Mutowo,P., Nowotka,M., et al. (2019) ChEMBL: towards direct deposition of bioassay data. Nucleic Acids Res., 47, D930–D940. PMID: 30398643",
          source_db_version: 'chembl_20',
          source_type_id: DataModel::SourceType.INTERACTION,
          source_db_name: 'ChEMBL',
          full_name: 'The ChEMBL Bioactivity Database',
          source_trust_level_id: DataModel::SourceTrustLevel.EXPERT_CURATED,
          license: 'Creative Commons Attribution-Share Alike 3.0 Unported License',
          license_link: 'https://chembl.gitbook.io/chembl-interface-documentation/about',
        }
      end

      def self.run(tsv_path)
        blank_filter = ->(x) { x.blank? || x == "''" || x == '""' }
        upcase = ->(x) {x.upcase}
        downcase = ->(x) {x.downcase}
        known = ->() {if :action_type.blank?
                        'unknown'
                      else
                        'known'
                      end
        }
        TSVImporter.import tsv_path, ChemblRow, source_info do
          interaction known_action_type: known, transform: downcase do
            drug :drug_chembl_id, nomenclature: 'ChEMBL Drug Identifier', primary_name: :drug_name, transform: upcase do
              name :drug_name, nomenclature: 'ChEMBL Drug Name', transform: upcase
            end
            gene :gene_chembl_id, nomenclature: 'ChEMBL Gene Identifier' do
              names :gene_symbol, nomenclature: 'ChEMBL Gene Symbol', unless: blank_filter
              names :uniprot_id, nomenclature: 'UniProt Accession', unless: blank_filter
              names :uniprot_name, nomenclature: 'UniProt Name', unless: blank_filter
              # target_ligand fields are ignored for now.
            end
            attribute :mechanism_of_action, name: 'Mechanism of Interaction', transform: downcase, unless: blank_filter
            attribute :direct_interaction, name: 'Direct Interaction', unless: blank_filter
            attributes :fda, name: 'FDA ID', unless: blank_filter
            attributes :pmid, name: 'PMID', unless: blank_filter
            attribute :action_type, name: 'Interaction Type', transform: downcase, unless: blank_filter
          end
        end.save!
        s = DataModel::Source.where(source_db_name: source_info['source_db_name'])
        s.interaction_claims.each do |ic|
          Genome::OnlineUpdater.new.create_interaction_claim_link(ic, 'Drug Mechanisms', "https://www.ebi.ac.uk/chembl/compound_report_card/#{ic.drug_claim.name}/#MechanismOfAction")
        end
      end
    end
  end
end