summaryrefslogtreecommitdiff
path: root/lib/feature.rb
blob: 9deb199db1d628bf13ddbedb6204af1822d6c31e (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
module OpenTox

  # Basic feature class
  class Feature
    field :name, as: :title, type: String
    field :nominal, type: Boolean
    field :numeric, type: Boolean
    field :measured, type: Boolean
  end

  # Feature for categorical variables
  class NominalFeature < Feature
    # TODO check if accept_values are still needed 
    field :accept_values, type: Array
    def initialize params
      super params
      nominal = true
    end
  end

  # Feature for quantitative variables
  class NumericFeature < Feature
    def initialize params
      super params
      numeric = true
    end
  end

  # Feature for SMARTS fragments
  class Smarts < NominalFeature
    field :smarts, type: String 
  end

  # Feature for supervised fragments from Fminer algorithm
  class FminerSmarts < Smarts
    field :p_value, type: Float
    # TODO check if effect is used
    field :effect, type: String
    field :dataset_id 
  end

  # Feature for database fingerprints
  # needs count for efficient retrieval (see compound.rb)
  class FingerprintSmarts < Smarts
    field :count, type: Integer
    def self.fingerprint
      @@fp4 ||= OpenTox::FingerprintSmarts.all
      unless @@fp4.size == 306
        @@fp4 = []
        # OpenBabel FP4 fingerprints
        # OpenBabel http://open-babel.readthedocs.org/en/latest/Fingerprints/intro.html
        # TODO investigate other types of fingerprints (MACCS)
        # OpenBabel http://open-babel.readthedocs.org/en/latest/Fingerprints/intro.html
        # http://www.dalkescientific.com/writings/diary/archive/2008/06/26/fingerprint_background.html
        # OpenBabel MNA http://openbabel.org/docs/dev/FileFormats/Multilevel_Neighborhoods_of_Atoms_(MNA).html#multilevel-neighborhoods-of-atoms-mna
        # Morgan ECFP, FCFP
        # http://cdk.github.io/cdk/1.5/docs/api/org/openscience/cdk/fingerprint/CircularFingerprinter.html
        # http://www.rdkit.org/docs/GettingStartedInPython.html
        # Chemfp
        # https://chemfp.readthedocs.org/en/latest/using-tools.html
        # CACTVS/PubChem

        File.open(File.join(File.dirname(__FILE__),"SMARTS_InteLigand.txt")).each do |l| 
          l.strip!
          unless l.empty? or l.match /^#/
            name,smarts = l.split(': ')
            @@fp4 << OpenTox::FingerprintSmarts.find_or_create_by(:name => name, :smarts => smarts) unless smarts.nil?
          end
        end
      end
      @@fp4
    end
  end

  # Feature for physico-chemical descriptors
  class PhysChemDescriptor < NumericFeature
    field :algorithm, type: String, default: "OpenTox::Algorithm::Descriptor.physchem"
    field :parameters, type: Hash
    field :creator, type: String
  end

  # Feature for categorical bioassay results
  class NominalBioAssay < NominalFeature
    # TODO: needed? move to dataset?
    field :description, type: String
  end

  # Feature for quantitative bioassay results
  class NumericBioAssay < NumericFeature
    # TODO: needed? move to dataset?
    field :description, type: String
  end

end