summaryrefslogtreecommitdiff
path: root/test/fminer.rb
blob: 16e1f9e1e2f87f6fe7660d8222a1789fc02112d7 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
require_relative "setup.rb"

class FminerTest < MiniTest::Test

  def test_fminer_bbrc
    dataset = OpenTox::Dataset.from_csv_file File.join(DATA_DIR,"hamster_carcinogenicity.csv")
    refute_nil dataset.id
    feature_dataset = OpenTox::Algorithm::Fminer.bbrc dataset
    feature_dataset = Dataset.find feature_dataset.id
    assert_equal dataset.compounds.size, feature_dataset.compounds.size
    # TODO: fminer calculates 62 instead of 54 features
    # it is unclear which commit changed the numbers (occurs with old libraries/mongodb branch too
    # modification of Compound to use smiles instead of inchis seems to have no effect
    #assert_equal 54, feature_dataset.features.size
    #assert_equal "C-C-C=C", feature_dataset.features.first.smarts
    compounds = feature_dataset.compounds
    smarts = feature_dataset.features
    smarts.each do |smart|
      assert smart.p_value.round(2) >= 0.95
    end
    match = OpenTox::Algorithm::Descriptor.smarts_match compounds, smarts
    feature_dataset.data_entries.each_with_index do |fingerprint,i|
      assert_equal match[i], fingerprint
    end

    dataset.delete
    feature_dataset.delete
  end

  def test_fminer_last
    skip "last features have to be activated"
    dataset = OpenTox::Dataset.new
    dataset.upload File.join(DATA_DIR,"hamster_carcinogenicity.csv")
    feature_dataset = OpenTox::Algorithm::Fminer.last :dataset => dataset
    assert_equal dataset.compounds.size, feature_dataset.compounds.size
    assert_equal 21, feature_dataset.features.size
    assert_equal '[#6&A]-[#6&a]:[#6&a]:[#6&a]:[#6&a]:[#6&a]', feature_dataset.features.first.smarts

    compounds = feature_dataset.compounds
    smarts = feature_dataset.features.collect{|f| f.smarts}
    match = OpenTox::Algorithm::Descriptor.smarts_match compounds, smarts
    compounds.each_with_index do |c,i|
      smarts.each_with_index do |s,j|
        assert_equal match[i][j], feature_dataset.data_entries[i][j].to_i
      end
    end

    dataset.delete
    feature_dataset.delete
  end

end