summaryrefslogtreecommitdiff
path: root/test/experiment.rb
blob: 4b54768318867e08ba3b50e5d63b88f93c03185b (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
require_relative "setup.rb"

class ExperimentTest < MiniTest::Test

  def test_regression_experiment
    datasets = [
      "EPAFHM.medi.csv",
      #"EPAFHM.csv",
      #"FDA_v3b_Maximum_Recommended_Daily_Dose_mmol.csv",
      "LOAEL_mmol_corrected_smiles.csv"
    ]
    experiment = Experiment.create(
      :name => "Default regression for datasets #{datasets}.",
      :dataset_ids => datasets.collect{|d| Dataset.from_csv_file(File.join(DATA_DIR, d)).id},
      :model_settings => [
        {
          :algorithm => "OpenTox::Model::LazarRegression",
        }
      ]
    )
    #experiment.run
    puts experiment.report.to_yaml
    assert_equal datasets.size, experiment.results.size
    experiment.results.each do |dataset_id, result|
      assert_equal 1, result.size
      result.each do |r|
        assert_kind_of BSON::ObjectId, r[:model_id]
        assert_kind_of BSON::ObjectId, r[:repeated_crossvalidation_id]
      end
    end
  end

  def test_classification_experiment

    datasets = [ "hamster_carcinogenicity.csv" ]
    experiment = Experiment.create(
      :name => "Fminer vs fingerprint classification for datasets #{datasets}.",
      :dataset_ids => datasets.collect{|d| Dataset.from_csv_file(File.join(DATA_DIR, d)).id},
      :model_settings => [
        {
          :algorithm => "OpenTox::Model::LazarClassification",
        },{
          :algorithm => "OpenTox::Model::LazarClassification",
          :neighbor_algorithm_parameter => {:min_sim => 0.3}
        },
        #{
          #:algorithm => "OpenTox::Model::LazarFminerClassification",
        #}
      ]
    )
    #experiment.run
=begin
    experiment = Experiment.find "55f944a22b72ed7de2000000"
=end
    puts experiment.report.to_yaml
    experiment.results.each do |dataset_id, result|
      assert_equal 2, result.size
      result.each do |r|
        assert_kind_of BSON::ObjectId, r[:model_id]
        assert_kind_of BSON::ObjectId, r[:repeated_crossvalidation_id]
      end
    end
  end

  def test_regression_fingerprints
    datasets = [
      "LOAEL_mmol_corrected_smiles.csv"
    ]
    min_sims = [0.3,0.7]
    types = ["FP2","FP3","FP4","MACCS"]
    experiment = Experiment.create(
      :name => "Fminer vs fingerprint classification for datasets #{datasets}.",
      :dataset_ids => datasets.collect{|d| Dataset.from_csv_file(File.join(DATA_DIR, d)).id},
    )
    types.each do |type|
      min_sims.each do |min_sim|
        experiment.model_settings << {
          :algorithm => "OpenTox::Model::LazarRegression",
          :neighbor_algorithm => "fingerprint_neighbors",
          :neighbor_algorithm_parameter => {
            :type => type,
            :min_sim => min_sim,
          }
        }
      end
    end
    experiment.run
    p experiment.report

  end
end