summaryrefslogtreecommitdiff
path: root/lib/experiment.rb
blob: 985a491820a29f8ef5d86346b97ae7bcb68b27b3 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
module OpenTox

  class Experiment
    field :dataset_ids, type: Array
    field :model_settings, type: Array, default: []
    field :results, type: Hash, default: {}
  end

  def run 
    dataset_ids.each do |dataset_id|
      dataset = Dataset.find(dataset_id)
      results[dataset_id.to_s] = []
      model_settings.each do |setting|
        model = Object.const_get(setting[:algorithm]).create dataset
        model.prediction_algorithm = setting[:prediction_algorithm] if setting[:prediction_algorithm]
        model.neighbor_algorithm = setting[:neighbor_algorithm] if setting[:neighbor_algorithm]
        model.neighbor_algorithm_parameters = setting[:neighbor_algorithm_parameter] if setting[:neighbor_algorithm_parameter]
        model.save
        repeated_crossvalidation = RepeatedCrossValidation.create model
        results[dataset_id.to_s] << {:model_id => model.id, :repeated_crossvalidation_id => repeated_crossvalidation.id}
      end
    end
    save
  end

  def self.create params
    experiment = self.new
    $logge.debug "Experiment started ..."
    #experiment.run params
    experiment
  end

  def report
    # TODO significances
    report = {}
    report[:name] = name
    report[:experiment_id] = self.id.to_s
    dataset_ids.each do |dataset_id|
      dataset_name = Dataset.find(dataset_id).name
      report[dataset_name] = []
      results[dataset_id.to_s].each do |result|
        model = Model::Lazar.find(result[:model_id])
        repeated_cv = RepeatedCrossValidation.find(result[:repeated_crossvalidation_id])
        crossvalidations = repeated_cv.crossvalidations
        summary = {}
        [:neighbor_algorithm, :neighbor_algorithm_parameters, :prediction_algorithm].each do |key|
          summary[key] = model[key]
        end
        summary[:nr_instances] = crossvalidations.first.nr_instances
        summary[:nr_unpredicted] = crossvalidations.collect{|cv| cv.nr_unpredicted}
        summary[:time] = crossvalidations.collect{|cv| cv.time}
        if crossvalidations.first.is_a? ClassificationCrossValidation
          summary[:accuracies] = crossvalidations.collect{|cv| cv.accuracy}
        elsif crossvalidations.first.is_a? RegressionCrossValidation
          summary[:r_squared] = crossvalidations.collect{|cv| cv.r_squared}
        end
        report[dataset_name] << summary
        #p repeated_cv.crossvalidations.collect{|cv| cv.accuracy}
        #file = "/tmp/#{id}.svg"
        #File.open(file,"w+"){|f| f.puts cv.correlation_plot}
        #`inkview '#{file}'`
      end
    end
    report
  end

end