summaryrefslogtreecommitdiff
path: root/lib/fminer.rb
diff options
context:
space:
mode:
Diffstat (limited to 'lib/fminer.rb')
-rw-r--r--lib/fminer.rb12
1 files changed, 2 insertions, 10 deletions
diff --git a/lib/fminer.rb b/lib/fminer.rb
index 666cefa..37be183 100644
--- a/lib/fminer.rb
+++ b/lib/fminer.rb
@@ -186,16 +186,8 @@ module OpenTox
# @param [Integer] per-mil value
# return [Integer] min-frequency
def min_frequency(training_dataset,prediction_feature,per_mil)
- nr_labeled_cmpds = DataEntry.where(dataset_id: training_dataset.id, feature_id: prediction_feature.id).in(compound_id: training_dataset.compound_ids).count
- #nr_labeled_cmpds=0
- #f_idx=training_dataset.features.index prediction_feature
- #training_dataset.compounds.each_with_index { |cmpd, c_idx|
- #if ( training_dataset.data_entries[c_idx] )
- #unless training_dataset.data_entries[c_idx][f_idx].nil?
- #nr_labeled_cmpds += 1
- #end
- #end
- #}
+ i = training_dataset.feature_ids.index prediction_feature.id
+ nr_labeled_cmpds = training_dataset.data_entries.select{|de| !de[i].nil?}.size
minfreq = per_mil * nr_labeled_cmpds.to_f / 1000.0 # AM sugg. 8-10 per mil for BBRC, 50 per mil for LAST
minfreq = 2 unless minfreq > 2
Integer (minfreq)