From a29eb3e38414cd252850c9c4fb356f8b2bef6fb4 Mon Sep 17 00:00:00 2001 From: Christoph Helma Date: Fri, 12 Feb 2021 19:54:07 +0100 Subject: model.rb refactored, mp2d models updated --- lib/dataset.rb | 9 ++++++++- 1 file changed, 8 insertions(+), 1 deletion(-) (limited to 'lib/dataset.rb') diff --git a/lib/dataset.rb b/lib/dataset.rb index e30f000..f40f054 100644 --- a/lib/dataset.rb +++ b/lib/dataset.rb @@ -12,7 +12,7 @@ class Dataset @independent_variable_type = File.read(File.join(@dir,"independent_variable_type")).chomp @lines = File.readlines(file) @header = @lines.shift.split(",") - @header.first.match(/ID/i) ? @has_id = true : @has_id = false + @header.first.match(/ID|SMILES/i) ? @has_id = true : @has_id = false @dependent_variable_name = @header.pop @ids = [] @dependent_variables = [] @@ -43,6 +43,13 @@ class Dataset end @independent_variables = Matrix[ *@independent_variables ] columns = @independent_variables.column_vectors + stdev = columns.collect{|c| c.to_a.standard_deviation} + stdev.each_index.reverse_each do |i| + if stdev[i] == 0 + @independent_variable_names.delete_at(i) + columns.delete_at(i) + end + end @independent_variable_means = columns.collect{|c| c.to_a.mean} @independent_variable_standard_deviations = columns.collect{|c| c.to_a.standard_deviation} scaled_columns = [] -- cgit v1.2.3