From 455da06aa6459da0d25b286ca6cb866ff64c4c34 Mon Sep 17 00:00:00 2001 From: Christoph Helma Date: Thu, 20 Jun 2019 22:01:50 +0200 Subject: separate csv serialisations for batch predictions and training data, repeated measurements in mutagenicity dataset fixed, daphnia import fixed, CENTRAL_MONGO_IP removed --- lib/download.rb | 3 +-- 1 file changed, 1 insertion(+), 2 deletions(-) (limited to 'lib/download.rb') diff --git a/lib/download.rb b/lib/download.rb index f17d060..2546dc4 100644 --- a/lib/download.rb +++ b/lib/download.rb @@ -122,7 +122,6 @@ module OpenTox # Combine mutagenicity data from Kazius, Hansen and EFSA and download into the data folder def self.mutagenicity $logger.debug "Mutagenicity" - # TODO add download/conversion programs to lazar dependencies hansen_url = "http://doc.ml.tu-berlin.de/toxbenchmark/Mutagenicity_N6512.csv" kazius_url = "http://cheminformatics.org/datasets/bursi/cas_4337.zip" efsa_url = "https://data.europa.eu/euodp/data/storage/f/2017-07-19T142131/GENOTOX data and dictionary.xls" @@ -185,7 +184,7 @@ module OpenTox map = {"mutagen" => "mutagenic", "nonmutagen" => "non-mutagenic"} dataset = Dataset.merge datasets: datasets, features: datasets.collect{|d| d.bioactivity_features.first}, value_maps: [nil,nil,map], keep_original_features: false, remove_duplicates: true dataset.merged_features.first.name = "Mutagenicity" - File.open(File.join(DATA,"Mutagenicity-Salmonella_typhimurium.csv"),"w+"){|f| f.puts dataset.to_csv} + File.open(File.join(DATA,"Mutagenicity-Salmonella_typhimurium.csv"),"w+"){|f| f.puts dataset.to_training_csv} meta = { :species => "Salmonella typhimurium", :endpoint => "Mutagenicity", -- cgit v1.2.3