1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
|
require_relative 'include.rb'
old = Dataset.from_csv_file File.join(DATA,"mazzatorta.csv")
new = Dataset.from_csv_file File.join(DATA,"swiss.csv")
common_compound_ids = (old.compound_ids + new.compound_ids).uniq
data = []
common_compound_ids.each do |cid|
c = Compound.find cid
old_values = old.values(c,old.features.first)
new_values = new.values(c,new.features.first)
identical = old_values & new_values
unless identical.empty?
old_values -= identical
new_values -= identical
end
identical.each do |v|
data << [c.smiles,v,"mazzatorta, swiss"]
end
old_values.each do |v|
data << [c.smiles,v,"mazzatorta"]
end
new_values.each do |v|
data << [c.smiles,v,"swiss"]
end
end
data.sort!{|a,b| a[1] <=> b[1]}
CSV.open(File.join(DATA,"combined.csv"),"w+") do |csv|
csv << ["SMILES","LOAEL","Dataset"]
data.each{|r| csv << r}
end
|