summaryrefslogtreecommitdiff
path: root/scripts/pa-fingerprints.rb
blob: 344ba864ca374c6d7a23936d84041c86fd9cb590 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
#!/usr/bin/env ruby
require_relative "../../lazar/lib/lazar.rb"
training_fingerprints = `sed -n '1p' data/mutagenicity-fingerprints.csv`.chomp.split(",")
training_fingerprints.pop
puts training_fingerprints.join(",")
training_fingerprints.shift

File.readlines(File.join("pyrrolizidine-alkaloids","lazar","pa-smiles.csv")).each_with_index do |line,i|
  if i > 0
    (id,smiles) = line.chomp.split(",")
    c = Compound.new(smiles)
    out = [c.smiles]
    fp = c.fingerprint
    training_fingerprints.each do |frag|
      fp.include?(frag) ? out << 1 : out << 0
    end
    puts out.join(",")
  end
end