1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
|
require_relative "setup.rb"
class LazarExtendedTest < MiniTest::Test
def test_lazar_bbrc_ham_minfreq
skip
dataset = OpenTox::Dataset.from_csv_file File.join(DATA_DIR,"hamster_carcinogenicity.csv")
model = Model::LazarFminerClassification.create(dataset, :min_frequency => 5)
feature_dataset = Dataset.find model.neighbor_algorithm_parameters[:feature_dataset_id]
assert_equal dataset.compounds.size, feature_dataset.compounds.size
assert_equal model.feature_calculation_parameters, {"min_frequency"=>5}
#TODO check frequencies, features and confidence
#assert_equal 41, feature_dataset.features.size
#assert_equal 'N-C=N', feature_dataset.features.first.smarts
compound = OpenTox::Compound.from_inchi("InChI=1S/C6H6/c1-2-4-6-5-3-1/h1-6H")
prediction = model.predict compound
assert_equal "false", prediction[:value]
#assert_equal 0.12380952380952381, prediction[:confidence]
dataset.delete
model.delete
feature_dataset.delete
end
def test_lazar_bbrc_large_ds
skip
dataset = OpenTox::Dataset.from_csv_file File.join(DATA_DIR,"multi_cell_call_no_dup.csv")
model = Model::LazarFminerClassification.create dataset
feature_dataset = Dataset.find model.neighbor_algorithm_parameters[:feature_dataset_id]
model.save
p model.id
assert_equal dataset.compounds.size, feature_dataset.compounds.size
#assert_equal 52, feature_dataset.features.size
#assert_equal '[#17&A]-[#6&A]', feature_dataset.features.first.name
compound = OpenTox::Compound.from_inchi("InChI=1S/C10H9NO2S/c1-8-2-4-9(5-3-8)13-6-10(12)11-7-14/h2-5H,6H2,1H3")
prediction = model.predict compound
assert_equal "1", prediction[:value]
#p prediction
#prediction = prediction_dataset.data_entries.first
#assert_in_delta 0.025, prediction[:confidence], 0.001
#assert_equal 0.025885845574483608, prediction[:confidence]
# with compound change in training_dataset see:
# https://github.com/opentox/opentox-test/commit/0e78c9c59d087adbd4cc58bab60fb29cbe0c1da0
#assert_equal 0.02422364949075546, prediction[:confidence]
dataset.delete
model.delete
feature_dataset.delete
end
def test_lazar_fminer_kazius
skip
t = Time.now
dataset = Dataset.from_csv_file File.join(DATA_DIR,"kazius.csv")
p "Dataset upload: #{Time.now-t}"
t = Time.now
model = Model::LazarFminerClassification.create(dataset, :min_frequency => 100)
p "Feature mining: #{Time.now-t}"
t = Time.now
feature_dataset = Dataset.find model.neighbor_algorithm_parameters[:feature_dataset_id]
assert_equal feature_dataset.compounds.size, dataset.compounds.size
#model = Model::Lazar.find('55bcf5bf7a7838381200017e')
#p model.id
#prediction_times = []
2.times do
compound = Compound.from_smiles("Clc1ccccc1NN")
prediction = model.predict compound
p prediction
#assert_equal "1", prediction[:value]
#assert_in_delta 0.019858401199860445, prediction[:confidence], 0.001
end
#dataset.delete
#feature_dataset.delete
end
def test_lazar_kazius
t = Time.now
dataset = Dataset.from_csv_file File.join(DATA_DIR,"kazius.csv")
p "Dataset upload: #{Time.now-t}"
t = Time.now
model = Model::LazarClassification.create(dataset.features.first,dataset)
p "Feature mining: #{Time.now-t}"
t = Time.now
2.times do
compound = Compound.from_smiles("Clc1ccccc1NN")
prediction = model.predict compound
#p prediction
assert_equal "1", prediction[:value]
#assert_in_delta 0.019858401199860445, prediction[:confidence], 0.001
end
dataset.delete
end
end
|