summaryrefslogtreecommitdiff
path: root/Makefile
diff options
context:
space:
mode:
Diffstat (limited to 'Makefile')
-rw-r--r--Makefile12
1 files changed, 4 insertions, 8 deletions
diff --git a/Makefile b/Makefile
index a73e178..7f1ec93 100644
--- a/Makefile
+++ b/Makefile
@@ -1,8 +1,4 @@
# TODO
-# efsa smiles errors (encodings?)
-# efsa script via csv
-# remove headers from csv files
-# add header at merged csv
# remove \u003e/00
# remove log messages in result
@@ -62,7 +58,7 @@ data/mutagenicity-merged.id: data/mutagenicity-merged.csv
scripts/import-csv.rb $< > $@
data/mutagenicity-merged.csv: $(data)
- echo "SMILES,Activity" > $@ && cat $(data) | sort -u | sed '/SMILES/d' >> $@
+ scripts/merge-mutagenicity.rb $(data) > $@
data/carcinogenicity.csv: data/aid1205.csv
scripts/carcinogenicity2csv.rb $< > $@
@@ -85,11 +81,11 @@ data/cas_4337.zip:
# efsa
-data/efsa.csv: data/GENOTOX_data_and_dictionary.csv
+data/efsa.csv: data/GENOTOX_data_and_dictionary.tsv
scripts/efsa2csv.rb $< > $@
-data/GENOTOX_data_and_dictionary.csv: data/GENOTOX_data_and_dictionary.xls
- xls2csv $< > $@
+data/GENOTOX_data_and_dictionary.tsv: data/GENOTOX_data_and_dictionary.xls
+ xls2csv -s cp1252 -d utf-8 -x -c " " $< > $@
data/GENOTOX_data_and_dictionary.xls:
cd data && wget "https://data.europa.eu/euodp/data/storage/f/2017-07-19T142131/GENOTOX%20data%20and%20dictionary.xls" -o $@