summaryrefslogtreecommitdiff
path: root/paper/loael.html
diff options
context:
space:
mode:
Diffstat (limited to 'paper/loael.html')
-rw-r--r--paper/loael.html433
1 files changed, 52 insertions, 381 deletions
diff --git a/paper/loael.html b/paper/loael.html
index c8c0a2d..95932e1 100644
--- a/paper/loael.html
+++ b/paper/loael.html
@@ -1,384 +1,55 @@
-<?xml version="1.0" encoding="utf-8" ?>
-<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
-<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
-<head>
-<meta http-equiv="Content-Type" content="text/html; charset=utf-8" />
-<meta name="generator" content="Docutils 0.12: http://docutils.sourceforge.net/" />
-<title></title>
-<style type="text/css">
-
-/*
-:Author: David Goodger (goodger@python.org)
-:Id: $Id: html4css1.css 7614 2013-02-21 15:55:51Z milde $
-:Copyright: This stylesheet has been placed in the public domain.
-
-Default cascading style sheet for the HTML output of Docutils.
-
-See http://docutils.sf.net/docs/howto/html-stylesheets.html for how to
-customize this style sheet.
-*/
-
-/* used to remove borders from tables and images */
-.borderless, table.borderless td, table.borderless th {
- border: 0 }
-
-table.borderless td, table.borderless th {
- /* Override padding for "table.docutils td" with "! important".
- The right padding separates the table cells. */
- padding: 0 0.5em 0 0 ! important }
-
-.first {
- /* Override more specific margin styles with "! important". */
- margin-top: 0 ! important }
-
-.last, .with-subtitle {
- margin-bottom: 0 ! important }
-
-.hidden {
- display: none }
-
-a.toc-backref {
- text-decoration: none ;
- color: black }
-
-blockquote.epigraph {
- margin: 2em 5em ; }
-
-dl.docutils dd {
- margin-bottom: 0.5em }
-
-object[type="image/svg+xml"], object[type="application/x-shockwave-flash"] {
- overflow: hidden;
-}
-
-/* Uncomment (and remove this text!) to get bold-faced definition list terms
-dl.docutils dt {
- font-weight: bold }
-*/
-
-div.abstract {
- margin: 2em 5em }
-
-div.abstract p.topic-title {
- font-weight: bold ;
- text-align: center }
-
-div.admonition, div.attention, div.caution, div.danger, div.error,
-div.hint, div.important, div.note, div.tip, div.warning {
- margin: 2em ;
- border: medium outset ;
- padding: 1em }
-
-div.admonition p.admonition-title, div.hint p.admonition-title,
-div.important p.admonition-title, div.note p.admonition-title,
-div.tip p.admonition-title {
- font-weight: bold ;
- font-family: sans-serif }
-
-div.attention p.admonition-title, div.caution p.admonition-title,
-div.danger p.admonition-title, div.error p.admonition-title,
-div.warning p.admonition-title, .code .error {
- color: red ;
- font-weight: bold ;
- font-family: sans-serif }
-
-/* Uncomment (and remove this text!) to get reduced vertical space in
- compound paragraphs.
-div.compound .compound-first, div.compound .compound-middle {
- margin-bottom: 0.5em }
-
-div.compound .compound-last, div.compound .compound-middle {
- margin-top: 0.5em }
-*/
-
-div.dedication {
- margin: 2em 5em ;
- text-align: center ;
- font-style: italic }
-
-div.dedication p.topic-title {
- font-weight: bold ;
- font-style: normal }
-
-div.figure {
- margin-left: 2em ;
- margin-right: 2em }
-
-div.footer, div.header {
- clear: both;
- font-size: smaller }
-
-div.line-block {
- display: block ;
- margin-top: 1em ;
- margin-bottom: 1em }
-
-div.line-block div.line-block {
- margin-top: 0 ;
- margin-bottom: 0 ;
- margin-left: 1.5em }
-
-div.sidebar {
- margin: 0 0 0.5em 1em ;
- border: medium outset ;
- padding: 1em ;
- background-color: #ffffee ;
- width: 40% ;
- float: right ;
- clear: right }
-
-div.sidebar p.rubric {
- font-family: sans-serif ;
- font-size: medium }
-
-div.system-messages {
- margin: 5em }
-
-div.system-messages h1 {
- color: red }
-
-div.system-message {
- border: medium outset ;
- padding: 1em }
-
-div.system-message p.system-message-title {
- color: red ;
- font-weight: bold }
-
-div.topic {
- margin: 2em }
-
-h1.section-subtitle, h2.section-subtitle, h3.section-subtitle,
-h4.section-subtitle, h5.section-subtitle, h6.section-subtitle {
- margin-top: 0.4em }
-
-h1.title {
- text-align: center }
-
-h2.subtitle {
- text-align: center }
-
-hr.docutils {
- width: 75% }
-
-img.align-left, .figure.align-left, object.align-left {
- clear: left ;
- float: left ;
- margin-right: 1em }
-
-img.align-right, .figure.align-right, object.align-right {
- clear: right ;
- float: right ;
- margin-left: 1em }
-
-img.align-center, .figure.align-center, object.align-center {
- display: block;
- margin-left: auto;
- margin-right: auto;
-}
-
-.align-left {
- text-align: left }
-
-.align-center {
- clear: both ;
- text-align: center }
-
-.align-right {
- text-align: right }
-
-/* reset inner alignment in figures */
-div.align-right {
- text-align: inherit }
-
-/* div.align-center * { */
-/* text-align: left } */
-
-ol.simple, ul.simple {
- margin-bottom: 1em }
-
-ol.arabic {
- list-style: decimal }
-
-ol.loweralpha {
- list-style: lower-alpha }
-
-ol.upperalpha {
- list-style: upper-alpha }
-
-ol.lowerroman {
- list-style: lower-roman }
-
-ol.upperroman {
- list-style: upper-roman }
-
-p.attribution {
- text-align: right ;
- margin-left: 50% }
-
-p.caption {
- font-style: italic }
-
-p.credits {
- font-style: italic ;
- font-size: smaller }
-
-p.label {
- white-space: nowrap }
-
-p.rubric {
- font-weight: bold ;
- font-size: larger ;
- color: maroon ;
- text-align: center }
-
-p.sidebar-title {
- font-family: sans-serif ;
- font-weight: bold ;
- font-size: larger }
-
-p.sidebar-subtitle {
- font-family: sans-serif ;
- font-weight: bold }
-
-p.topic-title {
- font-weight: bold }
-
-pre.address {
- margin-bottom: 0 ;
- margin-top: 0 ;
- font: inherit }
-
-pre.literal-block, pre.doctest-block, pre.math, pre.code {
- margin-left: 2em ;
- margin-right: 2em }
-
-pre.code .ln { color: grey; } /* line numbers */
-pre.code, code { background-color: #eeeeee }
-pre.code .comment, code .comment { color: #5C6576 }
-pre.code .keyword, code .keyword { color: #3B0D06; font-weight: bold }
-pre.code .literal.string, code .literal.string { color: #0C5404 }
-pre.code .name.builtin, code .name.builtin { color: #352B84 }
-pre.code .deleted, code .deleted { background-color: #DEB0A1}
-pre.code .inserted, code .inserted { background-color: #A3D289}
-
-span.classifier {
- font-family: sans-serif ;
- font-style: oblique }
-
-span.classifier-delimiter {
- font-family: sans-serif ;
- font-weight: bold }
-
-span.interpreted {
- font-family: sans-serif }
-
-span.option {
- white-space: nowrap }
-
-span.pre {
- white-space: pre }
-
-span.problematic {
- color: red }
-
-span.section-subtitle {
- /* font-size relative to parent (h1..h6 element) */
- font-size: 80% }
-
-table.citation {
- border-left: solid 1px gray;
- margin-left: 1px }
-
-table.docinfo {
- margin: 2em 4em }
-
-table.docutils {
- margin-top: 0.5em ;
- margin-bottom: 0.5em }
-
-table.footnote {
- border-left: solid 1px black;
- margin-left: 1px }
-
-table.docutils td, table.docutils th,
-table.docinfo td, table.docinfo th {
- padding-left: 0.5em ;
- padding-right: 0.5em ;
- vertical-align: top }
-
-table.docutils th.field-name, table.docinfo th.docinfo-name {
- font-weight: bold ;
- text-align: left ;
- white-space: nowrap ;
- padding-left: 0 }
-
-/* "booktabs" style (no vertical lines) */
-table.docutils.booktabs {
- border: 0px;
- border-top: 2px solid;
- border-bottom: 2px solid;
- border-collapse: collapse;
-}
-table.docutils.booktabs * {
- border: 0px;
-}
-table.docutils.booktabs th {
- border-bottom: thin solid;
- text-align: left;
-}
-
-h1 tt.docutils, h2 tt.docutils, h3 tt.docutils,
-h4 tt.docutils, h5 tt.docutils, h6 tt.docutils {
- font-size: 100% }
-
-ul.auto-toc {
- list-style-type: none }
-
-</style>
-</head>
-<body>
-<div class="document">
-
-
-<div class="section" id="introduction">
-<h1>Introduction</h1>
-</div>
-<div class="section" id="data">
-<h1>Data</h1>
-<div class="section" id="loael-values">
-<h2>LOAEL Values</h2>
-<div class="section" id="comparison-of-variances-in-datasets">
-<h3>Comparison of variances in datasets</h3>
+<p>================================================================================================================================ lazar read across models for lowest adverse effect levels: A comparison of experimental variability with read across predictions ================================================================================================================================</p>
+<p>Christoph Helma, David Vorgrimmler, Martin Guetlein, Denis Gebele, Elena Lo Piparo</p>
+<p>in silico toxicology gmbh, Rastatterstrasse 41, 4051 Basel, Switzerland</p>
+<h1 id="introduction">Introduction</h1>
+<p>The main objectives of this study are</p>
+<ul>
+<li>to investigate the experimental variability of LOAEL data</li>
+<li>develop predictive model for lowest observed effect levels</li>
+<li>compare the performance of model predictions with experimental variability</li>
+</ul>
+<h1 id="methods">Methods</h1>
+<h2 id="data">Data</h2>
+<h3 id="mazzatorta-dataset">Mazzatorta dataset</h3>
+<h3 id="swiss-dataset">Swiss dataset</h3>
+<h3 id="preprocessing">Preprocessing</h3>
+<p>Missing and invalid SMILES Unfortunately no identifier is complete across all compound therefore we focused on SMILES. Missing SMILES were generated from other identifiers when available.</p>
+<p>study type/ table rat_chron mouse_chron multigen missing SMILES 35 27 31 invalid SMILES 9 6 9 corrected SMILES 44 33 40 Detailed tables: https://docs.google.com/spreadsheets/d/14P8F-3iX5gr5FbN7oSeuwabUOr_xdDhhr5KwiUX6LXY/edit?usp=sharing</p>
+<h2 id="algorithms">Algorithms</h2>
+<p>For this study we are using the modular lazar (<em>la</em>zy <em>s</em>tructure <em>a</em>ctivity <em>r</em>elationships) framework (helma..) for model development and validation.</p>
+<p>lazar follows the following basic workflow: For a given chemical structure it searches in a database for similar structures (neighbors) with experimental data, builds a local (Q)SAR model with these neighbors and uses this model to predict the unknown activity of the query compound. This procedure resembles an automated version of <em>read across</em> predictions in toxicology, in machine learning terms it would be classified as a <em>k-nearest-neighbor</em> algorithm.</p>
+<p>Apart from this basic workflow lazar is completely modular and allows the researcher to use any algorithm for neighbor identification and local (Q)SAR modelling. Within this study we are using the following algorithms:</p>
+<h3 id="neighbor-identification">Neighbor identification</h3>
+<p>Similarity calculations are based on TODO fingerprints (Bender 2003) from the OpenBabel chemoinformatics library (TODO). The TODO fingerprint uses atom environments as molecular representation, which resemble basically the chemical concept of functional groups. For each atom in a molecule the atom types of connected atoms are recorded. The same procedure is repeated for connected atoms up to a given distance of chemical bonds. From this data a vector with atom type counts at a given distance from the central atom is constructed. These vectors are used to calculate chemical similarities.</p>
+<p>TODO: example???</p>
+<p>Similarities are expressed as Tanimoto index</p>
+<p>TODO: Jaquard index? TODO: formula TODO: similarity threshold</p>
+<p>Such a In machine learning</p>
+<p>The main advantage of TODO fingerprints in comparison to fingerprints with predefined substructures such as MACCs fingerprints (TODO) is that</p>
+<p>TODO; toxicological relevance</p>
+<p>Preliminary experiments have shown that predictions with TODO fingerprints are more accurate than fingerprints with predefined substructures (OpenBabel FP TODO) fingerprints, which is in agreement with findings in the literature (TOCDO cite).</p>
+<h3 id="local-qsar-models">Local (Q)SAR models</h3>
+<p>As soon as neighbors for a query compound have been identified, we can use their experimental LOAEL values to predict the activity of the untested compound. In this case we are using the weighted mean (TODO median?) of the neighbors LOAEL values, where the contribution of each neighbor is weighted by its similarity to the query compound.</p>
+<h3 id="validation">Validation</h3>
+<h2 id="results">Results</h2>
+<h3 id="dataset-comparison">Dataset comparison</h3>
+<h4 id="structural-composition">Structural composition</h4>
+<h5 id="ches-mapper-analysis">Ches-Mapper analysis</h5>
+<h5 id="distribution-of-functional-groups">Distribution of functional groups</h5>
+<h4 id="loael-values">LOAEL values</h4>
+<h5 id="intra-dataset-variability">Intra dataset variability</h5>
<p>p-value: 0.4750771581019402</p>
-<object data="loael-variance.svg" type="image/svg+xml">
-loael-variance.svg</object>
-</div>
-<div class="section" id="comparison-of-compounds-in-both-datasets">
-<h3>Comparison of compounds in both datasets</h3>
-<object data="loael-dataset-comparison-mmol_kg_day.svg" type="image/svg+xml">
-loael-dataset-comparison-mmol_kg_day.svg</object>
-</div>
-<div class="section" id="correlation-between-datasets">
-<h3>Correlation between datasets</h3>
+<p>.. image:: loael-dataset-comparison-all-compounds.pdf</p>
+<h5 id="inter-dataset-variability">Inter dataset variability</h5>
+<p>.. image:: loael-dataset-comparison-common-compounds.pdf</p>
+<h5 id="loael-correlation-between-datasets">LOAEL correlation between datasets</h5>
<p>using means</p>
-<object data="loael-dataset-correlation.svg" type="image/svg+xml">
-loael-dataset-correlation.svg</object>
+<p>.. image:: loael-dataset-correlation.pdf</p>
<p>with &quot;identical&quot; values</p>
-<blockquote>
-r^2: 0.6106457754533314
-RMSE: 1.2228212261024438
-MAE: 0.801626064534318</blockquote>
-</div>
-</div>
-</div>
-<div class="section" id="models">
-<h1>Models</h1>
-</div>
-<div class="section" id="validation">
-<h1>Validation</h1>
-<p>Discussion</p>
-</div>
-</div>
-</body>
-</html>
+<p>r^2: 0.6106457754533314 RMSE: 1.2228212261024438 MAE: 0.801626064534318</p>
+<h3 id="read-across-predictions">Read across predictions</h3>
+<h2 id="discussion">Discussion</h2>
+<h3 id="chemical-similarity">Chemical similarity</h3>
+<h3 id="loael-variability">LOAEL variability</h3>
+<h3 id="predictive-performance">Predictive performance</h3>
+<h3 id="section"></h3>