<?xml version="1.0" encoding="utf-8"?>
<!DOCTYPE QMRF SYSTEM "/WEB-INF/xslt/qmrf.dtd">
<QMRF author="Joint Research Centre, European Commission" contact="Joint Research Centre, European Commission" date="July 2007" email="qsardb@jrc.it" name="(Q)SAR Model Reporting Format" schema_version="0.9" url="http://ecb.jrc.ec.europa.eu/qsar/" version="1.2">
<QMRF_chapters>
<QSAR_identifier chapter="1" help="" name="QSAR identifier">
<QSAR_title chapter="1.1" help="" name="QSAR identifier (title)">&lt;html&gt;&#13;
  &lt;head&gt;&#13;
    &#13;
  &lt;/head&gt;&#13;
  &lt;body&gt;&#13;
    &lt;p style="margin-top: 0"&gt;&#13;
      Nonlinear QSAR: artificial neural network for dermal irritation&#13;
    &lt;/p&gt;&#13;
  &lt;/body&gt;&#13;
&lt;/html&gt;&#13;
</QSAR_title>
<QSAR_models chapter="1.2" help="" name="Other related models">&lt;html&gt;&#13;
  &lt;head&gt;&#13;
    &#13;
  &lt;/head&gt;&#13;
  &lt;body&gt;&#13;
    http://reachqsar.com/&#13;
  &lt;/body&gt;&#13;
&lt;/html&gt;&#13;
</QSAR_models>
<QSAR_software chapter="1.3" help="" name="Software coding the model">
			
      









<software_ref idref="firstsoftware" catalog="software_catalog"/>
<software_ref idref="software_catalog_4" catalog="software_catalog"/>
</QSAR_software>
</QSAR_identifier>
<QSAR_General_information chapter="2" help="" name="General information">
<qmrf_date chapter="2.1" help="" name="Date of QMRF">&lt;html&gt;&#13;
  &lt;head&gt;&#13;
    &#13;
  &lt;/head&gt;&#13;
  &lt;body&gt;&#13;
    &lt;p style="margin-top: 0"&gt;&#13;
      10.10.2010&#13;
    &lt;/p&gt;&#13;
  &lt;/body&gt;&#13;
&lt;/html&gt;&#13;
</qmrf_date>
<qmrf_authors chapter="2.2" help="" name="QMRF author(s) and contact details">
		
      

























































<author_ref idref="firstauthor" catalog="authors_catalog"/>
<author_ref idref="authors_catalog_3" catalog="authors_catalog"/>
<author_ref idref="authors_catalog_4" catalog="authors_catalog"/>
<author_ref idref="authors_catalog_5" catalog="authors_catalog"/>
<author_ref idref="authors_catalog_6" catalog="authors_catalog"/>
<author_ref idref="authors_catalog_7" catalog="authors_catalog"/>
<author_ref idref="authors_catalog_8" catalog="authors_catalog"/>
<author_ref idref="authors_catalog_9" catalog="authors_catalog"/>
<author_ref idref="authors_catalog_10" catalog="authors_catalog"/>
<author_ref idref="authors_catalog_11" catalog="authors_catalog"/>
<author_ref idref="authors_catalog_12" catalog="authors_catalog"/>
</qmrf_authors>
<qmrf_date_revision chapter="2.3" help="" name="Date of QMRF update(s)">&lt;html&gt;&#13;
  &lt;head&gt;&#13;
    &#13;
  &lt;/head&gt;&#13;
  &lt;body&gt;&#13;
  &lt;/body&gt;&#13;
&lt;/html&gt;&#13;
</qmrf_date_revision>
<qmrf_revision chapter="2.4" help="" name="QMRF update(s)">&lt;html&gt;&#13;
  &lt;head&gt;&#13;
&#13;
  &lt;/head&gt;&#13;
  &lt;body&gt;&#13;
    &lt;p style="margin-top: 0"&gt;&#13;
      &#13;
    &lt;/p&gt;&#13;
  &lt;/body&gt;&#13;
&lt;/html&gt;&#13;
</qmrf_revision>
<model_authors chapter="2.5" help="" name="Model developer(s) and contact details">
		
      







<author_ref idref="modelauthor" catalog="authors_catalog"/>
</model_authors>
<model_date chapter="2.6" help="" name="Date of model development and/or publication">&lt;html&gt;&#13;
  &lt;head&gt;&#13;
    &#13;
  &lt;/head&gt;&#13;
  &lt;body&gt;&#13;
    &lt;p style="margin-top: 0"&gt;&#13;
      12.04.2010&#13;
    &lt;/p&gt;&#13;
  &lt;/body&gt;&#13;
&lt;/html&gt;&#13;
</model_date>
<references chapter="2.7" help="" name="Reference(s) to main scientific papers and/or software package">

      


























<publication_ref idref="publications_catalog_2" number="" catalog="publications_catalog"/>
<publication_ref idref="publications_catalog_3" number="" catalog="publications_catalog"/>
<publication_ref idref="publications_catalog_4" number="" catalog="publications_catalog"/>
</references>
<info_availability chapter="2.8" help="" name="Availability of information about the model">&lt;html&gt;&#13;
  &lt;head&gt;&#13;
    &#13;
  &lt;/head&gt;&#13;
  &lt;body&gt;&#13;
    &lt;p style="margin-top: 0"&gt;&#13;
      Selection, training and test sets are available. Model algorithm is &#13;
      available (snn file).&#13;
    &lt;/p&gt;&#13;
  &lt;/body&gt;&#13;
&lt;/html&gt;&#13;
</info_availability>
<related_models chapter="2.9" help="" name="Availability of another QMRF for exactly the same model">&lt;html&gt;&#13;
  &lt;head&gt;&#13;
    &#13;
  &lt;/head&gt;&#13;
  &lt;body&gt;&#13;
    &lt;p style="margin-top: 0"&gt;&#13;
      None to date.&#13;
    &lt;/p&gt;&#13;
  &lt;/body&gt;&#13;
&lt;/html&gt;&#13;
</related_models>
</QSAR_General_information>
<QSAR_Endpoint chapter="3" help="" name="Defining the endpoint - OECD Principle 1">
<model_species chapter="3.1" help="" name="Species">&lt;html&gt;&#13;
  &lt;head&gt;&#13;
    &#13;
  &lt;/head&gt;&#13;
  &lt;body&gt;&#13;
    &lt;p style="margin-top: 0"&gt;&#13;
      Rabbit&#13;
    &lt;/p&gt;&#13;
  &lt;/body&gt;&#13;
&lt;/html&gt;&#13;
</model_species>
<model_endpoint chapter="3.2" help="" name="Endpoint">

      







<endpoint_ref idref="endpoints_catalog_4" catalog="endpoints_catalog"/>
</model_endpoint>
<endpoint_comments chapter="3.3" help="" name="Comment on endpoint">&lt;html&gt;&#13;
  &lt;head&gt;&#13;
    &#13;
  &lt;/head&gt;&#13;
  &lt;body&gt;&#13;
    &lt;p style="margin-top: 0"&gt;&#13;
      Dermal irritation is the production of reversible inflammatory changes &#13;
      in irritation skin following the application of a substance. The skin &#13;
      irritation potential is described by the Primary Irritation Index (PII), &#13;
      calculated from erythema and oedema grades based on experimental &#13;
      rabbits. The maximum PII is 8 and the minimum is 0. The grading scale &#13;
      for irritant effects on rabbit skin were originally proposed by Draize &#13;
      and adopted by the OECD (Test Guideline 404) and the US and EU &#13;
      regulatory agencies [ref 1, sect 9.2].&#13;
    &lt;/p&gt;&#13;
    &lt;p style="margin-top: 0"&gt;&#13;
      The PII can be calculated as:&#13;
    &lt;/p&gt;&#13;
    &lt;p style="margin-top: 0"&gt;&#13;
      PII = [SUM(Erythema 24/48/72 h)+SUM(Oedema24/48/72 h)] (3 x no. animals) &#13;
      where Erythema is redness of skin produced by vascular congestion or &#13;
      increased perfusion And Oedema is the presence of abnormally large &#13;
      amounts of fluid in the intercellular tissue spaces of the epidermis, &#13;
      dermis or subcutaneous tissues.&#13;
    &lt;/p&gt;&#13;
  &lt;/body&gt;&#13;
&lt;/html&gt;&#13;
</endpoint_comments>
<endpoint_units chapter="3.4" help="" name="Endpoint units">&lt;html&gt;&#13;
  &lt;head&gt;&#13;
    &#13;
  &lt;/head&gt;&#13;
  &lt;body&gt;&#13;
  &lt;/body&gt;&#13;
&lt;/html&gt;&#13;
</endpoint_units>
<endpoint_variable chapter="3.5" help="" name="Dependent variable">&lt;html&gt;&#13;
  &lt;head&gt;&#13;
    &#13;
  &lt;/head&gt;&#13;
  &lt;body&gt;&#13;
    &lt;p style="margin-top: 0"&gt;&#13;
      Primary Irritation Index (PII)&#13;
    &lt;/p&gt;&#13;
  &lt;/body&gt;&#13;
&lt;/html&gt;&#13;
</endpoint_variable>
<endpoint_protocol chapter="3.6" help="" name="Experimental protocol">&lt;html&gt;&#13;
  &lt;head&gt;&#13;
    &#13;
  &lt;/head&gt;&#13;
  &lt;body&gt;&#13;
    &lt;p style="margin-top: 0"&gt;&#13;
      All 286 data used in this report were obtained from in vivo rabbit skin &#13;
      irritation test that were used to assess the potential of materials to &#13;
      cause skin irritancy or corrosion in man, and to meet regulatory &#13;
      requirements which require classification and appropriate labeling of a &#13;
      material if it is believed to be potential irritant or corrosive. All &#13;
      chemicals were tested applying a volume or weight of 0.5ml or 0.5g &#13;
      undiluted, except where an alternative weight or concentration was &#13;
      needed. Exposure time for each test was 4 hours [ref 1, sect 9.2].&#13;
    &lt;/p&gt;&#13;
  &lt;/body&gt;&#13;
&lt;/html&gt;&#13;
</endpoint_protocol>
<endpoint_data_quality chapter="3.7" help="" name="Endpoint data quality and variability">&lt;html&gt;&#13;
  &lt;head&gt;&#13;
    &#13;
  &lt;/head&gt;&#13;
  &lt;body&gt;&#13;
    &lt;p style="margin-top: 0"&gt;&#13;
      The 286 chemicals selected were readily available at high and consistent &#13;
      purity and are expected to be stable on storage. They have been tested &#13;
      undiluted in in vivo studies, excepting those chemical where high &#13;
      concentrations of the substance could be expected to cause sever &#13;
      effects. The invivo data were generated in 1981 in studies carried out &#13;
      according to OECD Test Guideline 404 and following the principles of &#13;
      Good Laboratory Practice. The data presented were obtained from tests &#13;
      normally using at least three rabbits involving application of 0.5 ml &#13;
      (or 0.5g) to the flank under semi-occlusive patches and in which &#13;
      observations were made at least 24, 48 and 72 hours [ref 1, sect 9.2].&#13;
    &lt;/p&gt;&#13;
  &lt;/body&gt;&#13;
&lt;/html&gt;&#13;
</endpoint_data_quality>
</QSAR_Endpoint>
<QSAR_Algorithm chapter="4" help="" name="Defining the algorithm - OECD Principle 2">
<algorithm_type chapter="4.1" help="" name="Type of model">&lt;html&gt;&#13;
  &lt;head&gt;&#13;
    &#13;
  &lt;/head&gt;&#13;
  &lt;body&gt;&#13;
    &lt;p style="margin-top: 0"&gt;&#13;
      Neural network&#13;
    &lt;/p&gt;&#13;
  &lt;/body&gt;&#13;
&lt;/html&gt;&#13;
</algorithm_type>
<algorithm_explicit chapter="4.2" help="" name="Explicit algorithm">
<algorithm_ref idref="algorithms_catalog_6" catalog="algorithms_catalog"/>
<equation>&lt;html&gt;&#13;
  &lt;head&gt;&#13;
&#13;
  &lt;/head&gt;&#13;
  &lt;body&gt;&#13;
    &lt;p style="margin-top: 0"&gt;&#13;
      The algorithm is based on regression neural network predictor with &#13;
      structure 9-8-6-1.&#13;
    &lt;/p&gt;&#13;
  &lt;/body&gt;&#13;
&lt;/html&gt;&#13;
</equation>
</algorithm_explicit>
<algorithms_descriptors chapter="4.3" help="" name="Descriptors in the model">
      
      









































































<descriptor_ref idref="descriptors_catalog_35" catalog="descriptors_catalog"/>
<descriptor_ref idref="descriptors_catalog_36" catalog="descriptors_catalog"/>
<descriptor_ref idref="descriptors_catalog_37" catalog="descriptors_catalog"/>
<descriptor_ref idref="descriptors_catalog_38" catalog="descriptors_catalog"/>
<descriptor_ref idref="descriptors_catalog_39" catalog="descriptors_catalog"/>
<descriptor_ref idref="descriptors_catalog_40" catalog="descriptors_catalog"/>
<descriptor_ref idref="descriptors_catalog_41" catalog="descriptors_catalog"/>
<descriptor_ref idref="descriptors_catalog_42" catalog="descriptors_catalog"/>
<descriptor_ref idref="descriptors_catalog_43" catalog="descriptors_catalog"/>
</algorithms_descriptors>
<descriptors_selection chapter="4.4" help="" name="Descriptor selection">&lt;html&gt;&#13;
  &lt;head&gt;&#13;
    &#13;
  &lt;/head&gt;&#13;
  &lt;body&gt;&#13;
    &lt;p style="margin-top: 0"&gt;&#13;
      Initial pool of ~1000 descriptors. Stepwise descriptor selection based &#13;
      on a set of statistical selection rules as F statistic and p. The first &#13;
      highest F (low p) descriptors (9) were selected from the whole set of &#13;
      descriptors. These 9 descriptors were used as inputs to the network. 29 &#13;
      networks with different structures were tested in order to find the best &#13;
      ANN with lowest RMS (root-mean-squared error) and highest correct &#13;
      predictions (for training, selection and test sets). Then 245 epochs &#13;
      were used to train the final network with architecture depicted in 4.2. &#13;
      Optimization of the weights was performed with Levenberg-Marquardt &#13;
      algorithm encoded in the backpropagation scheme using linear and &#13;
      hyperbolic activation functions.&#13;
    &lt;/p&gt;&#13;
  &lt;/body&gt;&#13;
&lt;/html&gt;&#13;
</descriptors_selection>
<descriptors_generation chapter="4.5" help="" name="Algorithm and descriptor generation">&lt;html&gt;&#13;
  &lt;head&gt;&#13;
    &#13;
  &lt;/head&gt;&#13;
  &lt;body&gt;&#13;
    &lt;p style="margin-top: 0"&gt;&#13;
      All descriptors were generated using QSARModel on structure optimized by &#13;
      AM1 semiempirical quantum mechanical model. The final structure were &#13;
      optimized by mopac6 implemented in QSARModel. Keywords used for &#13;
      opyimizations were: AM1 EF GNORM=0.05 BONDS PI POLAR ENPART NOINTER &#13;
      PRECISE. The final descriptors were selected as denoted in 4.4 as well &#13;
      as descriptors with small variances less than 10 e-&lt;sup&gt;5&lt;/sup&gt; were &#13;
      discarded from the total pool.&#13;
    &lt;/p&gt;&#13;
  &lt;/body&gt;&#13;
&lt;/html&gt;&#13;
</descriptors_generation>
<descriptors_generation_software chapter="4.6" help="" name="Software name and version for descriptor generation" options="">
				
      







<software_ref idref="software_catalog_2" catalog="software_catalog"/>
</descriptors_generation_software>
<descriptors_chemicals_ratio chapter="4.7" help="" name="Chemicals/Descriptors ratio">&lt;html&gt;&#13;
  &lt;head&gt;&#13;
    &#13;
  &lt;/head&gt;&#13;
  &lt;body&gt;&#13;
    &lt;p style="margin-top: 0"&gt;&#13;
      16.2 ( 146 chemicals / 9 descriptors)&#13;
    &lt;/p&gt;&#13;
  &lt;/body&gt;&#13;
&lt;/html&gt;&#13;
</descriptors_chemicals_ratio>
</QSAR_Algorithm>
<QSAR_Applicability_domain chapter="5" help="" name="Defining the applicability domain - OECD Principle 3">
<app_domain_description chapter="5.1" help="" name="Description of the applicability domain of the model">&lt;html&gt;&#13;
  &lt;head&gt;&#13;
    &#13;
  &lt;/head&gt;&#13;
  &lt;body&gt;&#13;
    &lt;p style="margin-top: 0"&gt;&#13;
      Applicability domain based on training set:&#13;
    &lt;/p&gt;&#13;
    &lt;p style="margin-top: 0"&gt;&#13;
      By descriptor value range (between min and max values): The model is &#13;
      suitable for compounds that have the descriptors in the following range &#13;
      augmented with the confidence in 5.2:&#13;
    &lt;/p&gt;&#13;
    &lt;p style="margin-top: 0"&gt;&#13;
      Desc ID&#13;
    &lt;/p&gt;&#13;
    &lt;p style="margin-top: 0"&gt;&#13;
      See 4.3: 1 2 3 4 5 6 7 8 9&#13;
    &lt;/p&gt;&#13;
    &lt;p style="margin-top: 0"&gt;&#13;
      Min: 0.000 0.000 0.000 4.588 0.000 0.000 0.000 -243.84 1.705&#13;
    &lt;/p&gt;&#13;
    &lt;p style="margin-top: 0"&gt;&#13;
      Max: 4.000 92.304 0.209 27.639 4.000 6.156 6.000 952.967 140.451&#13;
    &lt;/p&gt;&#13;
  &lt;/body&gt;&#13;
&lt;/html&gt;&#13;
</app_domain_description>
<app_domain_method chapter="5.2" help="" name="Method used to assess the applicability domain">&lt;html&gt;&#13;
  &lt;head&gt;&#13;
    &#13;
  &lt;/head&gt;&#13;
  &lt;body&gt;&#13;
    &lt;p style="margin-top: 0"&gt;&#13;
      Presence of functional groups in structures (ethers, esters, amides, &#13;
      halides, aromatic, aliphatic functional groups etc)&#13;
    &lt;/p&gt;&#13;
    &lt;p style="margin-top: 0"&gt;&#13;
      Range of descriptor values in training set with &amp;#177;30% confidence&#13;
    &lt;/p&gt;&#13;
    &lt;p style="margin-top: 0"&gt;&#13;
      Descriptor values must fall between maximal and minimal descriptor &#13;
      values (see5.1) of training set &amp;#177;30%.&#13;
    &lt;/p&gt;&#13;
  &lt;/body&gt;&#13;
&lt;/html&gt;&#13;
</app_domain_method>
<app_domain_software chapter="5.3" help="" name="Software name and version for applicability domain assessment">

      







<software_ref idref="software_catalog_3" catalog="software_catalog"/>
</app_domain_software>
<applicability_limits chapter="5.4" help="" name="Limits of applicability">&lt;html&gt;&#13;
  &lt;head&gt;&#13;
    &#13;
  &lt;/head&gt;&#13;
  &lt;body&gt;&#13;
    &lt;p style="margin-top: 0"&gt;&#13;
      See 5.1, 5.2&#13;
    &lt;/p&gt;&#13;
  &lt;/body&gt;&#13;
&lt;/html&gt;&#13;
</applicability_limits>
</QSAR_Applicability_domain>
<QSAR_Robustness chapter="6" help="" name="Internal validation - OECD Principle 4">
<training_set_availability answer="Yes" chapter="6.1" help="" name="Availability of the training set"/>
<training_set_data cas="Yes" chapter="6.2" chemname="Yes" formula="No" help="" inchi="No" mol="Yes" name="Available information for the training set" smiles="No"/>
<training_set_descriptors answer="All" chapter="6.3" help="" name="Data for each descriptor variable for the training set"/>
<dependent_var_availability answer="All" chapter="6.4" help="" name="Data for the dependent variable for the training set"/>
<other_info chapter="6.5" help="" name="Other information about the training set">&lt;html&gt;&#13;
  &lt;head&gt;&#13;
    &#13;
  &lt;/head&gt;&#13;
  &lt;body&gt;&#13;
    &lt;p style="margin-top: 0"&gt;&#13;
      Data points: 146&#13;
    &lt;/p&gt;&#13;
  &lt;/body&gt;&#13;
&lt;/html&gt;&#13;
</other_info>
<preprocessing chapter="6.6" help="" name="Pre-processing of data before modelling">&lt;html&gt;&#13;
  &lt;head&gt;&#13;
    &#13;
  &lt;/head&gt;&#13;
  &lt;body&gt;&#13;
    &lt;p style="margin-top: 0"&gt;&#13;
      Standardization and normalization of the inputs by taking into account &#13;
      the mean and standard deviation&#13;
    &lt;/p&gt;&#13;
  &lt;/body&gt;&#13;
&lt;/html&gt;&#13;
</preprocessing>
<goodness_of_fit chapter="6.7" help="" name="Statistics for goodness-of-fit">&lt;html&gt;&#13;
  &lt;head&gt;&#13;
    &#13;
  &lt;/head&gt;&#13;
  &lt;body&gt;&#13;
    &lt;p style="margin-top: 0"&gt;&#13;
      Training PII; Selection PII; Test PII&#13;
    &lt;/p&gt;&#13;
    &lt;p style="margin-top: 0"&gt;&#13;
      Data Mean: 2.348; 3.129; 2.417&#13;
    &lt;/p&gt;&#13;
    &lt;p style="margin-top: 0"&gt;&#13;
      Data SD: 2.040; 2.512; 1.610&#13;
    &lt;/p&gt;&#13;
    &lt;p style="margin-top: 0"&gt;&#13;
      Error Mean: -0.019; -0.009; -0.222&#13;
    &lt;/p&gt;&#13;
    &lt;p style="margin-top: 0"&gt;&#13;
      Error SD: 1.185; 2.781; 1.390&#13;
    &lt;/p&gt;&#13;
    &lt;p style="margin-top: 0"&gt;&#13;
      Abs E. Mean: 0.845; 1.903; 1.112&#13;
    &lt;/p&gt;&#13;
    &lt;p style="margin-top: 0"&gt;&#13;
      S.D. Ratio: 0.581; 1.107; 0.864&#13;
    &lt;/p&gt;&#13;
    &lt;p style="margin-top: 0"&gt;&#13;
      Correlation: 0.814; 0.628; 0.590&#13;
    &lt;/p&gt;&#13;
  &lt;/body&gt;&#13;
&lt;/html&gt;&#13;
</goodness_of_fit>
<loo chapter="6.8" help="" name="Robustness - Statistics obtained by leave-one-out cross-validation">&lt;html&gt;&#13;
  &lt;head&gt;&#13;
    &#13;
  &lt;/head&gt;&#13;
  &lt;body&gt;&#13;
    See 6.7&#13;
  &lt;/body&gt;&#13;
&lt;/html&gt;&#13;
</loo>
<lmo chapter="6.9" help="" name="Robustness - Statistics obtained by leave-many-out cross-validation">&lt;html&gt;&#13;
  &lt;head&gt;&#13;
&#13;
  &lt;/head&gt;&#13;
  &lt;body&gt;&#13;
    &lt;p style="margin-top: 0"&gt;&#13;
      &#13;
    &lt;/p&gt;&#13;
  &lt;/body&gt;&#13;
&lt;/html&gt;&#13;
</lmo>
<yscrambling chapter="6.10" help="" name="Robustness - Statistics obtained by Y-scrambling"/>
<bootstrap chapter="6.11" help="" name="Robustness - Statistics obtained by bootstrap">&lt;html&gt;&#13;
  &lt;head&gt;&#13;
&#13;
  &lt;/head&gt;&#13;
  &lt;body&gt;&#13;
    &lt;p style="margin-top: 0"&gt;&#13;
      &#13;
    &lt;/p&gt;&#13;
  &lt;/body&gt;&#13;
&lt;/html&gt;&#13;
</bootstrap>
<other_statistics chapter="6.12" help="" name="Robustness - Statistics obtained by other methods">&lt;html&gt;&#13;
  &lt;head&gt;&#13;
    &#13;
  &lt;/head&gt;&#13;
  &lt;body&gt;&#13;
    &lt;p style="margin-top: 0"&gt;&#13;
      RMS(Training)=0.14814; RMS (Selection)=0.347624; RMS(Test)=0.176003&#13;
    &lt;/p&gt;&#13;
    &lt;p style="margin-top: 0"&gt;&#13;
      In this ANN 2 sets of randomly chosen (20) data to test the network &amp;#8211; &#13;
      selection set and test set, See also 6.7&#13;
    &lt;/p&gt;&#13;
  &lt;/body&gt;&#13;
&lt;/html&gt;&#13;
</other_statistics>
</QSAR_Robustness>
<QSAR_Predictivity chapter="7" help="" name="External validation - OECD Principle 4">
<validation_set_availability answer="Yes" chapter="7.1" help="" name="Availability of the external validation set"/>
<validation_set_data cas="Yes" chapter="7.2" chemname="Yes" formula="No" help="" inchi="No" mol="Yes" name="Available information for the external validation set" smiles="No"/>
<validation_set_descriptors answer="All" chapter="7.3" help="" name="Data for each descriptor variable for the external validation set"/>
<validation_dependent_var_availability answer="All" chapter="7.4" help="" name="Data for the dependent variable for the external validation set"/>
<validation_other_info chapter="7.5" help="" name="Other information about the external validation set">&lt;html&gt;&#13;
  &lt;head&gt;&#13;
    &#13;
  &lt;/head&gt;&#13;
  &lt;body&gt;&#13;
    &lt;p style="margin-top: 0"&gt;&#13;
      The method used two validation sets: selection (20) and test (20)&#13;
    &lt;/p&gt;&#13;
  &lt;/body&gt;&#13;
&lt;/html&gt;&#13;
</validation_other_info>
<experimental_design chapter="7.6" help="" name="Experimental design of test set">&lt;html&gt;&#13;
  &lt;head&gt;&#13;
    &#13;
  &lt;/head&gt;&#13;
  &lt;body&gt;&#13;
    &lt;p style="margin-top: 0"&gt;&#13;
      Randomly selected 20 selection and 20 test data points&#13;
    &lt;/p&gt;&#13;
  &lt;/body&gt;&#13;
&lt;/html&gt;&#13;
</experimental_design>
<validation_predictivity chapter="7.7" help="" name="Predictivity - Statistics obtained by external validation">&lt;html&gt;&#13;
  &lt;head&gt;&#13;
    &#13;
  &lt;/head&gt;&#13;
  &lt;body&gt;&#13;
    &lt;p style="margin-top: 0"&gt;&#13;
      See 6.7 and 6.12&#13;
    &lt;/p&gt;&#13;
  &lt;/body&gt;&#13;
&lt;/html&gt;&#13;
</validation_predictivity>
<validation_assessment chapter="7.8" help="" name="Predictivity - Assessment of the external validation set">&lt;html&gt;&#13;
  &lt;head&gt;&#13;
    &#13;
  &lt;/head&gt;&#13;
  &lt;body&gt;&#13;
    &lt;p style="margin-top: 0"&gt;&#13;
      The descriptors for the test set are in the limit of applicability, see &#13;
      6.7 and 6.12. We have limited ourselves to select two auxiliary sets to &#13;
      train the network and to test it externally on the test set. Thus more &#13;
      than 1.5 of the datapoints were selected for these two sets divided by &#13;
      2. One of the main purposes of the ANN model also to be applicable for &#13;
      diverse compounds for future predictions, thus we wtried to keep the &#13;
      training set as large as possible and to select the validation and test &#13;
      sets with significant data points.&#13;
    &lt;/p&gt;&#13;
  &lt;/body&gt;&#13;
&lt;/html&gt;&#13;
</validation_assessment>
<validation_comments chapter="7.9" help="" name="Comments on the external validation of the model">&lt;html&gt;&#13;
  &lt;head&gt;&#13;
    &#13;
  &lt;/head&gt;&#13;
  &lt;body&gt;&#13;
    &lt;p style="margin-top: 0"&gt;&#13;
      Overall predictions for the selection set (used to stop the ANN training &#13;
      and not to overfit it) and the test set (used to test the external &#13;
      prediction of the net after training) are significant according to the &#13;
      RMS error and the standard deviation ratio (S.D.Ratio); see 6.7 and 6.12.&#13;
    &lt;/p&gt;&#13;
  &lt;/body&gt;&#13;
&lt;/html&gt;&#13;
</validation_comments>
</QSAR_Predictivity>
<QSAR_Interpretation chapter="8" help="" name="Providing a mechanistic interpretation - OECD Principle 5">
<mechanistic_basis chapter="8.1" help="" name="Mechanistic basis of the model">&lt;html&gt;&#13;
  &lt;head&gt;&#13;
    &#13;
  &lt;/head&gt;&#13;
  &lt;body&gt;&#13;
    &lt;p style="margin-top: 0"&gt;&#13;
      The complex nature of the ANN model does not allow direct interpretation &#13;
      of the descriptors in relation to the modelled property. However, it can &#13;
      be noted that descriptors related to the hydrogen bonding ability and &#13;
      the charged surface areas of the molecules are mainly present. The &#13;
      reactivity of the compounds with the epidermis depends also on charged &#13;
      surface areas of the compounds (which are the most reactive sides). &#13;
      Several authors have confirmed the reactivity related with the charged &#13;
      surfaces and also the LUMO and HOMO descriptors [ref 2,3; sect 9.2]. It &#13;
      can be roughly estimated that the PII increases with increasing (slight &#13;
      negative correlation between the descriptors) count of H-acceptor sites &#13;
      (AM1), HBCA H-bonding charged surface area (AM1), and FHACA Fractional &#13;
      HACA (HACA/TMSA) (AM1).&#13;
    &lt;/p&gt;&#13;
  &lt;/body&gt;&#13;
&lt;/html&gt;&#13;
</mechanistic_basis>
<mechanistic_basis_comments chapter="8.2" help="" name="A priori or a posteriori mechanistic interpretation">&lt;html&gt;&#13;
  &lt;head&gt;&#13;
    &#13;
  &lt;/head&gt;&#13;
  &lt;body&gt;&#13;
  &lt;/body&gt;&#13;
&lt;/html&gt;&#13;
</mechanistic_basis_comments>
<mechanistic_basis_info chapter="8.3" help="" name="Other information about the mechanistic interpretation">&lt;html&gt;&#13;
  &lt;head&gt;&#13;
&#13;
  &lt;/head&gt;&#13;
  &lt;body&gt;&#13;
    &lt;p style="margin-top: 0"&gt;&#13;
      &#13;
    &lt;/p&gt;&#13;
  &lt;/body&gt;&#13;
&lt;/html&gt;&#13;
</mechanistic_basis_info>
</QSAR_Interpretation>
<QSAR_Miscelaneous chapter="9" help="" name="Miscellaneous information">
<comments chapter="9.1" help="" name="Comments">&lt;html&gt;&#13;
  &lt;head&gt;&#13;
    &#13;
  &lt;/head&gt;&#13;
  &lt;body&gt;&#13;
    &lt;p style="margin-top: 0"&gt;&#13;
      Supporting information for: training set(s), selection set(s), test &#13;
      set(s).&#13;
    &lt;/p&gt;&#13;
    &lt;p style="margin-top: 0"&gt;&#13;
      The 9-8-6-1.snn file includes the ANN model;  the user must have &#13;
      Statistica 7 or higher with ANN modules to make predictions.&#13;
    &lt;/p&gt;&#13;
  &lt;/body&gt;&#13;
&lt;/html&gt;&#13;
</comments>
<bibliography chapter="9.2" help="" name="Bibliography">
				
      
























<publication_ref idref="publications_catalog_14" number="" catalog="publications_catalog"/>
<publication_ref idref="publications_catalog_15" number="" catalog="publications_catalog"/>
<publication_ref idref="publications_catalog_16" number="" catalog="publications_catalog"/>
</bibliography>
<attachments chapter="9.3" name="Supporting information" help="">
<attachment_training_data>
<molecules description="Dermal_Irritation_PII_training_ 146.sdf" filetype="sdf" url="http://qsardb.jrc.it:80/qmrf/download_attachment.jsp?name=qmrf332_Dermal_Irritation_PII_training_ 146.sdf"/>
</attachment_training_data>
<attachment_validation_data>
<molecules description="Dermal_Irritation_PII_selection_20.sdf" filetype="sdf" url="http://qsardb.jrc.it:80/qmrf/download_attachment.jsp?name=qmrf332_Dermal_Irritation_PII_selection_20.sdf"/>
<molecules description="Dermal_Irritation_PII_test_20.sdf" filetype="sdf" url="http://qsardb.jrc.it:80/qmrf/download_attachment.jsp?name=qmrf332_Dermal_Irritation_PII_test_20.sdf"/>
</attachment_validation_data>
<attachment_documents>
<document description="9-8-6-1.snn" filetype="snn" url="http://qsardb.jrc.it:80/qmrf/download_attachment.jsp?name=qmrf332_9-8-6-1.snn"/>
</attachment_documents>
</attachments>
</QSAR_Miscelaneous>
<QMRF_Summary chapter="10" help="" name="Summary (JRC Inventory)">
<QMRF_number chapter="10.1" help="" name="QMRF number">Q17-22-1-332</QMRF_number>
<date_publication chapter="10.2" help="" name="Publication date">2011/12/19</date_publication>
<keywords chapter="10.3" name="Keywords" help="">skin irritation, PII, Draize, Molcode</keywords>
<summary_comments chapter="10.4" name="Comments" help="">To be entered by JRC</summary_comments>
</QMRF_Summary>
</QMRF_chapters>
<Catalogs>
<software_catalog>
<software contact="Turu 2, Tartu, 51014, Estonia" description="" id="firstsoftware" name="QSARModel 3.3.8" number="" url="http://www.molcode.com"/>
<software contact="" description="" id="software_catalog_2" name="QSARModel 3.3.8 " number="" url="http://www.molcode.com"/>
<software contact="" description="" id="software_catalog_3" name="QSARModel 3.3.8 " number="" url="http://www.molcode.com"/>
<software contact="StatSoft Ltd." description=" " id="software_catalog_4" name="Statistica 7" number="" url="http://www.statsoft.com/"/>
</software_catalog>
<algorithms_catalog>
<algorithm definition="Neural network" description="Nonlinear QSAR: backpropagation Neural Network (Multilayer Perceptron) regression" id="algorithms_catalog_6" publication_ref=""/>
</algorithms_catalog>
<descriptors_catalog>
<descriptor description="" id="descriptors_catalog_35" name="count of H-acceptor sites (AM1) " publication_ref="" units=""/>
<descriptor description="" id="descriptors_catalog_36" name="HBCA H-bonding charged surface area (AM1) " publication_ref="" units=""/>
<descriptor description="" id="descriptors_catalog_37" name="FHACA Fractional HACA (HACA/TMSA) (AM1) " publication_ref="" units=""/>
<descriptor description="" id="descriptors_catalog_38" name="Average atom weight " publication_ref="" units=""/>
<descriptor description="" id="descriptors_catalog_39" name="min(#HA, #HD) (AM1) " publication_ref="" units=""/>
<descriptor description="" id="descriptors_catalog_40" name="HACA-2 (AM1) " publication_ref="" units=""/>
<descriptor description="" id="descriptors_catalog_41" name="Number of O atoms " publication_ref="" units=""/>
<descriptor description="" id="descriptors_catalog_42" name="Difference (Pos - Neg) in Charged Surface Areas (Zefirov) " publication_ref="" units=""/>
<descriptor description="" id="descriptors_catalog_43" name="Negatively Charged Part of Charged Surface Area (AM1) " publication_ref="" units=""/>
</descriptors_catalog>
<endpoints_catalog>
<endpoint group="4.Human health effects" id="endpoints_catalog_4" name="4.4.Skin irritation /corrosion" subgroup=""/>
</endpoints_catalog>
<publications_catalog>
<publication id="publications_catalog_2" title="Katritzky A R, Dobchev DA, Fara DC, Hur E, Tämm K, Kuruncz L, Karelson M, Varnek A &amp; Solov'ev VP (2006). Skin Permeation Rate as a Function of Chemical Structure. Journal of Medicinal Chemistry 49, 3305-3314." url=""/>
<publication id="publications_catalog_3" title="Karelson M, Dobchev DA, Kulshyn OV &amp; Katritzky A (2006). Neural Networks Convergence Using Physicochemical Data. Journal of Chemical Information and Modeling 46, 1891- 1897. " url=""/>
<publication id="publications_catalog_4" title="Statistica 7 " url="www.statsoft.com"/>
<publication id="publications_catalog_14" title="ECETOC Technical Report No 66. Skin Irritation and Corrosion: Reference Chemicals Data Bank. March 1995" url=""/>
<publication id="publications_catalog_15" title="Kodithala K, Hopfinger AJ, Thompson ED &amp; Robinson MK (2002). Prediction of skin irritation from organic chemicals using membrane-interaction QSAR analysis. Toxicological Sciences 66, 336–346." url=""/>
<publication id="publications_catalog_16" title="Hayashi M, Nakamura Y, Higashi K, Kato H, Kishida F &amp; Kaneko H (1999). A quantitative structure-Activity relationship study of the skin irritation potential of phenols. Toxicology in Vitro 13, 915-922." url=""/>
</publications_catalog>
<authors_catalog>
<author affiliation="Molcode Ltd. " contact="Turu 2, Tartu, 51014, Estonia " email="models@molcode.com" id="firstauthor" name="Dimitar Dobchev" number="" url="http://www.molcode.com"/>
<author affiliation="Molcode Ltd" contact="Turu 2, Tartu, 51014, Estonia" email="models@molcode.com" id="modelauthor" name="Molcode model development team " number="" url="www.molcode.com"/>
<author affiliation="Molcode Ltd. " contact="Turu 2, Tartu, 51014, Estonia " email="models@molcode.com" id="authors_catalog_3" name="Mati Karelson" number="" url="http://www.molcode.com"/>
<author affiliation="Molcode Ltd. " contact="Turu 2, Tartu, 51014, Estonia " email="models@molcode.com" id="authors_catalog_4" name="Tarmo Tamm" number="" url="http://www.molcode.com"/>
<author affiliation="Molcode Ltd. " contact="Turu 2, Tartu, 51014, Estonia " email="models@molcode.com" id="authors_catalog_5" name="Gunnar Karelson" number="" url="http://www.molcode.com"/>
<author affiliation="Molcode Ltd. " contact="Turu 2, Tartu, 51014, Estonia " email="models@molcode.com" id="authors_catalog_6" name="Indrek Tulp" number="" url="http://www.molcode.com"/>
<author affiliation="Molcode Ltd. " contact="Turu 2, Tartu, 51014, Estonia " email="models@molcode.com" id="authors_catalog_7" name="Dana Martin" number="" url="http://www.molcode.com"/>
<author affiliation="Molcode Ltd. " contact="Turu 2, Tartu, 51014, Estonia " email="models@molcode.com" id="authors_catalog_8" name="Kaido Tämm" number="" url="http://www.molcode.com"/>
<author affiliation="Molcode Ltd. " contact="Turu 2, Tartu, 51014, Estonia " email="models@molcode.com" id="authors_catalog_9" name="Deniss Savchenko" number="" url="http://www.molcode.com"/>
<author affiliation="Molcode Ltd. " contact="Turu 2, Tartu, 51014, Estonia " email="models@molcode.com" id="authors_catalog_10" name="Jaak Jänes" number="" url="http://www.molcode.com"/>
<author affiliation="Molcode Ltd. " contact="Turu 2, Tartu, 51014, Estonia " email="models@molcode.com" id="authors_catalog_11" name="Eneli Härk" number="" url="http://www.molcode.com"/>
<author affiliation="Molcode Ltd. " contact="Turu 2, Tartu, 51014, Estonia " email="models@molcode.com" id="authors_catalog_12" name="Andres Kreegipuu" number="" url="http://www.molcode.com"/>
</authors_catalog>
</Catalogs>
</QMRF>
<!--
	include_attachments
	Replaces <attachments/> in param.xml with attachments from database.
	expects:
	param.id - qmrf_documents.documents.idqmrf
	param.xml - the xml to be transformed
-->
<!--
	include_attachments
	Replaces <attachments/> in param.xml with attachments from database.
	expects:
	param.id - qmrf_documents.documents.idqmrf
	param.xml - the xml to be transformed
-->
<!--
	include_attachments
	Replaces <attachments/> in param.xml with attachments from database.
	expects:
	param.id - qmrf_documents.documents.idqmrf
	param.xml - the xml to be transformed
-->
<!--
	include_attachments
	Replaces <attachments/> in param.xml with attachments from database.
	expects:
	param.id - qmrf_documents.documents.idqmrf
	param.xml - the xml to be transformed
-->