<?xml version="1.0" encoding="US-ASCII"?><?xml-stylesheet href="/styles/xsl/ch.xsl" type="text/xsl" title="ch"?><?xml-stylesheet href="/styles/xsl/chfn.xsl" type="text/xsl" title="chfn" alternate="yes"?><?xml-stylesheet href="/styles/xsl/chfig.xsl" type="text/xsl" title="chfig" alternate="yes"?><?xml-stylesheet href="/styles/xsl/chtable.xsl" type="text/xsl" title="chtable" alternate="yes"?><?xml-stylesheet href="/styles/xsl/chsec.xsl" type="text/xsl" title="chsec" alternate="yes"?><?xml-stylesheet href="/styles/xsl/chreferences.xsl" type="text/xsl" title="chreferences" alternate="yes"?><?xml-stylesheet href="/styles/xsl/chsindex.xsl" type="text/xsl" title="chsindex" alternate="yes"?><?xml-stylesheet href="/styles/xsl/chrelated.xsl" type="text/xsl" title="chrelated" alternate="yes"?><?xml-stylesheet href="/styles/xsl/chconts.xsl" type="text/xsl" title="chconts" alternate="yes"?><?xml-stylesheet href="/styles/xsl/html-identity.xsl" type="text/xsl" title="identity" alternate="yes"?>
<!DOCTYPE wrap
  SYSTEM "../../xml/dtds/local/wrap/wrap.dtd">
<wrap>
  <variables>
    <partno>24</partno>
    <copyright>International Union of Crystallography</copyright>
    <chnumo>24o3</chnumo>
    <published_year>2006</published_year>
    <copyright_year>2006</copyright_year>
    <isbn>0-7923-6857-6</isbn>
    <doi_dep_url>http://xrpp.iucr.org/cgi-bin/itr?url_ver=Z39.88-2003&amp;rft_dat=what%3Dchapter%26volid%3DFa%26chnumo%3D24o3%26chvers%3Dv0001</doi_dep_url>
    <epubmo/>
    <chapter_dir>/Local/Ix86/Linux/ITGEN/httpd_axkit/htdocs/Fa/ch24o3v0001</chapter_dir>
    <doi>10.1107/97809553602060000720</doi>
    <partid>fapart24</partid>
    <shortpart_title>Crystallographic databases</shortpart_title>
    <chid>Fach24o3</chid>
    <ch_title>The Cambridge Structural Database (CSD)</ch_title>
    <epubyr/>
    <next_chapter_dir>/Local/Ix86/Linux/ITGEN/httpd_axkit/htdocs/Fa/ch24o4v0001/</next_chapter_dir>
    <doi_rfr_linking_iucr_html>http://dx.doi.org/openurl?url_ver=Z39.88-2003&amp;rfr_id=ori:rid:iucr.org&amp;rft_id=doi:10.1107/97809553602060000720&amp;rfr_dat=cr%5FsetVer%3D01%26cr%5Fpub%3D10%2E1107%26cr%5Fwork%3DThe%20Cambridge%20Structural%20Database%20%28CSD%29%26cr%5Fsrc%3D10%2E1107%26cr%5FsrvTyp%3Dhtml</doi_rfr_linking_iucr_html>
    <doi_rfr_linking_iucr_pdf>http://dx.doi.org/openurl?url_ver=Z39.88-2003&amp;rfr_id=ori:rid:iucr.org&amp;rft_id=doi:10.1107/97809553602060000720&amp;rfr_dat=cr%5FsetVer%3D01%26cr%5Fpub%3D10%2E1107%26cr%5Fwork%3DThe%20Cambridge%20Structural%20Database%20%28CSD%29%26cr%5Fsrc%3D10%2E1107%26cr%5FsrvTyp%3Dpdf</doi_rfr_linking_iucr_pdf>
    <xref_ch_title>The Cambridge Structural Database (CSD)</xref_ch_title>
    <doi_test_url>http://xrpp.iucr.org/cgi-bin/itr?url_ver=Z39.88-2003&amp;rft_dat=what%3Dchapter%26volid%3DFa%26chnumo%3D24o3%26chvers%3Dv0001&amp;rfr_id=ori:rid:iucr.org&amp;rft_id=doi:10.1107/97809553602060000720&amp;rfr_dat=cr%5FsetVer%3D01%26cr%5Fpub%3D10%2E1107%26cr%5Fwork%3DThe%20Cambridge%20Structural%20Database%20%28CSD%29%26cr%5Fsrc%3D10%2E1107%26cr%5FsrvTyp%3Dhtml</doi_test_url>
    <volid>Fa</volid>
    <fpage>663</fpage>
    <series_title>International Tables for Crystallography</series_title>
    <previous_chapter_dir>/Local/Ix86/Linux/ITGEN/httpd_axkit/htdocs/Fa/ch24o2v0001/</previous_chapter_dir>
    <volume_title>International Tables for Crystallography Volume F</volume_title>
    <doi_rfr_linking_springer_html>http://dx.doi.org/openurl?url_ver=Z39.88-2003&amp;rfr_id=ori:rid:springer.com&amp;rft_id=doi:10.1107/97809553602060000720&amp;rfr_dat=cr%5FsetVer%3D01%26cr%5Fpub%3D10%2E1107%26cr%5Fwork%3DThe%20Cambridge%20Structural%20Database%20%28CSD%29%26cr%5Fsrc%3D10%2E1007%26cr%5FsrvTyp%3Dhtml</doi_rfr_linking_springer_html>
    <editor>M. G. Rossmann and E. Arnold</editor>
    <chnum>24.3</chnum>
    <previous_chapter_durl>/Fa/ch24o2v0001/</previous_chapter_durl>
    <lpage>668</lpage>
    <shortch_title>The Cambridge Structural Database (CSD)</shortch_title>
    <meta_kwds>ConQuest; Pluto; PreQuest; Quest3D; Vista; CSD-Use database; Cambridge Structural Database; databases; intermolecular interactions; IsoStar</meta_kwds>
    <volume>F</volume>
    <doi_rfr_linking_springer_pdf>http://dx.doi.org/openurl?url_ver=Z39.88-2003&amp;rfr_id=ori:rid:springer.com&amp;rft_id=doi:10.1107/97809553602060000720&amp;rfr_dat=cr%5FsetVer%3D01%26cr%5Fpub%3D10%2E1107%26cr%5Fwork%3DThe%20Cambridge%20Structural%20Database%20%28CSD%29%26cr%5Fsrc%3D10%2E1007%26cr%5FsrvTyp%3Dpdf</doi_rfr_linking_springer_pdf>
    <volrevision>a</volrevision>
    <eisbn>1-4020-5416-5</eisbn>
    <next_chapter_durl>/Fa/ch24o4v0001/</next_chapter_durl>
    <epubday/>
    <chvers>v0001</chvers>
    <chapter_durl>/Fa/ch24o3v0001/</chapter_durl>
    <volume_subtitle>Crystallography of biological macromolecules</volume_subtitle>
<volumes>
<value subtitle="Space-group symmetry">A</value>
<value subtitle="Symmetry relations between space groups">A1</value>
<value subtitle="Reciprocal space">B</value>
<value subtitle="Mathematical, physical and chemical tables">C</value>
<value subtitle="Physical properties of crystals">D</value>
<value subtitle="Subperiodic group symmetry">E</value>
<value subtitle="Crystallography of biological macromolecules">F</value>
<value subtitle="Definition and exchange of crystallographic data">G</value>
</volumes>
  </variables>
<fm>

<aug><div class="aug">
<div class="au">
<b> <span class="au">F. H. Allen</span><a class="linkclass" href="#a"><sup>a</sup></a><a class="linkclass" href="#cor"><sup>*</sup></a> and&#160;<span class="au">V. J. Hoy</span><a class="linkclass" href="#a"><sup>a</sup></a></b>
</div>

<div class="aff">
<p><span class="small"><a class="linkclass" name="a"><sup><b>a</b></sup></a>Cambridge Crystallographic Data Centre, 12 Union Road, Cambridge CB2 1EZ, <span class="cny">England</span><br/><a name="cor">Correspondence e-mail:</a>&#160; <a class="linkclass" href="mailto:allen@ccdc.cam.ac.uk">allen@ccdc.cam.ac.uk</a></span></p>
</div>

</div>
</aug>

<authorlist>
<span class="au">F. H. Allen</span>
<span class="au">V. J. Hoy</span>
  <authorsearch>DC%2Ecreator%3D%22F%2E%22%20AND%20DC%2Ecreator%3D%22H%2E%22%20AND%20DC%2Ecreator%3D%22Allen%22</authorsearch>
  <authorsearch>DC%2Ecreator%3D%22V%2E%22%20AND%20DC%2Ecreator%3D%22J%2E%22%20AND%20DC%2Ecreator%3D%22Hoy%22</authorsearch>
</authorlist>
<contribaudata>
<aug>
<au snmindx="Allen, F. H."><span class="au">F. H. Allen</span></au>
<email>allen@ccdc.cam.ac.uk</email>
<aff id="a"><a class="linkclass" name="a"><sup><b>a</b></sup></a>Cambridge Crystallographic Data Centre, 12 Union Road, Cambridge CB2 1EZ, <span class="cny">England</span></aff>
</aug>
<aug>
<au snmindx="Hoy, V. J."><span class="au">V. J. Hoy</span></au>
<email/>
<aff id="a"><a class="linkclass" name="a"><sup><b>a</b></sup></a>Cambridge Crystallographic Data Centre, 12 Union Road, Cambridge CB2 1EZ, <span class="cny">England</span></aff>
</aug>
  <authorsearch>DC%2Ecreator%3D%22F%2E%22%20AND%20DC%2Ecreator%3D%22H%2E%22%20AND%20DC%2Ecreator%3D%22Allen%22</authorsearch>
  <authorsearch>DC%2Ecreator%3D%22V%2E%22%20AND%20DC%2Ecreator%3D%22J%2E%22%20AND%20DC%2Ecreator%3D%22Hoy%22</authorsearch>
</contribaudata>

<xrefauthorinfo>
<au>
<fnm>F. H.</fnm>
<snm>Allen</snm>
<nee/>
<jr/>
</au>
<au>
<fnm>V. J.</fnm>
<snm>Hoy</snm>
<nee/>
<jr/>
</au>
</xrefauthorinfo>

<abs><div id="abs"><p>The Cambridge Structural Database System (CSDS), comprising the Cambridge Structural Database (CSD) and its associated software, as available in mid-2000 is described. The validated information content, comprehensive literature coverage and statistical data for the CSD are summarized. CSDS software for search, retrieval, analysis and display of database content is also reviewed, and typical research applications of the CSDS in structural chemistry and biology are briefly indicated. A new software component of the CSDS, IsoStar (a knowledge base of intermolecular interactions derived from the CSD and the PDB) is also summarized.</p>
</div>
</abs>
</fm>
<bdy>
<subch>
<div id="divsec24o3o1" class="sec1" secnum="24.3.1" fpage="663" lpage="663">
<div class="sectionheaders">
<h3 class="sectionheaders"><a name="sec24o3o1"><tree level="1"/></a>24.3.1. Introduction and historical perspective<indexg><index id="fach24o3index00001" type="s" significance="standard">Cambridge Structural Database (CSD)</index><index id="fach24o3index00002" type="s" significance="standard">Databases<index id="fach24o3index00003" type="s" significance="standard">Cambridge Structural Database</index></index></indexg></h3>
<span class="navlinks"><span class="topnavlinks">| <a class="navlinks" href="#top">top</a></span> | <a class="navlinks" href="/Fa/ch24o3v0001/sec24o3o1.pdf">pdf</a> |</span>
</div>
<st secid="sec24o3o1" secnum="24.3.1">Introduction and historical perspective<indexg><index id="fach24o3index00001" type="s" significance="standard">Cambridge Structural Database (CSD)</index><index id="fach24o3index00002" type="s" significance="standard">Databases<index id="fach24o3index00003" type="s" significance="standard">Cambridge Structural Database</index></index></indexg></st>
<p>The Cambridge Structural Database (CSD: Allen <span class="it"><i>et al.</i></span>, 1991<bbr id="bb2"/>; Kennard &amp; Allen, 1993<bbr id="bb8"/>; <a class="linkclass" href="http://www.ccdc.cam.ac.uk">http://www.ccdc.cam.ac.uk</a>
) is a fully retrospective computerized archive of bibliographic, chemical and numerical data from X-ray and neutron diffraction studies of small organic and metallo-organic molecules. Here, `small' means an upper limit of about 500 non-H atoms. The CSD was established in 1965, when the number of small-molecule crystal structures published each year was just a few hundred and, for this reason, it was possible to rapidly assimilate the earlier literature. However, the advent of increasingly powerful computers and associated advances in data collection and structure solution techniques has led to an almost exponential increase in the number of crystal structures being reported (Fig. 24.3.1.1)<figr id="fig24o3o1o1" loc="float"/>.</p>
<figplace id="fig24o3o1o1"/>
<p>Since the mid-1980s, there has been an average year-on-year increase in the number of CSD entries of very close to 10%. In 1999, around 18&#160;000 structures were added to the database, and in mid-2000 the total archive contained over 220&#160;000 structure determinations. This makes the CSD one of the largest numerical data resources currently available in chemistry (Table 24.3.1.1).<tabler id="table24o3o1o1" loc="float"/> At present, about 48% of the CSD comprises metallo-organic structures, 42% are pure organics, and the remaining 10% are compounds of the main-group elements. The doubling period of the CSD is approximately 7.5 years and, if account is taken of recent advances in diffractometer technology, it is possible to project a total of at least 500&#160;000 database entries by the year 2010.</p>
<tableplace id="table24o3o1o1"/>
<p>In contrast with the Protein Data Bank (PDB: Bernstein <span class="it"><i>et al.</i></span>, 1972<bbr id="bb4"/>; Abola <span class="it"><i>et al.</i></span>, 1997<bbr id="bb1"/>; RCSB, 2000<bbr id="bb9"/>), which has always received its data through direct electronic depositions, the CSD reflects the published literature. Until recently, much of the raw input has been re-keyboarded from hard-copy documents. Thus, in the early years, Cambridge Crystallographic Data Centre (CCDC)<indexg><index id="fach24o3index00004" type="s" significance="standard">Cambridge Crystallographic Data Centre (CCDC)</index></indexg> software development concentrated on data-validation techniques designed to eliminate keyboarding, typographical and scientific errors so as to ensure the accuracy of the master archive. Validation software has recently been upgraded to take advantage of modern computing methods, particularly the rapid developments in high-resolution graphics systems.</p>
<p>Nevertheless, the massive growth of the database has meant that the development of fast and efficient applications software for database search, data retrieval, numerical analysis and visual display has always been a high priority. The first of these software systems became available towards the end of the 1970s and constant updates ensure that the code continues to develop in response to user needs. The CSD system (CSDS), comprising the database and its applications software, is now distributed to about 1000 academic and industrial institutions worldwide.</p>
<p>Users of the CSD span the scientific spectrum, reflecting the wide range of research applications of the data it contains. Over the past two decades, the CSDS has provided the essential basis for research projects in structural chemistry, structure correlation and the rational design of novel bioactive molecules of pharmaceutical or agrochemical interest. A variety of statistical, numerical and computational methodologies have been applied to the CSD, giving rise to the concept of knowledge acquisition, or data mining, from the ever-increasing reservoir of precise experimental results. To date, nearly 700 papers of this type exist in the literature. This activity has, in turn, raised the possibility of the generation of knowledge-based libraries of structural information from the CSD. IsoStar (Bruno <span class="it"><i>et al.</i></span>, 1997<bbr id="bb5"/>), a library of information on non-bonded interactions which was first released in 1997, is the CCDC's first knowledge-based product. A companion knowledge base of intramolecular geometry, Mogul, is now under development, and will contain bond-length, valence-angle and torsional-angle information.</p>
</div>

<div id="divsec24o3o2" class="sec1" secnum="24.3.2" fpage="663" lpage="665">
<div class="sectionheaders">
<h3 class="sectionheaders"><a name="sec24o3o2"><tree level="1"/></a>24.3.2. Information content of the CSD<indexg><index id="fach24o3index00005" type="s" significance="standard">Cambridge Structural Database (CSD)<index id="fach24o3index00006" type="s" significance="standard">content of</index></index></indexg></h3>
<span class="navlinks"><span class="topnavlinks">| <a class="navlinks" href="#top">top</a></span> | <a class="navlinks" href="/Fa/ch24o3v0001/sec24o3o2.pdf">pdf</a> |</span>
</div>
<st secid="sec24o3o2" secnum="24.3.2">Information content of the CSD<indexg><index id="fach24o3index00005" type="s" significance="standard">Cambridge Structural Database (CSD)<index id="fach24o3index00006" type="s" significance="standard">content of</index></index></indexg></st>

<div id="divsec24o3o2o1" class="sec2" secnum="24.3.2.1" fpage="663" lpage="663">
<div class="sectionheaders">
<h4 class="sectionheaders"><a name="sec24o3o2o1"><tree level="2"/></a>24.3.2.1. Acquisition of information</h4>
<span class="navlinks"><span class="topnavlinks">| <a class="navlinks" href="#top">top</a></span> | <a class="navlinks" href="/Fa/ch24o3v0001/sec24o3o2o1.pdf">pdf</a> |</span>
</div>
<st secid="sec24o3o2o1" secnum="24.3.2.1">Acquisition of information</st>
<p>Almost all of the information contained in the CSD has been abstracted from the published literature. Over 800 primary literature sources are cited and the earliest reference is from 1930. Much of the data has been re-keyboarded from the original literature and from hard-copy supplementary deposition documents. The CSD now acts as the official depository for some 40 major international journals. Today, an increasing proportion (around 75% in mid-2000) of the numerical information is received directly in electronic form. The switch from hard-copy input to electronic deposition has been catalysed by the development of the exchange format for crystallographic data, the crystallographic information file<indexg><index id="fach24o3index00007" type="s" significance="standard">Crystallographic information file (CIF)</index><index id="fach24o3index00008" type="s" significance="standard">CIF (crystallographic information file)</index></indexg> or CIF (Hall <span class="it"><i>et al.</i></span>, 1991<bbr id="bb6"/>). The CIF has been adopted as the standard for the subject by the International Union of Crystallography, and is now output by nearly all of the major software packages for structure determination and refinement. Development of the CIF has also led to an increase in direct private depositions of structural data to the CSD, data that, for various reasons, are unlikely to be published through formal mechanisms.</p>
</div>

<div id="divsec24o3o2o2" class="sec2" secnum="24.3.2.2" fpage="663" lpage="664">
<div class="sectionheaders">
<h4 class="sectionheaders"><a name="sec24o3o2o2"><tree level="2"/></a>24.3.2.2. Data organization</h4>
<span class="navlinks"><span class="topnavlinks">| <a class="navlinks" href="#top">top</a></span> | <a class="navlinks" href="/Fa/ch24o3v0001/sec24o3o2o2.pdf">pdf</a> |</span>
</div>
<st secid="sec24o3o2o2" secnum="24.3.2.2">Data organization</st>
<p>Each individual structure in the CSD is referred to as an <span class="it"><i>entry</i></span> and each entry is identified by a <span class="it"><i>reference code</i></span> (<span class="it"><i>refcode</i></span>) containing six alphabetic characters, which characterize a specific chemical compound, and a further two numeric characters which trace the publication history of the structure. The information content of a typical CSD entry is illustrated schematically in Fig. 24.3.2.1.<figr id="fig24o3o2o1" loc="float"/> Individual data items can be categorized into three different groupings which are most conveniently described in terms of their dimensionality.</p>
<figplace id="fig24o3o2o1"/>
</div>

<div id="divsec24o3o2o3" class="sec2" secnum="24.3.2.3" fpage="664" lpage="664">
<div class="sectionheaders">
<h4 class="sectionheaders"><a name="sec24o3o2o3"><tree level="2"/></a>24.3.2.3. 1D bibliographic and chemical data<indexg><index id="fach24o3index00009" type="s" significance="standard">Cambridge Structural Database (CSD)<index id="fach24o3index00010" type="s" significance="standard">bibliographic and chemical data</index></index></indexg></h4>
<span class="navlinks"><span class="topnavlinks">| <a class="navlinks" href="#top">top</a></span> | <a class="navlinks" href="/Fa/ch24o3v0001/sec24o3o2o3.pdf">pdf</a> |</span>
</div>
<st secid="sec24o3o2o3" secnum="24.3.2.3">1D bibliographic and chemical data<indexg><index id="fach24o3index00009" type="s" significance="standard">Cambridge Structural Database (CSD)<index id="fach24o3index00010" type="s" significance="standard">bibliographic and chemical data</index></index></indexg></st>
<p>The one-dimensional data for each entry comprise chemical and bibliographic text strings, together with certain individual numerical items, <span class="it"><i>viz</i></span> chemical compound name and any common synonym(s), chemical formula, authors names, journal name and literature citation, text comment reflecting any special experimental details (non-room-temperature study, absolute configuration determined, neutron study <span class="it"><i>etc.</i></span>). The cell parameters, crystal data, space group and precision indicators also fall into this category.</p>
</div>

<div id="divsec24o3o2o4" class="sec2" secnum="24.3.2.4" fpage="664" lpage="664">
<div class="sectionheaders">
<h4 class="sectionheaders"><a name="sec24o3o2o4"><tree level="2"/></a>24.3.2.4. 2D chemical connectivity data<indexg><index id="fach24o3index00011" type="s" significance="standard">Cambridge Structural Database (CSD)<index id="fach24o3index00012" type="s" significance="standard">chemical connectivity data</index></index></indexg></h4>
<span class="navlinks"><span class="topnavlinks">| <a class="navlinks" href="#top">top</a></span> | <a class="navlinks" href="/Fa/ch24o3v0001/sec24o3o2o4.pdf">pdf</a> |</span>
</div>
<st secid="sec24o3o2o4" secnum="24.3.2.4">2D chemical connectivity data<indexg><index id="fach24o3index00011" type="s" significance="standard">Cambridge Structural Database (CSD)<index id="fach24o3index00012" type="s" significance="standard">chemical connectivity data</index></index></indexg></st>
<p>The formal two-dimensional chemical structural diagram for each entry (Fig. 24.3.2.2)<figr id="fig24o3o2o2" loc="float"/> is encoded in the form of a compact connection table. Chemical connectivity is recorded in terms of a set of atom and bond properties. The atom properties recorded are: atom number, element type, number of connected non-H atoms, number of terminal H atoms and the formal atomic charge. Bond properties are encoded as a pair of atom numbers and the formal chemical bond type that connects those atoms. Bond types employed in the CSD connectivity descriptions are: single, double, triple, quadruple (metal&#8211;metal), aromatic, delocalized double and &#960; bonds. Bond types are (automatically) coded negative if the bond forms part of a cyclic system.</p>
<figplace id="fig24o3o2o2"/>
</div>

<div id="divsec24o3o2o5" class="sec2" secnum="24.3.2.5" fpage="664" lpage="664">
<div class="sectionheaders">
<h4 class="sectionheaders"><a name="sec24o3o2o5"><tree level="2"/></a>24.3.2.5. 3D crystal structure data<indexg><index id="fach24o3index00013" type="s" significance="standard">Cambridge Structural Database (CSD)<index id="fach24o3index00014" type="s" significance="standard">crystal structure data</index></index></indexg></h4>
<span class="navlinks"><span class="topnavlinks">| <a class="navlinks" href="#top">top</a></span> | <a class="navlinks" href="/Fa/ch24o3v0001/sec24o3o2o5.pdf">pdf</a> |</span>
</div>
<st secid="sec24o3o2o5" secnum="24.3.2.5">3D crystal structure data<indexg><index id="fach24o3index00013" type="s" significance="standard">Cambridge Structural Database (CSD)<index id="fach24o3index00014" type="s" significance="standard">crystal structure data</index></index></indexg></st>
<p>The three-dimensional data consist of the fractional coordinates and symmetry operators for each entry. This information, together with the cell dimensions, is used to establish a crystallographic connectivity using standard covalent radii. The chemical and crystallographic connectivities are then mapped onto one another, using graph-theoretic algorithms, so that the chemical atom and bond properties are associated with the three-dimensional structure for search purposes. The CSD always records coordinates for complete molecules. Thus, if a molecule adopts a special position in the assigned space group, <span class="it"><i>i.e.</i></span> the asymmetric unit is some fraction of the total number of atoms in the molecule, then the CSD system also records those symmetry-generated atoms that complete the chemical entity. This speeds up the search process and also makes the data more accessible to non-crystallographers.</p>
</div>

<div id="divsec24o3o2o6" class="sec2" secnum="24.3.2.6" fpage="664" lpage="665">
<div class="sectionheaders">
<h4 class="sectionheaders"><a name="sec24o3o2o6"><tree level="2"/></a>24.3.2.6. Derived data and bit-encoded information</h4>
<span class="navlinks"><span class="topnavlinks">| <a class="navlinks" href="#top">top</a></span> | <a class="navlinks" href="/Fa/ch24o3v0001/sec24o3o2o6.pdf">pdf</a> |</span>
</div>
<st secid="sec24o3o2o6" secnum="24.3.2.6">Derived data and bit-encoded information</st>
<p>Derived data are calculated directly from the evaluated raw data and stored in the master archive for search purposes. Numerical items such as <span class="it"><i>Z</i></span>&#8242;, the number of chemical entities in the asymmetric unit, is a typical (real) numerical data item in this category. However, by far the most useful of the derived data items are a set of 682 individual pieces of yes/no information which are encoded as a bitmap, referred to as the <span class="it"><i>screen</i></span> record. The first 155 of these bits record information about (<span class="it"><i>a</i></span>) the elemental constitution of the compound, (<span class="it"><i>b</i></span>) results of the data-validation procedure and (<span class="it"><i>c</i></span>) summary information about the data content of the entry. These bits can be accessed directly by the user as search keys. The most important parts of the bitmap contain codified yes/no information about the presence/absence of specific features in the complete 2D or 3D structures held in the CSD. When a chemical substructure is entered as a query, its constitution is analysed in the same way to produce a bitmap for the query. Logical comparison of the query bitmap with the bitmap stored for each full CSD entry is computationally rapid, and quickly eliminates those entries that do not contain the requested features. Only those entries that pass this initial screening process need enter the detailed and computationally intensive atom-by-atom, bond-by-bond connectivity mapping that finally confirms (or not) the presence of the required query substructure.</p>
</div>

<div id="divsec24o3o2o7" class="sec2" secnum="24.3.2.7" fpage="665" lpage="665">
<div class="sectionheaders">
<h4 class="sectionheaders"><a name="sec24o3o2o7"><tree level="2"/></a>24.3.2.7. Data validation<indexg><index id="fach24o3index00015" type="s" significance="standard">Cambridge Structural Database (CSD)<index id="fach24o3index00016" type="s" significance="standard">data validation</index></index></indexg></h4>
<span class="navlinks"><span class="topnavlinks">| <a class="navlinks" href="#top">top</a></span> | <a class="navlinks" href="/Fa/ch24o3v0001/sec24o3o2o7.pdf">pdf</a> |</span>
</div>
<st secid="sec24o3o2o7" secnum="24.3.2.7">Data validation<indexg><index id="fach24o3index00015" type="s" significance="standard">Cambridge Structural Database (CSD)<index id="fach24o3index00016" type="s" significance="standard">data validation</index></index></indexg></st>
<p>All data entering the CSD are subject to stringent check and evaluation procedures. Some of these are visual, but the majority are automated within the CSD program <span class="it"><i>PreQuest</i></span><indexg><index id="fach24o3index00017" type="s" significance="standard">Cambridge Structural Database (CSD)<index id="fach24o3index00018" type="s" significance="standard"><span class="it"><i>PreQuest</i></span></index></index><index id="fach24o3index00019" type="s" significance="standard"><span class="it"><i>PreQuest</i></span></index></indexg>. The checks ensure that the 1D and 2D information fields abstracted by CCDC staff are accurately encoded, and that the 3D crystallographic coordinates are consistent with both the chemical description of the structure and with the geometrical description supplied by the authors. Most typographical errors in original papers can be corrected by the CCDC but, in the case of serious discrepancies, the original authors are consulted.</p>
</div>

<div id="divsec24o3o2o8" class="sec2" secnum="24.3.2.8" fpage="665" lpage="665">
<div class="sectionheaders">
<h4 class="sectionheaders"><a name="sec24o3o2o8"><tree level="2"/></a>24.3.2.8. The CSD-Use database<indexg><index id="fach24o3index00020" type="s" significance="standard">Cambridge Structural Database (CSD)<index id="fach24o3index00021" type="s" significance="standard">CSD-Use database</index></index><index id="fach24o3index00022" type="s" significance="standard">CSD-Use database</index></indexg></h4>
<span class="navlinks"><span class="topnavlinks">| <a class="navlinks" href="#top">top</a></span> | <a class="navlinks" href="/Fa/ch24o3v0001/sec24o3o2o8.pdf">pdf</a> |</span>
</div>
<st secid="sec24o3o2o8" secnum="24.3.2.8">The CSD-Use database<indexg><index id="fach24o3index00020" type="s" significance="standard">Cambridge Structural Database (CSD)<index id="fach24o3index00021" type="s" significance="standard">CSD-Use database</index></index><index id="fach24o3index00022" type="s" significance="standard">CSD-Use database</index></indexg></st>
<p>CSD-Use is a database of scientific research papers in which the CSD was used as the principal or sole source of experimental information. The database comprises more than 700 literature citations classified according to the type of systematic study undertaken. Each CSD-Use entry also contains a short summary of the major findings of the research. The database is growing rapidly over time, and is expected to be a valuable resource in the future, since it contains a fully retrospective overview of the data-mining methods and research applications of the CSD.</p>
</div>
</div>

<div id="divsec24o3o3" class="sec1" secnum="24.3.3" fpage="665" lpage="666">
<div class="sectionheaders">
<h3 class="sectionheaders"><a name="sec24o3o3"><tree level="1"/></a>24.3.3. The CSD software system<indexg><index id="fach24o3index00023" type="s" significance="standard">Cambridge Structural Database (CSD)<index id="fach24o3index00024" type="s" significance="standard">software</index></index></indexg></h3>
<span class="navlinks"><span class="topnavlinks">| <a class="navlinks" href="#top">top</a></span> | <a class="navlinks" href="/Fa/ch24o3v0001/sec24o3o3.pdf">pdf</a> |</span>
</div>
<st secid="sec24o3o3" secnum="24.3.3">The CSD software system<indexg><index id="fach24o3index00023" type="s" significance="standard">Cambridge Structural Database (CSD)<index id="fach24o3index00024" type="s" significance="standard">software</index></index></indexg></st>

<div id="divsec24o3o3o1" class="sec2" secnum="24.3.3.1" fpage="665" lpage="665">
<div class="sectionheaders">
<h4 class="sectionheaders"><a name="sec24o3o3o1"><tree level="2"/></a>24.3.3.1. Overview</h4>
<span class="navlinks"><span class="topnavlinks">| <a class="navlinks" href="#top">top</a></span> | <a class="navlinks" href="/Fa/ch24o3v0001/sec24o3o3o1.pdf">pdf</a> |</span>
</div>
<st secid="sec24o3o3o1" secnum="24.3.3.1">Overview</st>
<p>The CSD is supplied with a suite of fully interactive graphical software modules which provides users with facilities to: (<span class="it"><i>a</i></span>) interrogate all of the 1D, 2D and 3D information fields; (<span class="it"><i>b</i></span>) display entries graphically in a variety of styles; (<span class="it"><i>c</i></span>) retrieve relevant data for search hits, including geometrical parameters derived from the stored coordinates; and (<span class="it"><i>d</i></span>) display the derived numerical information, <span class="it"><i>e.g.</i></span> as histograms, scattergrams <span class="it"><i>etc.</i></span>, generate descriptive statistics and perform more complex numerical analyses. More recently, software has been added that permits users to transform their own in-house structural data to CSD formats for inclusion in these processes. A summary of the overall CSD software system is given in Fig. 24.3.3.1<figr id="fig24o3o3o1" loc="float"/> which shows the functional relationships between the four major applications programs.</p>
<figplace id="fig24o3o3o1"/>
</div>

<div id="divsec24o3o3o2" class="sec2" secnum="24.3.3.2" fpage="665" lpage="665">
<div class="sectionheaders">
<h4 class="sectionheaders"><a name="sec24o3o3o2"><tree level="2"/></a>24.3.3.2. <span class="it"><i>PreQuest</i></span><indexg><index id="fach24o3index00025" type="s" significance="standard">Cambridge Structural Database (CSD)<index id="fach24o3index00026" type="s" significance="standard"><span class="it"><i>PreQuest</i></span></index></index><index id="fach24o3index00027" type="s" significance="standard"><span class="it"><i>PreQuest</i></span></index></indexg></h4>
<span class="navlinks"><span class="topnavlinks">| <a class="navlinks" href="#top">top</a></span> | <a class="navlinks" href="/Fa/ch24o3v0001/sec24o3o3o2.pdf">pdf</a> |</span>
</div>
<st secid="sec24o3o3o2" secnum="24.3.3.2"><span class="it"><i>PreQuest</i></span><indexg><index id="fach24o3index00025" type="s" significance="standard">Cambridge Structural Database (CSD)<index id="fach24o3index00026" type="s" significance="standard"><span class="it"><i>PreQuest</i></span></index></index><index id="fach24o3index00027" type="s" significance="standard"><span class="it"><i>PreQuest</i></span></index></indexg></st>
<p><span class="it"><i>PreQuest</i></span> is a data-validation and data-conversion program which is used to create high-quality structural data files in CSD format from, <span class="it"><i>e.g.</i></span>, raw input data from a CIF. <span class="it"><i>PreQuest</i></span> is used routinely by CCDC's scientific editors to create and validate entries for inclusion in the master CSD archive, hence the program is constantly being maintained and upgraded. The released version enables users to build a private CSD-format database of their own structures which can then be searched independently of, or in conjunction with, the master CSD files using the database access programs described below.</p>
</div>

<div id="divsec24o3o3o3" class="sec2" secnum="24.3.3.3" fpage="665" lpage="665">
<div class="sectionheaders">
<h4 class="sectionheaders"><a name="sec24o3o3o3"><tree level="2"/></a>24.3.3.3. Searching the CSD: <span class="it"><i>Quest</i></span>3<span class="it"><i>D</i></span> and <span class="it"><i>ConQuest</i></span><indexg><index id="fach24o3index00028" type="s" significance="standard">Cambridge Structural Database (CSD)<index id="fach24o3index00029" type="s" significance="standard">searching the database</index></index></indexg></h4>
<span class="navlinks"><span class="topnavlinks">| <a class="navlinks" href="#top">top</a></span> | <a class="navlinks" href="/Fa/ch24o3v0001/sec24o3o3o3.pdf">pdf</a> |</span>
</div>
<st secid="sec24o3o3o3" secnum="24.3.3.3">Searching the CSD: <span class="it"><i>Quest</i></span>3<span class="it"><i>D</i></span> and <span class="it"><i>ConQuest</i></span><indexg><index id="fach24o3index00028" type="s" significance="standard">Cambridge Structural Database (CSD)<index id="fach24o3index00029" type="s" significance="standard">searching the database</index></index></indexg></st>
<p><span class="it"><i>Quest</i></span>3<span class="it"><i>D</i></span> has been the main search engine and information-retrieval program for the CSD since the late 1980s. Its main features are summarized below. However, since 1997, the CCDC has been developing its successor, the <span class="it"><i>ConQuest</i></span> program, which was first released as part of the CSD system in April 2000. During an interim period, perhaps two years, <span class="it"><i>ConQuest</i></span> and <span class="it"><i>Quest</i></span>3<span class="it"><i>D</i></span> will both form part of the released CSD system on certain computing platforms while the functionality of the new program is being fully developed. Further details of <span class="it"><i>ConQuest</i></span> are provided in Section 24.3.3.5<secr id="sec24o3o3o5"/>, indicating in particular how it differs from, and improves upon, the facilities available in <span class="it"><i>Quest</i></span>3<span class="it"><i>D</i></span>.</p>
</div>

<div id="divsec24o3o3o4" class="sec2" secnum="24.3.3.4" fpage="665" lpage="666">
<div class="sectionheaders">
<h4 class="sectionheaders"><a name="sec24o3o3o4"><tree level="2"/></a>24.3.3.4. <span class="it"><i>Quest</i></span>3<span class="it"><i>D</i></span><indexg><index id="fach24o3index00030" type="s" significance="standard">Cambridge Structural Database (CSD)<index id="fach24o3index00031" type="s" significance="standard"><span class="it"><i>Quest</i></span>3<span class="it"><i>D</i></span></index></index><index id="fach24o3index00032" type="s" significance="standard"><span class="it"><i>Quest</i></span>3<span class="it"><i>D</i></span></index></indexg></h4>
<span class="navlinks"><span class="topnavlinks">| <a class="navlinks" href="#top">top</a></span> | <a class="navlinks" href="/Fa/ch24o3v0001/sec24o3o3o4.pdf">pdf</a> |</span>
</div>
<st secid="sec24o3o3o4" secnum="24.3.3.4"><span class="it"><i>Quest</i></span>3<span class="it"><i>D</i></span><indexg><index id="fach24o3index00030" type="s" significance="standard">Cambridge Structural Database (CSD)<index id="fach24o3index00031" type="s" significance="standard"><span class="it"><i>Quest</i></span>3<span class="it"><i>D</i></span></index></index><index id="fach24o3index00032" type="s" significance="standard"><span class="it"><i>Quest</i></span>3<span class="it"><i>D</i></span></index></indexg></st>
<p><span class="it"><i>Quest</i></span>3<span class="it"><i>D</i></span> is the main search engine and information-retrieval program for the CSD. It permits interrogation of all information fields: (<span class="it"><i>a</i></span>) 19 text fields, (<span class="it"><i>b</i></span>) 38 individual numerical fields, (<span class="it"><i>c</i></span>) element symbols and element counts, (<span class="it"><i>d</i></span>) full or partial molecular formulae, (<span class="it"><i>e</i></span>) direct access to over 150 bit screens, (<span class="it"><i>f</i></span>) extensive 2D chemical substructure search capabilities, and (<span class="it"><i>g</i></span>) 3D substructure searching at the molecular level or at the extended crystal-structure level. A search of a specific information field is termed a <span class="it"><i>test</i></span> of that field, and is constructed graphically <span class="it"><i>via</i></span> the menu system; menu components correspond to the categories of searches identified above. A complete <span class="it"><i>query</i></span> is then constructed by combining a number of separate <span class="it"><i>test</i></span> components using Boolean logic.</p>
<p>Substructure searching is the most important and frequently used facility. At the molecular level, the substructure (chemical fragment) query is entered graphically and is defined using the formal covalent bond types present in the 2D chemical connectivity tables of the CSD. The process can be extended to locate non-bonded contacts in the complete crystal structure. Here, the individual atoms or chemical groups involved in the contact must be specified, and a limiting non-bonded contact distance must be provided, along with any other geometrical criteria required to define the contact more precisely.</p>
<p>All substructure searches begin with the user drawing the required chemical unit(s) <span class="it"><i>via</i></span> the BUILD menu. Chemical variability and precision are controlled through (<span class="it"><i>a</i></span>) the PERIODIC TABLE sub-menu, which allows for specification of variable element types at specific atomic sites, (<span class="it"><i>b</i></span>) the 2D-CONSTRAIN menu, which allows further chemical restrictions to be specified, such as cyclicity/acyclicity of bonds, exact hydrogen-atom counts, total coordination numbers for atoms <span class="it"><i>etc.</i></span>, and (<span class="it"><i>c</i></span>) the 3D-CONSTRAIN menu, which permits the user to specify a list of geometrical parameters to be calculated by the program for each instance of the fragment located in the CSD; any of these geometrical parameters may be used as criteria to limit the scope of the search, especially at the intermolecular level. A file of calculated geometrical information is output by <span class="it"><i>Quest</i></span>3<span class="it"><i>D</i></span> and may be read by <span class="it"><i>Vista</i></span>, or by external data analysis software. Other <span class="it"><i>Quest</i></span>3<span class="it"><i>D</i></span> output files allow CSD search results to be communicated rapidly to proprietary modelling software.</p>
</div>

<div id="divsec24o3o3o5" class="sec2" secnum="24.3.3.5" fpage="666" lpage="666">
<div class="sectionheaders">
<h4 class="sectionheaders"><a name="sec24o3o3o5"><tree level="2"/></a>24.3.3.5. <span class="it"><i>ConQuest</i></span><indexg><index id="fach24o3index00033" type="s" significance="standard">Cambridge Structural Database (CSD)<index id="fach24o3index00034" type="s" significance="standard"><span class="it"><i>ConQuest</i></span></index></index><index id="fach24o3index00035" type="s" significance="standard"><span class="it"><i>ConQuest</i></span></index></indexg></h4>
<span class="navlinks"><span class="topnavlinks">| <a class="navlinks" href="#top">top</a></span> | <a class="navlinks" href="/Fa/ch24o3v0001/sec24o3o3o5.pdf">pdf</a> |</span>
</div>
<st secid="sec24o3o3o5" secnum="24.3.3.5"><span class="it"><i>ConQuest</i></span><indexg><index id="fach24o3index00033" type="s" significance="standard">Cambridge Structural Database (CSD)<index id="fach24o3index00034" type="s" significance="standard"><span class="it"><i>ConQuest</i></span></index></index><index id="fach24o3index00035" type="s" significance="standard"><span class="it"><i>ConQuest</i></span></index></indexg></st>
<p>The overall aim of the <span class="it"><i>ConQuest</i></span> project is to replace <span class="it"><i>Quest</i></span>3<span class="it"><i>D</i></span> with graphical search software that makes best use of modern computing environments. The primary objective has been to create an interface that is both simple and intuitive to use, so as to encourage use of the CSD by a broader spectrum of scientists. Thus, <span class="it"><i>ConQuest</i></span> provides: (<span class="it"><i>a</i></span>) text and numeric searches <span class="it"><i>via</i></span> pop-up windows, (<span class="it"><i>b</i></span>) a new sketcher window within which to encode 2D and 3D substructure searches, pharmacophore searches, and searches for non-bonded contacts in crystal structures, and (<span class="it"><i>c</i></span>) the immediate viewing of hits with facilities for backward and forward scrolling within hit lists. <span class="it"><i>ConQuest</i></span> is provided with full documentation and tutorials, both online and in printed form, and with context-dependent help facilities. Version 1.0, released in April 2000, contains most of the functionality available within the <span class="it"><i>Quest</i></span>3<span class="it"><i>D</i></span> program, and it is expected that <span class="it"><i>Quest</i></span>3<span class="it"><i>D</i></span> capabilities will soon be exceeded by the new program.</p>
<p>A most important feature of <span class="it"><i>ConQuest</i></span> is its availability on PC-Windows platforms, as well as its implementation under Unix/Linux. Initially, <span class="it"><i>ConQuest</i></span> and the CSD will be the only parts of the full CSD system available under PC-Windows, but <span class="it"><i>Vista</i></span> (or <span class="it"><i>Vista</i></span>-like facilities, see Section 24.3.3.6<secr id="sec24o3o3o6"/>), a new visualizer and provision of the CCDC's knowledge bases (IsoStar and Mogul) will follow as planned developments in the PC area.</p>
</div>

<div id="divsec24o3o3o6" class="sec2" secnum="24.3.3.6" fpage="666" lpage="666">
<div class="sectionheaders">
<h4 class="sectionheaders"><a name="sec24o3o3o6"><tree level="2"/></a>24.3.3.6. <span class="it"><i>Vista</i></span><indexg><index id="fach24o3index00036" type="s" significance="standard">Cambridge Structural Database (CSD)<index id="fach24o3index00037" type="s" significance="standard"><span class="it"><i>Vista</i></span></index></index><index id="fach24o3index00038" type="s" significance="standard"><span class="it"><i>Vista</i></span></index></indexg></h4>
<span class="navlinks"><span class="topnavlinks">| <a class="navlinks" href="#top">top</a></span> | <a class="navlinks" href="/Fa/ch24o3v0001/sec24o3o3o6.pdf">pdf</a> |</span>
</div>
<st secid="sec24o3o3o6" secnum="24.3.3.6"><span class="it"><i>Vista</i></span><indexg><index id="fach24o3index00036" type="s" significance="standard">Cambridge Structural Database (CSD)<index id="fach24o3index00037" type="s" significance="standard"><span class="it"><i>Vista</i></span></index></index><index id="fach24o3index00038" type="s" significance="standard"><span class="it"><i>Vista</i></span></index></indexg></st>
<p><span class="it"><i>Vista</i></span> reads geometrical table(s) generated by <span class="it"><i>Quest</i></span>3<span class="it"><i>D</i></span> and provides extensive facilities for the graphical representation and statistical analysis of the numerical data. Graphical facilities include histograms and scattergrams referred to Cartesian or polar axes, with a hyperlink back to the original CSD entries to permit immediate investigation of, <span class="it"><i>e.g.</i></span>, outlying observations. The contents of plots can be edited interactively, and all illustrations can be output in PostScript format for inclusion in reports and publications. Additionally, <span class="it"><i>Vista</i></span> will generate descriptive statistics for a distribution, carry out simple linear regressions and perform principal-component analyses.</p>
</div>

<div id="divsec24o3o3o7" class="sec2" secnum="24.3.3.7" fpage="666" lpage="666">
<div class="sectionheaders">
<h4 class="sectionheaders"><a name="sec24o3o3o7"><tree level="2"/></a>24.3.3.7. <span class="it"><i>Pluto</i></span><indexg><index id="fach24o3index00039" type="s" significance="standard">Cambridge Structural Database (CSD)<index id="fach24o3index00040" type="s" significance="standard"><span class="it"><i>Pluto</i></span></index></index><index id="fach24o3index00041" type="s" significance="standard"><span class="it"><i>Pluto</i></span></index></indexg></h4>
<span class="navlinks"><span class="topnavlinks">| <a class="navlinks" href="#top">top</a></span> | <a class="navlinks" href="/Fa/ch24o3v0001/sec24o3o3o7.pdf">pdf</a> |</span>
</div>
<st secid="sec24o3o3o7" secnum="24.3.3.7"><span class="it"><i>Pluto</i></span><indexg><index id="fach24o3index00039" type="s" significance="standard">Cambridge Structural Database (CSD)<index id="fach24o3index00040" type="s" significance="standard"><span class="it"><i>Pluto</i></span></index></index><index id="fach24o3index00041" type="s" significance="standard"><span class="it"><i>Pluto</i></span></index></indexg></st>
<p><span class="it"><i>Pluto</i></span> is used to visualize crystal and molecular structures in a variety of styles, including stick diagrams and ball-and-spoke and space-filling representations of individual molecules or extended crystal structures.</p>
</div>

<div id="divsec24o3o3o8" class="sec2" secnum="24.3.3.8" fpage="666" lpage="666">
<div class="sectionheaders">
<h4 class="sectionheaders"><a name="sec24o3o3o8"><tree level="2"/></a>24.3.3.8. Use of the CSD software system: an example<indexg><index id="fach24o3index00042" type="s" significance="standard">Cambridge Structural Database (CSD)<index id="fach24o3index00043" type="s" significance="standard">software</index></index></indexg></h4>
<span class="navlinks"><span class="topnavlinks">| <a class="navlinks" href="#top">top</a></span> | <a class="navlinks" href="/Fa/ch24o3v0001/sec24o3o3o8.pdf">pdf</a> |</span>
</div>
<st secid="sec24o3o3o8" secnum="24.3.3.8">Use of the CSD software system: an example<indexg><index id="fach24o3index00042" type="s" significance="standard">Cambridge Structural Database (CSD)<index id="fach24o3index00043" type="s" significance="standard">software</index></index></indexg></st>
<p>The preceding sections can only give a flavour of the extensive search, analysis and visualization capabilities of <span class="it"><i>Quest</i></span>3<span class="it"><i>D</i></span>, <span class="it"><i>ConQuest</i></span>, <span class="it"><i>Vista</i></span> and <span class="it"><i>Pluto</i></span>, which are fully documented in manuals available online <span class="it"><i>via</i></span> the web address given below, or in printed form from the CCDC.</p>
<p>In this section, we illustrate the application of the CSD system to one specific example: a CSD-based analysis to examine the O&#8212;H&#183;&#183;&#183;O hydrogen-bonding ability of the keto oxygen of Fig. 24.3.3.2<figr id="fig24o3o3o2" loc="float"/>. This example illustrates a number of key features of the software system. The example is constructed in terms of <span class="it"><i>Quest</i></span>3<span class="it"><i>D</i></span> terminology, but identical facilities are available in the <span class="it"><i>ConQuest</i></span> program.</p>
<div id="l1" class="lORD">
<table>
<tbody>
<tr>
<td>
<ul class="none"><li><a name="l1li1"/><p>(1) Draw the two component substructures: the keto group and the O&#8212;H donor group. Constrain the <span class="it"><i>total coordination number</i></span> of C<span class="inf"><sub>1</sub></span>, C<span class="inf"><sub>3</sub></span> (Fig. 24.3.3.2)<figr id="fig24o3o3o2" loc="float"/> to be 4, thus defining them as C(<span class="it"><i>sp</i></span><span class="sup"><sup>3</sup></span>) atoms.</p>
<figplace id="fig24o3o3o2"/>
</li>
<li><a name="l1li2"/><p>(2) Define a non-bonded contact between keto O<span class="inf"><sub>1</sub></span> and hydroxy donor H<span class="inf"><sub>1</sub></span>. Require that this contact (DOH) is less than 2.62&#160;&#197;, the sum of van der Waals radii, after normalization of the H-atom position to correspond to a standard O&#8212;H bond length as determined by neutron diffraction [X-ray location of H atoms is imprecise &#8211; <span class="it"><i>X</i></span>&#8212;H distances are usually foreshortened &#8211; so the system will reposition H atoms along the <span class="it"><i>X</i></span>&#8212;H vector and at an <span class="it"><i>X</i></span>&#8212;H distance that corresponds to the mean value from neutron diffraction experiments (Allen <span class="it"><i>et al.</i></span>, 1987<bbr id="bb3"/>)].</p>
</li>
<li><a name="l1li3"/><p>(3) Define the geometrical parameters shown in Fig. 24.3.3.2,<figr id="fig24o3o3o2" loc="float"/> comprising the H&#183;&#183;&#183;O distance (DOH), the O&#8212;H&#183;&#183;&#183;O angle (AH), and the angles THETA and PHI that describe the angle of approach of H to the putative lone-pair plane of the keto oxygen atom. THETA is the angle of approach of the donor H atom to the plane of the keto group, PHI is the angle of rotation of the projection of the O&#183;&#183;&#183;H vector in that plane; THETA = 0&#176;, PHI = &#177;120&#176; would correspond to H-atom approach along an O-atom lone-pair direction. The search is further constrained so that hits are only accepted if AH &gt; 90&#176;.</p>
</li>
<li><a name="l1li4"/><p>(4) At this stage, the 3D-CONSTRAIN menu will show a graphic which closely resembles Fig. 24.3.3.2<figr id="fig24o3o3o2" loc="float"/>. Test 1 is now defined.</p>
</li>
<li><a name="l1li5"/><p>(5) Since there will be large numbers of examples of keto-O&#183;&#183;&#183;H&#8212;O hydrogen bonds in the CSD, a secondary constraint based on the crystallographic <span class="it"><i>R</i></span> factor is applied so that examples are only located in the more precise structure determinations. To do this, we access the NUMERIC search menu to define RFACT &lt; 0.075 as test 2.</p>
</li>
<li><a name="l1li6"/><p>(6) Enter the QUEST menu, which summarizes all current tests, select the <span class="it"><i>organic structures only</i></span> bit screen, and complete the full query by combining test 1 and test 2 <span class="it"><i>via</i></span> a Boolean .AND. operator.</p>
</li>
</ul></td>
</tr>
</tbody>
</table>
</div>
<p>
</p>
<p>Searches can be performed interactively or allowed to run to completion without further intervention from the user. In interactive mode, <span class="it"><i>Quest</i></span>3<span class="it"><i>D</i></span> presents each hit as it is located, as illustrated in Fig. 24.3.3.3,<figr id="fig24o3o3o3" loc="float"/> and can then display the 1D bibliographic information, a 2D structural diagram, the 3D molecular structure, or a 3D packing diagram by toggling between display options. For an intermolecular search, as exemplified here, the non-bonded contact that triggered the hit is clearly identified. For the example described above, a file of the four user-defined geometrical parameters (DOH, AH, THETA, PHI) for each hit is created for use by <span class="it"><i>Vista</i></span>.</p>
<figplace id="fig24o3o3o3"/>
<p><span class="it"><i>Vista</i></span> displays the geometrical parameters in the form of an interactive spreadsheet; the user may include or exclude specific substructures on the basis of numerical criteria during the data analysis, <span class="it"><i>e.g.</i></span> to focus on a specific range of DOH values, exclude outlying observations <span class="it"><i>etc</i></span>. Hyperlinking between <span class="it"><i>Vista</i></span> and the master CSD file means that all of the database information of Fig. 24.3.1.1<figr id="fig24o3o1o1" loc="float"/> is immediately available during a <span class="it"><i>Vista</i></span> session, either by clicking on a particular fragment in the spreadsheet or on a particular data point in a histogram or scattergram. Use of <span class="it"><i>Vista</i></span> is illustrated for the &gt;C=O&#183;&#183;&#183;H&#8212;O example in Figs. 24.3.3.4,<figr id="fig24o3o3o4" loc="float"/> 24.3.3.5<figr id="fig24o3o3o5" loc="float"/> and 24.3.3.6<figr id="fig24o3o3o6" loc="float"/>.</p>
<figplace id="fig24o3o3o4"/>
<figplace id="fig24o3o3o5"/>
<figplace id="fig24o3o3o6"/>
</div>
</div>

<div id="divsec24o3o4" class="sec1" secnum="24.3.4" fpage="667" lpage="668">
<div class="sectionheaders">
<h3 class="sectionheaders"><a name="sec24o3o4"><tree level="1"/></a>24.3.4. Knowledge engineering from the CSD<indexg><index id="fach24o3index00044" type="s" significance="standard">Cambridge Structural Database (CSD)<index id="fach24o3index00045" type="s" significance="standard">knowledge engineering</index></index></indexg></h3>
<span class="navlinks"><span class="topnavlinks">| <a class="navlinks" href="#top">top</a></span> | <a class="navlinks" href="/Fa/ch24o3v0001/sec24o3o4.pdf">pdf</a> |</span>
</div>
<st secid="sec24o3o4" secnum="24.3.4">Knowledge engineering from the CSD<indexg><index id="fach24o3index00044" type="s" significance="standard">Cambridge Structural Database (CSD)<index id="fach24o3index00045" type="s" significance="standard">knowledge engineering</index></index></indexg></st>

<div id="divsec24o3o4o1" class="sec2" secnum="24.3.4.1" fpage="667" lpage="668">
<div class="sectionheaders">
<h4 class="sectionheaders"><a name="sec24o3o4o1"><tree level="2"/></a>24.3.4.1. Databases <span class="it"><i>versus</i></span> knowledge bases</h4>
<span class="navlinks"><span class="topnavlinks">| <a class="navlinks" href="#top">top</a></span> | <a class="navlinks" href="/Fa/ch24o3v0001/sec24o3o4o1.pdf">pdf</a> |</span>
</div>
<st secid="sec24o3o4o1" secnum="24.3.4.1">Databases <span class="it"><i>versus</i></span> knowledge bases</st>
<p>As illustrated in earlier sections, the CSD represents a collection of primary <span class="it"><i>data</i></span> resulting from diffraction experiments on crystals of small molecules &#8211; in particular the fractional coordinates, space group and cell dimensions that define the 3D crystal and molecular structure. However, the user of the system is usually interested in structural <span class="it"><i>knowledge</i></span> &#8211; in the form of bond lengths, angles, intermolecular contact distances and other parameters &#8211; that can be synthesized from the raw data by the use of the CSD system software. Thus, each detailed analysis carried out using the CSD system represents an experiment in data mining, and considerable operational and intellectual effort is employed in performing such analyses.</p>
<p>At the present state of development of the field, three facts are apparent: (<span class="it"><i>a</i></span>) many data-mining activities centre around a set of standard geometrical data types that are essential for major applications, particularly in structural chemistry, molecular modelling and rational drug design; (<span class="it"><i>b</i></span>) the expertise required to carry out data-mining experiments is not inconsiderable and the time required can be lengthy; and (<span class="it"><i>c</i></span>) as the size of the CSD is increasing rapidly and any compilations of structural knowledge should be updated on a regular basis, the increasing database size makes this operation very time consuming for individual users.</p>
<p>These considerations indicate that access to CSD information should be at two levels, the raw-data level and the structural-knowledge level, and, since 1995, the CCDC has started to derive libraries of structural knowledge from the raw data content of the CSD. The first of these libraries &#8211; IsoStar<indexg><index id="fach24o3index00046" type="s" significance="standard">Cambridge Structural Database (CSD)<index id="fach24o3index00047" type="s" significance="standard">IsoStar</index></index><index id="fach24o3index00048" type="s" significance="standard">IsoStar</index></indexg>: a library of information on intermolecular interactions (Bruno <span class="it"><i>et al.</i></span>, 1997<bbr id="bb5"/>) &#8211; is briefly summarized below. A second library, Mogul<indexg><index id="fach24o3index00049" type="s" significance="standard">Cambridge Structural Database (CSD)<index id="fach24o3index00050" type="s" significance="standard">Mogul</index></index><index id="fach24o3index00051" type="s" significance="standard">Mogul</index></indexg>, containing bond lengths, valence angles and torsional distributions, is currently under development in mid-2000. Such a knowledge base has obvious applications in crystallography, structural chemistry and molecular biology, not least in providing precise geometrical parameters which can be used in 3D model building, structure refinement and reality checking of developing and refined structures. The scientific applications of non-bonded contact geometries and conformational (torsional) information are more fully discussed in Chapter <related volume="F" chnum="22.4" url="/Fa/ch22o4v0001/"><relchtitle>The relevance of the Cambridge Structural Database in protein crystallography</relchtitle><relau>F. H. Allen</relau><relau>J. C. Cole</relau><relau>M. L. Verdonk</relau></related>22.4<a href="/Fa/ch22o4v0001/"><img align="bottom" border="0" src="/graphics/greenarr.gif" alt="[link]"/></a>
.</p>
</div>

<div id="divsec24o3o4o2" class="sec2" secnum="24.3.4.2" fpage="668" lpage="668">
<div class="sectionheaders">
<h4 class="sectionheaders"><a name="sec24o3o4o2"><tree level="2"/></a>24.3.4.2. IsoStar: a library of knowledge about intermolecular interactions<indexg><index id="fach24o3index00052" type="s" significance="standard">Cambridge Structural Database (CSD)<index id="fach24o3index00053" type="s" significance="standard">IsoStar</index></index><index id="fach24o3index00054" type="s" significance="standard">IsoStar</index></indexg><indexg><index id="fach24o3index00055" type="s" significance="standard">Intermolecular interactions<index id="fach24o3index00056" type="s" significance="standard">data from the CSD</index></index><index id="fach24o3index00057" type="s" significance="standard">Intermolecular interactions<index id="fach24o3index00058" type="s" significance="standard">IsoStar</index></index></indexg></h4>
<span class="navlinks"><span class="topnavlinks">| <a class="navlinks" href="#top">top</a></span> | <a class="navlinks" href="/Fa/ch24o3v0001/sec24o3o4o2.pdf">pdf</a> |</span>
</div>
<st secid="sec24o3o4o2" secnum="24.3.4.2">IsoStar: a library of knowledge about intermolecular interactions<indexg><index id="fach24o3index00052" type="s" significance="standard">Cambridge Structural Database (CSD)<index id="fach24o3index00053" type="s" significance="standard">IsoStar</index></index><index id="fach24o3index00054" type="s" significance="standard">IsoStar</index></indexg><indexg><index id="fach24o3index00055" type="s" significance="standard">Intermolecular interactions<index id="fach24o3index00056" type="s" significance="standard">data from the CSD</index></index><index id="fach24o3index00057" type="s" significance="standard">Intermolecular interactions<index id="fach24o3index00058" type="s" significance="standard">IsoStar</index></index></indexg></st>
<p>IsoStar (Bruno <span class="it"><i>et al.</i></span>, 1997<bbr id="bb5"/>) is based on experimental data, not only from the CSD but also from the PDB, and contains some theoretical results calculated using the <span class="it"><i>ab initio</i></span> intermolecular perturbation theory<indexg><index id="fach24o3index00059" type="s" significance="standard">Intermolecular perturbation theory</index></indexg> (IMPT) method of Hayes &amp; Stone (1984<bbr id="bb7"/>). The experimental data in the CSD and the PDB have been used to display interaction geometries involving <span class="it"><i>central groups</i></span> (<span class="it"><i>A</i></span>) and <span class="it"><i>contact groups</i></span> (<span class="it"><i>B</i></span>). CSD search results of the type exemplified above are transformed into an easily visualized form by overlaying the <span class="it"><i>A</i></span> moieties. This results in a 3D distribution (scatterplot) showing the experimental distribution of <span class="it"><i>B</i></span> around <span class="it"><i>A</i></span>. A web-browser front end permits rapid access to these scatterplots, which can be viewed in <span class="it"><i>RasMol</i></span> (Sayle, 1996<bbr id="bb10"/>), interrogated interactively, converted into contoured surfaces <span class="it"><i>etc.</i></span></p>
<p>Version 1.1 of IsoStar, released in October 1998, contains information on non-bonded interactions formed between 310 central groups and 45 contact groups. Version 1.1 contains over 12&#160;000 scatterplots: 9&#160;000 from the CSD and 3&#160;000 from the PDB. IsoStar also reports results for 867 theoretical potential-energy minima calculated using the IMPT procedure. The library will be updated on a regular basis using automated software procedures developed at the CCDC.</p>
<p>Chapter <related volume="F" chnum="22.4" url="/Fa/ch22o4v0001/"><relchtitle>The relevance of the Cambridge Structural Database in protein crystallography</relchtitle><relau>F. H. Allen</relau><relau>J. C. Cole</relau><relau>M. L. Verdonk</relau></related>22.4<a href="/Fa/ch22o4v0001/"><img align="bottom" border="0" src="/graphics/greenarr.gif" alt="[link]"/></a>
 contains illustrative examples from IsoStar, together with a more complete description of the knowledge base and its applications.</p>
</div>
</div>

<div id="divsec24o3o5" class="sec1" secnum="24.3.5" fpage="668" lpage="668">
<div class="sectionheaders">
<h3 class="sectionheaders"><a name="sec24o3o5"><tree level="1"/></a>24.3.5. Accessing the CSD system and IsoStar<indexg><index id="fach24o3index00060" type="s" significance="standard">Cambridge Structural Database (CSD)<index id="fach24o3index00061" type="s" significance="standard">accessing the database</index></index><index id="fach24o3index00062" type="s" significance="standard">IsoStar<index id="fach24o3index00063" type="s" significance="standard">access to</index></index></indexg></h3>
<span class="navlinks"><span class="topnavlinks">| <a class="navlinks" href="#top">top</a></span> | <a class="navlinks" href="/Fa/ch24o3v0001/sec24o3o5.pdf">pdf</a> |</span>
</div>
<st secid="sec24o3o5" secnum="24.3.5">Accessing the CSD system and IsoStar<indexg><index id="fach24o3index00060" type="s" significance="standard">Cambridge Structural Database (CSD)<index id="fach24o3index00061" type="s" significance="standard">accessing the database</index></index><index id="fach24o3index00062" type="s" significance="standard">IsoStar<index id="fach24o3index00063" type="s" significance="standard">access to</index></index></indexg></st>

<div id="divsec24o3o5o1" class="sec2" secnum="24.3.5.1" fpage="668" lpage="668">
<div class="sectionheaders">
<h4 class="sectionheaders"><a name="sec24o3o5o1"><tree level="2"/></a>24.3.5.1. Release mechanisms</h4>
<span class="navlinks"><span class="topnavlinks">| <a class="navlinks" href="#top">top</a></span> | <a class="navlinks" href="/Fa/ch24o3v0001/sec24o3o5o1.pdf">pdf</a> |</span>
</div>
<st secid="sec24o3o5o1" secnum="24.3.5.1">Release mechanisms</st>
<p>The CSD system, comprising the CSD and CSD-Use databases, and all of the applications software described above, is available on CD-ROM for Unix and DEC-VMS platforms and for PCs operating under Linux. At the time of writing (mid-2000), <span class="it"><i>ConQuest</i></span> alone is available for PC-Windows platforms, but the full availability of other components of the CSD system is currently being addressed. The CSD is released twice yearly, in April and October, as an indexed sequential binary file, with full installation instructions contained within the CD. Versions of the CSD have been reformatted for use with proprietary software systems: the MACCS3D/Isis system from Molecular Design Limited, and the Sybyl-UNITY system from Tripos Associates.</p>
<p>Subscribers in academic and other not-for-profit institutions may obtain the CSD system through their local National Affiliated Centre (NAC). The names, addresses and other coordinates of these centres are contained in the CCDC's web pages (see below). Users in countries not covered by NAC arrangements, or users from for-profit companies and organizations, should contact the CCDC directly.</p>
<p>The IsoStar library, for Unix systems only, is released after each library update, currently planned to occur on an annual basis. IsoStar forms part of the distributed CSD system, and CDs are available through the same mechanisms as the main system.</p>
</div>

<div id="divsec24o3o5o2" class="sec2" secnum="24.3.5.2" fpage="668" lpage="668">
<div class="sectionheaders">
<h4 class="sectionheaders"><a name="sec24o3o5o2"><tree level="2"/></a>24.3.5.2. Information about the CCDC</h4>
<span class="navlinks"><span class="topnavlinks">| <a class="navlinks" href="#top">top</a></span> | <a class="navlinks" href="/Fa/ch24o3v0001/sec24o3o5o2.pdf">pdf</a> |</span>
</div>
<st secid="sec24o3o5o2" secnum="24.3.5.2">Information about the CCDC</st>
<p>The CCDC maintains an extensive set of information on the web site <a class="linkclass" href="http://www.ccdc.cam.ac.uk">http://www.ccdc.cam.ac.uk</a>
. The site describes the CSD system, IsoStar, and the associated research and development activities of the CCDC. These pages also provide access to CSD system documentation, provide lists of contact details for the National Affiliated Centres that service not-for-profit users worldwide, and give up-to-date information on how to contact the CCDC directly.</p>
</div>
</div>

<div id="divsec24o3o6" class="sec1" secnum="24.3.6" fpage="668" lpage="668">
<div class="sectionheaders">
<h3 class="sectionheaders"><a name="sec24o3o6"><tree level="1"/></a>24.3.6. Conclusion</h3>
<span class="navlinks"><span class="topnavlinks">| <a class="navlinks" href="#top">top</a></span> | <a class="navlinks" href="/Fa/ch24o3v0001/sec24o3o6.pdf">pdf</a> |</span>
</div>
<st secid="sec24o3o6" secnum="24.3.6">Conclusion</st>
<p>This chapter has provided an overview of the Cambridge Structural Database, its associated software system, other databases and IsoStar &#8211; the first library of structural knowledge to be derived from the CSD. This information is accurate at the time of writing (May 1998, but with some revision in mid-2000). However, the CSD itself, the knowledge bases derived from it and a wide variety of applications software are under continuous development and improvement, and articles such as this can only provide a snapshot of progress at any particular time. Readers of this article are therefore encouraged to visit the CCDC's website (<a class="linkclass" href="http://www.ccdc.cam.ac.uk">http://www.ccdc.cam.ac.uk</a>
) to obtain the latest information on available products and services.<figwrap id="fig24o3o1o1" fpage="663" lpage="663">
<div class="fig">
<table summary="Figure 24.3.1.1" bgcolor="#CCFFCC" border="0" cellpadding="2" width="98%" style="margin-left: auto; margin-right: auto; border: 1px solid green;">
<tbody>
<tr>
<td align="center" width="20%" style="border:solid 1px #000;">
<a class="linkclass" href="/Fa/ch24o3v0001/fig24o3o1o1/"><img src="/figures/Fafig24o3o1o1thm.gif" align="middle" alt="[Figure 24.3.1.1]"/>
<br/></a>
</td>
<td style="border:solid 1px #000;">
<p><span class="size3"><b><a name="fig24o3o1o1">Figure 24.3.1.1</a></b></span>
<span class="navlinks"><span class="topnavlinks">| <a class="navlinks" href="#top">top</a></span> | <a class="navlinks" href="/Fa/ch24o3v0001/fig24o3o1o1.pdf">pdf</a> |</span></p><p>Growth of the CSD since 1970 expressed in terms of the number of structures published per annum.</p>
</td>
</tr>
</tbody>
</table>
</div>
<caption><p>Growth of the CSD since 1970 expressed in terms of the number of structures published per annum.</p></caption>
<short-figcaption><p>Growth of the CSD since 1970 expressed in terms of the number of structures published per annum</p></short-figcaption>
</figwrap>
 <figwrap id="fig24o3o2o1" fpage="664" lpage="664">
<div class="fig">
<table summary="Figure 24.3.2.1" bgcolor="#CCFFCC" border="0" cellpadding="2" width="98%" style="margin-left: auto; margin-right: auto; border: 1px solid green;">
<tbody>
<tr>
<td align="center" width="20%" style="border:solid 1px #000;">
<a class="linkclass" href="/Fa/ch24o3v0001/fig24o3o2o1/"><img src="/figures/Fafig24o3o2o1thm.gif" align="middle" alt="[Figure 24.3.2.1]"/>
<br/></a>
</td>
<td style="border:solid 1px #000;">
<p><span class="size3"><b><a name="fig24o3o2o1">Figure 24.3.2.1</a></b></span>
<span class="navlinks"><span class="topnavlinks">| <a class="navlinks" href="#top">top</a></span> | <a class="navlinks" href="/Fa/ch24o3v0001/fig24o3o2o1.pdf">pdf</a> |</span></p><p>Information content of the Cambridge Structural Database (CSD).</p>
</td>
</tr>
</tbody>
</table>
</div>
<caption><p>Information content of the Cambridge Structural Database (CSD).</p></caption>
<short-figcaption><p>Information content of the Cambridge Structural Database (CSD)</p></short-figcaption>
</figwrap>
 <figwrap id="fig24o3o2o2" fpage="664" lpage="664">
<div class="fig">
<table summary="Figure 24.3.2.2" bgcolor="#CCFFCC" border="0" cellpadding="2" width="98%" style="margin-left: auto; margin-right: auto; border: 1px solid green;">
<tbody>
<tr>
<td align="center" width="20%" style="border:solid 1px #000;">
<a class="linkclass" href="/Fa/ch24o3v0001/fig24o3o2o2/"><img src="/figures/Fafig24o3o2o2thm.gif" align="middle" alt="[Figure 24.3.2.2]"/>
<br/></a>
</td>
<td style="border:solid 1px #000;">
<p><span class="size3"><b><a name="fig24o3o2o2">Figure 24.3.2.2</a></b></span>
<span class="navlinks"><span class="topnavlinks">| <a class="navlinks" href="#top">top</a></span> | <a class="navlinks" href="/Fa/ch24o3v0001/fig24o3o2o2.pdf">pdf</a> |</span></p><p>2D chemical connectivity data for a simple organic molecule.</p>
</td>
</tr>
</tbody>
</table>
</div>
<caption><p>2D chemical connectivity data for a simple organic molecule.</p></caption>
<short-figcaption><p>2D chemical connectivity data for a simple organic molecule</p></short-figcaption>
</figwrap>
 <figwrap id="fig24o3o3o1" fpage="665" lpage="665">
<div class="fig">
<table summary="Figure 24.3.3.1" bgcolor="#CCFFCC" border="0" cellpadding="2" width="98%" style="margin-left: auto; margin-right: auto; border: 1px solid green;">
<tbody>
<tr>
<td align="center" width="20%" style="border:solid 1px #000;">
<a class="linkclass" href="/Fa/ch24o3v0001/fig24o3o3o1/"><img src="/figures/Fafig24o3o3o1thm.gif" align="middle" alt="[Figure 24.3.3.1]"/>
<br/></a>
</td>
<td style="border:solid 1px #000;">
<p><span class="size3"><b><a name="fig24o3o3o1">Figure 24.3.3.1</a></b></span>
<span class="navlinks"><span class="topnavlinks">| <a class="navlinks" href="#top">top</a></span> | <a class="navlinks" href="/Fa/ch24o3v0001/fig24o3o3o1.pdf">pdf</a> |</span></p><p>Summary of the software components of the Cambridge Structural Database system (CSDS).</p>
</td>
</tr>
</tbody>
</table>
</div>
<caption><p>Summary of the software components of the Cambridge Structural Database system (CSDS).</p></caption>
<short-figcaption><p>Summary of the software components of the Cambridge Structural Database system (CSDS)</p></short-figcaption>
</figwrap>
 <figwrap id="fig24o3o3o2" fpage="666" lpage="666">
<div class="fig">
<table summary="Figure 24.3.3.2" bgcolor="#CCFFCC" border="0" cellpadding="2" width="98%" style="margin-left: auto; margin-right: auto; border: 1px solid green;">
<tbody>
<tr>
<td align="center" width="20%" style="border:solid 1px #000;">
<a class="linkclass" href="/Fa/ch24o3v0001/fig24o3o3o2/"><img src="/figures/Fafig24o3o3o2thm.gif" align="middle" alt="[Figure 24.3.3.2]"/>
<br/></a>
</td>
<td style="border:solid 1px #000;">
<p><span class="size3"><b><a name="fig24o3o3o2">Figure 24.3.3.2</a></b></span>
<span class="navlinks"><span class="topnavlinks">| <a class="navlinks" href="#top">top</a></span> | <a class="navlinks" href="/Fa/ch24o3v0001/fig24o3o3o2.pdf">pdf</a> |</span></p><p>The keto&#183;&#183;&#183;hydroxyl fragment described in the example of CSDS usage (see Section 24.3.3.8<secr id="sec24o3o3o8"/>), illustrating the parameters DOH, AH, THETA and PHI used to describe the hydrogen-bonded system.</p>
</td>
</tr>
</tbody>
</table>
</div>
<caption><p>The keto&#183;&#183;&#183;hydroxyl fragment described in the example of CSDS usage (see Section 24.3.3.8<secr id="sec24o3o3o8"/>), illustrating the parameters DOH, AH, THETA and PHI used to describe the hydrogen-bonded system.</p></caption>
<short-figcaption><p>The keto&#183;&#183;&#183;hydroxyl fragment described in the example of CSDS usage</p></short-figcaption>
</figwrap>
 <figwrap id="fig24o3o3o3" fpage="667" lpage="667">
<div class="fig">
<table summary="Figure 24.3.3.3" bgcolor="#CCFFCC" border="0" cellpadding="2" width="98%" style="margin-left: auto; margin-right: auto; border: 1px solid green;">
<tbody>
<tr>
<td align="center" width="20%" style="border:solid 1px #000;">
<a class="linkclass" href="/Fa/ch24o3v0001/fig24o3o3o3/"><img src="/figures/Fafig24o3o3o3thm.gif" align="middle" alt="[Figure 24.3.3.3]"/>
<br/></a>
</td>
<td style="border:solid 1px #000;">
<p><span class="size3"><b><a name="fig24o3o3o3">Figure 24.3.3.3</a></b></span>
<span class="navlinks"><span class="topnavlinks">| <a class="navlinks" href="#top">top</a></span> | <a class="navlinks" href="/Fa/ch24o3v0001/fig24o3o3o3.pdf">pdf</a> |</span></p><p>A typical <span class="it"><i>Quest</i></span>3<span class="it"><i>D</i></span> graphics screen showing how search hits are visualized and manipulated.</p>
</td>
</tr>
</tbody>
</table>
</div>
<caption><p>A typical <span class="it"><i>Quest</i></span>3<span class="it"><i>D</i></span> graphics screen showing how search hits are visualized and manipulated.</p></caption>
<short-figcaption><p>A typical <span class="it"><i>Quest</i></span>3<span class="it"><i>D</i></span> graphics screen showing how search hits are visualized and manipulated</p></short-figcaption>
</figwrap>
 <figwrap id="fig24o3o3o4" fpage="667" lpage="667">
<div class="fig">
<table summary="Figure 24.3.3.4" bgcolor="#CCFFCC" border="0" cellpadding="2" width="98%" style="margin-left: auto; margin-right: auto; border: 1px solid green;">
<tbody>
<tr>
<td align="center" width="20%" style="border:solid 1px #000;">
<a class="linkclass" href="/Fa/ch24o3v0001/fig24o3o3o4/"><img src="/figures/Fafig24o3o3o4thm.gif" align="middle" alt="[Figure 24.3.3.4]"/>
<br/></a>
</td>
<td style="border:solid 1px #000;">
<p><span class="size3"><b><a name="fig24o3o3o4">Figure 24.3.3.4</a></b></span>
<span class="navlinks"><span class="topnavlinks">| <a class="navlinks" href="#top">top</a></span> | <a class="navlinks" href="/Fa/ch24o3v0001/fig24o3o3o4.pdf">pdf</a> |</span></p><p>A <span class="it"><i>Vista</i></span> histogram of the hydrogen-bond distance, DOH, showing a sharp peak in the range 1.8&#8211;2.2&#160;&#197;, well below the sum of van der Waals radii (2.62&#160;&#197;). This peak can be isolated in <span class="it"><i>Vista</i></span> to obtain an estimate of the mean O&#183;&#183;&#183;H separation in &gt;C=O&#183;&#183;&#183;H&#8212;O systems.</p>
</td>
</tr>
</tbody>
</table>
</div>
<caption><p>A <span class="it"><i>Vista</i></span> histogram of the hydrogen-bond distance, DOH, showing a sharp peak in the range 1.8&#8211;2.2&#160;&#197;, well below the sum of van der Waals radii (2.62&#160;&#197;). This peak can be isolated in <span class="it"><i>Vista</i></span> to obtain an estimate of the mean O&#183;&#183;&#183;H separation in &gt;C=O&#183;&#183;&#183;H&#8212;O systems.</p></caption>
<short-figcaption><p>A <span class="it"><i>Vista</i></span> histogram of the hydrogen-bond distance</p></short-figcaption>
</figwrap>
 <figwrap id="fig24o3o3o5" fpage="667" lpage="667">
<div class="fig">
<table summary="Figure 24.3.3.5" bgcolor="#CCFFCC" border="0" cellpadding="2" width="98%" style="margin-left: auto; margin-right: auto; border: 1px solid green;">
<tbody>
<tr>
<td align="center" width="20%" style="border:solid 1px #000;">
<a class="linkclass" href="/Fa/ch24o3v0001/fig24o3o3o5/"><img src="/figures/Fafig24o3o3o5thm.gif" align="middle" alt="[Figure 24.3.3.5]"/>
<br/></a>
</td>
<td style="border:solid 1px #000;">
<p><span class="size3"><b><a name="fig24o3o3o5">Figure 24.3.3.5</a></b></span>
<span class="navlinks"><span class="topnavlinks">| <a class="navlinks" href="#top">top</a></span> | <a class="navlinks" href="/Fa/ch24o3v0001/fig24o3o3o5.pdf">pdf</a> |</span></p><p>A <span class="it"><i>Vista</i></span> scatterplot of the hydrogen-bond length (DOH) <span class="it"><i>versus</i></span> the O&#8212;H&#183;&#183;&#183;O angle (AH). The plot shows a major clustering of observations having short DOH values and hydrogen-bond linearity (AH = 180&#176;): stronger hydrogen bonds prefer to be linear.</p>
</td>
</tr>
</tbody>
</table>
</div>
<caption><p>A <span class="it"><i>Vista</i></span> scatterplot of the hydrogen-bond length (DOH) <span class="it"><i>versus</i></span> the O&#8212;H&#183;&#183;&#183;O angle (AH). The plot shows a major clustering of observations having short DOH values and hydrogen-bond linearity (AH = 180&#176;): stronger hydrogen bonds prefer to be linear.</p></caption>
<short-figcaption><p>A <span class="it"><i>Vista</i></span> scatterplot of the hydrogen-bond length (DOH) <span class="it"><i>versus</i></span> the O&#8212;H&#183;&#183;&#183;O angle (AH)</p></short-figcaption>
</figwrap>
 <figwrap id="fig24o3o3o6" fpage="668" lpage="668">
<div class="fig">
<table summary="Figure 24.3.3.6" bgcolor="#CCFFCC" border="0" cellpadding="2" width="98%" style="margin-left: auto; margin-right: auto; border: 1px solid green;">
<tbody>
<tr>
<td align="center" width="20%" style="border:solid 1px #000;">
<a class="linkclass" href="/Fa/ch24o3v0001/fig24o3o3o6/"><img src="/figures/Fafig24o3o3o6thm.gif" align="middle" alt="[Figure 24.3.3.6]"/>
<br/></a>
</td>
<td style="border:solid 1px #000;">
<p><span class="size3"><b><a name="fig24o3o3o6">Figure 24.3.3.6</a></b></span>
<span class="navlinks"><span class="topnavlinks">| <a class="navlinks" href="#top">top</a></span> | <a class="navlinks" href="/Fa/ch24o3v0001/fig24o3o3o6.pdf">pdf</a> |</span></p><p>A <span class="it"><i>Vista</i></span> polar scatterplot of THETA <span class="it"><i>versus</i></span> PHI, the angles that define the direction of approach of the donor H atom to the &gt;C=O plane. There are clear indications of lone-pair directionality: H prefers an in-plane approach to O (THETA = 0&#176;), with preferred PHI values in the range 120&#8211;135&#176;.</p>
</td>
</tr>
</tbody>
</table>
</div>
<caption><p>A <span class="it"><i>Vista</i></span> polar scatterplot of THETA <span class="it"><i>versus</i></span> PHI, the angles that define the direction of approach of the donor H atom to the &gt;C=O plane. There are clear indications of lone-pair directionality: H prefers an in-plane approach to O (THETA = 0&#176;), with preferred PHI values in the range 120&#8211;135&#176;.</p></caption>
<short-figcaption><p>A <span class="it"><i>Vista</i></span> polar scatterplot of THETA <span class="it"><i>versus</i></span> PHI</p></short-figcaption>
</figwrap>
 <tablewrap id="table24o3o1o1" tablenum="24.3.1.1" fpage="663" lpage="663">
<div class="table">
<table summary="CSD statistics (August 2000)" bgcolor="#CCFFCC" border="0" cellpadding="2" width="98%" style="margin-left: auto; margin-right: auto; border: 1px solid green;">
<tbody>
<tr>
<td>
<table summary="CSD statistics (August 2000)" bgcolor="#CCFFCC" class="tbheader" width="100%">
<tbody>
<tr>
<td align="left" bgcolor="#CCFFCC" valign="bottom">
<p><span class="size3"><b><a name="table24o3o1o1">Table 24.3.1.1</a></b></span><span class="navlinks"><span class="topnavlinks">| <a class="navlinks" href="#top">top</a></span> | <a class="navlinks" href="/Fa/ch24o3v0001/table24o3o1o1.pdf">pdf</a> |</span><br/>
<span class="size2">CSD statistics (August 2000)</span>
</p></td>
</tr>
</tbody>
</table>
<table summary="CSD statistics (August 2000)" bgcolor="#CCFFCC" class="tbheader" width="100%">
<tbody>
<tr>
<td align="left" bgcolor="#CCFFCC" valign="bottom">
<p/></td>
</tr>
</tbody>
</table>
<table summary="CSD statistics (August 2000)" width="98%" style="margin-left: auto; margin-right: auto; border:1px solid green;">
<tbody valign="top">
<tr>
<td bgcolor="#FFFFFF" style="" rowspan="1" colspan="1" align="left" valign="top"><span class="size2">No. of entries</span></td>
<td bgcolor="#FFFFFF" style="" rowspan="1" colspan="1" align="char" valign="top"><span class="size2">224&#160;945</span></td>
</tr>
<tr>
<td bgcolor="#FFFFFF" style="" rowspan="1" colspan="1" align="left" valign="top"><span class="size2">No. of compounds</span></td>
<td bgcolor="#FFFFFF" style="" rowspan="1" colspan="1" align="char" valign="top"><span class="size2">202&#160;669</span></td>
</tr>
<tr>
<td bgcolor="#FFFFFF" style="" rowspan="1" colspan="1" align="left" valign="top"><span class="size2">No. of entries with 3D coordinates</span></td>
<td bgcolor="#FFFFFF" style="" rowspan="1" colspan="1" align="char" valign="top"><span class="size2">198&#160;136</span></td>
</tr>
<tr>
<td bgcolor="#FFFFFF" style="" rowspan="1" colspan="1" align="left" valign="top"><span class="size2">No. of entries with error-free coordinates</span></td>
<td bgcolor="#FFFFFF" style="" rowspan="1" colspan="1" align="char" valign="top"><span class="size2">194&#160;784</span></td>
</tr>
<tr>
<td bgcolor="#FFFFFF" style="" rowspan="1" colspan="1" align="left" valign="top"><span class="size2">No. of atoms having 3D coordinates in the CSD</span></td>
<td bgcolor="#FFFFFF" style="" rowspan="1" colspan="1" align="char" valign="top"><span class="size2">12&#160;906&#160;283</span></td>
</tr>
<tr>
<td bgcolor="#FFFFFF" style="" rowspan="1" colspan="1" align="left" valign="top"><span class="size2">No. of entries in the CSD-Use database</span></td>
<td bgcolor="#FFFFFF" style="" rowspan="1" colspan="1" align="char" valign="top"><span class="size2">792</span></td>
</tr>
</tbody>
</table>
</td>
</tr>
</tbody>
</table>
</div>
<caption><span class="size2">CSD statistics (August 2000)</span></caption>
<short-tbcaption><span class="size2">CSD statistics (August 2000)</span></short-tbcaption>
</tablewrap>
</p>
</div>
</subch></bdy>
<bm>
<bibl>
<bb id="bb1"><bbau index="Abola, E. E.">Abola, E. E.</bbau>, <bbau index="Sussman, J. L.">Sussman, J. L.</bbau>, <bbau index="Prilusky, J.">Prilusky, J.</bbau> &amp; <bbau index="Manning, N. O.">Manning, N. O.</bbau> (1997). <span class="it"><i>Protein Data Bank archives of three-dimensional macromolecular structures. Methods Enzymol.</i></span> <span class="b"><b>277</b></span>, 556&#8211;571.</bb><bb id="bb2"><bbau index="Allen, F. H.">Allen, F. H.</bbau>, <bbau index="Davies, J. E.">Davies, J. E.</bbau>, <bbau index="Galloy, J. J.">Galloy, J. J.</bbau>, <bbau index="Johnson, O.">Johnson, O.</bbau>, <bbau index="Kennard, O.">Kennard, O.</bbau>, <bbau index="Macrae, C. F.">Macrae, C. F.</bbau>, <bbau index="Mitchell, E. M.">Mitchell, E. M.</bbau>, <bbau index="Mitchell, G. F.">Mitchell, G. F.</bbau>, <bbau index="Smith, J. M.">Smith, J. M.</bbau> &amp; <bbau index="Watson, D. G.">Watson, D. G.</bbau> (1991). <span class="it"><i>The development of versions 3 and 4 of the Cambridge Structural Database system. J. Chem. Inf. Comput. Sci.</i></span> <span class="b"><b>31</b></span>, 187&#8211;204.</bb><bb id="bb3"><bbau index="Allen, F. H.">Allen, F. H.</bbau>, <bbau index="Kennard, O.">Kennard, O.</bbau>, <bbau index="Watson, D. G.">Watson, D. G.</bbau>, <bbau index="Brammer, L.">Brammer, L.</bbau>, <bbau index="Orpen, A. G.">Orpen, A. G.</bbau> &amp; <bbau index="Taylor, R.">Taylor, R.</bbau> (1987). <span class="it"><i>Tables of bond lengths determined by X-ray and neutron diffraction. Part 1. Bond lengths in organic compounds. J. Chem. Soc. Perkin Trans.</i></span> 2, pp. S1&#8211;S19.</bb><bb id="bb4"><bbau index="Bernstein, F. C.">Bernstein, F. C.</bbau>, <bbau index="Koetzle, T. F.">Koetzle, T. F.</bbau>, <bbau index="Williams, G. J. B.">Williams, G. J. B.</bbau>, <bbau index="Meyer, E. F.">Meyer, E. F.</bbau>, <bbau index="Brice, M. D.">Brice, M. D.</bbau>, <bbau index="Rodgers, J. R.">Rodgers, J. R.</bbau>, <bbau index="Kennard, O.">Kennard, O.</bbau>, <bbau index="Shimanouchi, T.">Shimanouchi, T.</bbau> &amp; <bbau index="Tasumi, M.">Tasumi, M.</bbau> (1972). <span class="it"><i>The Protein Data Bank: a computer-based archival file for macromolecular structures. J. Mol. Biol.</i></span> <span class="b"><b>112</b></span>, 535&#8211;547.</bb><bb id="bb5"><bbau index="Bruno, I. J.">Bruno, I. J.</bbau>, <bbau index="Cole, J. C.">Cole, J. C.</bbau>, <bbau index="Lommerse, J. P. M.">Lommerse, J. P. M.</bbau>, <bbau index="Rowland, R. S.">Rowland, R. S.</bbau>, <bbau index="Taylor, R.">Taylor, R.</bbau> &amp; <bbau index="Verdonk, M. L.">Verdonk, M. L.</bbau> (1997). <span class="it"><i>IsoStar: a library of information about nonbonded interactions. J. Comput.-Aided Mol. Des.</i></span> <span class="b"><b>11</b></span>, 525&#8211;537.</bb><bb id="bb6"><bbau index="Hall, S. R.">Hall, S. R.</bbau>, <bbau index="Allen, F. H.">Allen, F. H.</bbau> &amp; <bbau index="Brown, I. D.">Brown, I. D.</bbau> (1991). <span class="it"><i>The crystallographic information file (CIF): a new standard archive file for crystallography. Acta Cryst.</i></span> A<span class="b"><b>47</b></span>, 655&#8211;685.</bb><bb id="bb7"><bbau index="Hayes, I. C.">Hayes, I. C.</bbau> &amp; <bbau index="Stone, A. J.">Stone, A. J.</bbau> (1984). <span class="it"><i>An intermolecular perturbation theory for the region of moderate overlap. J. Mol. Phys.</i></span> <span class="b"><b>53</b></span>, 83&#8211;105.</bb><bb id="bb8"><bbau index="Kennard, O.">Kennard, O.</bbau> &amp; <bbau index="Allen, F. H.">Allen, F. H.</bbau> (1993). <span class="it"><i>3D search and research using the Cambridge Structural Database. Chem. Des. Autom. News</i></span>, <span class="b"><b>8</b></span>, 1, 31&#8211;37.</bb><bb id="bb9">RCSB (2000). The Protein Data Bank. Research Collaboratory for Structural Bioinformatics, Department of Chemistry, Rutgers University, Piscataway, NJ, USA (<a class="linkclass" href="http://www.rcsb.org">http://www.rcsb.org</a>
).</bb><bb id="bb10"><bbau index="Sayle, R. A.">Sayle, R.</bbau> (1996). <span class="it"><i>The RASMOL visualiser</i></span>. Glaxo Wellcome Research, Stevenage, Hertfordshire, England.</bb></bibl>
</bm>
<figsection>
<bigfig id="fig24o3o1o1" fignum="24.3.1.1">
<div class="chfigure"><table summary="Figure 24.3.1.1" border="1" bgcolor="#CCFFCC" width="100%">
<tbody>
<tr>
<td align="center">
<img src="/figures/Fafig24o3o1o1.gif" alt="[Figure 24.3.1.1]"/>
<br/>
</td>
</tr>
<tr>
<td>
<span class="size3"><b><a name="fig24o3o1o1">Figure 24.3.1.1</a></b></span>
<p>Growth of the CSD since 1970 expressed in terms of the number of structures published per annum.</p></td>
</tr>
</tbody>
</table>
<br/>
</div>
</bigfig>
<bigfig id="fig24o3o2o1" fignum="24.3.2.1">
<div class="chfigure"><table summary="Figure 24.3.2.1" border="1" bgcolor="#CCFFCC" width="100%">
<tbody>
<tr>
<td align="center">
<img src="/figures/Fafig24o3o2o1.gif" alt="[Figure 24.3.2.1]"/>
<br/>
</td>
</tr>
<tr>
<td>
<span class="size3"><b><a name="fig24o3o2o1">Figure 24.3.2.1</a></b></span>
<p>Information content of the Cambridge Structural Database (CSD).</p></td>
</tr>
</tbody>
</table>
<br/>
</div>
</bigfig>
<bigfig id="fig24o3o2o2" fignum="24.3.2.2">
<div class="chfigure"><table summary="Figure 24.3.2.2" border="1" bgcolor="#CCFFCC" width="100%">
<tbody>
<tr>
<td align="center">
<img src="/figures/Fafig24o3o2o2.gif" alt="[Figure 24.3.2.2]"/>
<br/>
</td>
</tr>
<tr>
<td>
<span class="size3"><b><a name="fig24o3o2o2">Figure 24.3.2.2</a></b></span>
<p>2D chemical connectivity data for a simple organic molecule.</p></td>
</tr>
</tbody>
</table>
<br/>
</div>
</bigfig>
<bigfig id="fig24o3o3o1" fignum="24.3.3.1">
<div class="chfigure"><table summary="Figure 24.3.3.1" border="1" bgcolor="#CCFFCC" width="100%">
<tbody>
<tr>
<td align="center">
<img src="/figures/Fafig24o3o3o1.gif" alt="[Figure 24.3.3.1]"/>
<br/>
</td>
</tr>
<tr>
<td>
<span class="size3"><b><a name="fig24o3o3o1">Figure 24.3.3.1</a></b></span>
<p>Summary of the software components of the Cambridge Structural Database system (CSDS).</p></td>
</tr>
</tbody>
</table>
<br/>
</div>
</bigfig>
<bigfig id="fig24o3o3o2" fignum="24.3.3.2">
<div class="chfigure"><table summary="Figure 24.3.3.2" border="1" bgcolor="#CCFFCC" width="100%">
<tbody>
<tr>
<td align="center">
<img src="/figures/Fafig24o3o3o2.gif" alt="[Figure 24.3.3.2]"/>
<br/>
</td>
</tr>
<tr>
<td>
<span class="size3"><b><a name="fig24o3o3o2">Figure 24.3.3.2</a></b></span>
<p>The keto&#183;&#183;&#183;hydroxyl fragment described in the example of CSDS usage (see Section 24.3.3.8<secr id="sec24o3o3o8"/>), illustrating the parameters DOH, AH, THETA and PHI used to describe the hydrogen-bonded system.</p></td>
</tr>
</tbody>
</table>
<br/>
</div>
</bigfig>
<bigfig id="fig24o3o3o3" fignum="24.3.3.3">
<div class="chfigure"><table summary="Figure 24.3.3.3" border="1" bgcolor="#CCFFCC" width="100%">
<tbody>
<tr>
<td align="center">
<img src="/figures/Fafig24o3o3o3.gif" alt="[Figure 24.3.3.3]"/>
<br/>
</td>
</tr>
<tr>
<td>
<span class="size3"><b><a name="fig24o3o3o3">Figure 24.3.3.3</a></b></span>
<p>A typical <span class="it"><i>Quest</i></span>3<span class="it"><i>D</i></span> graphics screen showing how search hits are visualized and manipulated.</p></td>
</tr>
</tbody>
</table>
<br/>
</div>
</bigfig>
<bigfig id="fig24o3o3o4" fignum="24.3.3.4">
<div class="chfigure"><table summary="Figure 24.3.3.4" border="1" bgcolor="#CCFFCC" width="100%">
<tbody>
<tr>
<td align="center">
<img src="/figures/Fafig24o3o3o4.gif" alt="[Figure 24.3.3.4]"/>
<br/>
</td>
</tr>
<tr>
<td>
<span class="size3"><b><a name="fig24o3o3o4">Figure 24.3.3.4</a></b></span>
<p>A <span class="it"><i>Vista</i></span> histogram of the hydrogen-bond distance, DOH, showing a sharp peak in the range 1.8&#8211;2.2&#160;&#197;, well below the sum of van der Waals radii (2.62&#160;&#197;). This peak can be isolated in <span class="it"><i>Vista</i></span> to obtain an estimate of the mean O&#183;&#183;&#183;H separation in &gt;C=O&#183;&#183;&#183;H&#8212;O systems.</p></td>
</tr>
</tbody>
</table>
<br/>
</div>
</bigfig>
<bigfig id="fig24o3o3o5" fignum="24.3.3.5">
<div class="chfigure"><table summary="Figure 24.3.3.5" border="1" bgcolor="#CCFFCC" width="100%">
<tbody>
<tr>
<td align="center">
<img src="/figures/Fafig24o3o3o5.gif" alt="[Figure 24.3.3.5]"/>
<br/>
</td>
</tr>
<tr>
<td>
<span class="size3"><b><a name="fig24o3o3o5">Figure 24.3.3.5</a></b></span>
<p>A <span class="it"><i>Vista</i></span> scatterplot of the hydrogen-bond length (DOH) <span class="it"><i>versus</i></span> the O&#8212;H&#183;&#183;&#183;O angle (AH). The plot shows a major clustering of observations having short DOH values and hydrogen-bond linearity (AH = 180&#176;): stronger hydrogen bonds prefer to be linear.</p></td>
</tr>
</tbody>
</table>
<br/>
</div>
</bigfig>
<bigfig id="fig24o3o3o6" fignum="24.3.3.6">
<div class="chfigure"><table summary="Figure 24.3.3.6" border="1" bgcolor="#CCFFCC" width="100%">
<tbody>
<tr>
<td align="center">
<img src="/figures/Fafig24o3o3o6.gif" alt="[Figure 24.3.3.6]"/>
<br/>
</td>
</tr>
<tr>
<td>
<span class="size3"><b><a name="fig24o3o3o6">Figure 24.3.3.6</a></b></span>
<p>A <span class="it"><i>Vista</i></span> polar scatterplot of THETA <span class="it"><i>versus</i></span> PHI, the angles that define the direction of approach of the donor H atom to the &gt;C=O plane. There are clear indications of lone-pair directionality: H prefers an in-plane approach to O (THETA = 0&#176;), with preferred PHI values in the range 120&#8211;135&#176;.</p></td>
</tr>
</tbody>
</table>
<br/>
</div>
</bigfig>
</figsection>
<fnsection>
</fnsection>
<indexes>
   <entry number="1">
      <term level="1">
         <level1>Cambridge Crystallographic Data Centre (CCDC)</level1>
         <link indexid="index00004" significance="standard" section="1" chnumo="24o3" id="fach24o3index00004" type="s" volid="Fa" secido="24o3o1" secid="24.3.1"/>
      </term>
   </entry>
   <entry number="21">
      <term level="1">
         <level1>Cambridge Structural Database (CSD)</level1>
         <link indexid="index00001" significance="standard" section="1" chnumo="24o3" type="s" id="fach24o3index00001" secido="24o3o1" volid="Fa" secid="24.3.1"/>
      </term>
      <term level="2">
         <index id="fach24o3index00061" significance="standard" type="s">accessing the database</index>
         <link indexid="index00061" significance="standard" section="1" chnumo="24o3" type="s" id="fach24o3index00061" secido="24o3o5" volid="Fa" secid="24.3.5"/>
      </term>
      <term level="2">
         <index id="fach24o3index00010" significance="standard" type="s">bibliographic and chemical data</index>
         <link indexid="index00010" significance="standard" section="1" chnumo="24o3" type="s" id="fach24o3index00010" secido="24o3o2o3" volid="Fa" secid="24.3.2.3"/>
      </term>
      <term level="2">
         <index id="fach24o3index00012" significance="standard" type="s">chemical connectivity data</index>
         <link indexid="index00012" significance="standard" section="1" chnumo="24o3" type="s" id="fach24o3index00012" secido="24o3o2o4" volid="Fa" secid="24.3.2.4"/>
      </term>
      <term level="2">
         <index id="fach24o3index00034" significance="standard" type="s">
            <span class="it">
               <i>ConQuest</i>
            </span>
         </index>
         <link indexid="index00034" significance="standard" section="1" chnumo="24o3" type="s" id="fach24o3index00034" secido="24o3o3o5" volid="Fa" secid="24.3.3.5"/>
      </term>
      <term level="2">
         <index id="fach24o3index00006" significance="standard" type="s">content of</index>
         <link indexid="index00006" significance="standard" section="1" chnumo="24o3" type="s" id="fach24o3index00006" secido="24o3o2" volid="Fa" secid="24.3.2"/>
      </term>
      <term level="2">
         <index id="fach24o3index00014" significance="standard" type="s">crystal structure data</index>
         <link indexid="index00014" significance="standard" section="1" chnumo="24o3" type="s" id="fach24o3index00014" secido="24o3o2o5" volid="Fa" secid="24.3.2.5"/>
      </term>
      <term level="2">
         <index id="fach24o3index00021" significance="standard" type="s">CSD-Use database</index>
         <link indexid="index00021" significance="standard" section="1" chnumo="24o3" type="s" id="fach24o3index00021" secido="24o3o2o8" volid="Fa" secid="24.3.2.8"/>
      </term>
      <term level="2">
         <index id="fach24o3index00016" significance="standard" type="s">data validation</index>
         <link indexid="index00016" significance="standard" section="1" chnumo="24o3" type="s" id="fach24o3index00016" secido="24o3o2o7" volid="Fa" secid="24.3.2.7"/>
      </term>
      <term level="2">
         <index id="fach24o3index00047" significance="standard" type="s">IsoStar</index>
         <link indexid="index00047" significance="standard" section="1" chnumo="24o3" type="s" id="fach24o3index00047" secido="24o3o4o1" volid="Fa" secid="24.3.4.1"/>
         <link indexid="index00053" significance="standard" section="1" chnumo="24o3" type="s" id="fach24o3index00053" secido="24o3o4o2" volid="Fa" secid="24.3.4.2"/>
      </term>
      <term level="2">
         <index id="fach24o3index00045" significance="standard" type="s">knowledge engineering</index>
         <link indexid="index00045" significance="standard" section="1" chnumo="24o3" type="s" id="fach24o3index00045" secido="24o3o4" volid="Fa" secid="24.3.4"/>
      </term>
      <term level="2">
         <index id="fach24o3index00050" significance="standard" type="s">Mogul</index>
         <link indexid="index00050" significance="standard" section="1" chnumo="24o3" type="s" id="fach24o3index00050" secido="24o3o4o1" volid="Fa" secid="24.3.4.1"/>
      </term>
      <term level="2">
         <index id="fach24o3index00040" significance="standard" type="s">
            <span class="it">
               <i>Pluto</i>
            </span>
         </index>
         <link indexid="index00040" significance="standard" section="1" chnumo="24o3" type="s" id="fach24o3index00040" secido="24o3o3o7" volid="Fa" secid="24.3.3.7"/>
      </term>
      <term level="2">
         <index id="fach24o3index00018" significance="standard" type="s">
            <span class="it">
               <i>PreQuest</i>
            </span>
         </index>
         <link indexid="index00018" significance="standard" section="1" chnumo="24o3" type="s" id="fach24o3index00018" secido="24o3o2o7" volid="Fa" secid="24.3.2.7"/>
         <link indexid="index00026" significance="standard" section="1" chnumo="24o3" type="s" id="fach24o3index00026" secido="24o3o3o2" volid="Fa" secid="24.3.3.2"/>
      </term>
      <term level="2">
         <index id="fach24o3index00031" significance="standard" type="s">
            <span class="it">
               <i>Quest</i>
            </span>3<span class="it">
               <i>D</i>
            </span>
         </index>
         <link indexid="index00031" significance="standard" section="1" chnumo="24o3" type="s" id="fach24o3index00031" secido="24o3o3o4" volid="Fa" secid="24.3.3.4"/>
      </term>
      <term level="2">
         <index id="fach24o3index00029" significance="standard" type="s">searching the database</index>
         <link indexid="index00029" significance="standard" section="1" chnumo="24o3" type="s" id="fach24o3index00029" secido="24o3o3o3" volid="Fa" secid="24.3.3.3"/>
      </term>
      <term level="2">
         <index id="fach24o3index00024" significance="standard" type="s">software</index>
         <link indexid="index00024" significance="standard" section="1" chnumo="24o3" type="s" id="fach24o3index00024" secido="24o3o3" volid="Fa" secid="24.3.3"/>
         <link indexid="index00043" significance="standard" section="1" chnumo="24o3" type="s" id="fach24o3index00043" secido="24o3o3o8" volid="Fa" secid="24.3.3.8"/>
      </term>
      <term level="2">
         <index id="fach24o3index00037" significance="standard" type="s">
            <span class="it">
               <i>Vista</i>
            </span>
         </index>
         <link indexid="index00037" significance="standard" section="1" chnumo="24o3" type="s" id="fach24o3index00037" secido="24o3o3o6" volid="Fa" secid="24.3.3.6"/>
      </term>
   </entry>
   <entry number="1">
      <term level="1">
         <level1>CIF (crystallographic information file)</level1>
         <link indexid="index00008" significance="standard" section="1" chnumo="24o3" type="s" id="fach24o3index00008" secido="24o3o2o1" volid="Fa" secid="24.3.2.1"/>
      </term>
   </entry>
   <entry number="1">
      <term level="1">
         <level1>
            <span class="it">
               <i>ConQuest</i>
            </span>
         </level1>
         <link indexid="index00035" significance="standard" section="1" chnumo="24o3" type="s" id="fach24o3index00035" secido="24o3o3o5" volid="Fa" secid="24.3.3.5"/>
      </term>
   </entry>
   <entry number="1">
      <term level="1">
         <level1>Crystallographic information file (CIF)</level1>
         <link indexid="index00007" significance="standard" section="1" chnumo="24o3" type="s" id="fach24o3index00007" secido="24o3o2o1" volid="Fa" secid="24.3.2.1"/>
      </term>
   </entry>
   <entry number="1">
      <term level="1">
         <level1>CSD-Use database</level1>
         <link indexid="index00022" significance="standard" section="1" chnumo="24o3" type="s" id="fach24o3index00022" secido="24o3o2o8" volid="Fa" secid="24.3.2.8"/>
      </term>
   </entry>
   <entry number="1">
      <term level="1">
         <level1>Databases</level1>
      </term>
      <term level="2">
         <index id="fach24o3index00003" significance="standard" type="s">Cambridge Structural Database</index>
         <link indexid="index00003" significance="standard" section="1" chnumo="24o3" type="s" id="fach24o3index00003" secido="24o3o1" volid="Fa" secid="24.3.1"/>
      </term>
   </entry>
   <entry number="2">
      <term level="1">
         <level1>Intermolecular interactions</level1>
      </term>
      <term level="2">
         <index id="fach24o3index00056" significance="standard" type="s">data from the CSD</index>
         <link indexid="index00056" significance="standard" section="1" chnumo="24o3" type="s" id="fach24o3index00056" secido="24o3o4o2" volid="Fa" secid="24.3.4.2"/>
      </term>
      <term level="2">
         <index id="fach24o3index00058" significance="standard" type="s">IsoStar</index>
         <link indexid="index00058" significance="standard" section="1" chnumo="24o3" type="s" id="fach24o3index00058" secido="24o3o4o2" volid="Fa" secid="24.3.4.2"/>
      </term>
   </entry>
   <entry number="1">
      <term level="1">
         <level1>Intermolecular perturbation theory</level1>
         <link indexid="index00059" significance="standard" section="1" chnumo="24o3" type="s" id="fach24o3index00059" secido="24o3o4o2" volid="Fa" secid="24.3.4.2"/>
      </term>
   </entry>
   <entry number="3">
      <term level="1">
         <level1>IsoStar</level1>
         <link indexid="index00048" significance="standard" section="1" chnumo="24o3" type="s" id="fach24o3index00048" secido="24o3o4o1" volid="Fa" secid="24.3.4.1"/>
         <link indexid="index00054" significance="standard" section="1" chnumo="24o3" type="s" id="fach24o3index00054" secido="24o3o4o2" volid="Fa" secid="24.3.4.2"/>
      </term>
      <term level="2">
         <index id="fach24o3index00063" significance="standard" type="s">access to</index>
         <link indexid="index00063" significance="standard" section="1" chnumo="24o3" type="s" id="fach24o3index00063" secido="24o3o5" volid="Fa" secid="24.3.5"/>
      </term>
   </entry>
   <entry number="1">
      <term level="1">
         <level1>Mogul</level1>
         <link indexid="index00051" significance="standard" section="1" chnumo="24o3" type="s" id="fach24o3index00051" secido="24o3o4o1" volid="Fa" secid="24.3.4.1"/>
      </term>
   </entry>
   <entry number="1">
      <term level="1">
         <level1>
            <span class="it">
               <i>Pluto</i>
            </span>
         </level1>
         <link indexid="index00041" significance="standard" section="1" chnumo="24o3" type="s" id="fach24o3index00041" secido="24o3o3o7" volid="Fa" secid="24.3.3.7"/>
      </term>
   </entry>
   <entry number="2">
      <term level="1">
         <level1>
            <span class="it">
               <i>PreQuest</i>
            </span>
         </level1>
         <link indexid="index00019" significance="standard" section="1" chnumo="24o3" type="s" id="fach24o3index00019" secido="24o3o2o7" volid="Fa" secid="24.3.2.7"/>
         <link indexid="index00027" significance="standard" section="1" chnumo="24o3" type="s" id="fach24o3index00027" secido="24o3o3o2" volid="Fa" secid="24.3.3.2"/>
      </term>
   </entry>
   <entry number="1">
      <term level="1">
         <level1>
            <span class="it">
               <i>Quest</i>
            </span>3<span class="it">
               <i>D</i>
            </span>
         </level1>
         <link indexid="index00032" significance="standard" section="1" chnumo="24o3" type="s" id="fach24o3index00032" secido="24o3o3o4" volid="Fa" secid="24.3.3.4"/>
      </term>
   </entry>
   <entry number="1">
      <term level="1">
         <level1>
            <span class="it">
               <i>Vista</i>
            </span>
         </level1>
         <link indexid="index00038" significance="standard" section="1" chnumo="24o3" type="s" id="fach24o3index00038" secido="24o3o3o6" volid="Fa" secid="24.3.3.6"/>
      </term>
   </entry>
</indexes>
</wrap>