<?xml version="1.0" encoding="ISO-8859-1"?>

<rdf:RDF
 xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#"
 xmlns="http://purl.org/rss/1.0/"
 xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/"
 xmlns:dc="http://purl.org/dc/elements/1.1/"
 xmlns:syn="http://purl.org/rss/1.0/modules/syndication/"
 xmlns:prism="http://purl.org/rss/1.0/modules/prism/"
 xmlns:admin="http://webns.net/mvcb/"
>

<channel rdf:about="http://bioinformatics.oxfordjournals.org">
<title>Bioinformatics - recent issues</title>
<link>http://bioinformatics.oxfordjournals.org</link>
<description>Bioinformatics - RSS feed of recent issues (covers the latest 3 issues, including the current issue) </description>
<prism:eIssn>1460-2059</prism:eIssn>
<prism:publicationName>Bioinformatics</prism:publicationName>
<prism:issn>1367-4803</prism:issn>
<items>
 <rdf:Seq>
  <rdf:li rdf:resource="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/22/2891?rss=1" />
  <rdf:li rdf:resource="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/22/2897?rss=1" />
  <rdf:li rdf:resource="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/22/2906?rss=1" />
  <rdf:li rdf:resource="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/22/2913?rss=1" />
  <rdf:li rdf:resource="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/22/2921?rss=1" />
  <rdf:li rdf:resource="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/22/2929?rss=1" />
  <rdf:li rdf:resource="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/22/2937?rss=1" />
  <rdf:li rdf:resource="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/22/2945?rss=1" />
  <rdf:li rdf:resource="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/22/2955?rss=1" />
  <rdf:li rdf:resource="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/22/2962?rss=1" />
  <rdf:li rdf:resource="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/22/2969?rss=1" />
  <rdf:li rdf:resource="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/22/2975?rss=1" />
  <rdf:li rdf:resource="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/22/2983?rss=1" />
  <rdf:li rdf:resource="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/22/2992?rss=1" />
  <rdf:li rdf:resource="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/22/3001?rss=1" />
  <rdf:li rdf:resource="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/22/3005?rss=1" />
  <rdf:li rdf:resource="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/22/3012?rss=1" />
  <rdf:li rdf:resource="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/22/3020?rss=1" />
  <rdf:li rdf:resource="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/22/3026?rss=1" />
  <rdf:li rdf:resource="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/22/3028?rss=1" />
  <rdf:li rdf:resource="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/22/3031?rss=1" />
  <rdf:li rdf:resource="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/22/3033?rss=1" />
  <rdf:li rdf:resource="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/22/3035?rss=1" />
  <rdf:li rdf:resource="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/22/3038?rss=1" />
  <rdf:li rdf:resource="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/22/3040?rss=1" />
  <rdf:li rdf:resource="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/22/3043?rss=1" />
  <rdf:li rdf:resource="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/22/3045?rss=1" />
  <rdf:li rdf:resource="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/22/3047?rss=1" />
  <rdf:li rdf:resource="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/21/2735?rss=1" />
  <rdf:li rdf:resource="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/21/2744?rss=1" />
  <rdf:li rdf:resource="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/21/2751?rss=1" />
  <rdf:li rdf:resource="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/21/2757?rss=1" />
  <rdf:li rdf:resource="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/21/2764?rss=1" />
  <rdf:li rdf:resource="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/21/2772?rss=1" />
  <rdf:li rdf:resource="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/21/2780?rss=1" />
  <rdf:li rdf:resource="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/21/2787?rss=1" />
  <rdf:li rdf:resource="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/21/2795?rss=1" />
  <rdf:li rdf:resource="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/21/2802?rss=1" />
  <rdf:li rdf:resource="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/21/2809?rss=1" />
  <rdf:li rdf:resource="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/21/2816?rss=1" />
  <rdf:li rdf:resource="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/21/2824?rss=1" />
  <rdf:li rdf:resource="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/21/2831?rss=1" />
  <rdf:li rdf:resource="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/21/2839?rss=1" />
  <rdf:li rdf:resource="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/21/2841?rss=1" />
  <rdf:li rdf:resource="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/21/2843?rss=1" />
  <rdf:li rdf:resource="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/21/2845?rss=1" />
  <rdf:li rdf:resource="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/21/2848?rss=1" />
  <rdf:li rdf:resource="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/21/2850?rss=1" />
  <rdf:li rdf:resource="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/21/2853?rss=1" />
  <rdf:li rdf:resource="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/21/2855?rss=1" />
  <rdf:li rdf:resource="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/21/2857?rss=1" />
  <rdf:li rdf:resource="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/21/2860?rss=1" />
  <rdf:li rdf:resource="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/21/2863?rss=1" />
  <rdf:li rdf:resource="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/21/2865?rss=1" />
  <rdf:li rdf:resource="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/21/2872?rss=1" />
  <rdf:li rdf:resource="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/21/2878?rss=1" />
  <rdf:li rdf:resource="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/21/2882?rss=1" />
  <rdf:li rdf:resource="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/20/2625?rss=1" />
  <rdf:li rdf:resource="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/20/2632?rss=1" />
  <rdf:li rdf:resource="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/20/2639?rss=1" />
  <rdf:li rdf:resource="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/20/2646?rss=1" />
  <rdf:li rdf:resource="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/20/2655?rss=1" />
  <rdf:li rdf:resource="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/20/2663?rss=1" />
  <rdf:li rdf:resource="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/20/2670?rss=1" />
  <rdf:li rdf:resource="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/20/2677?rss=1" />
  <rdf:li rdf:resource="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/20/2685?rss=1" />
  <rdf:li rdf:resource="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/20/2692?rss=1" />
  <rdf:li rdf:resource="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/20/2700?rss=1" />
  <rdf:li rdf:resource="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/20/2708?rss=1" />
  <rdf:li rdf:resource="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/20/2715?rss=1" />
  <rdf:li rdf:resource="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/20/2723?rss=1" />
  <rdf:li rdf:resource="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/20/2730?rss=1" />
  <rdf:li rdf:resource="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/20/2732?rss=1" />
  <rdf:li rdf:resource="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/20/2734?rss=1" />
  <rdf:li rdf:resource="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/20/2737?rss=1" />
  <rdf:li rdf:resource="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/20/2739?rss=1" />
  <rdf:li rdf:resource="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/20/2741?rss=1" />
  <rdf:li rdf:resource="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/20/2743?rss=1" />
  <rdf:li rdf:resource="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/20/2745?rss=1" />
  <rdf:li rdf:resource="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/20/2747?rss=1" />
  <rdf:li rdf:resource="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/20/2750?rss=1" />
  <rdf:li rdf:resource="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/20/2753?rss=1" />
  <rdf:li rdf:resource="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/20/2755?rss=1" />
  <rdf:li rdf:resource="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/20/2758?rss=1" />
  <rdf:li rdf:resource="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/20/2760?rss=1" />
  <rdf:li rdf:resource="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/20/2762?rss=1" />
  <rdf:li rdf:resource="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/20/2764?rss=1" />
  <rdf:li rdf:resource="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/20/2768?rss=1" />
  <rdf:li rdf:resource="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/20/2770?rss=1" />
  <rdf:li rdf:resource="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/20/2772?rss=1" />
  <rdf:li rdf:resource="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/20/2773?rss=1" />
 </rdf:Seq>
</items>
</channel>

<item rdf:about="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/22/2891?rss=1">
<title><![CDATA[Phenotypic categorization of genetic skin diseases reveals new relations between phenotypes, genes and pathways]]></title>
<link>http://bioinformatics.oxfordjournals.org/cgi/content/short/25/22/2891?rss=1</link>
<description><![CDATA[
<p><b>Motivation:</b> Systematic analysis of connection between proteins, their cellular function and phenotypic manifestations in disease is a central problem of biological and clinical research. The solution to this problem requires the development of new approaches to link the rapidly growing dataset of gene&ndash;disease associations with the many complex and overlapping phenotypes of human disease.</p>
<p><b>Results:</b> We analyze genetic skin disorders and suggest a manually designed set of elementary phenotypes whose combinations define diseases as points in a multidimensional space, providing a basis for phenotypic disease clustering. Placing the known gene&ndash;disease associations in the context of this space reveals new patterns that suggest previously unknown functional links between proteins, signaling pathways and disease phenotypes. For example, analysis of telangiectasias (spider vein diseases) reveals a previously unrecognized interplay between the TGF-&beta; signaling pathway and pentose phosphate pathway. This interaction may mediate glucose-dependent regulation of TGF-&beta; signaling, providing a clue to the known association between angiopathies and diabetes and implying new gene candidates for mutational analysis and drug targeting.</p>
<p><b>Contact:</b> <inter-ref locator="grishin@chop.swmed.edu" locator-type="email">grishin@chop.swmed.edu</inter-ref></p>
<p><b>Supplementary information:</b> <inter-ref locator="http://bioinformatics.oxfordjournals.org/cgi/content/full/btp538/DC1" locator-type="url">Supplementary data</inter-ref> are available at <I>Bioinformatics</I> online.</p>
]]></description>
<dc:creator><![CDATA[Sadreyev, R. I., Feramisco, J. D., Tsao, H., Grishin, N. V.]]></dc:creator>
<dc:date>Wed, 04 Nov 2009 05:45:49 PST</dc:date>
<dc:identifier>info:doi/10.1093/bioinformatics/btp538</dc:identifier>
<dc:title><![CDATA[Phenotypic categorization of genetic skin diseases reveals new relations between phenotypes, genes and pathways]]></dc:title>
<dc:publisher>Oxford University Press</dc:publisher>
<prism:number>22</prism:number>
<prism:volume>25</prism:volume>
<prism:endingPage>2896</prism:endingPage>
<prism:publicationDate>2009-11-15</prism:publicationDate>
<prism:startingPage>2891</prism:startingPage>
<prism:section>SYSTEMS BIOLOGY</prism:section>
</item>

<item rdf:about="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/22/2897?rss=1">
<title><![CDATA[De novo computational prediction of non-coding RNA genes in prokaryotic genomes]]></title>
<link>http://bioinformatics.oxfordjournals.org/cgi/content/short/25/22/2897?rss=1</link>
<description><![CDATA[
<p><b>Motivation:</b> The computational identification of non-coding RNA (ncRNA) genes represents one of the most important and challenging problems in computational biology. Existing methods for ncRNA gene prediction rely mostly on homology information, thus limiting their applications to ncRNA genes with known homologues.</p>
<p><b>Results:</b> We present a novel <I>de novo</I> prediction algorithm for ncRNA genes using features derived from the sequences and structures of known ncRNA genes in comparison to decoys. Using these features, we have trained a neural network-based classifier and have applied it to <I>Escherichia coli</I> and <I>Sulfolobus solfataricus</I> for genome-wide prediction of ncRNAs. Our method has an average prediction sensitivity and specificity of 68% and 70%, respectively, for identifying windows with potential for ncRNA genes in <I>E.coli</I>. By combining windows of different sizes and using positional filtering strategies, we predicted 601 candidate ncRNAs and recovered 41% of known ncRNAs in <I>E.coli</I>. We experimentally investigated six novel candidates using Northern blot analysis and found expression of three candidates: one represents a potential new ncRNA, one is associated with stable mRNA decay intermediates and one is a case of either a potential riboswitch or transcription attenuator involved in the regulation of cell division. In general, our approach enables the identification of both <I>cis</I>- and <I>trans</I>-acting ncRNAs in partially or completely sequenced microbial genomes without requiring homology or structural conservation.</p>
<p><b>Availability:</b> The source code and results are available at <inter-ref locator="http://csbl.bmb.uga.edu/publications/materials/tran/" locator-type="url">http://csbl.bmb.uga.edu/publications/materials/tran/</inter-ref>.</p>
<p><b>Contact:</b> <inter-ref locator="xyn@bmb.uga.edu" locator-type="email">xyn@bmb.uga.edu</inter-ref></p>
<p><b>Supplementary information:</b> <inter-ref locator="http://bioinformatics.oxfordjournals.org/cgi/content/full/537/DC1" locator-type="url">Supplementary data</inter-ref> are available at <I>Bioinformatics</I> online.</p>
]]></description>
<dc:creator><![CDATA[Tran, T. T., Zhou, F., Marshburn, S., Stead, M., Kushner, S. R., Xu, Y.]]></dc:creator>
<dc:date>Wed, 04 Nov 2009 05:45:49 PST</dc:date>
<dc:identifier>info:doi/10.1093/bioinformatics/btp537</dc:identifier>
<dc:title><![CDATA[De novo computational prediction of non-coding RNA genes in prokaryotic genomes]]></dc:title>
<dc:publisher>Oxford University Press</dc:publisher>
<prism:number>22</prism:number>
<prism:volume>25</prism:volume>
<prism:endingPage>2905</prism:endingPage>
<prism:publicationDate>2009-11-15</prism:publicationDate>
<prism:startingPage>2897</prism:startingPage>
<prism:section>GENOME ANALYSIS</prism:section>
</item>

<item rdf:about="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/22/2906?rss=1">
<title><![CDATA[Integrative clustering of multiple genomic data types using a joint latent variable model with application to breast and lung cancer subtype analysis]]></title>
<link>http://bioinformatics.oxfordjournals.org/cgi/content/short/25/22/2906?rss=1</link>
<description><![CDATA[
<p><b>Motivation:</b> The molecular complexity of a tumor manifests itself at the genomic, epigenomic, transcriptomic and proteomic levels. Genomic profiling at these multiple levels should allow an integrated characterization of tumor etiology. However, there is a shortage of effective statistical and bioinformatic tools for truly integrative data analysis. The standard approach to integrative clustering is separate clustering followed by manual integration. A more statistically powerful approach would incorporate all data types simultaneously and generate a single integrated cluster assignment.</p>
<p><b>Methods:</b> We developed a joint latent variable model for integrative clustering. We call the resulting methodology iCluster. iCluster incorporates flexible modeling of the associations between different data types and the variance&ndash;covariance structure within data types in a single framework, while simultaneously reducing the dimensionality of the datasets. Likelihood-based inference is obtained through the Expectation&ndash;Maximization algorithm.</p>
<p><b>Results:</b> We demonstrate the iCluster algorithm using two examples of joint analysis of copy number and gene expression data, one from breast cancer and one from lung cancer. In both cases, we identified subtypes characterized by concordant DNA copy number changes and gene expression as well as unique profiles specific to one or the other in a completely automated fashion. In addition, the algorithm discovers potentially novel subtypes by combining weak yet consistent alteration patterns across data types.</p>
<p><b>Availability:</b> R code to implement iCluster can be downloaded at <inter-ref locator="http://www.mskcc.org/mskcc/html/85130.cfm" locator-type="url">http://www.mskcc.org/mskcc/html/85130.cfm</inter-ref></p>
<p><b>Contact:</b> <inter-ref locator="shenr@mskcc.org" locator-type="email">shenr@mskcc.org</inter-ref></p>
<p><b>Supplementary information:</b> <inter-ref locator="http://bioinformatics.oxfordjournals.org/cgi/content/full/543/DC1" locator-type="url">Supplementary data</inter-ref> are available at <I>Bioinformatics</I> online.</p>
]]></description>
<dc:creator><![CDATA[Shen, R., Olshen, A. B., Ladanyi, M.]]></dc:creator>
<dc:date>Wed, 04 Nov 2009 05:45:49 PST</dc:date>
<dc:identifier>info:doi/10.1093/bioinformatics/btp543</dc:identifier>
<dc:title><![CDATA[Integrative clustering of multiple genomic data types using a joint latent variable model with application to breast and lung cancer subtype analysis]]></dc:title>
<dc:publisher>Oxford University Press</dc:publisher>
<prism:number>22</prism:number>
<prism:volume>25</prism:volume>
<prism:endingPage>2912</prism:endingPage>
<prism:publicationDate>2009-11-15</prism:publicationDate>
<prism:startingPage>2906</prism:startingPage>
<prism:section>GENOME ANALYSIS</prism:section>
</item>

<item rdf:about="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/22/2913?rss=1">
<title><![CDATA[Predicting homologous signaling pathways using machine learning]]></title>
<link>http://bioinformatics.oxfordjournals.org/cgi/content/short/25/22/2913?rss=1</link>
<description><![CDATA[
<p><b>Motivation:</b> In general, each cell signaling pathway involves many proteins, each with one or more specific roles. As they are essential components of cell activity, it is important to understand how these proteins work&mdash;and in particular, to determine which of the species' proteins participate in each role. Experimentally determining this mapping of proteins to roles is difficult and time consuming. Fortunately, many pathways are similar across species, so we may be able to use known pathway information of one species to understand the corresponding pathway of another.</p>
<p><b>Results:</b> We present an automatic approach, Predict Signaling Pathway (PSP), which uses the signaling pathways in well-studied species to predict the roles of proteins in less-studied species. We use a machine learning approach to create a predictor that achieves a generalization <I>F</I>-measure of 78.2% when applied to 11 different pathways across 14 different species. We also show our approach is very effective in predicting the pathways that have not yet been experimentally studied completely.</p>
<p><b>Availability:</b> The list of predicted proteins for all pathways over all considered species is available at <inter-ref locator="http://www.cs.ualberta.ca/~bioinfo/signaling" locator-type="url">http://www.cs.ualberta.ca/~bioinfo/signaling</inter-ref>.</p>
<p><b>Contact:</b> <inter-ref locator="bioinfo@cs.ualberta.ca" locator-type="email">bioinfo@cs.ualberta.ca</inter-ref>; <inter-ref locator="duane@cs.ualberta.ca" locator-type="email">duane@cs.ualberta.ca</inter-ref></p>
]]></description>
<dc:creator><![CDATA[Bostan, B., Greiner, R., Szafron, D., Lu, P.]]></dc:creator>
<dc:date>Wed, 04 Nov 2009 05:45:49 PST</dc:date>
<dc:identifier>info:doi/10.1093/bioinformatics/btp532</dc:identifier>
<dc:title><![CDATA[Predicting homologous signaling pathways using machine learning]]></dc:title>
<dc:publisher>Oxford University Press</dc:publisher>
<prism:number>22</prism:number>
<prism:volume>25</prism:volume>
<prism:endingPage>2920</prism:endingPage>
<prism:publicationDate>2009-11-15</prism:publicationDate>
<prism:startingPage>2913</prism:startingPage>
<prism:section>SEQUENCE ANALYSIS</prism:section>
</item>

<item rdf:about="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/22/2921?rss=1">
<title><![CDATA[Understanding hydrogen-bond patterns in proteins using network motifs]]></title>
<link>http://bioinformatics.oxfordjournals.org/cgi/content/short/25/22/2921?rss=1</link>
<description><![CDATA[
<p><b>Summary:</b> Protein structures can be viewed as networks of contacts (edges) between amino-acid residues (nodes). Here we dissect proteins into sub-graphs consisting of six nodes and their corresponding edges, with an edge being either a backbone hydrogen bond (H-bond) or a covalent interaction. Six thousand three hundred and twenty-two such sub-graphs were found in a large non-redundant dataset of high-resolution structures, from which 35 occur much more frequently than in a random model. Many of these significant sub-graphs (also called network motifs) correspond to sub-structures of  helices and &beta;-sheets, as expected. However, others correspond to more exotic sub-structures such as 3<SUB>10</SUB> helix, Schellman motif and motifs that were not defined previously. This topological characterization of patterns is very useful for producing a detailed differences map to compare protein structures. Here we analyzed in details the differences between NMR, molecular dynamics (MD) simulations and X-ray structures for Lysozyme, SH3 and the lambda repressor. In these cases, the same structures solved by NMR and simulated by MD showed small but consistent differences in their motif composition from the crystal structures, despite a very small root mean square deviation (RMSD) between them. This may be due to differences in the pair-wise energy functions used and the dynamic nature of these proteins.</p>
<p><b>Availability:</b> A web-based tool to calculate network motifs is available at <inter-ref locator="http://bioinfo.weizmann.ac.il/protmot/" locator-type="url">http://bioinfo.weizmann.ac.il/protmot/</inter-ref>.</p>
<p><b>Contact:</b> <inter-ref locator="gideon.schreiber@weizmann.ac.il" locator-type="email">gideon.schreiber@weizmann.ac.il</inter-ref>; <inter-ref locator="koby.levy@weizmann.ac.il" locator-type="email">koby.levy@weizmann.ac.il</inter-ref></p>
<p><b>Supplementary information:</b> <inter-ref locator="http://bioinformatics.oxfordjournals.org/cgi/content/full/541/DC1" locator-type="url">Supplementary data</inter-ref> are available at <I>Bioinformatics</I> online.</p>
]]></description>
<dc:creator><![CDATA[Rahat, O., Alon, U., Levy, Y., Schreiber, G.]]></dc:creator>
<dc:date>Wed, 04 Nov 2009 05:45:49 PST</dc:date>
<dc:identifier>info:doi/10.1093/bioinformatics/btp541</dc:identifier>
<dc:title><![CDATA[Understanding hydrogen-bond patterns in proteins using network motifs]]></dc:title>
<dc:publisher>Oxford University Press</dc:publisher>
<prism:number>22</prism:number>
<prism:volume>25</prism:volume>
<prism:endingPage>2928</prism:endingPage>
<prism:publicationDate>2009-11-15</prism:publicationDate>
<prism:startingPage>2921</prism:startingPage>
<prism:section>STRUCTURAL BIOINFORMATICS</prism:section>
</item>

<item rdf:about="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/22/2929?rss=1">
<title><![CDATA[A boosting approach to structure learning of graphs with and without prior knowledge]]></title>
<link>http://bioinformatics.oxfordjournals.org/cgi/content/short/25/22/2929?rss=1</link>
<description><![CDATA[
<p><b>Motivation:</b> Identifying the network structure through which genes and their products interact can help to elucidate normal cell physiology as well as the genetic architecture of pathological phenotypes. Recently, a number of gene network inference tools have appeared based on Gaussian graphical model representations. Following this, we introduce a novel Boosting approach to learn the structure of a high-dimensional Gaussian graphical model motivated by the applications in genomics. A particular emphasis is paid to the inclusion of partial prior knowledge on the structure of the graph. With the increasing availability of pathway information and large-scale gene expression datasets, we believe that conditioning on prior knowledge will be an important aspect in raising the statistical power of structural learning algorithms to infer true conditional dependencies.</p>
<p><b>Results:</b> Our Boosting approach, termed BoostiGraph, is conceptually and algorithmically simple. It complements recent work on the network inference problem based on Lasso-type approaches. BoostiGraph is computationally cheap and is applicable to very high-dimensional graphs. For example, on graphs of order 5000 nodes, it is able to map out paths for the conditional independence structure in few minutes. Using computer simulations, we investigate the ability of our method with and without prior information to infer Gaussian graphical models from artificial as well as actual microarray datasets. The experimental results demonstrate that, using our method, it is possible to recover the true network topology with relatively high accuracy.</p>
<p><b>Availability:</b> This method and all other associated files are freely available from <inter-ref locator="http://www.stats.ox.ac.uk/~anjum/" locator-type="url">http://www.stats.ox.ac.uk/~anjum/</inter-ref>.</p>
<p><b>Contact:</b> <inter-ref locator="s.anjum@har.mrc.ac.uk" locator-type="email">s.anjum@har.mrc.ac.uk</inter-ref>; <inter-ref locator="cholmes@stats.ox.ac.uk" locator-type="email">cholmes@stats.ox.ac.uk</inter-ref></p>
<p><b>Supplementary information:</b> <inter-ref locator="http://bioinformatics.oxfordjournals.org/cgi/content/full/485/DC1" locator-type="url">Supplementary data</inter-ref> are available at <I>Bioinfomatics</I> online.</p>
]]></description>
<dc:creator><![CDATA[Anjum, S., Doucet, A., Holmes, C. C.]]></dc:creator>
<dc:date>Wed, 04 Nov 2009 05:45:49 PST</dc:date>
<dc:identifier>info:doi/10.1093/bioinformatics/btp485</dc:identifier>
<dc:title><![CDATA[A boosting approach to structure learning of graphs with and without prior knowledge]]></dc:title>
<dc:publisher>Oxford University Press</dc:publisher>
<prism:number>22</prism:number>
<prism:volume>25</prism:volume>
<prism:endingPage>2936</prism:endingPage>
<prism:publicationDate>2009-11-15</prism:publicationDate>
<prism:startingPage>2929</prism:startingPage>
<prism:section>SYSTEMS BIOLOGY</prism:section>
</item>

<item rdf:about="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/22/2937?rss=1">
<title><![CDATA[Learning gene regulatory networks from gene expression measurements using non-parametric molecular kinetics]]></title>
<link>http://bioinformatics.oxfordjournals.org/cgi/content/short/25/22/2937?rss=1</link>
<description><![CDATA[
<p><b>Motivation:</b> Regulation of gene expression is fundamental to the operation of a cell. Revealing the structure and dynamics of a gene regulatory network (GRN) is of great interest and represents a considerably challenging computational problem. The GRN estimation problem is complicated by the fact that the number of gene expression measurements is typically extremely small when compared with the dimension of the biological system. Further, because the gene regulation process is intrinsically complex, commonly used parametric models can provide too simple description of the underlying phenomena and, thus, can be unreliable. In this article, we propose a novel methodology for the inference of GRNs from time-series and steady-state gene expression measurements. The presented framework is based on the use of Bayesian analysis with ordinary differential equations (ODEs) and non-parametric Gaussian process modeling for the transcriptional-level regulation.</p>
<p><b>Results:</b> The performance of the proposed structure inference method is evaluated using a recently published <I>in vivo</I> dataset. By comparing the obtained results with those of existing ODE- and Bayesian-based inference methods we demonstrate that the proposed method provides more accurate network structure learning. The predictive capabilities of the method are examined by splitting the dataset into a training set and a test set and by predicting the test set based on the training set.</p>
<p><b>Availability:</b> A MATLAB implementation of the method will be available from <inter-ref locator="http://www.cs.tut.fi/~aijo2/gp" locator-type="url">http://www.cs.tut.fi/~aijo2/gp</inter-ref> upon publication</p>
<p><b>Contact:</b> <inter-ref locator="harri.lahdesmaki@tut.fi" locator-type="email">harri.lahdesmaki@tut.fi</inter-ref></p>
<p><b>Supplementary information:</b> <inter-ref locator="http://bioinformatics.oxfordjournals.org/cgi/content/full/511/DC1" locator-type="url">Supplementary data</inter-ref> are available at <I>Bioinformatics</I> online.</p>
]]></description>
<dc:creator><![CDATA[Aijo, T., Lahdesmaki, H.]]></dc:creator>
<dc:date>Wed, 04 Nov 2009 05:45:49 PST</dc:date>
<dc:identifier>info:doi/10.1093/bioinformatics/btp511</dc:identifier>
<dc:title><![CDATA[Learning gene regulatory networks from gene expression measurements using non-parametric molecular kinetics]]></dc:title>
<dc:publisher>Oxford University Press</dc:publisher>
<prism:number>22</prism:number>
<prism:volume>25</prism:volume>
<prism:endingPage>2944</prism:endingPage>
<prism:publicationDate>2009-11-15</prism:publicationDate>
<prism:startingPage>2937</prism:startingPage>
<prism:section>SYSTEMS BIOLOGY</prism:section>
</item>

<item rdf:about="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/22/2945?rss=1">
<title><![CDATA[Identification of genes involved in the same pathways using a Hidden Markov Model-based approach]]></title>
<link>http://bioinformatics.oxfordjournals.org/cgi/content/short/25/22/2945?rss=1</link>
<description><![CDATA[
<p><b>Motivation:</b> The sequencing of whole genomes from various species has provided us with a wealth of genetic information. To make use of the vast amounts of data available today it is necessary to devise computer-based analysis techniques.</p>
<p><b>Results:</b> We propose a Hidden Markov Model (HMM) based algorithm to detect groups of genes functionally similar to a set of input genes from microarray expression data. A subset of experiments from a microarray is selected based on a set of related input genes. HMMs are trained from the input genes and a group of random gene input sets to provide significance estimates. Every gene in the microarray is scored using all HMMs and significant matches with the input genes are retained. We ran this algorithm on the life cycle of Drosophila microarray data set with KEGG pathways for cell cycle and translation factors as input data sets. Results show high functional similarity in resulting gene sets, increasing our biological insight into gene pathways and KEGG annotations. The algorithm performed very well compared to the Signature Algorithm and a purely correlation-based approach.</p>
<p><b>Availability:</b> Java source codes and data sets are available at <inter-ref locator="http://www.ittc.ku.edu/~xwchen/software.htm" locator-type="url">http://www.ittc.ku.edu/~xwchen/software.htm</inter-ref></p>
<p><b>Contact:</b> <inter-ref locator="xwchen@ittc.ku.edu" locator-type="email">xwchen@ittc.ku.edu</inter-ref></p>
<p><b>Supplementary information:</b> <inter-ref locator="http://bioinformatics.oxfordjournals.org/cgi/content/full/521/DC1" locator-type="url">Supplementary data</inter-ref> are available at <I>Bioinformatics</I> online.</p>
]]></description>
<dc:creator><![CDATA[Senf, A., Chen, X.-w.]]></dc:creator>
<dc:date>Wed, 04 Nov 2009 05:45:49 PST</dc:date>
<dc:identifier>info:doi/10.1093/bioinformatics/btp521</dc:identifier>
<dc:title><![CDATA[Identification of genes involved in the same pathways using a Hidden Markov Model-based approach]]></dc:title>
<dc:publisher>Oxford University Press</dc:publisher>
<prism:number>22</prism:number>
<prism:volume>25</prism:volume>
<prism:endingPage>2954</prism:endingPage>
<prism:publicationDate>2009-11-15</prism:publicationDate>
<prism:startingPage>2945</prism:startingPage>
<prism:section>SYSTEMS BIOLOGY</prism:section>
</item>

<item rdf:about="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/22/2955?rss=1">
<title><![CDATA[Mining gene functional networks to improve mass-spectrometry-based protein identification]]></title>
<link>http://bioinformatics.oxfordjournals.org/cgi/content/short/25/22/2955?rss=1</link>
<description><![CDATA[
<p><b>Motivation:</b> High-throughput protein identification experiments based on tandem mass spectrometry (MS/MS) often suffer from low sensitivity and low-confidence protein identifications. In a typical shotgun proteomics experiment, it is assumed that all proteins are equally likely to be present. However, there is often other evidence to suggest that a protein is present and confidence in individual protein identification can be updated accordingly.</p>
<p><b>Results:</b> We develop a method that analyzes MS/MS experiments in the larger context of the biological processes active in a cell. Our method, MSNet, improves protein identification in shotgun proteomics experiments by considering information on functional associations from a gene functional network. MSNet substantially increases the number of proteins identified in the sample at a given error rate. We identify 8&ndash;29% more proteins than the original MS experiment when applied to yeast grown in different experimental conditions analyzed on different MS/MS instruments, and 37% more proteins in a human sample. We validate up to 94% of our identifications in yeast by presence in ground-truth reference sets.</p>
<p><b>Availability and Implementation:</b> Software and datasets are available at <inter-ref locator="http://aug.csres.utexas.edu/msnet" locator-type="url">http://aug.csres.utexas.edu/msnet</inter-ref></p>
<p><b>Contact:</b> <inter-ref locator="miranker@cs.utexas.edu" locator-type="email">miranker@cs.utexas.edu</inter-ref>, <inter-ref locator="marcotte@icmb.utexas.edu" locator-type="email">marcotte@icmb.utexas.edu</inter-ref></p>
<p><b>Supplementary information:</b> <inter-ref locator="http://bioinformatics.oxfordjournals.org/cgi/content/full/461/DC1" locator-type="url">Supplementary data</inter-ref> are available at <I>Bioinformatics</I> online.</p>
]]></description>
<dc:creator><![CDATA[Ramakrishnan, S. R., Vogel, C., Kwon, T., Penalva, L. O., Marcotte, E. M., Miranker, D. P.]]></dc:creator>
<dc:date>Wed, 04 Nov 2009 05:45:49 PST</dc:date>
<dc:identifier>info:doi/10.1093/bioinformatics/btp461</dc:identifier>
<dc:title><![CDATA[Mining gene functional networks to improve mass-spectrometry-based protein identification]]></dc:title>
<dc:publisher>Oxford University Press</dc:publisher>
<prism:number>22</prism:number>
<prism:volume>25</prism:volume>
<prism:endingPage>2961</prism:endingPage>
<prism:publicationDate>2009-11-15</prism:publicationDate>
<prism:startingPage>2955</prism:startingPage>
<prism:section>DATA AND TEXT MINING</prism:section>
</item>

<item rdf:about="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/22/2962?rss=1">
<title><![CDATA[Simultaneous inference of biological networks of multiple species from genome-wide data and evolutionary information: a semi-supervised approach]]></title>
<link>http://bioinformatics.oxfordjournals.org/cgi/content/short/25/22/2962?rss=1</link>
<description><![CDATA[
<p><b>Motivation:</b> The existing supervised methods for biological network inference work on each of the networks individually based only on intra-species information such as gene expression data. We believe that it will be more effective to use genomic data and cross-species evolutionary information from different species simultaneously, rather than to use the genomic data alone.</p>
<p><b>Results:</b> We created a new semi-supervised learning method called <I>Link Propagation</I> for inferring biological networks of multiple species based on genome-wide data and evolutionary information. The new method was applied to simultaneous reconstruction of three metabolic networks of <I>Caenorhabditis elegans</I>, <I>Helicobacter pylori</I> and <I>Saccharomyces cerevisiae</I>, based on gene expression similarities and amino acid sequence similarities. The experimental results proved that the new simultaneous network inference method consistently improves the predictive performance over the individual network inferences, and it also outperforms in accuracy and speed other established methods such as the pairwise support vector machine.</p>
<p><b>Availability:</b> The software and data are available at <inter-ref locator="http://cbio.ensmp.fr/~yyamanishi/LinkPropagation/" locator-type="url">http://cbio.ensmp.fr/~yyamanishi/LinkPropagation/</inter-ref>.</p>
<p><b>Contact:</b> <inter-ref locator="kashima@mist.i.u-tokyo.ac.jp" locator-type="email">kashima@mist.i.u-tokyo.ac.jp</inter-ref></p>
<p><b>Supplementary information:</b> <inter-ref locator="http://bioinformatics.oxfordjournals.org/cgi/content/full/494/DC1" locator-type="url">Supplementary data</inter-ref> are available at <I>Bioinformatics</I> online.</p>
]]></description>
<dc:creator><![CDATA[Kashima, H., Yamanishi, Y., Kato, T., Sugiyama, M., Tsuda, K.]]></dc:creator>
<dc:date>Wed, 04 Nov 2009 05:45:49 PST</dc:date>
<dc:identifier>info:doi/10.1093/bioinformatics/btp494</dc:identifier>
<dc:title><![CDATA[Simultaneous inference of biological networks of multiple species from genome-wide data and evolutionary information: a semi-supervised approach]]></dc:title>
<dc:publisher>Oxford University Press</dc:publisher>
<prism:number>22</prism:number>
<prism:volume>25</prism:volume>
<prism:endingPage>2968</prism:endingPage>
<prism:publicationDate>2009-11-15</prism:publicationDate>
<prism:startingPage>2962</prism:startingPage>
<prism:section>DATA AND TEXT MINING</prism:section>
</item>

<item rdf:about="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/22/2969?rss=1">
<title><![CDATA[Improving peptide identification with single-stage mass spectrum peaks]]></title>
<link>http://bioinformatics.oxfordjournals.org/cgi/content/short/25/22/2969?rss=1</link>
<description><![CDATA[
<p><b>Motivation:</b> Database searching is the major peptide identification method in shotgun proteomics. It searches tandem mass spectrometry (MS/MS) spectra against a protein database to identify target peptides. The success of such a database searching method relies on a scoring algorithm that can evaluate the quality of peptide-spectrum matches (PSMs) accurately. However, current scoring algorithms frequently generate inaccurate assignments due to variations and noises in the MS/MS spectra. To address this issue, we like to improve peptide identification by using additional information from other data sources.</p>
<p><b>Results:</b> Single-stage MS data is complementary to MS/MS data in the sense that it provides broader mass coverage but less sequence information. In this article, we show that single-stage MS data can be used to re-rank PSMs. The proposed method explores a linear combination of scores between MS and MS/MS data to perform re-ranking. Experimental results on real data show that such a re-ranking strategy improves the identification performance significantly.</p>
<p><b>Availability:</b> <inter-ref locator="http://bioinformatics.ust.hk/ReRankPSMwMS1.rar" locator-type="url">http://bioinformatics.ust.hk/ReRankPSMwMS1.rar</inter-ref></p>
<p><b>Contact:</b> <inter-ref locator="eezyhe@ust.hk" locator-type="email">eezyhe@ust.hk</inter-ref></p>
<p><b>Supplementary information:</b> <inter-ref locator="http://bioinformatics.oxfordjournals.org/cgi/content/full/501/DC1" locator-type="url">Supplementary data</inter-ref> are available at <I>Bioinformatics</I> online.</p>
]]></description>
<dc:creator><![CDATA[He, Z., Yu, W.]]></dc:creator>
<dc:date>Wed, 04 Nov 2009 05:45:49 PST</dc:date>
<dc:identifier>info:doi/10.1093/bioinformatics/btp501</dc:identifier>
<dc:title><![CDATA[Improving peptide identification with single-stage mass spectrum peaks]]></dc:title>
<dc:publisher>Oxford University Press</dc:publisher>
<prism:number>22</prism:number>
<prism:volume>25</prism:volume>
<prism:endingPage>2974</prism:endingPage>
<prism:publicationDate>2009-11-15</prism:publicationDate>
<prism:startingPage>2969</prism:startingPage>
<prism:section>DATA AND TEXT MINING</prism:section>
</item>

<item rdf:about="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/22/2975?rss=1">
<title><![CDATA[Metabolite and reaction inference based on enzyme specificities]]></title>
<link>http://bioinformatics.oxfordjournals.org/cgi/content/short/25/22/2975?rss=1</link>
<description><![CDATA[
<p><b>Motivation:</b> Many enzymes are not absolutely specific, or even promiscuous: they can catalyze transformations of more compounds than the traditional ones as listed in, e.g. KEGG. This information is currently only available in databases, such as the BRENDA enzyme activity database. In this article, we propose to model enzyme aspecificity by predicting whether an input compound is likely to be transformed by a certain enzyme. Such a predictor has many applications, for example, to complete reconstructed metabolic networks, to aid in metabolic engineering or to help identify unknown peaks in mass spectra.</p>
<p><b>Results:</b> We have developed a system for metabolite and reaction inference based on enzyme specificities (<I>MaRIboES</I>). It employs structural and stereochemistry similarity measures and molecular fingerprints to generalize enzymatic reactions based on data available in BRENDA. Leave-one-out cross-validation shows that 80% of known reactions are predicted well. Application to the yeast glycolytic and pentose phosphate pathways predicts a large number of known and new reactions, often leading to the formation of novel compounds, as well as a number of interesting bypasses and cross-links.</p>
<p><b>Availability:</b> M<scp>atlab</scp> and C++ code is freely available at <inter-ref locator="https://gforge.nbic.nl/projects/mariboes/" locator-type="url">https://gforge.nbic.nl/projects/mariboes/</inter-ref></p>
<p><b>Contact:</b> <inter-ref locator="d.deridder@tudelft.nl" locator-type="email">d.deridder@tudelft.nl</inter-ref></p>
<p><b>Supplementary information:</b> <inter-ref locator="http://bioinformatics.oxfordjournals.org/cgi/content/full/507/DC1" locator-type="url">Supplementary data</inter-ref> are available at <I>Bioinformatics</I> online.</p>
]]></description>
<dc:creator><![CDATA[de Groot, M. J. L., van Berlo, R. J. P., van Winden, W. A., Verheijen, P. J. T., Reinders, M. J. T., de Ridder, D.]]></dc:creator>
<dc:date>Wed, 04 Nov 2009 05:45:49 PST</dc:date>
<dc:identifier>info:doi/10.1093/bioinformatics/btp507</dc:identifier>
<dc:title><![CDATA[Metabolite and reaction inference based on enzyme specificities]]></dc:title>
<dc:publisher>Oxford University Press</dc:publisher>
<prism:number>22</prism:number>
<prism:volume>25</prism:volume>
<prism:endingPage>2982</prism:endingPage>
<prism:publicationDate>2009-11-15</prism:publicationDate>
<prism:startingPage>2975</prism:startingPage>
<prism:section>DATA AND TEXT MINING</prism:section>
</item>

<item rdf:about="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/22/2983?rss=1">
<title><![CDATA[A dictionary to identify small molecules and drugs in free text]]></title>
<link>http://bioinformatics.oxfordjournals.org/cgi/content/short/25/22/2983?rss=1</link>
<description><![CDATA[
<p><b>Motivation:</b> From the scientific community, a lot of effort has been spent on the correct identification of gene and protein names in text, while less effort has been spent on the correct identification of chemical names. Dictionary-based term identification has the power to recognize the diverse representation of chemical information in the literature and map the chemicals to their database identifiers.</p>
<p><b>Results:</b> We developed a dictionary for the identification of small molecules and drugs in text, combining information from UMLS, MeSH, ChEBI, DrugBank, KEGG, HMDB and ChemIDplus. Rule-based term filtering, manual check of highly frequent terms and disambiguation rules were applied. We tested the combined dictionary and the dictionaries derived from the individual resources on an annotated corpus, and conclude the following: (i) each of the different processing steps increase precision with a minor loss of recall; (ii) the overall performance of the combined dictionary is acceptable (precision 0.67, recall 0.40 (0.80 for trivial names); (iii) the combined dictionary performed better than the dictionary in the chemical recognizer OSCAR3; (iv) the performance of a dictionary based on ChemIDplus alone is comparable to the performance of the combined dictionary.</p>
<p><b>Availability:</b> The combined dictionary is freely available as an XML file in Simple Knowledge Organization System format on the web site <inter-ref locator="http://www.biosemantics.org/chemlist" locator-type="url">http://www.biosemantics.org/chemlist</inter-ref>.</p>
<p><b>Contact:</b> <inter-ref locator="k.hettne@erasmusmc.nl" locator-type="email">k.hettne@erasmusmc.nl</inter-ref></p>
<p><b>Supplementary information:</b> <inter-ref locator="http://bioinformatics.oxfordjournals.org/cgi/content/full/535/DC1" locator-type="url">Supplementary data</inter-ref> are available at <I>Bioinformatics</I> online.</p>
]]></description>
<dc:creator><![CDATA[Hettne, K. M., Stierum, R. H., Schuemie, M. J., Hendriksen, P. J. M., Schijvenaars, B. J. A., Mulligen, E. M. v., Kleinjans, J., Kors, J. A.]]></dc:creator>
<dc:date>Wed, 04 Nov 2009 05:45:49 PST</dc:date>
<dc:identifier>info:doi/10.1093/bioinformatics/btp535</dc:identifier>
<dc:title><![CDATA[A dictionary to identify small molecules and drugs in free text]]></dc:title>
<dc:publisher>Oxford University Press</dc:publisher>
<prism:number>22</prism:number>
<prism:volume>25</prism:volume>
<prism:endingPage>2991</prism:endingPage>
<prism:publicationDate>2009-11-15</prism:publicationDate>
<prism:startingPage>2983</prism:startingPage>
<prism:section>DATA AND TEXT MINING</prism:section>
</item>

<item rdf:about="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/22/2992?rss=1">
<title><![CDATA[Characterization of 1H NMR spectroscopic data and the generation of synthetic validation sets]]></title>
<link>http://bioinformatics.oxfordjournals.org/cgi/content/short/25/22/2992?rss=1</link>
<description><![CDATA[
<p><b>Motivation:</b> Common contemporary practice within the nuclear magnetic resonance (NMR) metabolomics community is to evaluate and validate novel algorithms on empirical data or simplified simulated data. Empirical data captures the complex characteristics of experimental data, but the optimal or most correct analysis is unknown <I>a priori</I>; therefore, researchers are forced to rely on indirect performance metrics, which are of limited value. In order to achieve fair and complete analysis of competing techniques more exacting metrics are required. Thus, metabolomics researchers often evaluate their algorithms on simplified simulated data with a known answer. Unfortunately, the conclusions obtained on simulated data are only of value if the data sets are complex enough for results to generalize to true experimental data. Ideally, synthetic data should be indistinguishable from empirical data, yet retain a known best analysis.</p>
<p><b>Results:</b> We have developed a technique for creating realistic synthetic metabolomics validation sets based on NMR spectroscopic data. The validation sets are developed by characterizing the salient distributions in sets of empirical spectroscopic data. Using this technique, several validation sets are constructed with a variety of characteristics present in &lsquo;real&rsquo; data. A case study is then presented to compare the relative accuracy of several alignment algorithms using the increased precision afforded by these synthetic data sets.</p>
<p><b>Availability:</b> These data sets are available for download at <inter-ref locator="http://birg.cs.wright.edu/nmr_synthetic_data_sets" locator-type="url">http://birg.cs.wright.edu/nmr_synthetic_data_sets</inter-ref>.</p>
<p><b>Contact:</b> <inter-ref locator="travis.doom@wright.edu" locator-type="email">travis.doom@wright.edu</inter-ref></p>
<p><b>Supplementary information:</b> <inter-ref locator="http://bioinformatics.oxfordjournals.org/cgi/content/full/540/DC1" locator-type="url">Supplementary data</inter-ref> are available at <I>Bioinformatics</I> online.</p>
]]></description>
<dc:creator><![CDATA[Anderson, P. E., Raymer, M. L., Kelly, B. J., Reo, N. V., DelRaso, N. J., Doom, T. E.]]></dc:creator>
<dc:date>Wed, 04 Nov 2009 05:45:49 PST</dc:date>
<dc:identifier>info:doi/10.1093/bioinformatics/btp540</dc:identifier>
<dc:title><![CDATA[Characterization of 1H NMR spectroscopic data and the generation of synthetic validation sets]]></dc:title>
<dc:publisher>Oxford University Press</dc:publisher>
<prism:number>22</prism:number>
<prism:volume>25</prism:volume>
<prism:endingPage>3000</prism:endingPage>
<prism:publicationDate>2009-11-15</prism:publicationDate>
<prism:startingPage>2992</prism:startingPage>
<prism:section>DATA AND TEXT MINING</prism:section>
</item>

<item rdf:about="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/22/3001?rss=1">
<title><![CDATA[Flynet: a genomic resource for Drosophila melanogaster transcriptional regulatory networks]]></title>
<link>http://bioinformatics.oxfordjournals.org/cgi/content/short/25/22/3001?rss=1</link>
<description><![CDATA[
<p><b>Motivation:</b> The highly coordinated expression of thousands of genes in an organism is regulated by the concerted action of transcription factors, chromatin proteins and epigenetic mechanisms. High-throughput experimental data for genome wide <I>in vivo</I> protein&ndash;DNA interactions and epigenetic marks are becoming available from large projects, such as the model organism ENCyclopedia Of DNA Elements (modENCODE) and from individual labs. Dissemination and visualization of these datasets in an explorable form is an important challenge.</p>
<p><b>Results:</b> To support research on <I>Drosophila melanogaster</I> transcription regulation and make the genome wide <I>in vivo</I> protein&ndash;DNA interactions data available to the scientific community as a whole, we have developed a system called Flynet. Currently, Flynet contains 101 datasets for 38 transcription factors and chromatin regulator proteins in different experimental conditions. These factors exhibit different types of binding profiles ranging from sharp localized peaks to broad binding regions. The protein&ndash;DNA interaction data in Flynet was obtained from the analysis of chromatin immunoprecipitation experiments on one color and two color genomic tiling arrays as well as chromatin immunoprecipitation followed by massively parallel sequencing. A web-based interface, integrated with an AJAX based genome browser, has been built for queries and presenting analysis results. Flynet also makes available the <I>cis</I>-regulatory modules reported in literature, known and <I>de novo</I> identified sequence motifs across the genome, and other resources to study gene regulation.</p>
<p><b>Contact:</b> <inter-ref locator="grossman@uic.edu" locator-type="email">grossman@uic.edu</inter-ref></p>
<p><b>Availability:</b> Flynet is available at <inter-ref locator="https://www.cistrack.org/flynet/" locator-type="url">https://www.cistrack.org/flynet/</inter-ref>.</p>
<p><b>Supplementary information:</b> <inter-ref locator="http://bioinformatics.oxfordjournals.org/cgi/content/full/469/DC1" locator-type="url">Supplementary data</inter-ref> are available at <I>Bioinformatics</I> online.</p>
]]></description>
<dc:creator><![CDATA[Tian, F., Shah, P. K., Liu, X., Negre, N., Chen, J., Karpenko, O., White, K. P., Grossman, R. L.]]></dc:creator>
<dc:date>Wed, 04 Nov 2009 05:45:49 PST</dc:date>
<dc:identifier>info:doi/10.1093/bioinformatics/btp469</dc:identifier>
<dc:title><![CDATA[Flynet: a genomic resource for Drosophila melanogaster transcriptional regulatory networks]]></dc:title>
<dc:publisher>Oxford University Press</dc:publisher>
<prism:number>22</prism:number>
<prism:volume>25</prism:volume>
<prism:endingPage>3004</prism:endingPage>
<prism:publicationDate>2009-11-15</prism:publicationDate>
<prism:startingPage>3001</prism:startingPage>
<prism:section>DATABASES AND ONTOLOGIES</prism:section>
</item>

<item rdf:about="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/22/3005?rss=1">
<title><![CDATA[Mobyle: a new full web bioinformatics framework]]></title>
<link>http://bioinformatics.oxfordjournals.org/cgi/content/short/25/22/3005?rss=1</link>
<description><![CDATA[
<p><b>Motivation:</b> For the biologist, running bioinformatics analyses involves a time-consuming management of data and tools. Users need support to organize their work, retrieve parameters and reproduce their analyses. They also need to be able to combine their analytic tools using a safe data flow software mechanism. Finally, given that scientific tools can be difficult to install, it is particularly helpful for biologists to be able to use these tools through a web user interface. However, providing a web interface for a set of tools raises the problem that a single web portal cannot offer all the existing and possible services: it is the user, again, who has to cope with data copy among a number of different services. A framework enabling portal administrators to build a network of cooperating services would therefore clearly be beneficial.</p>
<p><b>Results:</b> We have designed a system, Mobyle, to provide a flexible and usable Web environment for defining and running bioinformatics analyses. It embeds simple yet powerful data management features that allow the user to reproduce analyses and to combine tools using a hierarchical typing system. Mobyle offers invocation of services distributed over remote Mobyle servers, thus enabling a federated network of curated bioinformatics portals without the user having to learn complex concepts or to install sophisticated software. While being focused on the end user, the Mobyle system also addresses the need, for the bioinfomatician, to automate remote services execution: PlayMOBY is a companion tool that automates the publication of BioMOBY web services, using Mobyle program definitions.</p>
<p><b>Availability:</b> The Mobyle system is distributed under the terms of the GNU GPLv2 on the project web site (<inter-ref locator="http://bioweb2.pasteur.fr/projects/mobyle/" locator-type="url">http://bioweb2.pasteur.fr/projects/mobyle/</inter-ref>). It is already deployed on three servers: <inter-ref locator="http://mobyle.pasteur.fr" locator-type="url">http://mobyle.pasteur.fr</inter-ref>, <inter-ref locator="http://mobyle.rpbs.univ-paris-diderot.fr" locator-type="url">http://mobyle.rpbs.univ-paris-diderot.fr</inter-ref> and <inter-ref locator="http://lipm-bioinfo.toulouse.inra.fr/Mobyle" locator-type="url">http://lipm-bioinfo.toulouse.inra.fr/Mobyle</inter-ref>. The PlayMOBY companion is distributed under the terms of the CeCILL license, and is available at <inter-ref locator="http://lipm-bioinfo.toulouse.inra.fr/biomoby/PlayMOBY/" locator-type="url">http://lipm-bioinfo.toulouse.inra.fr/biomoby/PlayMOBY/</inter-ref>.</p>
<p><b>Contact:</b> <inter-ref locator="mobyle-support@pasteur.fr" locator-type="email">mobyle-support@pasteur.fr</inter-ref>; <inter-ref locator="mobyle-support@rpbs.univ-paris-diderot.fr" locator-type="email">mobyle-support@rpbs.univ-paris-diderot.fr</inter-ref>; <inter-ref locator="letondal@pasteur.fr" locator-type="email">letondal@pasteur.fr</inter-ref></p>
<p><b>Supplementary information:</b><inter-ref locator="http://bioinformatics.oxfordjournals.org/cgi/content/full/493/DC1" locator-type="url">Supplementary data</inter-ref> are available at <I>Bioinformatics</I> online.</p>
]]></description>
<dc:creator><![CDATA[Neron, B., Menager, H., Maufrais, C., Joly, N., Maupetit, J., Letort, S., Carrere, S., Tuffery, P., Letondal, C.]]></dc:creator>
<dc:date>Wed, 04 Nov 2009 05:45:49 PST</dc:date>
<dc:identifier>info:doi/10.1093/bioinformatics/btp493</dc:identifier>
<dc:title><![CDATA[Mobyle: a new full web bioinformatics framework]]></dc:title>
<dc:publisher>Oxford University Press</dc:publisher>
<prism:number>22</prism:number>
<prism:volume>25</prism:volume>
<prism:endingPage>3011</prism:endingPage>
<prism:publicationDate>2009-11-15</prism:publicationDate>
<prism:startingPage>3005</prism:startingPage>
<prism:section>DATABASES AND ONTOLOGIES</prism:section>
</item>

<item rdf:about="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/22/3012?rss=1">
<title><![CDATA[A method for visualizing CellML models]]></title>
<link>http://bioinformatics.oxfordjournals.org/cgi/content/short/25/22/3012?rss=1</link>
<description><![CDATA[
<p><b>Motivation:</b> The Physiome Project was established in 1997 to develop tools to facilitate international collaboration in the physiological sciences and the sharing of biological models and experimental data. The CellML language was developed to represent and exchange mathematical models of biological processes. CellML models can be very complicated, making it difficult to interpret the underlying physical and biological concepts and relationships captured/described in the mathematical model.</p>
<p><b>Results:</b> To address this issue a set of ontologies was developed to explicitly annotate the biophysical concepts represented in the CellML models. This article presents a framework that combines a visual language, together with CellML ontologies, to support the visualization of the underlying physical and biological concepts described by the mathematical model and also their relationships with the CellML model. Automated CellML model visualization assists in the interpretation of model concepts and facilitates model communication and exchange between different communities.</p>
<p><b>Contact:</b> <inter-ref locator="sarala.dissanayake@auckland.ac.nz" locator-type="email">sarala.dissanayake@auckland.ac.nz</inter-ref></p>
<p><b>Supplementary information:</b> <inter-ref locator="http://bioinformatics.oxfordjournals.org/cgi/content/full/495/DC1" locator-type="url">Supplementary data</inter-ref> are available at <I>Bioinformatics</I> online.</p>
]]></description>
<dc:creator><![CDATA[Wimalaratne, S. M., Halstead, M. D. B., Lloyd, C. M., Cooling, M. T., Crampin, E. J., Nielsen, P. F.]]></dc:creator>
<dc:date>Wed, 04 Nov 2009 05:45:49 PST</dc:date>
<dc:identifier>info:doi/10.1093/bioinformatics/btp495</dc:identifier>
<dc:title><![CDATA[A method for visualizing CellML models]]></dc:title>
<dc:publisher>Oxford University Press</dc:publisher>
<prism:number>22</prism:number>
<prism:volume>25</prism:volume>
<prism:endingPage>3019</prism:endingPage>
<prism:publicationDate>2009-11-15</prism:publicationDate>
<prism:startingPage>3012</prism:startingPage>
<prism:section>DATABASES AND ONTOLOGIES</prism:section>
</item>

<item rdf:about="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/22/3020?rss=1">
<title><![CDATA[Comparative analysis and unification of domain-domain interaction networks]]></title>
<link>http://bioinformatics.oxfordjournals.org/cgi/content/short/25/22/3020?rss=1</link>
<description><![CDATA[
<p><b>Motivation:</b> Certain protein domains are known to preferentially interact with other domains. Several approaches have been proposed to predict domain&ndash;domain interactions, and over nine datasets are available. Our aim is to analyse the coverage and quality of the existing resources, as well as the extent of their overlap. With this knowledge, we have the opportunity to merge individual domain interaction networks to construct a comprehensive and reliable database.</p>
<p><b>Results:</b> In this article we introduce a new approach towards comparing domain&ndash;domain interaction networks. This approach is used to compare nine predicted domain and protein interaction networks. The networks were used to generate a database of unified domain interactions, UniDomInt. Each interaction in the dataset is scored according to the benchmarked reliability of the sources. The performance of UniDomInt is an improvement compared to the underlying source networks and to another composite resource, <I>Domine</I>.</p>
<p><b>Availability:</b> <inter-ref locator="http://sonnhammer.sbc.su.se/download/UniDomInt/" locator-type="url">http://sonnhammer.sbc.su.se/download/UniDomInt/</inter-ref></p>
<p><b>Contact:</b> <inter-ref locator="Erik.Sonnhammer@sbc.su.se" locator-type="email">Erik.Sonnhammer@sbc.su.se</inter-ref></p>
]]></description>
<dc:creator><![CDATA[Bjorkholm, P., Sonnhammer, E. L. L.]]></dc:creator>
<dc:date>Wed, 04 Nov 2009 05:45:49 PST</dc:date>
<dc:identifier>info:doi/10.1093/bioinformatics/btp522</dc:identifier>
<dc:title><![CDATA[Comparative analysis and unification of domain-domain interaction networks]]></dc:title>
<dc:publisher>Oxford University Press</dc:publisher>
<prism:number>22</prism:number>
<prism:volume>25</prism:volume>
<prism:endingPage>3025</prism:endingPage>
<prism:publicationDate>2009-11-15</prism:publicationDate>
<prism:startingPage>3020</prism:startingPage>
<prism:section>DATABASES AND ONTOLOGIES</prism:section>
</item>

<item rdf:about="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/22/3026?rss=1">
<title><![CDATA[Saint: a lightweight integration environment for model annotation]]></title>
<link>http://bioinformatics.oxfordjournals.org/cgi/content/short/25/22/3026?rss=1</link>
<description><![CDATA[
<p><b>Summary:</b> Saint is a web application which provides a lightweight annotation integration environment for quantitative biological models. The system enables modellers to rapidly mark up models with biological information derived from a range of data sources.</p>
<p><b>Availability and Implementation:</b> Saint is freely available for use on the web at <inter-ref locator="http://www.cisban.ac.uk/saint" locator-type="url">http://www.cisban.ac.uk/saint</inter-ref>. The web application is implemented in Google Web Toolkit and Tomcat, with all major browsers supported. The Java source code is freely available for download at <inter-ref locator="http://saint-annotate.sourceforge.net" locator-type="url">http://saint-annotate.sourceforge.net</inter-ref>. The Saint web server requires an installation of libSBML and has been tested on Linux (32-bit Ubuntu 8.10 and 9.04).</p>
<p><b>Contact:</b> <inter-ref locator="helpdesk@cisban.ac.uk" locator-type="email">helpdesk@cisban.ac.uk</inter-ref>; <inter-ref locator="a.l.lister@ncl.ac.uk" locator-type="email">a.l.lister@ncl.ac.uk</inter-ref></p>
<p><b>Supplementary information:</b> <inter-ref locator="http://bioinformatics.oxfordjournals.org/cgi/content/full/523/DC1" locator-type="url">Supplementary data</inter-ref> are available at <I>Bioinformatics</I> online.</p>
]]></description>
<dc:creator><![CDATA[Lister, A. L., Pocock, M., Taschuk, M., Wipat, A.]]></dc:creator>
<dc:date>Wed, 04 Nov 2009 05:45:49 PST</dc:date>
<dc:identifier>info:doi/10.1093/bioinformatics/btp523</dc:identifier>
<dc:title><![CDATA[Saint: a lightweight integration environment for model annotation]]></dc:title>
<dc:publisher>Oxford University Press</dc:publisher>
<prism:number>22</prism:number>
<prism:volume>25</prism:volume>
<prism:endingPage>3027</prism:endingPage>
<prism:publicationDate>2009-11-15</prism:publicationDate>
<prism:startingPage>3026</prism:startingPage>
<prism:section>SYSTEMS BIOLOGY</prism:section>
</item>

<item rdf:about="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/22/3028?rss=1">
<title><![CDATA[CellClassifier: supervised learning of cellular phenotypes]]></title>
<link>http://bioinformatics.oxfordjournals.org/cgi/content/short/25/22/3028?rss=1</link>
<description><![CDATA[
<p><b>Summary:</b>CellClassifier is a tool for classifying single-cell phenotypes in microscope images. It includes several unique and user-friendly features for classification using multiclass support vector machines</p>
<p><b>Availability:</b> Source code, user manual and SaveObjectSegmentation CellProfiler module available for download at <inter-ref locator="www.cellclassifier.ethz.ch" locator-type="url">www.cellclassifier.ethz.ch</inter-ref> under the GPL license (implemented in Matlab).</p>
<p><b>Contact:</b> <inter-ref locator="pelkmans@imsb.biol.ethz.ch" locator-type="email">pelkmans@imsb.biol.ethz.ch</inter-ref></p>
<p><b>Supplementary information:</b> <inter-ref locator="http://bioinformatics.oxfordjournals.org/cgi/content/full/524/DC1" locator-type="url">Supplementary data</inter-ref> are available at <I>Bioinformatics</I> online.</p>
]]></description>
<dc:creator><![CDATA[Ramo, P., Sacher, R., Snijder, B., Begemann, B., Pelkmans, L.]]></dc:creator>
<dc:date>Wed, 04 Nov 2009 05:45:49 PST</dc:date>
<dc:identifier>info:doi/10.1093/bioinformatics/btp524</dc:identifier>
<dc:title><![CDATA[CellClassifier: supervised learning of cellular phenotypes]]></dc:title>
<dc:publisher>Oxford University Press</dc:publisher>
<prism:number>22</prism:number>
<prism:volume>25</prism:volume>
<prism:endingPage>3030</prism:endingPage>
<prism:publicationDate>2009-11-15</prism:publicationDate>
<prism:startingPage>3028</prism:startingPage>
<prism:section>SYSTEMS BIOLOGY</prism:section>
</item>

<item rdf:about="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/22/3031?rss=1">
<title><![CDATA[PubMed-EX: a web browser extension to enhance PubMed search with text mining features]]></title>
<link>http://bioinformatics.oxfordjournals.org/cgi/content/short/25/22/3031?rss=1</link>
<description><![CDATA[
<p><b>Summary:</b> PubMed-EX is a browser extension that marks up PubMed search results with additional text-mining information. PubMed-EX's page mark-up, which includes section categorization and gene/disease and relation mark-up, can help researchers to quickly focus on key terms and provide additional information on them. All text processing is performed server-side, freeing up user resources.</p>
<p><b>Availability:</b> PubMed-EX is freely available at <inter-ref locator="http://bws.iis.sinica.edu.tw/PubMed-EX" locator-type="url">http://bws.iis.sinica.edu.tw/PubMed-EX</inter-ref> and <inter-ref locator="http://iisr.cse.yzu.edu.tw:8000/PubMed-EX/" locator-type="url">http://iisr.cse.yzu.edu.tw:8000/PubMed-EX/</inter-ref>.</p>
<p><b>Contact:</b> <inter-ref locator="thtsai@saturn.yzu.edu.tw" locator-type="email">thtsai@saturn.yzu.edu.tw</inter-ref></p>
<p><b>Supplementary information:</b> <inter-ref locator="http://bioinformatics.oxfordjournals.org/cgi/content/full/475/DC1" locator-type="url">Supplementary data</inter-ref> are available at <I>Bioinformatics</I> online.</p>
]]></description>
<dc:creator><![CDATA[Tsai, R. T.-H., Dai, H.-J., Lai, P.-T., Huang, C.-H.]]></dc:creator>
<dc:date>Wed, 04 Nov 2009 05:45:49 PST</dc:date>
<dc:identifier>info:doi/10.1093/bioinformatics/btp475</dc:identifier>
<dc:title><![CDATA[PubMed-EX: a web browser extension to enhance PubMed search with text mining features]]></dc:title>
<dc:publisher>Oxford University Press</dc:publisher>
<prism:number>22</prism:number>
<prism:volume>25</prism:volume>
<prism:endingPage>3032</prism:endingPage>
<prism:publicationDate>2009-11-15</prism:publicationDate>
<prism:startingPage>3031</prism:startingPage>
<prism:section>DATA AND TEXT MINING</prism:section>
</item>

<item rdf:about="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/22/3033?rss=1">
<title><![CDATA[digeR: a graphical user interface R package for analyzing 2D-DIGE data]]></title>
<link>http://bioinformatics.oxfordjournals.org/cgi/content/short/25/22/3033?rss=1</link>
<description><![CDATA[
<p><b>Summary:</b> 2D Difference In-Gel Electrophoresis (2D-DIGE) or 2D gel technology is being used as a routine proteomics technique for biomarker discovery. Analyzing such high-dimensional data requires multivariate analysis techniques to be applied. In addition, protein post-translational modification (PTM) information from the 2D gel data is usually overlooked. We report on an R package, digeR, with an easy to use graphical user interface for analyzing 2D-DIGE (2D gel) data. It provides a tool for visually looking for potential PTM changes from different biological states and support biomarker discovery through multivariate analysis techniques.</p>
<p><b>Availability:</b> digeR package is freely available from the CRAN: <inter-ref locator="http://cran.r-project.org/web/packages/digeR/index.html" locator-type="url">http://cran.r-project.org/web/packages/digeR/index.html</inter-ref>.</p>
<p><b>Contact:</b> <inter-ref locator="yue.fan@ucd.ie" locator-type="email">yue.fan@ucd.ie</inter-ref></p>
<p><b>Supplementary information:</b> <inter-ref locator="http://bioinformatics.oxfordjournals.org/cgi/content/full/514/DC1" locator-type="url">Supplementary data</inter-ref> are available at <I>Bioinformatics</I> online.</p>
]]></description>
<dc:creator><![CDATA[Fan, Y., Murphy, T. B., Watson, R. W. G.]]></dc:creator>
<dc:date>Wed, 04 Nov 2009 05:45:49 PST</dc:date>
<dc:identifier>info:doi/10.1093/bioinformatics/btp514</dc:identifier>
<dc:title><![CDATA[digeR: a graphical user interface R package for analyzing 2D-DIGE data]]></dc:title>
<dc:publisher>Oxford University Press</dc:publisher>
<prism:number>22</prism:number>
<prism:volume>25</prism:volume>
<prism:endingPage>3034</prism:endingPage>
<prism:publicationDate>2009-11-15</prism:publicationDate>
<prism:startingPage>3033</prism:startingPage>
<prism:section>DATA AND TEXT MINING</prism:section>
</item>

<item rdf:about="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/22/3035?rss=1">
<title><![CDATA[UniMaP: finding unique mass and peptide signatures in the human proteome]]></title>
<link>http://bioinformatics.oxfordjournals.org/cgi/content/short/25/22/3035?rss=1</link>
<description><![CDATA[
<p><b>Summary:</b> The uniqueness of a measured molecular mass or peptide sequence plays a very important role in the fields of protein identification and peptide/protein-biomarker investigation. We present a publicly available web application that offers information concerning the uniqueness of one or more molecular masses and one or more peptide sequences in the human proteome. When a sequence is found to be unique in humans, the application is able to search across all species querying whether this sequence is unique, not only in humans but also in other species found in the Swiss-Prot Database. The application is also able to search for unique protein fragments derived computationally from enzymatic digestion driven by certain enzymes. Furthermore, the application can list all the unique masses and peptides of a given protein. Through this application, researchers are able to find unique tags, either on a molecular mass level or on a sequence level. These unique tags are remarkably important in research related to protein identification or biomarker discovery and measurements.</p>
<p><b>Availability:</b> UniMaP web-application is available at <inter-ref locator="http://bioserver-1.bioacademy.gr/Bioserver/UniMaP/" locator-type="url">http://bioserver-1.bioacademy.gr/Bioserver/UniMaP/</inter-ref></p>
<p><b>Contact:</b> <inter-ref locator="gspyrou@bioacademy.gr" locator-type="email">gspyrou@bioacademy.gr</inter-ref></p>
<p><b>Supplementary information:</b> <inter-ref locator="http://bioinformatics.oxfordjournals.org/cgi/content/full/516/DC1" locator-type="url">Supplementary data</inter-ref> are available at <I>Bioinformatics</I> online.</p>
]]></description>
<dc:creator><![CDATA[Alexandridou, A., Tsangaris, G. Th., Vougas, K., Nikita, K., Spyrou, G.]]></dc:creator>
<dc:date>Wed, 04 Nov 2009 05:45:49 PST</dc:date>
<dc:identifier>info:doi/10.1093/bioinformatics/btp516</dc:identifier>
<dc:title><![CDATA[UniMaP: finding unique mass and peptide signatures in the human proteome]]></dc:title>
<dc:publisher>Oxford University Press</dc:publisher>
<prism:number>22</prism:number>
<prism:volume>25</prism:volume>
<prism:endingPage>3037</prism:endingPage>
<prism:publicationDate>2009-11-15</prism:publicationDate>
<prism:startingPage>3035</prism:startingPage>
<prism:section>DATA AND TEXT MINING</prism:section>
</item>

<item rdf:about="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/22/3038?rss=1">
<title><![CDATA[Identifying related journals through log analysis]]></title>
<link>http://bioinformatics.oxfordjournals.org/cgi/content/short/25/22/3038?rss=1</link>
<description><![CDATA[
<p><b>Motivation:</b> With the explosion of biomedical literature and the evolution of online and open access, scientists are reading more articles from a wider variety of journals. Thus, the list of core journals relevant to their research may be less obvious and may often change over time. To help researchers quickly identify appropriate journals to read and publish in, we developed a web application for finding related journals based on the analysis of PubMed log data.</p>
<p><b>Availability:</b> <inter-ref locator="http://www.ncbi.nlm.nih.gov/IRET/Journals" locator-type="url">http://www.ncbi.nlm.nih.gov/IRET/Journals</inter-ref></p>
<p><b>Contact:</b> <inter-ref locator="luzh@ncbi.nlm.nih.gov" locator-type="email">luzh@ncbi.nlm.nih.gov</inter-ref></p>
<p><b>Supplementary information:</b> <inter-ref locator="http://bioinformatics.oxfordjournals.org/cgi/content/full/529/DC1" locator-type="url">Supplementary data</inter-ref> are available at <I>Bioinformatics</I> online.</p>
]]></description>
<dc:creator><![CDATA[Lu, Z., Xie, N., Wilbur, W. J.]]></dc:creator>
<dc:date>Wed, 04 Nov 2009 05:45:49 PST</dc:date>
<dc:identifier>info:doi/10.1093/bioinformatics/btp529</dc:identifier>
<dc:title><![CDATA[Identifying related journals through log analysis]]></dc:title>
<dc:publisher>Oxford University Press</dc:publisher>
<prism:number>22</prism:number>
<prism:volume>25</prism:volume>
<prism:endingPage>3039</prism:endingPage>
<prism:publicationDate>2009-11-15</prism:publicationDate>
<prism:startingPage>3038</prism:startingPage>
<prism:section>DATA AND TEXT MINING</prism:section>
</item>

<item rdf:about="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/22/3040?rss=1">
<title><![CDATA[CMap 1.01: a comparative mapping application for the Internet]]></title>
<link>http://bioinformatics.oxfordjournals.org/cgi/content/short/25/22/3040?rss=1</link>
<description><![CDATA[
<p><b>Summary:</b>CMap is a web-based tool for displaying and comparing maps of any type and from any species. A user can compare an unlimited number of maps, view pair-wise comparisons of known correspondences, and search for maps or for features by name, species, type and accession. CMap is freely available, can run on a variety of database engines and uses only free and open software components.</p>
<p><b>Availability:</b> <inter-ref locator="http://www.gmod.org/cmap" locator-type="url">http://www.gmod.org/cmap</inter-ref></p>
<p><b>Contact:</b> <inter-ref locator="kclark@cshl.edu" locator-type="email">kclark@cshl.edu</inter-ref></p>
]]></description>
<dc:creator><![CDATA[Youens-Clark, K., Faga, B., Yap, I. V., Stein, L., Ware, D.]]></dc:creator>
<dc:date>Wed, 04 Nov 2009 05:45:49 PST</dc:date>
<dc:identifier>info:doi/10.1093/bioinformatics/btp458</dc:identifier>
<dc:title><![CDATA[CMap 1.01: a comparative mapping application for the Internet]]></dc:title>
<dc:publisher>Oxford University Press</dc:publisher>
<prism:number>22</prism:number>
<prism:volume>25</prism:volume>
<prism:endingPage>3042</prism:endingPage>
<prism:publicationDate>2009-11-15</prism:publicationDate>
<prism:startingPage>3040</prism:startingPage>
<prism:section>DATABASES AND ONTOLOGIES</prism:section>
</item>

<item rdf:about="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/22/3043?rss=1">
<title><![CDATA[Next generation software for functional trend analysis]]></title>
<link>http://bioinformatics.oxfordjournals.org/cgi/content/short/25/22/3043?rss=1</link>
<description><![CDATA[
<p><b>Summary:</b> FuncAssociate is a web application that discovers properties enriched in lists of genes or proteins that emerge from large-scale experimentation. Here we describe an updated application with a new interface and several new features. For example, enrichment analysis can now be performed within multiple gene- and protein-naming systems. This feature avoids potentially serious translation artifacts to which other enrichment analysis strategies are subject.</p>
<p><b>Availability:</b> The FuncAssociate web application is freely available to all users at <inter-ref locator="http://llama.med.harvard.edu/funcassociate" locator-type="url">http://llama.med.harvard.edu/funcassociate</inter-ref>.</p>
<p><b>Contact:</b> <inter-ref locator="fritz_roth@hms.harvard.edu" locator-type="email">fritz_roth@hms.harvard.edu</inter-ref></p>
]]></description>
<dc:creator><![CDATA[Berriz, G. F., Beaver, J. E., Cenik, C., Tasan, M., Roth, F. P.]]></dc:creator>
<dc:date>Wed, 04 Nov 2009 05:45:50 PST</dc:date>
<dc:identifier>info:doi/10.1093/bioinformatics/btp498</dc:identifier>
<dc:title><![CDATA[Next generation software for functional trend analysis]]></dc:title>
<dc:publisher>Oxford University Press</dc:publisher>
<prism:number>22</prism:number>
<prism:volume>25</prism:volume>
<prism:endingPage>3044</prism:endingPage>
<prism:publicationDate>2009-11-15</prism:publicationDate>
<prism:startingPage>3043</prism:startingPage>
<prism:section>DATABASES AND ONTOLOGIES</prism:section>
</item>

<item rdf:about="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/22/3045?rss=1">
<title><![CDATA[QuickGO: a web-based tool for Gene Ontology searching]]></title>
<link>http://bioinformatics.oxfordjournals.org/cgi/content/short/25/22/3045?rss=1</link>
<description><![CDATA[
<p><b>Summary:</b> QuickGO is a web-based tool that allows easy browsing of the Gene Ontology (GO) and all associated electronic and manual GO annotations provided by the GO Consortium annotation groups QuickGO has been a popular GO browser for many years, but after a recent redevelopment it is now able to offer a greater range of facilities including bulk downloads of GO annotation data which can be extensively filtered by a range of different parameters and GO slim set generation.</p>
<p><b>Availability and Implementation:</b> QuickGO has implemented in JavaScript, Ajax and HTML, with all major browsers supported. It can be queried online at <inter-ref locator="http://www.ebi.ac.uk/QuickGO" locator-type="url">http://www.ebi.ac.uk/QuickGO</inter-ref>. The software for QuickGO is freely available under the Apache 2 licence and can be downloaded from <inter-ref locator="http://www.ebi.ac.uk/QuickGO/installation.html" locator-type="url">http://www.ebi.ac.uk/QuickGO/installation.html</inter-ref></p>
<p><b>Contact:</b> <inter-ref locator="goa@ebi.ac.uk" locator-type="email">goa@ebi.ac.uk</inter-ref>; <inter-ref locator="dbinns@ebi.ac.uk" locator-type="email">dbinns@ebi.ac.uk</inter-ref></p>
]]></description>
<dc:creator><![CDATA[Binns, D., Dimmer, E., Huntley, R., Barrell, D., O'Donovan, C., Apweiler, R.]]></dc:creator>
<dc:date>Wed, 04 Nov 2009 05:45:50 PST</dc:date>
<dc:identifier>info:doi/10.1093/bioinformatics/btp536</dc:identifier>
<dc:title><![CDATA[QuickGO: a web-based tool for Gene Ontology searching]]></dc:title>
<dc:publisher>Oxford University Press</dc:publisher>
<prism:number>22</prism:number>
<prism:volume>25</prism:volume>
<prism:endingPage>3046</prism:endingPage>
<prism:publicationDate>2009-11-15</prism:publicationDate>
<prism:startingPage>3045</prism:startingPage>
<prism:section>DATABASES AND ONTOLOGIES</prism:section>
</item>

<item rdf:about="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/22/3047?rss=1">
<title><![CDATA[Rapid detection, classification and accurate alignment of up to a million or more related protein sequences]]></title>
<link>http://bioinformatics.oxfordjournals.org/cgi/content/short/25/22/3047?rss=1</link>
<description><![CDATA[]]></description>
<dc:creator><![CDATA[Neuwald, A. F.]]></dc:creator>
<dc:date>Wed, 04 Nov 2009 05:45:50 PST</dc:date>
<dc:identifier>info:doi/10.1093/bioinformatics/btp573</dc:identifier>
<dc:title><![CDATA[Rapid detection, classification and accurate alignment of up to a million or more related protein sequences]]></dc:title>
<dc:publisher>Oxford University Press</dc:publisher>
<prism:number>22</prism:number>
<prism:volume>25</prism:volume>
<prism:endingPage>3047</prism:endingPage>
<prism:publicationDate>2009-11-15</prism:publicationDate>
<prism:startingPage>3047</prism:startingPage>
<prism:section>CORRIGENDUM</prism:section>
</item>

<item rdf:about="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/21/2735?rss=1">
<title><![CDATA[Efficiently finding genome-wide three-way gene interactions from transcript- and genotype-data]]></title>
<link>http://bioinformatics.oxfordjournals.org/cgi/content/short/25/21/2735?rss=1</link>
<description><![CDATA[
<p><b>Motivation:</b> We address the issue of finding a three-way gene interaction, i.e. two interacting genes in expression under the genotypes of another gene, given a dataset in which expressions and genotypes are measured at once for each individual. This issue can be a general, switching mechanism in expression of two genes, being controlled by categories of another gene, and finding this type of interaction can be a key to elucidating complex biological systems. The most suitable method for this issue is likelihood ratio test using logistic regressions, which we call <I>interaction test</I>, but a serious problem of this test is computational intractability at a genome-wide level.</p>
<p><b>Results:</b> We developed a fast method for this issue which improves the speed of interaction test by around 10 times for any size of datasets, keeping highly interacting genes with an accuracy of ~85%. We applied our method to ~3 <FONT FACE="arial,helvetica">x</FONT> 10<sup>8</sup> three-way combinations generated from a dataset on human brain samples and detected three-way gene interactions with small <I>P</I>-values. To check the reliability of our results, we first conducted permutations by which we can show that the obtained <I>P</I>-values are significantly smaller than those obtained from permuted null examples. We then used GEO (Gene Expression Omnibus) to generate gene expression datasets with binary classes to confirm the detected three-way interactions by using these datasets and interaction tests. The result showed us some datasets with significantly small <I>P</I>-values, strongly supporting the reliability of the detected three-way interactions.</p>
<p><b>Availability:</b> Software is available from <inter-ref locator="http://www.bic.kyoto-u.ac.jp/pathway/kayano/bioinfo_three-way.html" locator-type="url">http://www.bic.kyoto-u.ac.jp/pathway/kayano/bioinfo_three-way.html</inter-ref></p>
<p><b>Contact:</b> <inter-ref locator="kayano@kuicr.kyoto-u.ac.jp" locator-type="email">kayano@kuicr.kyoto-u.ac.jp</inter-ref></p>
<p><b>Supplementary information:</b> <inter-ref locator="http://bioinformatics.oxfordjournals.org/cgi/content/full/btp531/DC1" locator-type="url">Supplementary data</inter-ref> are available at <I>Bioinformatics</I> online.</p>
]]></description>
<dc:creator><![CDATA[Kayano, M., Takigawa, I., Shiga, M., Tsuda, K., Mamitsuka, H.]]></dc:creator>
<dc:date>Fri, 23 Oct 2009 06:34:19 PDT</dc:date>
<dc:identifier>info:doi/10.1093/bioinformatics/btp531</dc:identifier>
<dc:title><![CDATA[Efficiently finding genome-wide three-way gene interactions from transcript- and genotype-data]]></dc:title>
<dc:publisher>Oxford University Press</dc:publisher>
<prism:number>21</prism:number>
<prism:volume>25</prism:volume>
<prism:endingPage>2743</prism:endingPage>
<prism:publicationDate>2009-11-01</prism:publicationDate>
<prism:startingPage>2735</prism:startingPage>
<prism:section>GENOME ANALYSIS</prism:section>
</item>

<item rdf:about="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/21/2744?rss=1">
<title><![CDATA[Automated inference of molecular mechanisms of disease from amino acid substitutions]]></title>
<link>http://bioinformatics.oxfordjournals.org/cgi/content/short/25/21/2744?rss=1</link>
<description><![CDATA[
<p><b>Motivation:</b> Advances in high-throughput genotyping and next generation sequencing have generated a vast amount of human genetic variation data. Single nucleotide substitutions within protein coding regions are of particular importance owing to their potential to give rise to amino acid substitutions that affect protein structure and function which may ultimately lead to a disease state. Over the last decade, a number of computational methods have been developed to predict whether such amino acid substitutions result in an altered phenotype. Although these methods are useful in practice, and accurate for their intended purpose, they are not well suited for providing probabilistic estimates of the underlying disease mechanism.</p>
<p><b>Results:</b> We have developed a new computational model, MutPred, that is based upon protein sequence, and which models changes of structural features and functional sites between wild-type and mutant sequences. These changes, expressed as probabilities of gain or loss of structure and function, can provide insight into the specific molecular mechanism responsible for the disease state. MutPred also builds on the established SIFT method but offers improved classification accuracy with respect to human disease mutations. Given conservative thresholds on the predicted disruption of molecular function, we propose that MutPred can generate accurate and reliable hypotheses on the molecular basis of disease for ~11% of known inherited disease-causing mutations. We also note that the proportion of changes of functionally relevant residues in the sets of cancer-associated somatic mutations is higher than for the inherited lesions in the Human Gene Mutation Database which are instead predicted to be characterized by disruptions of protein structure.</p>
<p><b>Availability:</b> <inter-ref locator="http://mutdb.org/mutpred" locator-type="url">http://mutdb.org/mutpred</inter-ref></p>
<p><b>Contact:</b> <inter-ref locator="predrag@indiana.edu" locator-type="email">predrag@indiana.edu</inter-ref>; <inter-ref locator="smooney@buckinstitute.org" locator-type="email">smooney@buckinstitute.org</inter-ref></p>
]]></description>
<dc:creator><![CDATA[Li, B., Krishnan, V. G., Mort, M. E., Xin, F., Kamati, K. K., Cooper, D. N., Mooney, S. D., Radivojac, P.]]></dc:creator>
<dc:date>Fri, 23 Oct 2009 06:34:20 PDT</dc:date>
<dc:identifier>info:doi/10.1093/bioinformatics/btp528</dc:identifier>
<dc:title><![CDATA[Automated inference of molecular mechanisms of disease from amino acid substitutions]]></dc:title>
<dc:publisher>Oxford University Press</dc:publisher>
<prism:number>21</prism:number>
<prism:volume>25</prism:volume>
<prism:endingPage>2750</prism:endingPage>
<prism:publicationDate>2009-11-01</prism:publicationDate>
<prism:startingPage>2744</prism:startingPage>
<prism:section>SEQUENCE ANALYSIS</prism:section>
</item>

<item rdf:about="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/21/2751?rss=1">
<title><![CDATA[Algorithms for optimal protein structure alignment]]></title>
<link>http://bioinformatics.oxfordjournals.org/cgi/content/short/25/21/2751?rss=1</link>
<description><![CDATA[
<p><b>Motivation:</b> Structural alignment is an important tool for understanding the evolutionary relationships between proteins. However, finding the best pairwise structural alignment is difficult, due to the infinite number of possible superpositions of two structures. Unlike the sequence alignment problem, which has a polynomial time solution, the structural alignment problem has not been even classified as solvable.</p>
<p><b>Results:</b> We study one of the most widely used measures of protein structural similarity, defined as the number of pairs of residues in two proteins that can be superimposed under a predefined distance cutoff. We prove that, for any two proteins, this measure can be optimized for all but finitely many distance cutoffs. Our method leads to a series of algorithms for optimizing other structure similarity measures, including the measures commonly used in protein structure prediction experiments. We also present a polynomial time algorithm for finding a near-optimal superposition of two proteins. Aside from having a relatively low cost, the algorithm for near-optimal solution returns a superposition of provable quality. In other words, the difference between the score of the returned superposition and the score of an optimal superposition can be explicitly computed and used to determine whether the returned superposition is, in fact, the best superposition.</p>
<p><b>Contact:</b> <inter-ref locator="poleksic@cs.uni.edu" locator-type="email">poleksic@cs.uni.edu</inter-ref></p>
<p><b>Supplementary information:</b> <inter-ref locator="http://bioinformatics.oxfordjournals.org/cgi/content/full/btp530/DC1" locator-type="url">Supplementary data</inter-ref> are available at <I>Bioinformatics</I> online.</p>
]]></description>
<dc:creator><![CDATA[Poleksic, A.]]></dc:creator>
<dc:date>Fri, 23 Oct 2009 06:34:20 PDT</dc:date>
<dc:identifier>info:doi/10.1093/bioinformatics/btp530</dc:identifier>
<dc:title><![CDATA[Algorithms for optimal protein structure alignment]]></dc:title>
<dc:publisher>Oxford University Press</dc:publisher>
<prism:number>21</prism:number>
<prism:volume>25</prism:volume>
<prism:endingPage>2756</prism:endingPage>
<prism:publicationDate>2009-11-01</prism:publicationDate>
<prism:startingPage>2751</prism:startingPage>
<prism:section>STRUCTURAL BIOINFORMATICS</prism:section>
</item>

<item rdf:about="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/21/2757?rss=1">
<title><![CDATA[CCHMM_PROF: a HMM-based coiled-coil predictor with evolutionary information]]></title>
<link>http://bioinformatics.oxfordjournals.org/cgi/content/short/25/21/2757?rss=1</link>
<description><![CDATA[
<p><b>Motivation:</b>The widespread coiled-coil structural motif in proteins is known to mediate a variety of biological interactions. Recognizing a coiled-coil containing sequence and locating its coiled-coil domains are key steps towards the determination of the protein structure and function. Different tools are available for predicting coiled-coil domains in protein sequences, including those based on position-specific score matrices and machine learning methods.</p>
<p><b>Results:</b> In this article, we introduce a hidden Markov model (CCHMM_PROF) that exploits the information contained in multiple sequence alignments (profiles) to predict coiled-coil regions. The new method discriminates coiled-coil sequences with an accuracy of 97% and achieves a true positive rate of 79% with only 1% of false positives. Furthermore, when predicting the location of coiled-coil segments in protein sequences, the method reaches an accuracy of 80% at the residue level and a best per-segment and per-protein efficiency of 81% and 80%, respectively. The results indicate that CCHMM_PROF outperforms all the existing tools and can be adopted for large-scale genome annotation.</p>
<p><b>Availability:</b> The dataset is available at <inter-ref locator="http://www.biocomp.unibo.it/~lisa/coiled-coils" locator-type="url">http://www.biocomp.unibo.it/~lisa/coiled-coils</inter-ref>. The predictor is freely available at <inter-ref locator="http://gpcr.biocomp.unibo.it/cgi/predictors/cchmmprof/pred_cchmmprof.cgi" locator-type="url">http://gpcr.biocomp.unibo.it/cgi/predictors/cchmmprof/pred_cchmmprof.cgi</inter-ref>.</p>
<p><b>Contact:</b> <inter-ref locator="piero@biocomp.unibo.it" locator-type="email">piero@biocomp.unibo.it</inter-ref></p>
]]></description>
<dc:creator><![CDATA[Bartoli, L., Fariselli, P., Krogh, A., Casadio, R.]]></dc:creator>
<dc:date>Fri, 23 Oct 2009 06:34:20 PDT</dc:date>
<dc:identifier>info:doi/10.1093/bioinformatics/btp539</dc:identifier>
<dc:title><![CDATA[CCHMM_PROF: a HMM-based coiled-coil predictor with evolutionary information]]></dc:title>
<dc:publisher>Oxford University Press</dc:publisher>
<prism:number>21</prism:number>
<prism:volume>25</prism:volume>
<prism:endingPage>2763</prism:endingPage>
<prism:publicationDate>2009-11-01</prism:publicationDate>
<prism:startingPage>2757</prism:startingPage>
<prism:section>STRUCTURAL BIOINFORMATICS</prism:section>
</item>

<item rdf:about="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/21/2764?rss=1">
<title><![CDATA[Correlating multiple SNPs and multiple disease phenotypes: penalized non-linear canonical correlation analysis]]></title>
<link>http://bioinformatics.oxfordjournals.org/cgi/content/short/25/21/2764?rss=1</link>
<description><![CDATA[
<p><b>Motivation:</b> Canonical correlation analysis (CCA) can be used to capture the underlying genetic background of a complex disease, by associating two datasets containing information about a patient's phenotypical and genetic details. Often the genetic information is measured on a qualitative scale, consequently ordinary CCA cannot be applied to such data. Moreover, the size of the data in genetic studies can be enormous, thereby making the results difficult to interpret.</p>
<p><b>Results:</b> We developed a penalized non-linear CCA approach that can deal with qualitative data by transforming each qualitative variable into a continuous variable through optimal scaling. Additionally, sparse results were obtained by adapting soft-thresholding to this non-linear version of the CCA. By means of simulation studies, we show that our method is capable of extracting relevant variables out of high-dimensional sets. We applied our method to a genetic dataset containing 144 patients with glial cancer.</p>
<p><b>Contact:</b> <inter-ref locator="s.waaijenborg@amc.uva.nl" locator-type="email">s.waaijenborg@amc.uva.nl</inter-ref></p>
]]></description>
<dc:creator><![CDATA[Waaijenborg, S., Zwinderman, A. H.]]></dc:creator>
<dc:date>Fri, 23 Oct 2009 06:34:20 PDT</dc:date>
<dc:identifier>info:doi/10.1093/bioinformatics/btp491</dc:identifier>
<dc:title><![CDATA[Correlating multiple SNPs and multiple disease phenotypes: penalized non-linear canonical correlation analysis]]></dc:title>
<dc:publisher>Oxford University Press</dc:publisher>
<prism:number>21</prism:number>
<prism:volume>25</prism:volume>
<prism:endingPage>2771</prism:endingPage>
<prism:publicationDate>2009-11-01</prism:publicationDate>
<prism:startingPage>2764</prism:startingPage>
<prism:section>GENE EXPRESSION</prism:section>
</item>

<item rdf:about="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/21/2772?rss=1">
<title><![CDATA[The effects of probe binding affinity differences on gene expression measurements and how to deal with them]]></title>
<link>http://bioinformatics.oxfordjournals.org/cgi/content/short/25/21/2772?rss=1</link>
<description><![CDATA[
<p><b>Motivation:</b> When comparing gene expression levels between species or strains using microarrays, sequence differences between the groups can cause false identification of expression differences. Our simulated dataset shows that a sequence divergence of only 1% between species can lead to falsely reported expression differences for &gt;50% of the transcripts&mdash;similar levels of effect have been reported previously in comparisons of human and chimpanzee expression. We propose a method for identifying probes that cause such false readings, using only the microarray data, so that problematic probes can be excluded from analysis. We then test the power of the method to detect sequence differences and to correct for falsely reported expression differences. Our method can detect 70% of the probes with sequence differences using human and chimpanzee data, while removing only 18% of probes with no sequence differences. Although only 70% of the probes with sequence differences are detected, the effect of removing probes on falsely reported expression differences is more dramatic: the method can remove 98% of the falsely reported expression differences from a simulated dataset. We argue that the method should be used even when sequence data are available.</p>
<p><b>Contact:</b> <inter-ref locator="lachmann@eva.mpg.de" locator-type="email">lachmann@eva.mpg.de</inter-ref></p>
<p><b>Supplementary information:</b> <inter-ref locator="http://bioinformatics.oxfordjournals.org/cgi/content/full/btp492/DC1" locator-type="url">Supplementary data</inter-ref> are available at <I>Bioinformatics</I> online.</p>
]]></description>
<dc:creator><![CDATA[Dannemann, M., Lorenc, A., Hellmann, I., Khaitovich, P., Lachmann, M.]]></dc:creator>
<dc:date>Fri, 23 Oct 2009 06:34:20 PDT</dc:date>
<dc:identifier>info:doi/10.1093/bioinformatics/btp492</dc:identifier>
<dc:title><![CDATA[The effects of probe binding affinity differences on gene expression measurements and how to deal with them]]></dc:title>
<dc:publisher>Oxford University Press</dc:publisher>
<prism:number>21</prism:number>
<prism:volume>25</prism:volume>
<prism:endingPage>2779</prism:endingPage>
<prism:publicationDate>2009-11-01</prism:publicationDate>
<prism:startingPage>2772</prism:startingPage>
<prism:section>GENE EXPRESSION</prism:section>
</item>

<item rdf:about="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/21/2780?rss=1">
<title><![CDATA[Statistical methods for gene set co-expression analysis]]></title>
<link>http://bioinformatics.oxfordjournals.org/cgi/content/short/25/21/2780?rss=1</link>
<description><![CDATA[
<p><b>Motivation:</b> The power of a microarray experiment derives from the identification of genes differentially regulated across biological conditions. To date, differential regulation is most often taken to mean differential expression, and a number of useful methods for identifying differentially expressed (DE) genes or gene sets are available. However, such methods are not able to identify many relevant classes of differentially regulated genes. One important example concerns differentially co-expressed (DC) genes.</p>
<p><b>Results:</b> We propose an approach, gene set co-expression analysis (GSCA), to identify DC gene sets. The GSCA approach provides a false discovery rate controlled list of interesting gene sets, does not require that genes be highly correlated in at least one biological condition and is readily applied to data from individual or multiple experiments, as we demonstrate using data from studies of lung cancer and diabetes.</p>
<p><b>Availability:</b> The GSCA approach is implemented in R and available at <inter-ref locator="www.biostat.wisc.edu/~kendzior/GSCA/" locator-type="url">www.biostat.wisc.edu/~kendzior/GSCA/</inter-ref>.</p>
<p><b>Contact:</b> <inter-ref locator="kendzior@biostat.wisc.edu" locator-type="email">kendzior@biostat.wisc.edu</inter-ref></p>
<p><b>Supplementary information:</b> <inter-ref locator="http://bioinformatics.oxfordjournals.org/cgi/content/full/btp502/DC1" locator-type="url">Supplementary data</inter-ref> are available at <I>Bioinformatics</I> online.</p>
]]></description>
<dc:creator><![CDATA[Choi, Y., Kendziorski, C.]]></dc:creator>
<dc:date>Fri, 23 Oct 2009 06:34:20 PDT</dc:date>
<dc:identifier>info:doi/10.1093/bioinformatics/btp502</dc:identifier>
<dc:title><![CDATA[Statistical methods for gene set co-expression analysis]]></dc:title>
<dc:publisher>Oxford University Press</dc:publisher>
<prism:number>21</prism:number>
<prism:volume>25</prism:volume>
<prism:endingPage>2786</prism:endingPage>
<prism:publicationDate>2009-11-01</prism:publicationDate>
<prism:startingPage>2780</prism:startingPage>
<prism:section>GENE EXPRESSION</prism:section>
</item>

<item rdf:about="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/21/2787?rss=1">
<title><![CDATA[A novel algorithm for detecting differentially regulated paths based on gene set enrichment analysis]]></title>
<link>http://bioinformatics.oxfordjournals.org/cgi/content/short/25/21/2787?rss=1</link>
<description><![CDATA[
<p><b>Motivation:</b> Deregulated signaling cascades are known to play a crucial role in many pathogenic processes, among them are tumor initiation and progression. In the recent past, modern experimental techniques that allow for measuring the amount of mRNA transcripts of almost all known human genes in a tissue or even in a single cell have opened new avenues for studying the activity of the signaling cascades and for understanding the information flow in the networks.</p>
<p><b>Results:</b> We present a novel dynamic programming algorithm for detecting deregulated signaling cascades. The so-called FiDePa (Finding Deregulated Paths) algorithm interprets differences in the expression profiles of tumor and normal tissues. It relies on the well-known gene set enrichment analysis (GSEA) and efficiently detects all paths in a given regulatory or signaling network that are significantly enriched with differentially expressed genes or proteins. Since our algorithm allows for comparing a single tumor expression profile with the control group, it facilitates the detection of specific regulatory features of a tumor that may help to optimize tumor therapy. To demonstrate the capabilities of our algorithm, we analyzed a glioma expression dataset with respect to a directed graph that combined the regulatory networks of the KEGG and TRANSPATH database. The resulting glioma consensus network that encompasses all detected deregulated paths contained many genes and pathways that are known to be key players in glioma or cancer-related pathogenic processes. Moreover, we were able to correlate clinically relevant features like necrosis or metastasis with the detected paths.</p>
<p><b>Availability:</b> C++ source code is freely available, BiNA can be downloaded from <inter-ref locator="http://www.bnplusplus.org/" locator-type="url">http://www.bnplusplus.org/</inter-ref>.</p>
<p><b>Contact:</b> <inter-ref locator="ack@bioinf.uni-sb.de" locator-type="email">ack@bioinf.uni-sb.de</inter-ref></p>
<p><b>Supplementary information:</b> <inter-ref locator="http://bioinformatics.oxfordjournals.org/cgi/content/full/btp510/DC1" locator-type="url">Supplementary data</inter-ref> are available at <I>Bioinformatics</I> online.</p>
]]></description>
<dc:creator><![CDATA[Keller, A., Backes, C., Gerasch, A., Kaufmann, M., Kohlbacher, O., Meese, E., Lenhof, H.-P.]]></dc:creator>
<dc:date>Fri, 23 Oct 2009 06:34:20 PDT</dc:date>
<dc:identifier>info:doi/10.1093/bioinformatics/btp510</dc:identifier>
<dc:title><![CDATA[A novel algorithm for detecting differentially regulated paths based on gene set enrichment analysis]]></dc:title>
<dc:publisher>Oxford University Press</dc:publisher>
<prism:number>21</prism:number>
<prism:volume>25</prism:volume>
<prism:endingPage>2794</prism:endingPage>
<prism:publicationDate>2009-11-01</prism:publicationDate>
<prism:startingPage>2787</prism:startingPage>
<prism:section>GENE EXPRESSION</prism:section>
</item>

<item rdf:about="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/21/2795?rss=1">
<title><![CDATA[Bi-correlation clustering algorithm for determining a set of co-regulated genes]]></title>
<link>http://bioinformatics.oxfordjournals.org/cgi/content/short/25/21/2795?rss=1</link>
<description><![CDATA[
<p><b>Motivation:</b> Biclustering has been emerged as a powerful tool for identification of a group of co-expressed genes under a subset of experimental conditions (measurements) present in a gene expression dataset. Several biclustering algorithms have been proposed till date. In this article, we address some of the important shortcomings of these existing biclustering algorithms and propose a new correlation-based biclustering algorithm called bi-correlation clustering algorithm (BCCA).</p>
<p><b>Results:</b> BCCA has been able to produce a diverse set of biclusters of co-regulated genes over a subset of samples where all the genes in a bicluster have a similar change of expression pattern over the subset of samples. Moreover, the genes in a bicluster have common transcription factor binding sites in the corresponding promoter sequences. The presence of common transcription factors binding sites, in the corresponding promoter sequences, is an evidence that a group of genes in a bicluster are co-regulated. Biclusters determined by BCCA also show highly enriched functional categories. Using different gene expression datasets, we demonstrate strength and superiority of BCCA over some existing biclustering algorithms.</p>
<p><b>Availability:</b> The software for BCCA has been developed using C and Visual Basic languages, and can be executed on the Microsoft Windows platforms. The software may be downloaded as a zip file from <inter-ref locator="http://www.isical.ac.in/~rajat" locator-type="url">http://www.isical.ac.in/~rajat</inter-ref>. Then it needs to be installed. Two word files (included in the zip file) need to be consulted before installation and execution of the software.</p>
<p><b>Contact:</b> <inter-ref locator="rajat@isical.ac.in" locator-type="email">rajat@isical.ac.in</inter-ref></p>
<p><b>Supplementary information:</b> <inter-ref locator="http://bioinformatics.oxfordjournals.org/cgi/content/full/btp526/DC1" locator-type="url">Supplementary data</inter-ref> are available at <I>Bioinformatics</I> online.</p>
]]></description>
<dc:creator><![CDATA[Bhattacharya, A., De, R. K.]]></dc:creator>
<dc:date>Fri, 23 Oct 2009 06:34:20 PDT</dc:date>
<dc:identifier>info:doi/10.1093/bioinformatics/btp526</dc:identifier>
<dc:title><![CDATA[Bi-correlation clustering algorithm for determining a set of co-regulated genes]]></dc:title>
<dc:publisher>Oxford University Press</dc:publisher>
<prism:number>21</prism:number>
<prism:volume>25</prism:volume>
<prism:endingPage>2801</prism:endingPage>
<prism:publicationDate>2009-11-01</prism:publicationDate>
<prism:startingPage>2795</prism:startingPage>
<prism:section>GENE EXPRESSION</prism:section>
</item>

<item rdf:about="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/21/2802?rss=1">
<title><![CDATA[Multiple testing in genome-wide association studies via hidden Markov models]]></title>
<link>http://bioinformatics.oxfordjournals.org/cgi/content/short/25/21/2802?rss=1</link>
<description><![CDATA[
<p><b>Motivation:</b> Genome-wide association studies (GWAS) interrogate common genetic variation across the entire human genome in an unbiased manner and hold promise in identifying genetic variants with moderate or weak effect sizes. However, conventional testing procedures, which are mostly <I>P</I>-value based, ignore the dependency and therefore suffer from loss of efficiency. The goal of this article is to exploit the dependency information among adjacent single nucleotide polymorphisms (SNPs) to improve the screening efficiency in GWAS.</p>
<p><b>Results:</b> We propose to model the linear block dependency in the SNP data using hidden Markov models (HMMs). A compound decision&ndash;theoretic framework for testing HMM-dependent hypotheses is developed. We propose a powerful data-driven procedure [pooled local index of significance (PLIS)] that controls the false discovery rate (FDR) at the nominal level. PLIS is shown to be optimal in the sense that it has the smallest false negative rate (FNR) among all valid FDR procedures. By re-ranking significance for all SNPs with dependency considered, PLIS gains higher power than conventional <I>P</I>-value based methods. Simulation results demonstrate that PLIS dominates conventional FDR procedures in detecting disease-associated SNPs. Our method is applied to analysis of the SNP data from a GWAS of type 1 diabetes. Compared with the Benjamini&ndash;Hochberg (BH) procedure, PLIS yields more accurate results and has better reproducibility of findings.</p>
<p><b>Conclusion:</b> The genomic rankings based on our procedure are substantially different from the rankings based on the <I>P</I>-values. By integrating information from adjacent locations, the PLIS rankings benefit from the increased signal-to-noise ratio, hence our procedure often has higher statistical power and better reproducibility. It provides a promising direction in large-scale GWAS.</p>
<p><b>Availability:</b> An R package PLIS has been developed to implement the PLIS procedure. Source codes are available upon request and will be available on CRAN (<inter-ref locator="http://cran.r-project.org/" locator-type="url">http://cran.r-project.org/</inter-ref>).</p>
<p><b>Contact:</b> <inter-ref locator="zhiwei@njit.edu" locator-type="email">zhiwei@njit.edu</inter-ref></p>
<p><b>Supplementary information:</b> <inter-ref locator="http://bioinformatics.oxfordjournals.org/cgi/content/full/btp476/DC1" locator-type="url">Supplementary data</inter-ref> are available at <I>Bioinformatics</I> online.</p>
]]></description>
<dc:creator><![CDATA[Wei, Z., Sun, W., Wang, K., Hakonarson, H.]]></dc:creator>
<dc:date>Fri, 23 Oct 2009 06:34:20 PDT</dc:date>
<dc:identifier>info:doi/10.1093/bioinformatics/btp476</dc:identifier>
<dc:title><![CDATA[Multiple testing in genome-wide association studies via hidden Markov models]]></dc:title>
<dc:publisher>Oxford University Press</dc:publisher>
<prism:number>21</prism:number>
<prism:volume>25</prism:volume>
<prism:endingPage>2808</prism:endingPage>
<prism:publicationDate>2009-11-01</prism:publicationDate>
<prism:startingPage>2802</prism:startingPage>
<prism:section>GENETICS AND POPULATION ANALYSIS</prism:section>
</item>

<item rdf:about="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/21/2809?rss=1">
<title><![CDATA[Quantifying cancer progression with conjunctive Bayesian networks]]></title>
<link>http://bioinformatics.oxfordjournals.org/cgi/content/short/25/21/2809?rss=1</link>
<description><![CDATA[
<p><b>Motivation:</b> Cancer is an evolutionary process characterized by accumulating mutations. However, the precise timing and the order of genetic alterations that drive tumor progression remain enigmatic.</p>
<p><b>Results:</b> We present a specific probabilistic graphical model for the accumulation of mutations and their interdependencies. The Bayesian network models cancer progression by an explicit unobservable accumulation process in time that is separated from the observable but error-prone detection of mutations. Model parameters are estimated by an Expectation-Maximization algorithm and the underlying interaction graph is obtained by a simulated annealing procedure. Applying this method to cytogenetic data for different cancer types, we find multiple complex oncogenetic pathways deviating substantially from simplified models, such as linear pathways or trees. We further demonstrate how the inferred progression dynamics can be used to improve genetics-based survival predictions which could support diagnostics and prognosis.</p>
<p><b>Availability:</b> The software package ct-cbn is available under a GPL license on the web site <inter-ref locator="cbg.ethz.ch/software/ct-cbn" locator-type="url">cbg.ethz.ch/software/ct-cbn</inter-ref></p>
<p><b>Contact:</b> <inter-ref locator="moritz.gerstung@bsse.ethz.ch" locator-type="email">moritz.gerstung@bsse.ethz.ch</inter-ref></p>
]]></description>
<dc:creator><![CDATA[Gerstung, M., Baudis, M., Moch, H., Beerenwinkel, N.]]></dc:creator>
<dc:date>Fri, 23 Oct 2009 06:34:20 PDT</dc:date>
<dc:identifier>info:doi/10.1093/bioinformatics/btp505</dc:identifier>
<dc:title><![CDATA[Quantifying cancer progression with conjunctive Bayesian networks]]></dc:title>
<dc:publisher>Oxford University Press</dc:publisher>
<prism:number>21</prism:number>
<prism:volume>25</prism:volume>
<prism:endingPage>2815</prism:endingPage>
<prism:publicationDate>2009-11-01</prism:publicationDate>
<prism:startingPage>2809</prism:startingPage>
<prism:section>GENETICS AND POPULATION ANALYSIS</prism:section>
</item>

<item rdf:about="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/21/2816?rss=1">
<title><![CDATA[Accessible methods for the dynamic time-scale decomposition of biochemical systems]]></title>
<link>http://bioinformatics.oxfordjournals.org/cgi/content/short/25/21/2816?rss=1</link>
<description><![CDATA[
<p><b>Motivation:</b> The growing complexity of biochemical models asks for means to rationally dissect the networks into meaningful and rather independent subnetworks. Such foregoing should ensure an understanding of the system without any heuristics employed. Important for the success of such an approach is its accessibility and the clarity of the presentation of the results.</p>
<p><b>Results:</b> In order to achieve this goal, we developed a method which is a modification of the classical approach of time-scale separation. This modified method as well as the more classical approach have been implemented for time-dependent application within the widely used software COPASI. The implementation includes different possibilities for the representation of the results including 3D-visualization.</p>
<p><b>Availability:</b> The methods are included in COPASI which is free for academic use and available at <inter-ref locator="www.copasi.org" locator-type="url">www.copasi.org</inter-ref>.</p>
<p><b>Contact:</b> <inter-ref locator="irina.surovtsova@bioquant.uni-heidelberg.de" locator-type="email">irina.surovtsova@bioquant.uni-heidelberg.de</inter-ref></p>
<p><b>Supplementary information:</b> <inter-ref locator="http://bioinformatics.oxfordjournals.org/cgi/content/full/btp451/DC1" locator-type="url">Supplementary data</inter-ref> are available at <I>Bioinformatics</I> online.</p>
]]></description>
<dc:creator><![CDATA[Surovtsova, I., Simus, N., Lorenz, T., Konig, A., Sahle, S., Kummer, U.]]></dc:creator>
<dc:date>Fri, 23 Oct 2009 06:34:20 PDT</dc:date>
<dc:identifier>info:doi/10.1093/bioinformatics/btp451</dc:identifier>
<dc:title><![CDATA[Accessible methods for the dynamic time-scale decomposition of biochemical systems]]></dc:title>
<dc:publisher>Oxford University Press</dc:publisher>
<prism:number>21</prism:number>
<prism:volume>25</prism:volume>
<prism:endingPage>2823</prism:endingPage>
<prism:publicationDate>2009-11-01</prism:publicationDate>
<prism:startingPage>2816</prism:startingPage>
<prism:section>SYSTEMS BIOLOGY</prism:section>
</item>

<item rdf:about="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/21/2824?rss=1">
<title><![CDATA[Modified variational Bayes EM estimation of hidden Markov tree model of cell lineages]]></title>
<link>http://bioinformatics.oxfordjournals.org/cgi/content/short/25/21/2824?rss=1</link>
<description><![CDATA[
<p><b>Motivation:</b> Human pluripotent stem cell lines persist in culture as a heterogeneous population of SSEA3 positive and SSEA3 negative cells. Tracking individual stem cells in real time can elucidate the kinetics of cells switching between the SSEA3 positive and negative substates. However, identifying a cell's substate at all time points within a cell lineage tree is technically difficult.</p>
<p><b>Results:</b> A variational Bayesian Expectation Maximization (EM) with smoothed probabilities (VBEMS) algorithm for hidden Markov trees (HMT) is proposed for incomplete tree structured data. The full posterior of the HMT parameters is determined and the underflow problems associated with previous algorithms are eliminated. Example results for the prediction of the types of cells in synthetic and real stem cell lineage trees are presented.</p>
<p><b>Availability:</b>The Matlab code for the VBEMS algorithm is freely available at <inter-ref locator="http://www.acse.dept.shef.ac.uk/repository/vbems_lineage_tree/VBEMS.ZIP" locator-type="url">http://www.acse.dept.shef.ac.uk/repository/vbems_lineage_tree/VBEMS.ZIP</inter-ref></p>
<p><b>Contact:</b> <inter-ref locator="visakan@sheffield.ac.uk" locator-type="email">visakan@sheffield.ac.uk</inter-ref></p>
<p><b>Supplementary information:</b> <inter-ref locator="http://bioinformatics.oxfordjournals.org/cgi/content/full/btp456/DC1" locator-type="url">Supplementary data</inter-ref> are available at <I>Bioinformatics</I> online.</p>
]]></description>
<dc:creator><![CDATA[Olariu, V., Coca, D., Billings, S. A., Tonge, P., Gokhale, P., Andrews, P. W., Kadirkamanathan, V.]]></dc:creator>
<dc:date>Fri, 23 Oct 2009 06:34:20 PDT</dc:date>
<dc:identifier>info:doi/10.1093/bioinformatics/btp456</dc:identifier>
<dc:title><![CDATA[Modified variational Bayes EM estimation of hidden Markov tree model of cell lineages]]></dc:title>
<dc:publisher>Oxford University Press</dc:publisher>
<prism:number>21</prism:number>
<prism:volume>25</prism:volume>
<prism:endingPage>2830</prism:endingPage>
<prism:publicationDate>2009-11-01</prism:publicationDate>
<prism:startingPage>2824</prism:startingPage>
<prism:section>SYSTEMS BIOLOGY</prism:section>
</item>

<item rdf:about="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/21/2831?rss=1">
<title><![CDATA[A hypergraph-based learning algorithm for classifying gene expression and arrayCGH data with prior knowledge]]></title>
<link>http://bioinformatics.oxfordjournals.org/cgi/content/short/25/21/2831?rss=1</link>
<description><![CDATA[
<p><b>Motivation:</b> Incorporating biological prior knowledge into predictive models is a challenging data integration problem in analyzing high-dimensional genomic data. We introduce a hypergraph-based semi-supervised learning algorithm called <I>HyperPrior</I> to classify gene expression and array-based comparative genomic hybridization (arrayCGH) data using biological knowledge as constraints on graph-based learning. <I>HyperPrior</I> is a robust two-step iterative method that alternatively finds the optimal labeling of the samples and the optimal weighting of the features, guided by constraints encoding prior knowledge. The prior knowledge for analyzing gene expression data is that cancer-related genes tend to interact with each other in a protein&ndash;protein interaction network. Similarly, the prior knowledge for analyzing arrayCGH data is that probes that are spatially nearby in their layout along the chromosomes tend to be involved in the same amplification or deletion event. Based on the prior knowledge, <I>HyperPrior</I> imposes a consistent weighting of the correlated genomic features in graph-based learning.</p>
<p><b>Results:</b> We applied <I>HyperPrior</I> to test two arrayCGH datasets and two gene expression datasets for both cancer classification and biomarker identification. On all the datasets, <I>HyperPrior</I> achieved competitive classification performance, compared with SVMs and the other baselines utilizing the same prior knowledge. <I>HyperPrior</I> also identified several discriminative regions on chromosomes and discriminative subnetworks in the PPI, both of which contain cancer-related genomic elements. Our results suggest that <I>HyperPrior</I> is promising in utilizing biological prior knowledge to achieve better classification performance and more biologically interpretable findings in gene expression and arrayCGH data.</p>
<p><b>Availability:</b> <inter-ref locator="http://compbio.cs.umn.edu/HyperPrior" locator-type="url">http://compbio.cs.umn.edu/HyperPrior</inter-ref></p>
<p><b>Contact:</b> <inter-ref locator="kuang@cs.umn.edu" locator-type="email">kuang@cs.umn.edu</inter-ref></p>
<p><b>Supplementary information:</b> <inter-ref locator="http://bioinformatics.oxfordjournals.org/cgi/content/full/btp467/DC1" locator-type="url">Supplementary data</inter-ref> are available at <I>bioinformatics</I> online.</p>
]]></description>
<dc:creator><![CDATA[Tian, Z., Hwang, T., Kuang, R.]]></dc:creator>
<dc:date>Fri, 23 Oct 2009 06:34:20 PDT</dc:date>
<dc:identifier>info:doi/10.1093/bioinformatics/btp467</dc:identifier>
<dc:title><![CDATA[A hypergraph-based learning algorithm for classifying gene expression and arrayCGH data with prior knowledge]]></dc:title>
<dc:publisher>Oxford University Press</dc:publisher>
<prism:number>21</prism:number>
<prism:volume>25</prism:volume>
<prism:endingPage>2838</prism:endingPage>
<prism:publicationDate>2009-11-01</prism:publicationDate>
<prism:startingPage>2831</prism:startingPage>
<prism:section>SYSTEMS BIOLOGY</prism:section>
</item>

<item rdf:about="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/21/2839?rss=1">
<title><![CDATA[TagDust--a program to eliminate artifacts from next generation sequencing data]]></title>
<link>http://bioinformatics.oxfordjournals.org/cgi/content/short/25/21/2839?rss=1</link>
<description><![CDATA[
<p><b>Motivation:</b> Next-generation parallel sequencing technologies produce large quantities of short sequence reads. Due to experimental procedures various types of artifacts are commonly sequenced alongside the targeted RNA or DNA sequences. Identification of such artifacts is important during the development of novel sequencing assays and for the downstream analysis of the sequenced libraries.</p>
<p><b>Results:</b> Here we present TagDust, a program identifying artifactual sequences in large sequencing runs. Given a user-defined cutoff for the false discovery rate, TagDust identifies all reads explainable by combinations and partial matches to known sequences used during library preparation. We demonstrate the quality of our method on sequencing runs performed on Illumina's Genome Analyzer platform.</p>
<p><b>Availability:</b> Executables and documentation are available from <inter-ref locator="http://genome.gsc.riken.jp/osc/english/software/" locator-type="url">http://genome.gsc.riken.jp/osc/english/software/</inter-ref>.</p>
<p><b>Contact:</b> <inter-ref locator="timolassmann@gmail.com" locator-type="email">timolassmann@gmail.com</inter-ref></p>
]]></description>
<dc:creator><![CDATA[Lassmann, T., Hayashizaki, Y., Daub, C. O.]]></dc:creator>
<dc:date>Fri, 23 Oct 2009 06:34:20 PDT</dc:date>
<dc:identifier>info:doi/10.1093/bioinformatics/btp527</dc:identifier>
<dc:title><![CDATA[TagDust--a program to eliminate artifacts from next generation sequencing data]]></dc:title>
<dc:publisher>Oxford University Press</dc:publisher>
<prism:number>21</prism:number>
<prism:volume>25</prism:volume>
<prism:endingPage>2840</prism:endingPage>
<prism:publicationDate>2009-11-01</prism:publicationDate>
<prism:startingPage>2839</prism:startingPage>
<prism:section>GENOME ANALYSIS</prism:section>
</item>

<item rdf:about="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/21/2841?rss=1">
<title><![CDATA[Updates to the RMAP short-read mapping software]]></title>
<link>http://bioinformatics.oxfordjournals.org/cgi/content/short/25/21/2841?rss=1</link>
<description><![CDATA[
<p><b>Summary:</b> We report on a major new version of the RMAP software for mapping reads from short-read sequencing technology. General improvements to accuracy and space requirements are included, along with novel functionality. Included in the RMAP software package are tools for mapping paired-end reads, mapping using more sophisticated use of quality scores, collecting ambiguous mapping locations and mapping bisulfite-treated reads.</p>
<p><b>Availability:</b> The applications described in this note are available for download at <inter-ref locator="http://www.cmb.usc.edu/people/andrewds/rmap" locator-type="url">http://www.cmb.usc.edu/people/andrewds/rmap</inter-ref> and are distributed as Open Source software under the GPLv3.0. The software has been tested on Linux and OS X platforms.</p>
<p><b>Contact:</b> <inter-ref locator="andrewds@usc.edu" locator-type="email">andrewds@usc.edu</inter-ref>; <inter-ref locator="mzhang@cshl.edu" locator-type="email">mzhang@cshl.edu</inter-ref></p>
<p>The RMAP algorithm was introduced by (Smith <I>et al.</I>, <cross-ref type="bib" refid="B8">2008</cross-ref>) as one of the earliest available programs for mapping reads from the Illumina second-generation sequencing technology. One important contribution of RMAP was to incorporate the use of quality scores directly into the mapping process: read positions with too low a quality score were not considered while mapping, and that quality score cutoff could be adjusted by the user. Subsequently, numerous mapping algorithm have appeared (Langmead <I>et al.</I>, <cross-ref type="bib" refid="B2">2009</cross-ref>; Li,H. <I>et al.</I>, <cross-ref type="bib" refid="B3">2008</cross-ref>; Li,R. <I>et al.</I>, <cross-ref type="bib" refid="B4">2008</cross-ref>; Lin <I>et al.</I>, <cross-ref type="bib" refid="B5">2008</cross-ref>; Schatz, <cross-ref type="bib" refid="B7">2009</cross-ref>; Yanovsky <I>et al.</I>, <cross-ref type="bib" refid="B9">2008</cross-ref>), with improvements in both efficiency and breadth of functionality (e.g. ability to map paired-end reads; integrated SNP calling). Investigators requiring solutions to mapping problems now have many options. As new applications of short-read sequencing emerge, many variations on the analysis task of read mapping emerge. Diversity in performance characteristics of existing mapping tools becomes potentially valuable.</p>
<p>We report the first major update to RMAP. The basic algorithmic framework in RMAP is still to preprocess reads and scan the genome, but several modifications have been made and much additional functionality has been included. Importantly, RMAP has a memory footprint that depends on the number of reads being mapped. This feature allows RMAP to be used effectively in cluster environments with commodity nodes, because partitioning the reads allows natural parallelizations with linear reduction in memory requirements per processor core used.</p>
<p>Included in this release of the RMAP software package is functionality for mapping paired-end reads, making more sophisticated use of quality scores, collecting mapping locations for ambiguously mapping reads and mapping bisulfite-treated reads.</p>
]]></description>
<dc:creator><![CDATA[Smith, A. D., Chung, W.-Y., Hodges, E., Kendall, J., Hannon, G., Hicks, J., Xuan, Z., Zhang, M. Q.]]></dc:creator>
<dc:date>Fri, 23 Oct 2009 06:34:20 PDT</dc:date>
<dc:identifier>info:doi/10.1093/bioinformatics/btp533</dc:identifier>
<dc:title><![CDATA[Updates to the RMAP short-read mapping software]]></dc:title>
<dc:publisher>Oxford University Press</dc:publisher>
<prism:number>21</prism:number>
<prism:volume>25</prism:volume>
<prism:endingPage>2842</prism:endingPage>
<prism:publicationDate>2009-11-01</prism:publicationDate>
<prism:startingPage>2841</prism:startingPage>
<prism:section>SEQUENCE ANALYSIS</prism:section>
</item>

<item rdf:about="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/21/2843?rss=1">
<title><![CDATA[3D-SURFER: software for high-throughput protein surface comparison and analysis]]></title>
<link>http://bioinformatics.oxfordjournals.org/cgi/content/short/25/21/2843?rss=1</link>
<description><![CDATA[
<p><b>Summary:</b> We present 3D-SURFER, a web-based tool designed to facilitate high-throughput comparison and characterization of proteins based on their surface shape. As each protein is effectively represented by a vector of 3D Zernike descriptors, comparison times for a query protein against the entire PDB take, on an average, only a couple of seconds. The web interface has been designed to be as interactive as possible with displays showing animated protein rotations, CATH codes and structural alignments using the CE program. In addition, geometrically interesting local features of the protein surface, such as pockets that often correspond to ligand binding sites as well as protrusions and flat regions can also be identified and visualized.</p>
<p><b>Availability:</b> 3D-SURFER is a web application that can be freely accessed from: <inter-ref locator="http://dragon.bio.purdue.edu/3d-surfer" locator-type="url">http://dragon.bio.purdue.edu/3d-surfer</inter-ref></p>
<p><b>Contact:</b> <inter-ref locator="dkihara@purdue.edu" locator-type="email">dkihara@purdue.edu</inter-ref></p>
<p><b>Supplementary information:</b> <inter-ref locator="http://bioinformatics.oxfordjournals.org/cgi/content/full/btp542/DC1" locator-type="url">Supplementary data</inter-ref> are available at <I>Bioinformatics</I> online.</p>
]]></description>
<dc:creator><![CDATA[La, D., Esquivel-Rodriguez, J., Venkatraman, V., Li, B., Sael, L., Ueng, S., Ahrendt, S., Kihara, D.]]></dc:creator>
<dc:date>Fri, 23 Oct 2009 06:34:20 PDT</dc:date>
<dc:identifier>info:doi/10.1093/bioinformatics/btp542</dc:identifier>
<dc:title><![CDATA[3D-SURFER: software for high-throughput protein surface comparison and analysis]]></dc:title>
<dc:publisher>Oxford University Press</dc:publisher>
<prism:number>21</prism:number>
<prism:volume>25</prism:volume>
<prism:endingPage>2844</prism:endingPage>
<prism:publicationDate>2009-11-01</prism:publicationDate>
<prism:startingPage>2843</prism:startingPage>
<prism:section>STRUCTURAL BIOINFORMATICS</prism:section>
</item>

<item rdf:about="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/21/2845?rss=1">
<title><![CDATA[COMPASS: a program for generating serial samples under an infinite sites model]]></title>
<link>http://bioinformatics.oxfordjournals.org/cgi/content/short/25/21/2845?rss=1</link>
<description><![CDATA[
<p><b>Summary:</b> The program <I>COMPASS</I> can generate samples that have been collected at various points in time from a population that is evolving according to a Wright&ndash;Fisher model. The samples are generated using coalescence simulations permitting various demographic scenarios and the program uses an infinite sites model to generate polymorphism data for the samples. By generating serially sampled population-genetic data, <I>COMPASS</I> allows investigating properties of polymorphism data that has been collected at different time points, and aid in making inference from ancient polymorphism data.</p>
<p><b>Availability:</b> The program and the manual are available at: <inter-ref locator="http://www.egs.uu.se/evbiol/Research/JakobssonLab/compass.html" locator-type="url">http://www.egs.uu.se/evbiol/Research/JakobssonLab/compass.html</inter-ref></p>
<p><b>Contact:</b> <inter-ref locator="mattias.jakobsson@ebc.uu.se" locator-type="email">mattias.jakobsson@ebc.uu.se</inter-ref></p>
]]></description>
<dc:creator><![CDATA[Jakobsson, M.]]></dc:creator>
<dc:date>Fri, 23 Oct 2009 06:34:20 PDT</dc:date>
<dc:identifier>info:doi/10.1093/bioinformatics/btp534</dc:identifier>
<dc:title><![CDATA[COMPASS: a program for generating serial samples under an infinite sites model]]></dc:title>
<dc:publisher>Oxford University Press</dc:publisher>
<prism:number>21</prism:number>
<prism:volume>25</prism:volume>
<prism:endingPage>2847</prism:endingPage>
<prism:publicationDate>2009-11-01</prism:publicationDate>
<prism:startingPage>2845</prism:startingPage>
<prism:section>GENETICS AND POPULATION ANALYSIS</prism:section>
</item>

<item rdf:about="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/21/2848?rss=1">
<title><![CDATA[iBioSim: a tool for the analysis and design of genetic circuits]]></title>
<link>http://bioinformatics.oxfordjournals.org/cgi/content/short/25/21/2848?rss=1</link>
<description><![CDATA[
<p><b>Summary:</b> <ty>iBioSim</ty> is a tool that supports learning of genetic circuit models, efficient abstraction-based analysis of these models and the design of synthetic genetic circuits. <ty>iBioSim</ty> includes project management features and a graphical user interface that facilitate the development and maintenance of genetic circuit models as well as both experimental and simulation data records.</p>
<p><b>Availability:</b> <ty>iBioSim</ty> is available for download for Windows, Linux, and MacOS at <inter-ref locator="http://www.async.ece.utah.edu/iBioSim/" locator-type="url">http://www.async.ece.utah.edu/iBioSim/</inter-ref></p>
<p><b>Contact:</b> <inter-ref locator="myers@ece.utah.edu" locator-type="email">myers@ece.utah.edu</inter-ref></p>
]]></description>
<dc:creator><![CDATA[Myers, C. J., Barker, N., Jones, K., Kuwahara, H., Madsen, C., Nguyen, N.-P. D.]]></dc:creator>
<dc:date>Fri, 23 Oct 2009 06:34:20 PDT</dc:date>
<dc:identifier>info:doi/10.1093/bioinformatics/btp457</dc:identifier>
<dc:title><![CDATA[iBioSim: a tool for the analysis and design of genetic circuits]]></dc:title>
<dc:publisher>Oxford University Press</dc:publisher>
<prism:number>21</prism:number>
<prism:volume>25</prism:volume>
<prism:endingPage>2849</prism:endingPage>
<prism:publicationDate>2009-11-01</prism:publicationDate>
<prism:startingPage>2848</prism:startingPage>
<prism:section>SYSTEMS BIOLOGY</prism:section>
</item>

<item rdf:about="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/21/2850?rss=1">
<title><![CDATA[WEbcoli: an interactive and asynchronous web application for in silico design and analysis of genome-scale E.coli model]]></title>
<link>http://bioinformatics.oxfordjournals.org/cgi/content/short/25/21/2850?rss=1</link>
<description><![CDATA[
<p><b>Summary:</b> WEbcoli is a <I>WEb</I> application for <I>in silico</I> designing, analyzing and engineering <I>Escherichia coli</I> metabolism. It is devised and implemented using advanced web technologies, thereby leading to enhanced usability and dynamic web accessibility. As a main feature, the WEbcoli system provides a user-friendly rich web interface, allowing users to virtually design and synthesize mutant strains derived from the genome-scale wild-type <I>E.coli</I> model and to customize pathways of interest through a graph editor. In addition, constraints-based flux analysis can be conducted for quantifying metabolic fluxes and charactering the physiological and metabolic states under various genetic and/or environmental conditions.</p>
<p><b>Availability:</b> WEbcoli is freely accessible at <inter-ref locator="http://webcoli.org" locator-type="url">http://webcoli.org</inter-ref>.</p>
<p><b>Contact:</b> <inter-ref locator="cheld@nus.edu.sg" locator-type="email">cheld@nus.edu.sg</inter-ref></p>
]]></description>
<dc:creator><![CDATA[Jung, T.-S., Yeo, H. C., Reddy, S. G., Cho, W.-S., Lee, D.-Y.]]></dc:creator>
<dc:date>Fri, 23 Oct 2009 06:34:20 PDT</dc:date>
<dc:identifier>info:doi/10.1093/bioinformatics/btp496</dc:identifier>
<dc:title><![CDATA[WEbcoli: an interactive and asynchronous web application for in silico design and analysis of genome-scale E.coli model]]></dc:title>
<dc:publisher>Oxford University Press</dc:publisher>
<prism:number>21</prism:number>
<prism:volume>25</prism:volume>
<prism:endingPage>2852</prism:endingPage>
<prism:publicationDate>2009-11-01</prism:publicationDate>
<prism:startingPage>2850</prism:startingPage>
<prism:section>SYSTEMS BIOLOGY</prism:section>
</item>

<item rdf:about="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/21/2853?rss=1">
<title><![CDATA[ERNEST: a toolbox for chemical reaction network theory]]></title>
<link>http://bioinformatics.oxfordjournals.org/cgi/content/short/25/21/2853?rss=1</link>
<description><![CDATA[
<p><b>Summary:</b> ERNEST Reaction Network Equilibria Study Toolbox is a MATLAB package which, by checking various different criteria on the structure of a chemical reaction network, can exclude the multistationarity of the corresponding reaction system. The results obtained are independent of the rate constants of the reactions, and can be used for model discrimination.</p>
<p><b>Availability and Implementation:</b> The software, implemented in MATLAB, is available under the GNU GPL free software license from <inter-ref locator="http://people.sissa.it/~altafini/papers/SoAl09/" locator-type="url">http://people.sissa.it/~altafini/papers/SoAl09/</inter-ref>. It requires the MATLAB Optimization Toolbox.</p>
<p><b>Contact:</b> <inter-ref locator="altafini@sissa.it" locator-type="email">altafini@sissa.it</inter-ref></p>
]]></description>
<dc:creator><![CDATA[Soranzo, N., Altafini, C.]]></dc:creator>
<dc:date>Fri, 23 Oct 2009 06:34:20 PDT</dc:date>
<dc:identifier>info:doi/10.1093/bioinformatics/btp513</dc:identifier>
<dc:title><![CDATA[ERNEST: a toolbox for chemical reaction network theory]]></dc:title>
<dc:publisher>Oxford University Press</dc:publisher>
<prism:number>21</prism:number>
<prism:volume>25</prism:volume>
<prism:endingPage>2854</prism:endingPage>
<prism:publicationDate>2009-11-01</prism:publicationDate>
<prism:startingPage>2853</prism:startingPage>
<prism:section>SYSTEMS BIOLOGY</prism:section>
</item>

<item rdf:about="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/21/2855?rss=1">
<title><![CDATA[integrOmics: an R package to unravel relationships between two omics datasets]]></title>
<link>http://bioinformatics.oxfordjournals.org/cgi/content/short/25/21/2855?rss=1</link>
<description><![CDATA[
<p><b>Motivation:</b> With the availability of many &lsquo;omics&rsquo; data, such as transcriptomics, proteomics or metabolomics, the integrative or joint analysis of multiple datasets from different technology platforms is becoming crucial to unravel the relationships between different biological functional levels. However, the development of such an analysis is a major computational and technical challenge as most approaches suffer from high data dimensionality. New methodologies need to be developed and validated.</p>
<p><b>Results:</b> <ty>integrOmics</ty> efficiently performs integrative analyses of two types of &lsquo;omics&rsquo; variables that are measured on the same samples. It includes a regularized version of canonical correlation analysis to enlighten correlations between two datasets, and a sparse version of partial least squares (PLS) regression that includes simultaneous variable selection in both datasets. The usefulness of both approaches has been demonstrated previously and successfully applied in various integrative studies.</p>
<p><b>Availability:</b> <ty>integrOmics</ty> is freely available from <inter-ref locator="http://CRAN.R-project.org/" locator-type="url">http://CRAN.R-project.org/</inter-ref> or from the web site companion (<inter-ref locator="http://math.univ-toulouse.fr/biostat" locator-type="url">http://math.univ-toulouse.fr/biostat</inter-ref>) that provides full documentation and tutorials.</p>
<p><b>Contact:</b> <inter-ref locator="k.lecao@uq.edu.au" locator-type="email">k.lecao@uq.edu.au</inter-ref></p>
<p><b>Supplementary information:</b> <inter-ref locator="http://bioinformatics.oxfordjournals.org/cgi/content/full/btp515/DC1" locator-type="url">Supplementary data</inter-ref> are available at <I>Bioinformatics</I> online.</p>
]]></description>
<dc:creator><![CDATA[Le Cao, K.-A., Gonzalez, I., Dejean, S.]]></dc:creator>
<dc:date>Fri, 23 Oct 2009 06:34:20 PDT</dc:date>
<dc:identifier>info:doi/10.1093/bioinformatics/btp515</dc:identifier>
<dc:title><![CDATA[integrOmics: an R package to unravel relationships between two omics datasets]]></dc:title>
<dc:publisher>Oxford University Press</dc:publisher>
<prism:number>21</prism:number>
<prism:volume>25</prism:volume>
<prism:endingPage>2856</prism:endingPage>
<prism:publicationDate>2009-11-01</prism:publicationDate>
<prism:startingPage>2855</prism:startingPage>
<prism:section>SYSTEMS BIOLOGY</prism:section>
</item>

<item rdf:about="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/21/2857?rss=1">
<title><![CDATA[Analyzing biological network parameters with CentiScaPe]]></title>
<link>http://bioinformatics.oxfordjournals.org/cgi/content/short/25/21/2857?rss=1</link>
<description><![CDATA[
<p><b>Summary:</b> The increasing availability of large network datasets along with the progresses in experimental high-throughput technologies have prompted the need for tools allowing easy integration of experimental data with data derived form network computational analysis. In order to enrich experimental data with network topological parameters, we have developed the Cytoscape plug-in CentiScaPe. The plug-in computes several network centrality parameters and allows the user to analyze existing relationships between experimental data provided by the users and node centrality values computed by the plug-in. CentiScaPe allows identifying network nodes that are relevant from both experimental and topological viewpoints. CentiScaPe also provides a Boolean logic-based tool that allows easy characterization of nodes whose topological relevance depends on more than one centrality. Finally, different graphic outputs and the included description of biological significance for each computed centrality facilitate the analysis by the end users not expert in graph theory, thus allowing easy node categorization and experimental prioritization.</p>
<p><b>Availability:</b> CentiScaPe can be downloaded via the Cytoscape web site: <inter-ref locator="http://chianti.ucsd.edu/cyto_web/plugins/index.php" locator-type="url">http://chianti.ucsd.edu/cyto_web/plugins/index.php</inter-ref>. Tutorial, centrality descriptions and example data are available at: <inter-ref locator="http://profs.sci.univr.it/~scardoni/centiscape/centiscapepage.php" locator-type="url">http://profs.sci.univr.it/~scardoni/centiscape/centiscapepage.php</inter-ref></p>
<p><b>Contact:</b> <inter-ref locator="giovanni.scardoni@gmail.com" locator-type="email">giovanni.scardoni@gmail.com</inter-ref></p>
<p><b>Supplementary information:</b> <inter-ref locator="http://bioinformatics.oxfordjournals.org/cgi/content/full/btp517/DC1" locator-type="url">Supplementary data</inter-ref> are available at <I>Bioinformatics</I> online.</p>
]]></description>
<dc:creator><![CDATA[Scardoni, G., Petterlini, M., Laudanna, C.]]></dc:creator>
<dc:date>Fri, 23 Oct 2009 06:34:21 PDT</dc:date>
<dc:identifier>info:doi/10.1093/bioinformatics/btp517</dc:identifier>
<dc:title><![CDATA[Analyzing biological network parameters with CentiScaPe]]></dc:title>
<dc:publisher>Oxford University Press</dc:publisher>
<prism:number>21</prism:number>
<prism:volume>25</prism:volume>
<prism:endingPage>2859</prism:endingPage>
<prism:publicationDate>2009-11-01</prism:publicationDate>
<prism:startingPage>2857</prism:startingPage>
<prism:section>SYSTEMS BIOLOGY</prism:section>
</item>

<item rdf:about="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/21/2860?rss=1">
<title><![CDATA[PathBuilder--open source software for annotating and developing pathway resources]]></title>
<link>http://bioinformatics.oxfordjournals.org/cgi/content/short/25/21/2860?rss=1</link>
<description><![CDATA[
<p><b>Summary:</b> We have developed PathBuilder, an open-source web application to annotate biological information pertaining to signaling pathways and to create web-based pathway resources. PathBuilder enables annotation of molecular events including protein&ndash;protein interactions, enzyme&ndash;substrate relationships and protein translocation events either manually or through automated importing of data from other databases. Salient features of PathBuilder include automatic validation of data formats, built-in modules for visualization of pathways, automated import of data from other pathway resources, export of data in several standard data exchange formats and an application programming interface for retrieving existing pathway datasets.</p>
<p><b>Availability:</b> PathBuilder is freely available for download at <inter-ref locator="http://pathbuilder.sourceforge.net/" locator-type="url">http://pathbuilder.sourceforge.net/</inter-ref> under the terms of GNU lesser general public license (LGPL: <inter-ref locator="http://www.gnu.org/copyleft/lesser.html" locator-type="url">http://www.gnu.org/copyleft/lesser.html</inter-ref>). The software is platform independent and has been tested on Windows and Linux platforms.</p>
<p><b>Contact:</b> <inter-ref locator="pandey@jhmi.edu" locator-type="email">pandey@jhmi.edu</inter-ref></p>
<p><b>Supplementary information:</b> <inter-ref locator="http://bioinformatics.oxfordjournals.org/cgi/content/full/btp453/DC1" locator-type="url">Supplementary data</inter-ref> are available at <I>Bioinformatics</I> online.</p>
]]></description>
<dc:creator><![CDATA[Kandasamy, K., Keerthikumar, S., Raju, R., Keshava Prasad, T. S., Ramachandra, Y. L., Mohan, S., Pandey, A.]]></dc:creator>
<dc:date>Fri, 23 Oct 2009 06:34:21 PDT</dc:date>
<dc:identifier>info:doi/10.1093/bioinformatics/btp453</dc:identifier>
<dc:title><![CDATA[PathBuilder--open source software for annotating and developing pathway resources]]></dc:title>
<dc:publisher>Oxford University Press</dc:publisher>
<prism:number>21</prism:number>
<prism:volume>25</prism:volume>
<prism:endingPage>2862</prism:endingPage>
<prism:publicationDate>2009-11-01</prism:publicationDate>
<prism:startingPage>2860</prism:startingPage>
<prism:section>DATABASES AND ONTOLOGIES</prism:section>
</item>

<item rdf:about="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/21/2863?rss=1">
<title><![CDATA[A report on the 2009 SIG on short read sequencing and algorithms (Short-SIG)]]></title>
<link>http://bioinformatics.oxfordjournals.org/cgi/content/short/25/21/2863?rss=1</link>
<description><![CDATA[]]></description>
<dc:creator><![CDATA[Brudno, M., Medvedev, P., Stoye, J., De La Vega, F. M.]]></dc:creator>
<dc:date>Fri, 23 Oct 2009 06:34:21 PDT</dc:date>
<dc:identifier>info:doi/10.1093/bioinformatics/btp525</dc:identifier>
<dc:title><![CDATA[A report on the 2009 SIG on short read sequencing and algorithms (Short-SIG)]]></dc:title>
<dc:publisher>Oxford University Press</dc:publisher>
<prism:number>21</prism:number>
<prism:volume>25</prism:volume>
<prism:endingPage>2864</prism:endingPage>
<prism:publicationDate>2009-11-01</prism:publicationDate>
<prism:startingPage>2863</prism:startingPage>
<prism:section>REPORT</prism:section>
</item>

<item rdf:about="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/21/2865?rss=1">
<title><![CDATA[Pindel: a pattern growth approach to detect break points of large deletions and medium sized insertions from paired-end short reads]]></title>
<link>http://bioinformatics.oxfordjournals.org/cgi/content/short/25/21/2865?rss=1</link>
<description><![CDATA[
<p><b>Motivation:</b> There is a strong demand in the genomic community to develop effective algorithms to reliably identify genomic variants. Indel detection using next-gen data is difficult and identification of long structural variations is extremely challenging.</p>
<p><b>Results:</b> We present Pindel, a pattern growth approach, to detect breakpoints of large deletions and medium-sized insertions from paired-end short reads. We use both simulated reads and real data to demonstrate the efficiency of the computer program and accuracy of the results.</p>
<p><b>Availability:</b> The binary code and a short user manual can be freely downloaded from <inter-ref locator="http://www.ebi.ac.uk/~kye/pindel/" locator-type="url">http://www.ebi.ac.uk/~kye/pindel/</inter-ref>.</p>
<p><b>Contact:</b> <inter-ref locator="k.ye@lumc.nl" locator-type="email">k.ye@lumc.nl</inter-ref>; <inter-ref locator="zn1@sanger.ac.uk" locator-type="email">zn1@sanger.ac.uk</inter-ref></p>
]]></description>
<dc:creator><![CDATA[Ye, K., Schulz, M. H., Long, Q., Apweiler, R., Ning, Z.]]></dc:creator>
<dc:date>Fri, 23 Oct 2009 06:34:21 PDT</dc:date>
<dc:identifier>info:doi/10.1093/bioinformatics/btp394</dc:identifier>
<dc:title><![CDATA[Pindel: a pattern growth approach to detect break points of large deletions and medium sized insertions from paired-end short reads]]></dc:title>
<dc:publisher>Oxford University Press</dc:publisher>
<prism:number>21</prism:number>
<prism:volume>25</prism:volume>
<prism:endingPage>2871</prism:endingPage>
<prism:publicationDate>2009-11-01</prism:publicationDate>
<prism:startingPage>2865</prism:startingPage>
<prism:section>GENOME ANALYSIS</prism:section>
</item>

<item rdf:about="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/21/2872?rss=1">
<title><![CDATA[De novo transcriptome assembly with ABySS]]></title>
<link>http://bioinformatics.oxfordjournals.org/cgi/content/short/25/21/2872?rss=1</link>
<description><![CDATA[
<p><b>Motivation:</b> Whole transcriptome shotgun sequencing data from non-normalized samples offer unique opportunities to study the metabolic states of organisms. One can deduce gene expression levels using sequence coverage as a surrogate, identify coding changes or discover novel isoforms or transcripts. Especially for discovery of novel events, <I>de novo</I> assembly of transcriptomes is desirable.</p>
<p><b>Results:</b> Transcriptome from tumor tissue of a patient with follicular lymphoma was sequenced with 36 base pair (bp) single- and paired-end reads on the Illumina Genome Analyzer II platform. We assembled ~194 million reads using ABySS into 66 921 contigs 100 bp or longer, with a maximum contig length of 10 951 bp, representing over 30 million base pairs of unique transcriptome sequence, or roughly 1% of the genome.</p>
<p><b>Availability and Implementation:</b> Source code and binaries of ABySS are freely available for download at <inter-ref locator="http://www.bcgsc.ca/platform/bioinfo/software/abyss" locator-type="url">http://www.bcgsc.ca/platform/bioinfo/software/abyss</inter-ref>. Assembler tool is implemented in C++. The parallel version uses Open MPI. ABySS-Explorer tool is implemented in Java using the Java universal network/graph framework.</p>
<p><b>Contact:</b> <inter-ref locator="ibirol@bcgsc.ca" locator-type="email">ibirol@bcgsc.ca</inter-ref></p>
]]></description>
<dc:creator><![CDATA[Birol, I., Jackman, S. D., Nielsen, C. B., Qian, J. Q., Varhol, R., Stazyk, G., Morin, R. D., Zhao, Y., Hirst, M., Schein, J. E., Horsman, D. E., Connors, J. M., Gascoyne, R. D., Marra, M. A., Jones, S. J. M.]]></dc:creator>
<dc:date>Fri, 23 Oct 2009 06:34:21 PDT</dc:date>
<dc:identifier>info:doi/10.1093/bioinformatics/btp367</dc:identifier>
<dc:title><![CDATA[De novo transcriptome assembly with ABySS]]></dc:title>
<dc:publisher>Oxford University Press</dc:publisher>
<prism:number>21</prism:number>
<prism:volume>25</prism:volume>
<prism:endingPage>2877</prism:endingPage>
<prism:publicationDate>2009-11-01</prism:publicationDate>
<prism:startingPage>2872</prism:startingPage>
<prism:section>SEQUENCE ANALYSIS</prism:section>
</item>

<item rdf:about="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/21/2878?rss=1">
<title><![CDATA[Increasing the coverage of a metapopulation consensus genome by iterative read mapping and assembly]]></title>
<link>http://bioinformatics.oxfordjournals.org/cgi/content/short/25/21/2878?rss=1</link>
<description><![CDATA[
<p><b>Motivation:</b> Most microbial species can not be cultured in the laboratory. Metagenomic sequencing may still yield a complete genome if the sequenced community is enriched and the sequencing coverage is high. However, the complexity in a natural population may cause the enrichment culture to contain multiple related strains. This diversity can confound existing strict assembly programs and lead to a fragmented assembly, which is unnecessary if we have a related reference genome available that can function as a scaffold.</p>
<p><b>Results:</b> Here, we map short metagenomic sequencing reads from a population of strains to a related reference genome, and compose a genome that captures the consensus of the population's sequences. We show that by iteration of the mapping and assembly procedure, the coverage increases while the similarity with the reference genome decreases. This indicates that the assembly becomes less dependent on the reference genome and approaches the consensus genome of the multi-strain population.</p>
<p><b>Contact:</b> <inter-ref locator="dutilh@cmbi.ru.nl" locator-type="email">dutilh@cmbi.ru.nl</inter-ref></p>
<p><b>Supplementary Information:</b> <inter-ref locator="http://bioinformatics.oxfordjournals.org/cgi/content/full/btp377/DC1" locator-type="url">Supplementary data</inter-ref> are available at <I>Bioinformatics</I> online.</p>
]]></description>
<dc:creator><![CDATA[Dutilh, B. E., Huynen, M. A., Strous, M.]]></dc:creator>
<dc:date>Fri, 23 Oct 2009 06:34:21 PDT</dc:date>
<dc:identifier>info:doi/10.1093/bioinformatics/btp377</dc:identifier>
<dc:title><![CDATA[Increasing the coverage of a metapopulation consensus genome by iterative read mapping and assembly]]></dc:title>
<dc:publisher>Oxford University Press</dc:publisher>
<prism:number>21</prism:number>
<prism:volume>25</prism:volume>
<prism:endingPage>2881</prism:endingPage>
<prism:publicationDate>2009-11-01</prism:publicationDate>
<prism:startingPage>2878</prism:startingPage>
<prism:section>SEQUENCE ANALYSIS</prism:section>
</item>

<item rdf:about="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/21/2882?rss=1">
<title><![CDATA[ISOLATE: a computational strategy for identifying the primary origin of cancers using high-throughput sequencing]]></title>
<link>http://bioinformatics.oxfordjournals.org/cgi/content/short/25/21/2882?rss=1</link>
<description><![CDATA[
<p><b>Motivation:</b> One of the most deadly cancer diagnoses is the carcinoma of unknown primary origin. Without the knowledge of the site of origin, treatment regimens are limited in their specificity and result in high mortality rates. Though supervised classification methods have been developed to predict the site of origin based on gene expression data, they require large numbers of previously classified tumors for training, in part because they do not account for sample heterogeneity, which limits their application to well-studied cancers.</p>
<p><b>Results:</b> We present ISOLATE, a new statistical method that simultaneously predicts the primary site of origin of cancers and addresses sample heterogeneity, while taking advantage of new high-throughput sequencing technology that promises to bring higher accuracy and reproducibility to gene expression profiling experiments. ISOLATE makes predictions <I>de novo</I>, without having seen any training expression profiles of cancers with identified origin. Compared with previous methods, ISOLATE is able to predict the primary site of origin, de-convolve and remove the effect of sample heterogeneity and identify differentially expressed genes with higher accuracy, across both synthetic and clinical datasets. Methods such as ISOLATE are invaluable tools for clinicians faced with carcinomas of unknown primary origin.</p>
<p><b>Availability:</b> ISOLATE is available for download at: <inter-ref locator="http://morrislab.med.utoronto.ca/software" locator-type="url">http://morrislab.med.utoronto.ca/software</inter-ref></p>
<p><b>Contact:</b> <inter-ref locator="gerald.quon@utoronto.ca" locator-type="email">gerald.quon@utoronto.ca</inter-ref>; <inter-ref locator="quaid.morris@utoronto.ca" locator-type="email">quaid.morris@utoronto.ca</inter-ref></p>
<p><b>Supplementary information:</b> <inter-ref locator="http://bioinformatics.oxfordjournals.org/cgi/content/full/btp378/DC1" locator-type="url">Supplementary data</inter-ref> are available at <I>Bioinformatics</I> online.</p>
]]></description>
<dc:creator><![CDATA[Quon, G., Morris, Q.]]></dc:creator>
<dc:date>Fri, 23 Oct 2009 06:34:21 PDT</dc:date>
<dc:identifier>info:doi/10.1093/bioinformatics/btp378</dc:identifier>
<dc:title><![CDATA[ISOLATE: a computational strategy for identifying the primary origin of cancers using high-throughput sequencing]]></dc:title>
<dc:publisher>Oxford University Press</dc:publisher>
<prism:number>21</prism:number>
<prism:volume>25</prism:volume>
<prism:endingPage>2889</prism:endingPage>
<prism:publicationDate>2009-11-01</prism:publicationDate>
<prism:startingPage>2882</prism:startingPage>
<prism:section>GENE EXPRESSION</prism:section>
</item>

<item rdf:about="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/20/2625?rss=1">
<title><![CDATA[TargetMiner: microRNA target prediction with systematic identification of tissue-specific negative examples]]></title>
<link>http://bioinformatics.oxfordjournals.org/cgi/content/short/25/20/2625?rss=1</link>
<description><![CDATA[
<p><b>Motivation:</b> Prediction of microRNA (miRNA) target mRNAs using machine learning approaches is an important area of research. However, most of the methods suffer from either high false positive or false negative rates. One reason for this is the marked deficiency of negative examples or miRNA non-target pairs. Systematic identification of non-target mRNAs is still not addressed properly, and therefore, current machine learning approaches are compelled to rely on artificially generated negative examples for training.</p>
<p><b>Results:</b> In this article, we have identified ~300 tissue-specific negative examples using a novel approach that involves expression profiling of both miRNAs and mRNAs, miRNA&ndash;mRNA structural interactions and seed-site conservation. The newly generated negative examples are validated with pSILAC dataset, which elucidate the fact that the identified non-targets are indeed non-targets.These high-throughput tissue-specific negative examples and a set of experimentally verified positive examples are then used to build a system called TargetMiner, a support vector machine (SVM)-based classifier. In addition to assessing the prediction accuracy on cross-validation experiments, TargetMiner has been validated with a completely independent experimental test dataset. Our method outperforms 10 existing target prediction algorithms and provides a good balance between sensitivity and specificity that is not reflected in the existing methods. We achieve a significantly higher sensitivity and specificity of 69% and 67.8% based on a pool of 90 feature set and 76.5% and 66.1% using a set of 30 selected feature set on the completely independent test dataset.</p>
<p>In order to establish the effectiveness of the systematically generated negative examples, the SVM is trained using a different set of negative data generated using the method in Yousef <I>et al.</I> A significantly higher false positive rate (70.6%) is observed when tested on the independent set, while all other factors are kept the same. Again, when an existing method (NBmiRTar) is executed with the our proposed negative data, we observe an improvement in its performance. These clearly establish the effectiveness of the proposed approach of selecting the negative examples systematically.</p>
<p><b>Availability:</b> TargetMiner is now available as an online tool at <inter-ref locator="www.isical.ac.in/~bioinfo_miu" locator-type="url">www.isical.ac.in/~bioinfo_miu</inter-ref></p>
<p><b>Contact:</b> <inter-ref locator="sanghami@isical.ac.in" locator-type="email">sanghami@isical.ac.in</inter-ref>; <inter-ref locator="rmitra_t@isical.ac.in" locator-type="email">rmitra_t@isical.ac.in</inter-ref></p>
<p><b>Supplementary information:</b> <inter-ref locator="http://bioinformatics.oxfordjournals.org/cgi/content/full/btp503/DC1" locator-type="url">Supplementary data</inter-ref> are available at <I>Bioinformatics</I> online.</p>
]]></description>
<dc:creator><![CDATA[Bandyopadhyay, S., Mitra, R.]]></dc:creator>
<dc:date>Thu, 08 Oct 2009 22:47:51 PDT</dc:date>
<dc:identifier>info:doi/10.1093/bioinformatics/btp503</dc:identifier>
<dc:title><![CDATA[TargetMiner: microRNA target prediction with systematic identification of tissue-specific negative examples]]></dc:title>
<dc:publisher>Oxford University Press</dc:publisher>
<prism:number>20</prism:number>
<prism:volume>25</prism:volume>
<prism:endingPage>2631</prism:endingPage>
<prism:publicationDate>2009-10-15</prism:publicationDate>
<prism:startingPage>2625</prism:startingPage>
<prism:section>GENOME ANALYSIS</prism:section>
</item>

<item rdf:about="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/20/2632?rss=1">
<title><![CDATA[T-REKS: identification of Tandem REpeats in sequences with a K-meanS based algorithm]]></title>
<link>http://bioinformatics.oxfordjournals.org/cgi/content/short/25/20/2632?rss=1</link>
<description><![CDATA[
<p><b>Motivation:</b> Over the last years a number of evidences have been accumulated about high incidence of tandem repeats in proteins carrying fundamental biological functions and being related to a number of human diseases. At the same time, frequently, protein repeats are strongly degenerated during evolution and, therefore, cannot be easily identified. To solve this problem, several computer programs which were based on different algorithms have been developed. Nevertheless, our tests showed that there is still room for improvement of methods for accurate and rapid detection of tandem repeats in proteins.</p>
<p><b>Results:</b> We developed a new program called T-REKS for <I>ab initio</I> identification of the tandem repeats. It is based on clustering of lengths between identical short strings by using a <I>K</I>-means algorithm. Benchmark of the existing programs and T-REKS on several sequence datasets is presented. Our program being linked to the Protein Repeat DataBase opens the way for large-scale analysis of protein tandem repeats. T-REKS can also be applied to the nucleotide sequences.</p>
<p><b>Availability:</b> The algorithm has been implemented in JAVA, the program is available upon request at <inter-ref locator="http://bioinfo.montp.cnrs.fr/?r=t-reks" locator-type="url">http://bioinfo.montp.cnrs.fr/?r=t-reks</inter-ref>. Protein Repeat DataBase generated by using T-REKS is accessible at <inter-ref locator="http://bioinfo.montp.cnrs.fr/?r=repeatDB" locator-type="url">http://bioinfo.montp.cnrs.fr/?r=repeatDB</inter-ref>.</p>
<p><b>Contact:</b> <inter-ref locator="julien.jorda@crbm.cnrs.fr" locator-type="email">julien.jorda@crbm.cnrs.fr</inter-ref>; <inter-ref locator="andrey.kajava@crbm.cnrs.fr" locator-type="email">andrey.kajava@crbm.cnrs.fr</inter-ref></p>
<p><b>Supplementary information:</b> <inter-ref locator="http://bioinformatics.oxfordjournals.org/cgi/content/full/btp482/DC1" locator-type="url">Supplementary data</inter-ref> are available at <I>Bioinformatics</I> online.</p>
]]></description>
<dc:creator><![CDATA[Jorda, J., Kajava, A. V.]]></dc:creator>
<dc:date>Thu, 08 Oct 2009 22:47:51 PDT</dc:date>
<dc:identifier>info:doi/10.1093/bioinformatics/btp482</dc:identifier>
<dc:title><![CDATA[T-REKS: identification of Tandem REpeats in sequences with a K-meanS based algorithm]]></dc:title>
<dc:publisher>Oxford University Press</dc:publisher>
<prism:number>20</prism:number>
<prism:volume>25</prism:volume>
<prism:endingPage>2638</prism:endingPage>
<prism:publicationDate>2009-10-15</prism:publicationDate>
<prism:startingPage>2632</prism:startingPage>
<prism:section>SEQUENCE ANALYSIS</prism:section>
</item>

<item rdf:about="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/20/2639?rss=1">
<title><![CDATA[Enhancement of beta-sheet assembly by cooperative hydrogen bonds potential]]></title>
<link>http://bioinformatics.oxfordjournals.org/cgi/content/short/25/20/2639?rss=1</link>
<description><![CDATA[
<p><b>Motivation:</b> The roughness of energy landscapes is a major obstacle to protein structure prediction, since it forces conformational searches to spend much time struggling to escape numerous traps. Specifically, beta-sheet formation is prone to stray, since many possible combinations of hydrogen bonds are dead ends in terms of beta-sheet assembly. It has been shown that cooperative terms for backbone hydrogen bonds ease this problem by augmenting hydrogen bond patterns that are consistent with beta sheets. Here, we present a novel cooperative hydrogen-bond term that is both effective in promoting beta sheets and computationally efficient. In addition, the new term is differentiable and operates on all-atom protein models.</p>
<p><b>Results:</b> Energy optimization of poly-alanine chains under the new term led to significantly more beta-sheet content than optimization under a non-cooperative term. Furthermore, the optimized structure included very few non-native patterns.</p>
<p><b>Availability:</b> The new term is implemented within the MESHI package and is freely available at <inter-ref locator="http://cs.bgu.ac.il/~meshi" locator-type="url">http://cs.bgu.ac.il/~meshi</inter-ref>.</p>
<p><b>Contact:</b> <inter-ref locator="chen.keasar@gmail.com" locator-type="email">chen.keasar@gmail.com</inter-ref></p>
<p><b>Supplementary information:</b> <inter-ref locator="http://bioinformatics.oxfordjournals.org/cgi/content/full/btp449/DC1" locator-type="url">Supplementary data</inter-ref> are available at <I>Bioinformatics</I> online.</p>
]]></description>
<dc:creator><![CDATA[Levy-Moonshine, A., Amir, E.-a. D., Keasar, C.]]></dc:creator>
<dc:date>Thu, 08 Oct 2009 22:47:51 PDT</dc:date>
<dc:identifier>info:doi/10.1093/bioinformatics/btp449</dc:identifier>
<dc:title><![CDATA[Enhancement of beta-sheet assembly by cooperative hydrogen bonds potential]]></dc:title>
<dc:publisher>Oxford University Press</dc:publisher>
<prism:number>20</prism:number>
<prism:volume>25</prism:volume>
<prism:endingPage>2645</prism:endingPage>
<prism:publicationDate>2009-10-15</prism:publicationDate>
<prism:startingPage>2639</prism:startingPage>
<prism:section>STRUCTURAL BIOINFORMATICS</prism:section>
</item>

<item rdf:about="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/20/2646?rss=1">
<title><![CDATA[Partition function and base pairing probabilities for RNA-RNA interaction prediction]]></title>
<link>http://bioinformatics.oxfordjournals.org/cgi/content/short/25/20/2646?rss=1</link>
<description><![CDATA[
<p><b>Motivation:</b> The RNA&ndash;RNA interaction problem (RIP) consists in finding the energetically optimal structure of two RNA molecules that bind to each other. The standard model allows secondary structures in both partners as well as additional base pairs between the two RNAs subject to certain restrictions that ensure that RIP is solvabale by a polynomial time dynamic programming algorithm. RNA&ndash;RNA binding, like RNA folding, is typically not dominated by the ground state structure. Instead, a large ensemble of alternative structures contributes to the interaction thermodynamics.</p>
<p><b>Results:</b> We present here an <I>O</I>(<I>N</I><sup>6</sup>) time and <I>O</I>(<I>N</I><sup>4</sup>) dynamics programming algorithm for computing the full partition function for RIP which is based on the combinatorial notion of &lsquo;tight structures&rsquo;. Albeit equivalent to recent work by H. Chitsaz and collaborators, our approach in addition provides a full-fledged computation of the base pairing probabilities, which relies on the notion of a decomposition tree for joint structures. In practise, our implementation is efficient enough to investigate, for instance, the interactions of small bacterial RNAs and their target mRNAs.</p>
<p><b>Availability:</b> The program <ty>rip</ty> is implemented in C. The source code is available for download from <inter-ref locator="http://www.combinatorics.cn/cbpc/rip.html" locator-type="url">http://www.combinatorics.cn/cbpc/rip.html</inter-ref> and <inter-ref locator="http://www.bioinf.uni-leipzig.de/Software/rip.html" locator-type="url">http://www.bioinf.uni-leipzig.de/Software/rip.html</inter-ref>.</p>
<p><b>Contact:</b> <inter-ref locator="duck@santafe.edu" locator-type="email">duck@santafe.edu</inter-ref></p>
<p><b>Supplementary information:</b> <inter-ref locator="http://bioinformatics.oxfordjournals.org/cgi/content/full/btp481/DC1" locator-type="url">Supplementary data</inter-ref> are available at <I>Bioinformatics</I> online.</p>
]]></description>
<dc:creator><![CDATA[Huang, F. W. D., Qin, J., Reidys, C. M., Stadler, P. F.]]></dc:creator>
<dc:date>Thu, 08 Oct 2009 22:47:51 PDT</dc:date>
<dc:identifier>info:doi/10.1093/bioinformatics/btp481</dc:identifier>
<dc:title><![CDATA[Partition function and base pairing probabilities for RNA-RNA interaction prediction]]></dc:title>
<dc:publisher>Oxford University Press</dc:publisher>
<prism:number>20</prism:number>
<prism:volume>25</prism:volume>
<prism:endingPage>2654</prism:endingPage>
<prism:publicationDate>2009-10-15</prism:publicationDate>
<prism:startingPage>2646</prism:startingPage>
<prism:section>STRUCTURAL BIOINFORMATICS</prism:section>
</item>

<item rdf:about="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/20/2655?rss=1">
<title><![CDATA[A new taxonomy-based protein fold recognition approach based on autocross-covariance transformation]]></title>
<link>http://bioinformatics.oxfordjournals.org/cgi/content/short/25/20/2655?rss=1</link>
<description><![CDATA[
<p><b>Motivation:</b> Fold recognition is an important step in protein structure and function prediction. Traditional sequence comparison methods fail to identify reliable homologies with low sequence identity, while the taxonomic methods are effective alternatives, but their prediction accuracies are around 70%, which are still relatively low for practical usage.</p>
<p><b>Results:</b> In this study, a simple and powerful method is presented for taxonomic fold recognition, which combines support vector machine (SVM) with autocross-covariance (ACC) transformation. The evolutionary information represented in the form of position-specific score matrices is converted into a series of fixed-length vectors by ACC transformation and these vectors are then input to a SVM classifier for fold recognition. The sequence-order effect can be effectively captured by this scheme. Experiments are performed on the widely used D-B dataset and the corresponding extended dataset, respectively. The proposed method, called ACCFold, gets an overall accuracy of 70.1% on the D-B dataset, which is higher than major existing taxonomic methods by 2&ndash;14%. Furthermore, the method achieves an overall accuracy of 87.6% on the extended dataset, which surpasses major existing taxonomic methods by 9&ndash;17%. Additionally, our method obtains an overall accuracy of 80.9% for 86-folds and 77.2% for 199-folds. These results demonstrate that the ACCFold method provides the state-of-the-art performance for taxonomic fold recognition.</p>
<p><b>Availability:</b> The source code for ACC transformation is freely available at <inter-ref locator="http://www.iipl.fudan.edu.cn/demo/accpkg.html" locator-type="url">http://www.iipl.fudan.edu.cn/demo/accpkg.html</inter-ref>.</p>
<p><b>Contact:</b> <inter-ref locator="sgzhou@fudan.edu.cn" locator-type="email">sgzhou@fudan.edu.cn</inter-ref></p>
<p><b>Supplementary information:</b> <inter-ref locator="http://bioinformatics.oxfordjournals.org/cgi/content/full/btp500/DC1" locator-type="url">Supplementary data</inter-ref> are available at <I>Bioinformatics</I> online.</p>
]]></description>
<dc:creator><![CDATA[Dong, Q., Zhou, S., Guan, J.]]></dc:creator>
<dc:date>Thu, 08 Oct 2009 22:47:51 PDT</dc:date>
<dc:identifier>info:doi/10.1093/bioinformatics/btp500</dc:identifier>
<dc:title><![CDATA[A new taxonomy-based protein fold recognition approach based on autocross-covariance transformation]]></dc:title>
<dc:publisher>Oxford University Press</dc:publisher>
<prism:number>20</prism:number>
<prism:volume>25</prism:volume>
<prism:endingPage>2662</prism:endingPage>
<prism:publicationDate>2009-10-15</prism:publicationDate>
<prism:startingPage>2655</prism:startingPage>
<prism:section>STRUCTURAL BIOINFORMATICS</prism:section>
</item>

<item rdf:about="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/20/2663?rss=1">
<title><![CDATA[MISTRAL: a tool for energy-based multiple structural alignment of proteins]]></title>
<link>http://bioinformatics.oxfordjournals.org/cgi/content/short/25/20/2663?rss=1</link>
<description><![CDATA[
<p><b>Motivation:</b> The steady growth of the number of available protein structures has constantly motivated the development of new algorithms for detecting structural correspondences in proteins. Detecting structural equivalences in two or more proteins is computationally demanding as it typically entails the exploration of the combinatorial space of all possible amino acid pairings in the parent proteins. The search is often aided by the introduction of various constraints such as considering protein fragments, rather than single amino acids, and/or seeking only sequential correspondences in the given proteins. An additional challenge is represented by the difficulty of associating to a given alignment, a reliable a priori measure of its statistical significance.</p>
<p><b>Results:</b> Here, we present and discuss MISTRAL (Multiple STRuctural ALignment), a novel strategy for multiple protein alignment based on the minimization of an energy function over the low-dimensional space of the relative rotations and translations of the molecules. The energy minimization avoids combinatorial searches and returns pairwise alignment scores for which a reliable a priori statistical significance can be given.</p>
<p><b>Availability:</b> MISTRAL is freely available for academic users as a standalone program and as a web service at <inter-ref locator="http://ipht.cea.fr/protein.php" locator-type="url">http://ipht.cea.fr/protein.php</inter-ref>.</p>
<p><b>Contact:</b> <inter-ref locator="michelet@sissa.it" locator-type="email">michelet@sissa.it</inter-ref></p>
<p><b>Supplementary information:</b> <inter-ref locator="http://bioinformatics.oxfordjournals.org/cgi/content/full/btp506/DC1" locator-type="url">Supplementary data</inter-ref> are available at <I>Bioinformatics</I> online.</p>
]]></description>
<dc:creator><![CDATA[Micheletti, C., Orland, H.]]></dc:creator>
<dc:date>Thu, 08 Oct 2009 22:47:51 PDT</dc:date>
<dc:identifier>info:doi/10.1093/bioinformatics/btp506</dc:identifier>
<dc:title><![CDATA[MISTRAL: a tool for energy-based multiple structural alignment of proteins]]></dc:title>
<dc:publisher>Oxford University Press</dc:publisher>
<prism:number>20</prism:number>
<prism:volume>25</prism:volume>
<prism:endingPage>2669</prism:endingPage>
<prism:publicationDate>2009-10-15</prism:publicationDate>
<prism:startingPage>2663</prism:startingPage>
<prism:section>STRUCTURAL BIOINFORMATICS</prism:section>
</item>

<item rdf:about="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/20/2670?rss=1">
<title><![CDATA[Statistical lower bounds on protein copy number from fluorescence expression images]]></title>
<link>http://bioinformatics.oxfordjournals.org/cgi/content/short/25/20/2670?rss=1</link>
<description><![CDATA[
<p><b>Motivation:</b> Fluorescence imaging has become a commonplace for quantitatively measuring mRNA or protein expression in cells and tissues. However, such expression data are usually relative&mdash;absolute concentrations or molecular copy numbers are typically not known. While this is satisfactory for many applications, for certain kinds of quantitative network modeling and analysis of expression noise, absolute measures of expression are necessary.</p>
<p><b>Results:</b> We propose two methods for estimating molecular copy numbers from single uncalibrated expression images of tissues. These methods rely on expression variability between cells, due either to steady-state fluctuations or unequal distribution of molecules during cell division, to make their estimates. We apply these methods to 152 protein fluorescence expression images of <I>Drosophila melanogaster</I> embryos during early development, generating copy number estimates for 14 genes in the segmentation network. We also analyze the effects of noise on our estimators and compare with empirical findings. Finally, we confirm an observation of Bar-Even <I>et al.</I>, made in the much different setting of <I>Saccharomyces cerevisiae</I>, that steady-state expression variance tends to scale with mean expression.</p>
<p><b>Availability:</b> The data are all drawn from FlyEx (explained within), and is available at <inter-ref locator="http://flyex.ams.sunysb.edu/FlyEx/" locator-type="url">http://flyex.ams.sunysb.edu/FlyEx/</inter-ref>. Data and MATLAB codes for all algorithms described in this article are available at <inter-ref locator="http://www.perkinslab.ca/pubs/ZP2009.html" locator-type="url">http://www.perkinslab.ca/pubs/ZP2009.html</inter-ref>.</p>
<p><b>Contact:</b> <inter-ref locator="tperkins@ohri.ca" locator-type="email">tperkins@ohri.ca</inter-ref></p>
]]></description>
<dc:creator><![CDATA[Zamparo, L., Perkins, T. J.]]></dc:creator>
<dc:date>Thu, 08 Oct 2009 22:47:51 PDT</dc:date>
<dc:identifier>info:doi/10.1093/bioinformatics/btp415</dc:identifier>
<dc:title><![CDATA[Statistical lower bounds on protein copy number from fluorescence expression images]]></dc:title>
<dc:publisher>Oxford University Press</dc:publisher>
<prism:number>20</prism:number>
<prism:volume>25</prism:volume>
<prism:endingPage>2676</prism:endingPage>
<prism:publicationDate>2009-10-15</prism:publicationDate>
<prism:startingPage>2670</prism:startingPage>
<prism:section>GENE EXPRESSION</prism:section>
</item>

<item rdf:about="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/20/2677?rss=1">
<title><![CDATA[Multi-dimensional correlations for gene coexpression and application to the large-scale data of Arabidopsis]]></title>
<link>http://bioinformatics.oxfordjournals.org/cgi/content/short/25/20/2677?rss=1</link>
<description><![CDATA[
<p><b>Background:</b> Recent improvements in DNA microarray techniques have made a large variety of gene expression data available in public databases. This data can be used to evaluate the strength of gene coexpression by calculating the correlation of expression patterns among different genes between many experiments. However, gene expression levels differ significantly across various tissues in higher organisms, as well as in different cellular location in eukaryotes in different cell state. Thus the usual correlation measure can only evaluate the difference of tissues or cellular localizations, and cannot adequately elucidate the functional relationship from the coexpression of genes.</p>
<p><b>Method:</b> We propose a new measure of coexpression by expanding the generally used correlation into a multidimensional one. We used principal component analyses to identify the major factors of gene expression correlation, and then re-calculate the correlation by subtracting the major components in order to remove biases cased by a few experiments. The repeated subtractions of the major components yielded a set of correlation values for each pair of genes. We observed the correlation changes when the first ten principal components were subtracted step-by-step in large-scale Arabidopsis expression data.</p>
<p><b>Results:</b> We found two extreme patterns of correlation changes, corresponding to stable and fragile coexpression. Our new indexes provided a good means to determine the functional relationships of the genes, by examining a few examples, and higher performance of Gene Ontology term prediction by using the support vector machine and the multidimensional correlation.</p>
<p><b>Availability:</b> The results are available from the expression detail pages in ATTED-II (<inter-ref locator="http://atted.jp" locator-type="url">http://atted.jp</inter-ref>).</p>
<p><b>Contact:</b> <inter-ref locator="kinosita@hgc.jp" locator-type="email">kinosita@hgc.jp</inter-ref></p>
<p><b>Supplementary information:</b> <inter-ref locator="http://bioinformatics.oxfordjournals.org/cgi/content/full/btp442/DC1" locator-type="url">Supplementary data</inter-ref> are available at <I>Bioinformatics</I> online.</p>
]]></description>
<dc:creator><![CDATA[Kinoshita, K., Obayashi, T.]]></dc:creator>
<dc:date>Thu, 08 Oct 2009 22:47:51 PDT</dc:date>
<dc:identifier>info:doi/10.1093/bioinformatics/btp442</dc:identifier>
<dc:title><![CDATA[Multi-dimensional correlations for gene coexpression and application to the large-scale data of Arabidopsis]]></dc:title>
<dc:publisher>Oxford University Press</dc:publisher>
<prism:number>20</prism:number>
<prism:volume>25</prism:volume>
<prism:endingPage>2684</prism:endingPage>
<prism:publicationDate>2009-10-15</prism:publicationDate>
<prism:startingPage>2677</prism:startingPage>
<prism:section>GENE EXPRESSION</prism:section>
</item>

<item rdf:about="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/20/2685?rss=1">
<title><![CDATA[A modified LOESS normalization applied to microRNA arrays: a comparative evaluation]]></title>
<link>http://bioinformatics.oxfordjournals.org/cgi/content/short/25/20/2685?rss=1</link>
<description><![CDATA[
<p><b>Motivation:</b> Microarray normalization is a fundamental step in removing systematic bias and noise variability caused by technical and experimental artefacts. Several approaches, suitable for large-scale genome arrays, have been proposed and shown to be effective in the reduction of systematic errors. Most of these methodologies are based on specific assumptions that are reasonable for whole-genome arrays, but possibly unsuitable for small microRNA (miRNA) platforms. In this work, we propose a novel normalization (loessM), and we investigate, through simulated and real datasets, the influence that normalizations for two-colour miRNA arrays have on the identification of differentially expressed genes.</p>
<p><b>Results:</b> We show that normalizations usually applied to large-scale arrays, in several cases, modify the actual structure of miRNA data, leading to large portions of false positives and false negatives. Nevertheless, loessM is able to outperform other techniques in most experimental scenarios. Moreover, when usual assumptions on differential expression distribution are missed, channel effect has a strikingly negative influence on small arrays, bias that cannot be removed by normalizations but rather by an appropriate experimental design. We find that the combination of loessM with eCADS, an experimental design based on biological replicates dye-swap recently proposed for channel-effect reduction, gives better results in most of the experimental conditions in terms of specificity/sensitivity both on simulated and real data.</p>
<p><b>Availability:</b> LoessM R function is freely available at <inter-ref locator="http://gefu.cribi.unipd.it/papers/miRNA-simulation/" locator-type="url">http://gefu.cribi.unipd.it/papers/miRNA-simulation/</inter-ref></p>
<p><b>Contact:</b> <inter-ref locator="chiara.romualdi@unipd.it" locator-type="email">chiara.romualdi@unipd.it</inter-ref></p>
<p><b>Supplementary information:</b> <inter-ref locator="http://bioinformatics.oxfordjournals.org/cgi/content/full/btp443/DC1" locator-type="url">Supplementary data</inter-ref> are available at <I>Bioinformatics</I> online.</p>
]]></description>
<dc:creator><![CDATA[Risso, D., Massa, M. S., Chiogna, M., Romualdi, C.]]></dc:creator>
<dc:date>Thu, 08 Oct 2009 22:47:51 PDT</dc:date>
<dc:identifier>info:doi/10.1093/bioinformatics/btp443</dc:identifier>
<dc:title><![CDATA[A modified LOESS normalization applied to microRNA arrays: a comparative evaluation]]></dc:title>
<dc:publisher>Oxford University Press</dc:publisher>
<prism:number>20</prism:number>
<prism:volume>25</prism:volume>
<prism:endingPage>2691</prism:endingPage>
<prism:publicationDate>2009-10-15</prism:publicationDate>
<prism:startingPage>2685</prism:startingPage>
<prism:section>GENE EXPRESSION</prism:section>
</item>

<item rdf:about="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/20/2692?rss=1">
<title><![CDATA[Moderated effect size and P-value combinations for microarray meta-analyses]]></title>
<link>http://bioinformatics.oxfordjournals.org/cgi/content/short/25/20/2692?rss=1</link>
<description><![CDATA[
<p><b>Motivation:</b> With the proliferation of microarray experiments and their availability in the public domain, the use of meta-analysis methods to combine results from different studies increases. In microarray experiments, where the sample size is often limited, meta-analysis offers the possibility to considerably increase the statistical power and give more accurate results.</p>
<p><b>Results:</b> A moderated effect size combination method was proposed and compared with other meta-analysis approaches. All methods were applied to real publicly available datasets on prostate cancer, and were compared in an extensive simulation study for various amounts of inter-study variability. Although the proposed moderated effect size combination improved already existing effect size approaches, the <I>P</I>-value combination was found to provide a better sensitivity and a better gene ranking than the other meta-analysis methods, while effect size methods were more conservative.</p>
<p><b>Availability:</b> An R package metaMA is available on the CRAN.</p>
<p><b>Contact:</b> <inter-ref locator="guillemette.marot@jouy.inra.fr" locator-type="email">guillemette.marot@jouy.inra.fr</inter-ref></p>
]]></description>
<dc:creator><![CDATA[Marot, G., Foulley, J.-L., Mayer, C.-D., Jaffrezic, F.]]></dc:creator>
<dc:date>Thu, 08 Oct 2009 22:47:51 PDT</dc:date>
<dc:identifier>info:doi/10.1093/bioinformatics/btp444</dc:identifier>
<dc:title><![CDATA[Moderated effect size and P-value combinations for microarray meta-analyses]]></dc:title>
<dc:publisher>Oxford University Press</dc:publisher>
<prism:number>20</prism:number>
<prism:volume>25</prism:volume>
<prism:endingPage>2699</prism:endingPage>
<prism:publicationDate>2009-10-15</prism:publicationDate>
<prism:startingPage>2692</prism:startingPage>
<prism:section>GENE EXPRESSION</prism:section>
</item>

<item rdf:about="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/20/2700?rss=1">
<title><![CDATA[Gene ranking and biomarker discovery under correlation]]></title>
<link>http://bioinformatics.oxfordjournals.org/cgi/content/short/25/20/2700?rss=1</link>
<description><![CDATA[
<p><b>Motivation:</b> Biomarker discovery and gene ranking is a standard task in genomic high-throughput analysis. Typically, the ordering of markers is based on a stabilized variant of the <I>t</I>-score, such as the moderated <I>t</I> or the SAM statistic. However, these procedures ignore gene&ndash;gene correlations, which may have a profound impact on the gene orderings and on the power of the subsequent tests.</p>
<p><b>Results:</b> We propose a simple procedure that adjusts gene-wise <I>t</I>-statistics to take account of correlations among genes. The resulting correlation-adjusted <I>t</I>-scores (&lsquo;cat&rsquo; scores) are derived from a predictive perspective, i.e. as a score for variable selection to discriminate group membership in two-class linear discriminant analysis. In the absence of correlation the cat score reduces to the standard <I>t</I>-score. Moreover, using the cat score it is straightforward to evaluate groups of features (i.e. gene sets). For computation of the cat score from small sample data, we propose a shrinkage procedure. In a comparative study comprising six different synthetic and empirical correlation structures, we show that the cat score improves estimation of gene orderings and leads to higher power for fixed true discovery rate, and vice versa. Finally, we also illustrate the cat score by analyzing metabolomic data.</p>
<p><b>Availability:</b> The shrinkage cat score is implemented in the R package &lsquo;st&rsquo;, which is freely available under the terms of the GNU General Public License (version 3 or later) from CRAN (<inter-ref locator="http://cran.r-project.org/web/packages/st/" locator-type="url">http://cran.r-project.org/web/packages/st/</inter-ref>).</p>
<p><b>Contact:</b> <inter-ref locator="strimmer@uni-leipzig.de" locator-type="email">strimmer@uni-leipzig.de</inter-ref></p>
]]></description>
<dc:creator><![CDATA[Zuber, V., Strimmer, K.]]></dc:creator>
<dc:date>Thu, 08 Oct 2009 22:47:51 PDT</dc:date>
<dc:identifier>info:doi/10.1093/bioinformatics/btp460</dc:identifier>
<dc:title><![CDATA[Gene ranking and biomarker discovery under correlation]]></dc:title>
<dc:publisher>Oxford University Press</dc:publisher>
<prism:number>20</prism:number>
<prism:volume>25</prism:volume>
<prism:endingPage>2707</prism:endingPage>
<prism:publicationDate>2009-10-15</prism:publicationDate>
<prism:startingPage>2700</prism:startingPage>
<prism:section>GENE EXPRESSION</prism:section>
</item>

<item rdf:about="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/20/2708?rss=1">
<title><![CDATA[Methods for labeling error detection in microarrays based on the effect of data perturbation on the regression model]]></title>
<link>http://bioinformatics.oxfordjournals.org/cgi/content/short/25/20/2708?rss=1</link>
<description><![CDATA[
<p><b>Motivation:</b> Mislabeled samples often appear in gene expression profile because of the similarity of different sub-type of disease and the subjective misdiagnosis. The mislabeled samples deteriorate supervised learning procedures. The LOOE-sensitivity algorithm is an approach for mislabeled sample detection for microarray based on data perturbation. However, the failure of measuring the perturbing effect makes the LOOE-sensitivity algorithm a poor performance. The purpose of this article is to design a novel detection method for mislabeled samples of microarray, which could take advantage of the measuring effect of data perturbations.</p>
<p><b>Results:</b> To measure the effect of data perturbation, we define an index named perturbing influence value (PIV), based on the support vector machine (SVM) regression model. The Column Algorithm (CAPIV), Row Algorithm (RAPIV) and progressive Row Algorithm (PRAPIV) based on the PIV value are proposed to detect the mislabeled samples. Experimental results obtained by using six artificial datasets and five microarray datasets demonstrate that all proposed methods in this article are superior to LOOE-sensitivity. Moreover, compared with the simple SVM and CL-stability, the PRAPIV algorithm shows an increase in precision and high recall.</p>
<p><b>Availability:</b> The program and source code (in JAVA) are publicly available at <inter-ref locator="http://ccst.jlu.edu.cn/CSBG/PIVS/index.htm" locator-type="url">http://ccst.jlu.edu.cn/CSBG/PIVS/index.htm</inter-ref></p>
<p><b>Contact:</b> <inter-ref locator="blanzier@dit.unitn.it" locator-type="email">blanzier@dit.unitn.it</inter-ref>; <inter-ref locator="ycliang@jlu.edu.cn" locator-type="email">ycliang@jlu.edu.cn</inter-ref></p>
]]></description>
<dc:creator><![CDATA[Zhang, C., Wu, C., Blanzieri, E., Zhou, Y., Wang, Y., Du, W., Liang, Y.]]></dc:creator>
<dc:date>Thu, 08 Oct 2009 22:47:51 PDT</dc:date>
<dc:identifier>info:doi/10.1093/bioinformatics/btp478</dc:identifier>
<dc:title><![CDATA[Methods for labeling error detection in microarrays based on the effect of data perturbation on the regression model]]></dc:title>
<dc:publisher>Oxford University Press</dc:publisher>
<prism:number>20</prism:number>
<prism:volume>25</prism:volume>
<prism:endingPage>2714</prism:endingPage>
<prism:publicationDate>2009-10-15</prism:publicationDate>
<prism:startingPage>2708</prism:startingPage>
<prism:section>GENE EXPRESSION</prism:section>
</item>

<item rdf:about="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/20/2715?rss=1">
<title><![CDATA[info-gibbs: a motif discovery algorithm that directly optimizes information content during sampling]]></title>
<link>http://bioinformatics.oxfordjournals.org/cgi/content/short/25/20/2715?rss=1</link>
<description><![CDATA[
<p><b>Motivation:</b> Discovering <I>cis</I>-regulatory elements in genome sequence remains a challenging issue. Several methods rely on the optimization of some target scoring function. The information content (IC) or relative entropy of the motif has proven to be a good estimator of transcription factor DNA binding affinity. However, these information-based metrics are usually used as <I>a posteriori</I> statistics rather than during the motif search process itself.</p>
<p><b>Results:</b> We introduce here info-gibbs, a Gibbs sampling algorithm that efficiently optimizes the IC or the log-likelihood ratio (LLR) of the motif while keeping computation time low. The method compares well with existing methods like MEME, BioProspector, Gibbs or GAME on both synthetic and biological datasets. Our study shows that motif discovery techniques can be enhanced by directly focusing the search on the motif IC or the motif LLR.</p>
<p><b>Availability:</b> <inter-ref locator="http://rsat.ulb.ac.be/rsat/info-gibbs" locator-type="url">http://rsat.ulb.ac.be/rsat/info-gibbs</inter-ref></p>
<p><b>Contact:</b> <inter-ref locator="defrance@bigre.ulb.ac.be" locator-type="email">defrance@bigre.ulb.ac.be</inter-ref></p>
<p><b>Supplementary information:</b> <inter-ref locator="http://bioinformatics.oxfordjournals.org/cgi/content/full/btp490/DC1" locator-type="url">Supplementary data</inter-ref> are available at <I>Bioinformatics</I> online.</p>
]]></description>
<dc:creator><![CDATA[Defrance, M., van Helden, J.]]></dc:creator>
<dc:date>Thu, 08 Oct 2009 22:47:51 PDT</dc:date>
<dc:identifier>info:doi/10.1093/bioinformatics/btp490</dc:identifier>
<dc:title><![CDATA[info-gibbs: a motif discovery algorithm that directly optimizes information content during sampling]]></dc:title>
<dc:publisher>Oxford University Press</dc:publisher>
<prism:number>20</prism:number>
<prism:volume>25</prism:volume>
<prism:endingPage>2722</prism:endingPage>
<prism:publicationDate>2009-10-15</prism:publicationDate>
<prism:startingPage>2715</prism:startingPage>
<prism:section>GENE EXPRESSION</prism:section>
</item>

<item rdf:about="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/20/2723?rss=1">
<title><![CDATA[An optimization model for metabolic pathways]]></title>
<link>http://bioinformatics.oxfordjournals.org/cgi/content/short/25/20/2723?rss=1</link>
<description><![CDATA[
<p><b>Motivation:</b> Different mathematical methods have emerged in the post-genomic era to determine metabolic pathways. These methods can be divided into stoichiometric methods and path finding methods. In this paper we detail a novel optimization model, based upon integer linear programming, to determine metabolic pathways. Our model links reaction stoichiometry with path finding in a single approach. We test the ability of our model to determine 40 annotated <I>Escherichia coli</I> metabolic pathways. We show that our model is able to determine 36 of these 40 pathways in a computationally effective manner.</p>
<p><b>Contact:</b> <inter-ref locator="john.beasley@brunel.ac.uk" locator-type="email">john.beasley@brunel.ac.uk</inter-ref></p>
<p><b>Supplementary information:</b> <inter-ref locator="http://bioinformatics.oxfordjournals.org/cgi/content/full/btp441/DC1" locator-type="url">Supplementary data</inter-ref> are available at <I>Bioinformatics</I> online.</p>
]]></description>
<dc:creator><![CDATA[Planes, F. J., Beasley, J. E.]]></dc:creator>
<dc:date>Thu, 08 Oct 2009 22:47:51 PDT</dc:date>
<dc:identifier>info:doi/10.1093/bioinformatics/btp441</dc:identifier>
<dc:title><![CDATA[An optimization model for metabolic pathways]]></dc:title>
<dc:publisher>Oxford University Press</dc:publisher>
<prism:number>20</prism:number>
<prism:volume>25</prism:volume>
<prism:endingPage>2729</prism:endingPage>
<prism:publicationDate>2009-10-15</prism:publicationDate>
<prism:startingPage>2723</prism:startingPage>
<prism:section>SYSTEMS BIOLOGY</prism:section>
</item>

<item rdf:about="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/20/2730?rss=1">
<title><![CDATA[The Integrated Genome Browser: free software for distribution and exploration of genome-scale datasets]]></title>
<link>http://bioinformatics.oxfordjournals.org/cgi/content/short/25/20/2730?rss=1</link>
<description><![CDATA[
<p><b>Summary:</b> Experimental techniques that survey an entire genome demand flexible, highly interactive visualization tools that can display new data alongside foundation datasets, such as reference gene annotations. The Integrated Genome Browser (IGB) aims to meet this need. IGB is an open source, desktop graphical display tool implemented in Java that supports real-time zooming and panning through a genome; layout of genomic features and datasets in moveable, adjustable tiers; incremental or genome-scale data loading from remote web servers or local files; and dynamic manipulation of quantitative data via genome graphs.</p>
<p><b>Availability:</b> The application and source code are available from <inter-ref locator="http://igb.bioviz.org" locator-type="url">http://igb.bioviz.org</inter-ref> and <inter-ref locator="http://genoviz.sourceforge.net" locator-type="url">http://genoviz.sourceforge.net</inter-ref>.</p>
<p><b>Contact:</b> <inter-ref locator="aloraine@uncc.edu" locator-type="email">aloraine@uncc.edu</inter-ref></p>
]]></description>
<dc:creator><![CDATA[Nicol, J. W., Helt, G. A., Blanchard, S. G., Raja, A., Loraine, A. E.]]></dc:creator>
<dc:date>Thu, 08 Oct 2009 22:47:51 PDT</dc:date>
<dc:identifier>info:doi/10.1093/bioinformatics/btp472</dc:identifier>
<dc:title><![CDATA[The Integrated Genome Browser: free software for distribution and exploration of genome-scale datasets]]></dc:title>
<dc:publisher>Oxford University Press</dc:publisher>
<prism:number>20</prism:number>
<prism:volume>25</prism:volume>
<prism:endingPage>2731</prism:endingPage>
<prism:publicationDate>2009-10-15</prism:publicationDate>
<prism:startingPage>2730</prism:startingPage>
<prism:section>GENOME ANALYSIS</prism:section>
</item>

<item rdf:about="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/20/2732?rss=1">
<title><![CDATA[SnoopCGH: software for visualizing comparative genomic hybridization data]]></title>
<link>http://bioinformatics.oxfordjournals.org/cgi/content/short/25/20/2732?rss=1</link>
<description><![CDATA[
<p><b>Summary:</b> Array-based comparative genomic hybridization (CGH) technology is used to discover and validate genomic structural variation, including copy number variants, insertions, deletions and other structural variants (SVs). The visualization and summarization of the array CGH data outputs, potentially across many samples, is an important process in the identification and analysis of SVs. We have developed a software tool for SV analysis using data from array CGH technologies, which is also amenable to short-read sequence data.</p>
<p><b>Availability and implementation:</b> SnoopCGH is written in java and is available from <inter-ref locator="http://snoopcgh.sourceforge.net/" locator-type="url">http://snoopcgh.sourceforge.net/</inter-ref></p>
<p><b>Contact:</b> <inter-ref locator="jg10@sanger.ac.uk" locator-type="email">jg10@sanger.ac.uk</inter-ref>; <inter-ref locator="tc5@sanger.ac.uk" locator-type="email">tc5@sanger.ac.uk</inter-ref></p>
]]></description>
<dc:creator><![CDATA[Almagro-Garcia, J., Manske, M., Carret, C., Campino, S., Auburn, S., MacInnis, B. L, Maslen, G., Pain, A., Newbold, C. I, Kwiatkowski, D. P, Clark, T. G]]></dc:creator>
<dc:date>Thu, 08 Oct 2009 22:47:51 PDT</dc:date>
<dc:identifier>info:doi/10.1093/bioinformatics/btp488</dc:identifier>
<dc:title><![CDATA[SnoopCGH: software for visualizing comparative genomic hybridization data]]></dc:title>
<dc:publisher>Oxford University Press</dc:publisher>
<prism:number>20</prism:number>
<prism:volume>25</prism:volume>
<prism:endingPage>2733</prism:endingPage>
<prism:publicationDate>2009-10-15</prism:publicationDate>
<prism:startingPage>2732</prism:startingPage>
<prism:section>GENOME ANALYSIS</prism:section>
</item>

<item rdf:about="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/20/2734?rss=1">
<title><![CDATA[YADA: a tool for taking the most out of high-resolution spectra]]></title>
<link>http://bioinformatics.oxfordjournals.org/cgi/content/short/25/20/2734?rss=1</link>
<description><![CDATA[
<p><b>Summary:</b> YADA can deisotope and decharge high-resolution mass spectra from large peptide molecules, link the precursor monoisotopic peak information to the corresponding tandem mass spectrum, and account for different co-fragmenting ion species (multiplexed spectra). We describe how YADA enables a pipeline consisting of ProLuCID and DTASelect for analyzing large-scale middle-down proteomics data.</p>
<p><b>Availability:</b> <inter-ref locator="http://fields.scripps.edu/yada" locator-type="url">http://fields.scripps.edu/yada</inter-ref></p>
<p><b>Contact:</b> <inter-ref locator="paulo@pcarvalho.com" locator-type="email">paulo@pcarvalho.com</inter-ref></p>
<p><b>Supplementary information:</b> <inter-ref locator="http://bioinformatics.oxfordjournals.org/cgi/content/full/btp489/DC1" locator-type="url">Supplementary data</inter-ref> are available at <I>Bioinformatics</I> online.</p>
]]></description>
<dc:creator><![CDATA[Carvalho, P. C., Xu, T., Han, X., Cociorva, D., Barbosa, V. C., Yates, J. R.]]></dc:creator>
<dc:date>Thu, 08 Oct 2009 22:47:51 PDT</dc:date>
<dc:identifier>info:doi/10.1093/bioinformatics/btp489</dc:identifier>
<dc:title><![CDATA[YADA: a tool for taking the most out of high-resolution spectra]]></dc:title>
<dc:publisher>Oxford University Press</dc:publisher>
<prism:number>20</prism:number>
<prism:volume>25</prism:volume>
<prism:endingPage>2736</prism:endingPage>
<prism:publicationDate>2009-10-15</prism:publicationDate>
<prism:startingPage>2734</prism:startingPage>
<prism:section>SEQUENCE ANALYSIS</prism:section>
</item>

<item rdf:about="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/20/2737?rss=1">
<title><![CDATA[ShotgunFunctionalizeR: an R-package for functional comparison of metagenomes]]></title>
<link>http://bioinformatics.oxfordjournals.org/cgi/content/short/25/20/2737?rss=1</link>
<description><![CDATA[
<p><b>Summary:</b> Microorganisms are ubiquitous in nature and constitute intrinsic parts of almost every ecosystem. A culture-independent and powerful way to study microbial communities is metagenomics. In such studies, functional analysis is performed on fragmented genetic material from multiple species in the community. The recent advances in high-throughput sequencing have greatly increased the amount of data in metagenomic projects. At present, there is an urgent need for efficient statistical tools to analyse these data. We have created ShotgunFunctionalizeR, an R-package for functional comparison of metagenomes. The package contains tools for importing, annotating and visualizing metagenomic data produced by shotgun high-throughput sequencing. ShotgunFunctionalizeR contains several statistical procedures for assessing functional differences between samples, both for individual genes and for entire pathways. In addition to standard and previously published methods, we have developed and implemented a novel approach based on a Poisson model. This procedure is highly flexible and thus applicable to a wide range of different experimental designs. We demonstrate the potential of ShotgunFunctionalizeR by performing a regression analysis on metagenomes sampled at multiple depths in the Pacific Ocean.</p>
<p><b>Availability:</b> <inter-ref locator="http://shotgun.zool.gu.se" locator-type="url">http://shotgun.zool.gu.se</inter-ref></p>
<p><b>Contact:</b> <inter-ref locator="dalevi@chalmers.se" locator-type="email">dalevi@chalmers.se</inter-ref>; <inter-ref locator="erik.kristiansson@zool.gu.se" locator-type="email">erik.kristiansson@zool.gu.se</inter-ref></p>
<p><b>Supplementary information:</b> <inter-ref locator="http://bioinformatics.oxfordjournals.org/cgi/content/full/btp508/DC1" locator-type="url">supplementary data</inter-ref> are available at <I>Bioinformatics</I> online.</p>
]]></description>
<dc:creator><![CDATA[Kristiansson, E., Hugenholtz, P., Dalevi, D.]]></dc:creator>
<dc:date>Thu, 08 Oct 2009 22:47:51 PDT</dc:date>
<dc:identifier>info:doi/10.1093/bioinformatics/btp508</dc:identifier>
<dc:title><![CDATA[ShotgunFunctionalizeR: an R-package for functional comparison of metagenomes]]></dc:title>
<dc:publisher>Oxford University Press</dc:publisher>
<prism:number>20</prism:number>
<prism:volume>25</prism:volume>
<prism:endingPage>2738</prism:endingPage>
<prism:publicationDate>2009-10-15</prism:publicationDate>
<prism:startingPage>2737</prism:startingPage>
<prism:section>SEQUENCE ANALYSIS</prism:section>
</item>

<item rdf:about="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/20/2739?rss=1">
<title><![CDATA[Retrieve-ensembl-seq: user-friendly and large-scale retrieval of single or multi-genome sequences from Ensembl]]></title>
<link>http://bioinformatics.oxfordjournals.org/cgi/content/short/25/20/2739?rss=1</link>
<description><![CDATA[
<p><b>Summary:</b> The preparation of an appropriate sequence dataset is the starting point of all genomic analyses. We present <I>retrieve-ensembl-seq</I>, an application that considerably eases the retrieval of sequences from the Ensembl database, via our user-friendly web site or web services. The user provides Ensembl identifiers or gene names, and the program returns corresponding upstream, downstream, intronic, exonic, UTR or whole gene sequences. <I>retrieve-ensembl-seq</I> also offers a multiple organism mode to retrieve sequences from homologous genes at any taxonomical level. And we introduce various original filters such as the masking of coding fragments and the avoidance of sequence redundancy for genes with multiple transcripts. <I>retrieve-ensembl-seq</I> is included in the software suite regulatory sequence analysis tools (RSAT), allowing instant submission of retrieved sequences to further analysis tools.</p>
<p><b>Availability:</b> <I>retrieve-ensembl-seq</I> is integrated in the RSAT suite: <inter-ref locator="http://rsat.ulb.ac.be/rsat" locator-type="url">http://rsat.ulb.ac.be/rsat</inter-ref>. Web site: <inter-ref locator="http://rsat.ulb.ac.be/rsat/retrieve-ensembl-seq_form.cgi" locator-type="url">http://rsat.ulb.ac.be/rsat/retrieve-ensembl-seq_form.cgi</inter-ref>. Web services: <inter-ref locator="http://rsat.ulb.ac.be/rsat/web_services/RSATWS.wsdl" locator-type="url">http://rsat.ulb.ac.be/rsat/web_services/RSATWS.wsdl</inter-ref>. Stand-alone distribution: freely available under an academic licence to download from the RSAT web site. The complete manual, a convenient tutorial and demos are available from the RSAT website. Additional help can be found on the RSAT public forum.</p>
<p><b>Contact:</b> <inter-ref locator="oly@bigre.ulb.ac.be" locator-type="email">oly@bigre.ulb.ac.be</inter-ref></p>
]]></description>
<dc:creator><![CDATA[Sand, O., Thomas-Chollier, M., van Helden, J.]]></dc:creator>
<dc:date>Thu, 08 Oct 2009 22:47:51 PDT</dc:date>
<dc:identifier>info:doi/10.1093/bioinformatics/btp519</dc:identifier>
<dc:title><![CDATA[Retrieve-ensembl-seq: user-friendly and large-scale retrieval of single or multi-genome sequences from Ensembl]]></dc:title>
<dc:publisher>Oxford University Press</dc:publisher>
<prism:number>20</prism:number>
<prism:volume>25</prism:volume>
<prism:endingPage>2740</prism:endingPage>
<prism:publicationDate>2009-10-15</prism:publicationDate>
<prism:startingPage>2739</prism:startingPage>
<prism:section>SEQUENCE ANALYSIS</prism:section>
</item>

<item rdf:about="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/20/2741?rss=1">
<title><![CDATA[massXpert 2: a cross-platform software environment for polymer chemistry modelling and simulation/analysis of mass spectrometric data]]></title>
<link>http://bioinformatics.oxfordjournals.org/cgi/content/short/25/20/2741?rss=1</link>
<description><![CDATA[
<p><b>Summary:</b> Since the middle of the 90s, mass spectrometry has evolved into an almost indispensable tool in structural studies on an ever-growing variety of (bio-)polymers, of which proteins, sugars and nucleic acids are the most prominent. Since the first public release of <I>massXpert</I>, the advances of mass spectrometry have motivated continuous and thorough maintenance of that software, in the form of two full software rewrites, culminating with <I>massXpert 2</I>, which we describe in this report. We shall describe the profound changes in <I>massXpert</I> that were performed so as to keep up with the technical advances in mass spectrometry since a decade.</p>
<p><b>Availability:</b> The <I>massXpert 2</I> software is an open source and free software project hosted at <inter-ref locator="http://www.massxpert.org" locator-type="url">http://www.massxpert.org</inter-ref>.</p>
<p><b>Contact:</b> <inter-ref locator="rusconi@mnhn.fr" locator-type="email">rusconi@mnhn.fr</inter-ref></p>
<p><b>Supplementary information:</b> <inter-ref locator="http://bioinformatics.oxfordjournals.org/cgi/content/full/btp504/DC1" locator-type="url">Supplementary data</inter-ref> are available at <I>Bioinformatics</I> online.</p>
]]></description>
<dc:creator><![CDATA[Rusconi, F.]]></dc:creator>
<dc:date>Thu, 08 Oct 2009 22:47:51 PDT</dc:date>
<dc:identifier>info:doi/10.1093/bioinformatics/btp504</dc:identifier>
<dc:title><![CDATA[massXpert 2: a cross-platform software environment for polymer chemistry modelling and simulation/analysis of mass spectrometric data]]></dc:title>
<dc:publisher>Oxford University Press</dc:publisher>
<prism:number>20</prism:number>
<prism:volume>25</prism:volume>
<prism:endingPage>2742</prism:endingPage>
<prism:publicationDate>2009-10-15</prism:publicationDate>
<prism:startingPage>2741</prism:startingPage>
<prism:section>STRUCTURAL BIOINFORMATICS</prism:section>
</item>

<item rdf:about="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/20/2743?rss=1">
<title><![CDATA[PiSQRD: a web server for decomposing proteins into quasi-rigid dynamical domains]]></title>
<link>http://bioinformatics.oxfordjournals.org/cgi/content/short/25/20/2743?rss=1</link>
<description><![CDATA[
<p><b>Summary:</b> The PiSQRD web resource can be used to subdivide protein structures in quasi-rigid dynamical domains. The latter are groups of amino acids behaving as approximately rigid units in the course of protein equilibrium fluctuations. The PiSQRD server takes as input a biomolecular structure and the desired fraction of protein internal fluctuations that must be accounted for by the relative rigid-body motion of the dynamical domains. Next, the lowest energy modes of fluctuation of the protein (optionally provided by the user) are calculated and used to identify the rigid subunits. The resulting optimal subdivision is returned through a web page containing both interactive graphics and detailed data output.</p>
<p><b>Availability:</b> The PiSQRD web server, which requires Java, is available free of charge for academic users at <inter-ref locator="http://pisqrd.escience-lab.org" locator-type="url">http://pisqrd.escience-lab.org</inter-ref>.</p>
<p><b>Contact:</b> <inter-ref locator="potestio@sissa.it" locator-type="email">potestio@sissa.it</inter-ref></p>
]]></description>
<dc:creator><![CDATA[Aleksiev, T., Potestio, R., Pontiggia, F., Cozzini, S., Micheletti, C.]]></dc:creator>
<dc:date>Thu, 08 Oct 2009 22:47:51 PDT</dc:date>
<dc:identifier>info:doi/10.1093/bioinformatics/btp512</dc:identifier>
<dc:title><![CDATA[PiSQRD: a web server for decomposing proteins into quasi-rigid dynamical domains]]></dc:title>
<dc:publisher>Oxford University Press</dc:publisher>
<prism:number>20</prism:number>
<prism:volume>25</prism:volume>
<prism:endingPage>2744</prism:endingPage>
<prism:publicationDate>2009-10-15</prism:publicationDate>
<prism:startingPage>2743</prism:startingPage>
<prism:section>STRUCTURAL BIOINFORMATICS</prism:section>
</item>

<item rdf:about="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/20/2745?rss=1">
<title><![CDATA[ANCHOR: web server for predicting protein binding regions in disordered proteins]]></title>
<link>http://bioinformatics.oxfordjournals.org/cgi/content/short/25/20/2745?rss=1</link>
<description><![CDATA[
<p><b>Summary:</b> ANCHOR is a web-based implementation of an original method that takes a single amino acid sequence as an input and predicts protein binding regions that are disordered in isolation but can undergo disorder-to-order transition upon binding. The server incorporates the result of a general disorder prediction method, IUPred and can carry out simple motif searches as well.</p>
<p><b>Availability:</b> The web server is available at <inter-ref locator="http://anchor.enzim.hu" locator-type="url">http://anchor.enzim.hu</inter-ref>. The program package is freely available for academic users.</p>
<p><b>Contact:</b> <inter-ref locator="zsuzsa@enzim.hu" locator-type="email">zsuzsa@enzim.hu</inter-ref></p>
]]></description>
<dc:creator><![CDATA[Dosztanyi, Z., Meszaros, B., Simon, I.]]></dc:creator>
<dc:date>Thu, 08 Oct 2009 22:47:51 PDT</dc:date>
<dc:identifier>info:doi/10.1093/bioinformatics/btp518</dc:identifier>
<dc:title><![CDATA[ANCHOR: web server for predicting protein binding regions in disordered proteins]]></dc:title>
<dc:publisher>Oxford University Press</dc:publisher>
<prism:number>20</prism:number>
<prism:volume>25</prism:volume>
<prism:endingPage>2746</prism:endingPage>
<prism:publicationDate>2009-10-15</prism:publicationDate>
<prism:startingPage>2745</prism:startingPage>
<prism:section>STRUCTURAL BIOINFORMATICS</prism:section>
</item>

<item rdf:about="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/20/2747?rss=1">
<title><![CDATA[PopABC: a program to infer historical demographic parameters]]></title>
<link>http://bioinformatics.oxfordjournals.org/cgi/content/short/25/20/2747?rss=1</link>
<description><![CDATA[
<p><b>Summary:</b> PopABC is a computer package for inferring the pattern of demographic divergence of closely related populations and species. The software performs coalescent simulation in the framework of approximate Bayesian computation (ABC). PopABC can also be used to perform Bayesian model choice to discriminate between different demographic scenarios. The program can be used either for research or for education and teaching purposes.</p>
<p><b>Availability and Implementation:</b> Source code and binaries are freely available at <inter-ref locator="http://www.reading.ac.uk/~sar05sal/software.htm" locator-type="url">http://www.reading.ac.uk/~sar05sal/software.htm</inter-ref>. The program was implemented in C and can run on UNIX, MacOSX and Windows operating systems.</p>
<p><b>Contact:</b> <inter-ref locator="joao.lopes@reading.ac.uk" locator-type="email">joao.lopes@reading.ac.uk</inter-ref></p>
<p><b>Supplementary information:</b> <inter-ref locator="http://bioinformatics.oxfordjournals.org/cgi/content/full/btp487/DC1" locator-type="url">Supplementary data</inter-ref> are available at <I>Bioinformatics</I> online.</p>
]]></description>
<dc:creator><![CDATA[Lopes, J. S., Balding, D., Beaumont, M. A.]]></dc:creator>
<dc:date>Thu, 08 Oct 2009 22:47:51 PDT</dc:date>
<dc:identifier>info:doi/10.1093/bioinformatics/btp487</dc:identifier>
<dc:title><![CDATA[PopABC: a program to infer historical demographic parameters]]></dc:title>
<dc:publisher>Oxford University Press</dc:publisher>
<prism:number>20</prism:number>
<prism:volume>25</prism:volume>
<prism:endingPage>2749</prism:endingPage>
<prism:publicationDate>2009-10-15</prism:publicationDate>
<prism:startingPage>2747</prism:startingPage>
<prism:section>GENETICS AND POPULATION ANALYSIS</prism:section>
</item>

<item rdf:about="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/20/2750?rss=1">
<title><![CDATA[GRIMP: a web- and grid-based tool for high-speed analysis of large-scale genome-wide association using imputed data]]></title>
<link>http://bioinformatics.oxfordjournals.org/cgi/content/short/25/20/2750?rss=1</link>
<description><![CDATA[
<p><b>Summary:</b> The current fast growth of genome-wide association studies (GWAS) combined with now common computationally expensive imputation requires the online access of large user groups to high-performance computing resources capable of analyzing rapidly and efficiently millions of genetic markers for ten thousands of individuals. Here, we present a web-based interface&mdash;called GRIMP&mdash;to run publicly available genetic software for extremely large GWAS on scalable super-computing grid infrastructures. This is of major importance for the enlargement of GWAS with the availability of whole-genome sequence data from the 1000 Genomes Project and for future whole-population efforts.</p>
<p><b>Contact:</b> <inter-ref locator="ta.knoch@taknoch.org" locator-type="email">ta.knoch@taknoch.org</inter-ref>; <inter-ref locator="f.rivadeneira@erasmusmc.nl" locator-type="email">f.rivadeneira@erasmusmc.nl</inter-ref></p>
]]></description>
<dc:creator><![CDATA[Estrada, K., Abuseiris, A., Grosveld, F. G., Uitterlinden, A. G., Knoch, T. A., Rivadeneira, F.]]></dc:creator>
<dc:date>Thu, 08 Oct 2009 22:47:51 PDT</dc:date>
<dc:identifier>info:doi/10.1093/bioinformatics/btp497</dc:identifier>
<dc:title><![CDATA[GRIMP: a web- and grid-based tool for high-speed analysis of large-scale genome-wide association using imputed data]]></dc:title>
<dc:publisher>Oxford University Press</dc:publisher>
<prism:number>20</prism:number>
<prism:volume>25</prism:volume>
<prism:endingPage>2752</prism:endingPage>
<prism:publicationDate>2009-10-15</prism:publicationDate>
<prism:startingPage>2750</prism:startingPage>
<prism:section>GENETICS AND POPULATION ANALYSIS</prism:section>
</item>

<item rdf:about="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/20/2753?rss=1">
<title><![CDATA[CoCoa: a software tool for estimating the coefficient of coancestry from multilocus genotype data]]></title>
<link>http://bioinformatics.oxfordjournals.org/cgi/content/short/25/20/2753?rss=1</link>
<description><![CDATA[
<p><b>Motivation:</b> Phenotypic data collected in breeding programs and marker-trait association studies are often analyzed by means of linear mixed models. In these models, the covariance between the genetic background effects of all genotypes under study is modeled by means of pairwise coefficients of coancestry. Several marker-based coancestry estimation procedures allow to estimate this covariance matrix, but generally introduce a certain amount of bias when the examined genotypes are part of a breeding program. CoCoa implements the most commonly used marker-based coancestry estimation procedures and as such, allows to select the best fitting covariance structure for the phenotypic data at hand. This better model fit translates into an increased power and improved type I error control in association studies and an improved accuracy in phenotypic prediction studies. The presented software package also provides an implementation of the new Weighted Alikeness in State (WAIS) estimator for use in hybrid breeding programs. Besides several matrix manipulation tools, CoCoa implements two different bending heuristics, in case the inverse of an ill-conditioned coancestry matrix estimate is needed.</p>
<p><b>Availability and Implementation:</b> The software package CoCoa is freely available at <inter-ref locator="http://webs.hogent.be/cocoa" locator-type="url">http://webs.hogent.be/cocoa</inter-ref>. Source code, manual, binaries for 32 and 64-bit Linux systems and an installer for Microsoft Windows are provided. The core components of CoCoa are written in C++, while the graphical user interface is written in Java.</p>
<p><b>Contact:</b> <inter-ref locator="steven.maenhout@hogent.be" locator-type="email">steven.maenhout@hogent.be</inter-ref></p>
]]></description>
<dc:creator><![CDATA[Maenhout, S., De Baets, B., Haesaert, G.]]></dc:creator>
<dc:date>Thu, 08 Oct 2009 22:47:52 PDT</dc:date>
<dc:identifier>info:doi/10.1093/bioinformatics/btp499</dc:identifier>
<dc:title><![CDATA[CoCoa: a software tool for estimating the coefficient of coancestry from multilocus genotype data]]></dc:title>
<dc:publisher>Oxford University Press</dc:publisher>
<prism:number>20</prism:number>
<prism:volume>25</prism:volume>
<prism:endingPage>2754</prism:endingPage>
<prism:publicationDate>2009-10-15</prism:publicationDate>
<prism:startingPage>2753</prism:startingPage>
<prism:section>GENETICS AND POPULATION ANALYSIS</prism:section>
</item>

<item rdf:about="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/20/2755?rss=1">
<title><![CDATA[FBA-SimVis: interactive visualization of constraint-based metabolic models]]></title>
<link>http://bioinformatics.oxfordjournals.org/cgi/content/short/25/20/2755?rss=1</link>
<description><![CDATA[
<p><b>Summary:</b> FBA-SimVis is a VANTED plug-in for the constraint-based analysis of metabolic models with special focus on the visual exploration of metabolic flux data resulting from model analysis. The program provides a user-friendly environment for model reconstruction, constraint-based model analysis, and interactive visualization of the simulation results. With the ability to quantitatively analyse metabolic fluxes in an interactive and visual manner, FBA-SimVis supports a comprehensive understanding of constraint-based metabolic flux models in both overview and detail.</p>
<p><b>Availability:</b> Software with manual and tutorials are freely available at <inter-ref locator="http://fbasimvis.ipk-gatersleben.de/" locator-type="url">http://fbasimvis.ipk-gatersleben.de/</inter-ref></p>
<p><b>Contact:</b> <inter-ref locator="grafahr@ipk-gatersleben.de" locator-type="email">grafahr@ipk-gatersleben.de</inter-ref></p>
<p><b>Supplementary information:</b> Examples and <inter-ref locator="http://bioinformatics.oxfordjournals.org/cgi/content/full/btp408/DC1" locator-type="url">supplementary data</inter-ref> are available at <inter-ref locator="http://fbasimvis.ipk-gatersleben.de/" locator-type="url">http://fbasimvis.ipk-gatersleben.de/</inter-ref></p>
]]></description>
<dc:creator><![CDATA[Grafahrend-Belau, E., Klukas, C., Junker, B. H., Schreiber, F.]]></dc:creator>
<dc:date>Thu, 08 Oct 2009 22:47:52 PDT</dc:date>
<dc:identifier>info:doi/10.1093/bioinformatics/btp408</dc:identifier>
<dc:title><![CDATA[FBA-SimVis: interactive visualization of constraint-based metabolic models]]></dc:title>
<dc:publisher>Oxford University Press</dc:publisher>
<prism:number>20</prism:number>
<prism:volume>25</prism:volume>
<prism:endingPage>2757</prism:endingPage>
<prism:publicationDate>2009-10-15</prism:publicationDate>
<prism:startingPage>2755</prism:startingPage>
<prism:section>SYSTEMS BIOLOGY</prism:section>
</item>

<item rdf:about="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/20/2758?rss=1">
<title><![CDATA[FRED--a framework for T-cell epitope detection]]></title>
<link>http://bioinformatics.oxfordjournals.org/cgi/content/short/25/20/2758?rss=1</link>
<description><![CDATA[
<p><b>Summary:</b> Over the last decade, immunoinformatics has made significant progress. Computational approaches, in particular the prediction of T-cell epitopes using machine learning methods, are at the core of modern vaccine design. Large-scale analyses and the integration or comparison of different methods become increasingly important. We have developed FRED, an extendable, open source software framework for key tasks in immunoinformatics. In this, its first version, FRED offers easily accessible prediction methods for MHC binding and antigen processing as well as general infrastructure for the handling of antigen sequence data and epitopes. FRED is implemented in Python in a modular way and allows the integration of external methods.</p>
<p><b>Availability:</b> FRED is freely available for download at <inter-ref locator="http://www-bs.informatik.uni-tuebingen.de/Software/FRED" locator-type="url">http://www-bs.informatik.uni-tuebingen.de/Software/FRED</inter-ref>.</p>
<p><b>Contact:</b> <inter-ref locator="feldhahn@informatik.uni-tuebingen.de" locator-type="email">feldhahn@informatik.uni-tuebingen.de</inter-ref></p>
]]></description>
<dc:creator><![CDATA[Feldhahn, M., Donnes, P., Thiel, P., Kohlbacher, O.]]></dc:creator>
<dc:date>Thu, 08 Oct 2009 22:47:52 PDT</dc:date>
<dc:identifier>info:doi/10.1093/bioinformatics/btp409</dc:identifier>
<dc:title><![CDATA[FRED--a framework for T-cell epitope detection]]></dc:title>
<dc:publisher>Oxford University Press</dc:publisher>
<prism:number>20</prism:number>
<prism:volume>25</prism:volume>
<prism:endingPage>2759</prism:endingPage>
<prism:publicationDate>2009-10-15</prism:publicationDate>
<prism:startingPage>2758</prism:startingPage>
<prism:section>SYSTEMS BIOLOGY</prism:section>
</item>

<item rdf:about="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/20/2760?rss=1">
<title><![CDATA[Caleydo: connecting pathways and gene expression]]></title>
<link>http://bioinformatics.oxfordjournals.org/cgi/content/short/25/20/2760?rss=1</link>
<description><![CDATA[
<p><b>Summary:</b> Understanding the relationships between pathways and the altered expression of their components in disease conditions can be addressed in a visual data analysis process. Caleydo uses novel visualization techniques to support life science experts in their analysis of gene expression data in the context of pathways and functions of individual genes. Pathways and gene expression visualizations are placed in a 3D scene where selected entities (i.e. genes) are visually connected. This allows Caleydo to seamlessly integrate interactive gene expression visualization with cross-database pathway exploration.</p>
<p><b>Availability:</b> The Caleydo visualization framework is freely available on <inter-ref locator="www.caleydo.org" locator-type="url">www.caleydo.org</inter-ref> for non-commercial use. It runs on Windows and Linux and requires a 3D capable graphics card.</p>
<p><b>Contact:</b> <inter-ref locator="caleydo@icg.tugraz.at" locator-type="email">caleydo@icg.tugraz.at</inter-ref>; <inter-ref locator="streit@icg.tugraz.at" locator-type="email">streit@icg.tugraz.at</inter-ref></p>
<p><b>Supplementary information:</b> <inter-ref locator="http://bioinformatics.oxfordjournals.org/cgi/content/full/btp432/DC1" locator-type="url">Supplementary data</inter-ref> are available at <I>Bioinformatics</I> online.</p>
]]></description>
<dc:creator><![CDATA[Streit, M., Lex, A., Kalkusch, M., Zatloukal, K., Schmalstieg, D.]]></dc:creator>
<dc:date>Thu, 08 Oct 2009 22:47:52 PDT</dc:date>
<dc:identifier>info:doi/10.1093/bioinformatics/btp432</dc:identifier>
<dc:title><![CDATA[Caleydo: connecting pathways and gene expression]]></dc:title>
<dc:publisher>Oxford University Press</dc:publisher>
<prism:number>20</prism:number>
<prism:volume>25</prism:volume>
<prism:endingPage>2761</prism:endingPage>
<prism:publicationDate>2009-10-15</prism:publicationDate>
<prism:startingPage>2760</prism:startingPage>
<prism:section>SYSTEMS BIOLOGY</prism:section>
</item>

<item rdf:about="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/20/2762?rss=1">
<title><![CDATA[The SNP ratio test: pathway analysis of genome-wide association datasets]]></title>
<link>http://bioinformatics.oxfordjournals.org/cgi/content/short/25/20/2762?rss=1</link>
<description><![CDATA[
<p><b>Summary:</b> We present a tool that assesses the enrichment of significant associations from genome-wide association studies (GWAS) in a pathway context. The SNP ratio test (SRT) compares the proportion of significant to all SNPs within genes that are part of a pathway and computes an empirical <I>P</I>-value based on comparisons to ratios in datasets where the assignment of case/control status has been randomized. We applied the SRT to a Parkinson's disease GWAS dataset, using the KEGG database, revealing significance for Parkinson's disease and related pathways.</p>
<p><b>Availability:</b> <inter-ref locator="https://sourceforge.net/projects/snpratiotest/" locator-type="url">https://sourceforge.net/projects/snpratiotest/</inter-ref></p>
<p><b>Contact:</b> <inter-ref locator="codushlaine@gmail.com" locator-type="email">codushlaine@gmail.com</inter-ref>; <inter-ref locator="colm.odushlaine@tcd.ie" locator-type="email">colm.odushlaine@tcd.ie</inter-ref></p>
<p><b>Supplementary information:</b> <inter-ref locator="http://bioinformatics.oxfordjournals.org/cgi/content/full/btp448/DC1" locator-type="url">Supplementary data</inter-ref> are available at <I>Bioinformatics</I> online.</p>
]]></description>
<dc:creator><![CDATA[O'Dushlaine, C., Kenny, E., Heron, E. A., Segurado, R., Gill, M., Morris, D. W., Corvin, A.]]></dc:creator>
<dc:date>Thu, 08 Oct 2009 22:47:52 PDT</dc:date>
<dc:identifier>info:doi/10.1093/bioinformatics/btp448</dc:identifier>
<dc:title><![CDATA[The SNP ratio test: pathway analysis of genome-wide association datasets]]></dc:title>
<dc:publisher>Oxford University Press</dc:publisher>
<prism:number>20</prism:number>
<prism:volume>25</prism:volume>
<prism:endingPage>2763</prism:endingPage>
<prism:publicationDate>2009-10-15</prism:publicationDate>
<prism:startingPage>2762</prism:startingPage>
<prism:section>SYSTEMS BIOLOGY</prism:section>
</item>

<item rdf:about="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/20/2764?rss=1">
<title><![CDATA[Expertomica metabolite profiling: getting more information from LC-MS using the stochastic systems approach]]></title>
<link>http://bioinformatics.oxfordjournals.org/cgi/content/short/25/20/2764?rss=1</link>
<description><![CDATA[
<p>Mass spectrometers are sophisticated, fine instruments which are essential in a variety applications. However, the data they produce are usually interpreted in a rather primitive way, without considering the accuracy of this data and the potential errors in identifying peaks. Our new approach corrects this situation by dividing the LC-MS output into three components: (i) signature of the analyte, (ii) random noise and (iii) systemic noise. The systemic noise is related to the instrument and to the particular experiment; its characteristics change in time and depend on the analyzed substance. Working with these components allows us to quantify the probability of peak errors and, at the same time, to retrieve some peaks which get lost in the noise when using the existing methods. Our software tool, Expertomica metabolite profiling, automatically evaluates the given instrument, detects compounds and calculates the probability of individual peaks. It does not need any artificial user-defined parameters or thresholds.</p>
<p><b>Availability:</b> MATLAB scripts with a simple graphical user interface are free to download from <inter-ref locator="http://sourceforge.net/projects/expertomica-eda/" locator-type="url">http://sourceforge.net/projects/expertomica-eda/</inter-ref>. The software reads data exported by most Thermo and Agilent spectrometers, and it can also read the more general JCAMP-DX ASCII format. Other formats will be supported on request, assuming that the user can provide representative data samples.</p>
<p><b>Contact:</b> <inter-ref locator="urban@greentech.cz" locator-type="email">urban@greentech.cz</inter-ref></p>
]]></description>
<dc:creator><![CDATA[Urban, J., Vanek, J., Soukup, J., Stys, D.]]></dc:creator>
<dc:date>Thu, 08 Oct 2009 22:47:52 PDT</dc:date>
<dc:identifier>info:doi/10.1093/bioinformatics/btp427</dc:identifier>
<dc:title><![CDATA[Expertomica metabolite profiling: getting more information from LC-MS using the stochastic systems approach]]></dc:title>
<dc:publisher>Oxford University Press</dc:publisher>
<prism:number>20</prism:number>
<prism:volume>25</prism:volume>
<prism:endingPage>2767</prism:endingPage>
<prism:publicationDate>2009-10-15</prism:publicationDate>
<prism:startingPage>2764</prism:startingPage>
<prism:section>DATA AND TEXT MINING</prism:section>
</item>

<item rdf:about="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/20/2768?rss=1">
<title><![CDATA[A System for Information Management in BioMedical Studies--SIMBioMS]]></title>
<link>http://bioinformatics.oxfordjournals.org/cgi/content/short/25/20/2768?rss=1</link>
<description><![CDATA[
<p><b>Summary:</b> SIMBioMS is a web-based open source software system for managing data and information in biomedical studies. It provides a solution for the collection, storage, management and retrieval of information about research subjects and biomedical samples, as well as experimental data obtained using a range of high-throughput technologies, including gene expression, genotyping, proteomics and metabonomics. The system can easily be customized and has proven to be successful in several large-scale multi-site collaborative projects. It is compatible with emerging functional genomics data standards and provides data import and export in accepted standard formats. Protocols for transferring data to durable archives at the European Bioinformatics Institute have been implemented.</p>
<p><b>Availability:</b> The source code, documentation and initialization scripts are available at <inter-ref locator="http://simbioms.org." locator-type="url">http://simbioms.org.</inter-ref></p>
<p><b>Contact:</b> <inter-ref locator="support@simbioms.org" locator-type="email">support@simbioms.org</inter-ref>; <inter-ref locator="mariak@ebi.ac.uk" locator-type="email">mariak@ebi.ac.uk</inter-ref></p>
]]></description>
<dc:creator><![CDATA[Krestyaninova, M., Zarins, A., Viksna, J., Kurbatova, N., Rucevskis, P., Neogi, S. G., Gostev, M., Perheentupa, T., Knuuttila, J., Barrett, A., Lappalainen, I., Rung, J., Podnieks, K., Sarkans, U., McCarthy, M. I, Brazma, A.]]></dc:creator>
<dc:date>Thu, 08 Oct 2009 22:47:52 PDT</dc:date>
<dc:identifier>info:doi/10.1093/bioinformatics/btp420</dc:identifier>
<dc:title><![CDATA[A System for Information Management in BioMedical Studies--SIMBioMS]]></dc:title>
<dc:publisher>Oxford University Press</dc:publisher>
<prism:number>20</prism:number>
<prism:volume>25</prism:volume>
<prism:endingPage>2769</prism:endingPage>
<prism:publicationDate>2009-10-15</prism:publicationDate>
<prism:startingPage>2768</prism:startingPage>
<prism:section>DATABASES AND ONTOLOGIES</prism:section>
</item>

<item rdf:about="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/20/2770?rss=1">
<title><![CDATA[Comment on 'MeSH-up: effective MeSH text classification for improved document retrieval']]></title>
<link>http://bioinformatics.oxfordjournals.org/cgi/content/short/25/20/2770?rss=1</link>
<description><![CDATA[
<p><b>Contact:</b> <inter-ref locator="neveola@ncbi.nlm.nih.gov" locator-type="email">neveola@ncbi.nlm.nih.gov</inter-ref></p>
<p><b>Supplementary information:</b> <inter-ref locator="http://bioinformatics.oxfordjournals.org/cgi/content/full/btp483/DC1" locator-type="url">Supplementary data </inter-ref>are available at <I>Bioinformatics</I> online.</p>
]]></description>
<dc:creator><![CDATA[Neveol, A., Mork, J. G., Aronson, A. R.]]></dc:creator>
<dc:date>Thu, 08 Oct 2009 22:47:52 PDT</dc:date>
<dc:identifier>info:doi/10.1093/bioinformatics/btp483</dc:identifier>
<dc:title><![CDATA[Comment on 'MeSH-up: effective MeSH text classification for improved document retrieval']]></dc:title>
<dc:publisher>Oxford University Press</dc:publisher>
<prism:number>20</prism:number>
<prism:volume>25</prism:volume>
<prism:endingPage>2771</prism:endingPage>
<prism:publicationDate>2009-10-15</prism:publicationDate>
<prism:startingPage>2770</prism:startingPage>
<prism:section>DATA AND TEXT MINING</prism:section>
</item>

<item rdf:about="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/20/2772?rss=1">
<title><![CDATA[Response to comment on 'MeSH-up: effective MeSH text classification for improved document retrieval']]></title>
<link>http://bioinformatics.oxfordjournals.org/cgi/content/short/25/20/2772?rss=1</link>
<description><![CDATA[
<p><b>Contact:</b> <inter-ref locator="trieschn@ewi.utwente.nl" locator-type="email">trieschn@ewi.utwente.nl</inter-ref>; <inter-ref locator="dolf@trieschnigg.nl" locator-type="email">dolf@trieschnigg.nl</inter-ref></p>
<p>As developers and primary users of MTI and MetaMap, N&eacute;v&eacute;ol <I>et al.</I> made a number of interesting comments on our recent publication in <I>Bioinformatics</I>. However, some of the results and conclusions found in the reply seem premature and lack proper clarification.</p>
]]></description>
<dc:creator><![CDATA[Trieschnigg, D., Pezik, P., Lee, V., de Jong, F., Kraaij, W., Rebholz-Schuhmann, D.]]></dc:creator>
<dc:date>Thu, 08 Oct 2009 22:47:52 PDT</dc:date>
<dc:identifier>info:doi/10.1093/bioinformatics/btp484</dc:identifier>
<dc:title><![CDATA[Response to comment on 'MeSH-up: effective MeSH text classification for improved document retrieval']]></dc:title>
<dc:publisher>Oxford University Press</dc:publisher>
<prism:number>20</prism:number>
<prism:volume>25</prism:volume>
<prism:endingPage>2772</prism:endingPage>
<prism:publicationDate>2009-10-15</prism:publicationDate>
<prism:startingPage>2772</prism:startingPage>
<prism:section>DATA AND TEXT MINING</prism:section>
</item>

<item rdf:about="http://bioinformatics.oxfordjournals.org/cgi/content/short/25/20/2773?rss=1">
<title><![CDATA[Corrigendum for Elliott,B. et al., 'PathCase pathways database system', Bioinformatics, Nov. 2008, 24(21), pp. 2526-2533]]></title>
<link>http://bioinformatics.oxfordjournals.org/cgi/content/short/25/20/2773?rss=1</link>
<description><![CDATA[
<p>Contact: <inter-ref locator="tekin@case.edu" locator-type="email">tekin@case.edu</inter-ref></p>
]]></description>
<dc:creator><![CDATA[Elliott, B., Kirac, M., Cakmak, A., Yavas, G., Mayes, S., Cheng, E., Wang, Y., Gupta, C., Ozsoyoglu, G., Ozsoyoglu, Z. M.]]></dc:creator>
<dc:date>Thu, 08 Oct 2009 22:47:52 PDT</dc:date>
<dc:identifier>info:doi/10.1093/bioinformatics/btp520</dc:identifier>
<dc:title><![CDATA[Corrigendum for Elliott,B. et al., 'PathCase pathways database system', Bioinformatics, Nov. 2008, 24(21), pp. 2526-2533]]></dc:title>
<dc:publisher>Oxford University Press</dc:publisher>
<prism:number>20</prism:number>
<prism:volume>25</prism:volume>
<prism:endingPage>2773</prism:endingPage>
<prism:publicationDate>2009-10-15</prism:publicationDate>
<prism:startingPage>2773</prism:startingPage>
<prism:section>DATABASES AND ONTOLOGIES</prism:section>
</item>

</rdf:RDF>