<html xmlns:v="urn:schemas-microsoft-com:vml" xmlns:o="urn:schemas-microsoft-com:office:office" xmlns:w="urn:schemas-microsoft-com:office:word" xmlns:x="urn:schemas-microsoft-com:office:excel" xmlns:p="urn:schemas-microsoft-com:office:powerpoint" xmlns:a="urn:schemas-microsoft-com:office:access" xmlns:dt="uuid:C2F41010-65B3-11d1-A29F-00AA00C14882" xmlns:s="uuid:BDC6E3F0-6DA3-11d1-A2A3-00AA00C14882" xmlns:rs="urn:schemas-microsoft-com:rowset" xmlns:z="#RowsetSchema" xmlns:b="urn:schemas-microsoft-com:office:publisher" xmlns:ss="urn:schemas-microsoft-com:office:spreadsheet" xmlns:c="urn:schemas-microsoft-com:office:component:spreadsheet" xmlns:odc="urn:schemas-microsoft-com:office:odc" xmlns:oa="urn:schemas-microsoft-com:office:activation" xmlns:html="http://www.w3.org/TR/REC-html40" xmlns:q="http://schemas.xmlsoap.org/soap/envelope/" xmlns:rtc="http://microsoft.com/officenet/conferencing" xmlns:D="DAV:" xmlns:Repl="http://schemas.microsoft.com/repl/" xmlns:mt="http://schemas.microsoft.com/sharepoint/soap/meetings/" xmlns:x2="http://schemas.microsoft.com/office/excel/2003/xml" xmlns:ppda="http://www.passport.com/NameSpace.xsd" xmlns:ois="http://schemas.microsoft.com/sharepoint/soap/ois/" xmlns:dir="http://schemas.microsoft.com/sharepoint/soap/directory/" xmlns:ds="http://www.w3.org/2000/09/xmldsig#" xmlns:dsp="http://schemas.microsoft.com/sharepoint/dsp" xmlns:udc="http://schemas.microsoft.com/data/udc" xmlns:xsd="http://www.w3.org/2001/XMLSchema" xmlns:sub="http://schemas.microsoft.com/sharepoint/soap/2002/1/alerts/" xmlns:ec="http://www.w3.org/2001/04/xmlenc#" xmlns:sp="http://schemas.microsoft.com/sharepoint/" xmlns:sps="http://schemas.microsoft.com/sharepoint/soap/" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xmlns:udcs="http://schemas.microsoft.com/data/udc/soap" xmlns:udcxf="http://schemas.microsoft.com/data/udc/xmlfile" xmlns:udcp2p="http://schemas.microsoft.com/data/udc/parttopart" xmlns:wf="http://schemas.microsoft.com/sharepoint/soap/workflow/" xmlns:dsss="http://schemas.microsoft.com/office/2006/digsig-setup" xmlns:dssi="http://schemas.microsoft.com/office/2006/digsig" xmlns:mdssi="http://schemas.openxmlformats.org/package/2006/digital-signature" xmlns:mver="http://schemas.openxmlformats.org/markup-compatibility/2006" xmlns:m="http://schemas.microsoft.com/office/2004/12/omml" xmlns:mrels="http://schemas.openxmlformats.org/package/2006/relationships" xmlns:spwp="http://microsoft.com/sharepoint/webpartpages" xmlns:ex12t="http://schemas.microsoft.com/exchange/services/2006/types" xmlns:ex12m="http://schemas.microsoft.com/exchange/services/2006/messages" xmlns:pptsl="http://schemas.microsoft.com/sharepoint/soap/SlideLibrary/" xmlns:spsl="http://microsoft.com/webservices/SharePointPortalServer/PublishedLinksService" xmlns:Z="urn:schemas-microsoft-com:" xmlns:tax="http://schemas.microsoft.com/sharepoint/taxonomy/soap/" xmlns:tns="http://schemas.microsoft.com/sharepoint/soap/recordsrepository/" xmlns:spsup="http://microsoft.com/webservices/SharePointPortalServer/UserProfileService" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:st="" xmlns="http://www.w3.org/TR/REC-html40">
<head>
<meta http-equiv="Content-Type" content="text/html; charset=us-ascii">
<meta name="Generator" content="Microsoft Word 14 (filtered medium)">
<style><!--
/* Font Definitions */
@font-face
        {font-family:Calibri;
        panose-1:2 15 5 2 2 2 4 3 2 4;}
/* Style Definitions */
p.MsoNormal, li.MsoNormal, div.MsoNormal
        {margin:0cm;
        margin-bottom:.0001pt;
        font-size:11.0pt;
        font-family:"Calibri","sans-serif";
        mso-fareast-language:EN-US;}
a:link, span.MsoHyperlink
        {mso-style-priority:99;
        color:blue;
        text-decoration:underline;}
a:visited, span.MsoHyperlinkFollowed
        {mso-style-priority:99;
        color:purple;
        text-decoration:underline;}
span.EmailStyle17
        {mso-style-type:personal;
        font-family:"Calibri","sans-serif";
        color:windowtext;}
span.EmailStyle18
        {mso-style-type:personal;
        font-family:"Arial","sans-serif";
        color:black;
        font-weight:normal;
        font-style:normal;}
span.EmailStyle19
        {mso-style-type:personal-reply;
        font-family:"Calibri","sans-serif";
        color:#1F497D;}
.MsoChpDefault
        {mso-style-type:export-only;
        font-size:10.0pt;}
@page WordSection1
        {size:612.0pt 792.0pt;
        margin:72.0pt 72.0pt 72.0pt 72.0pt;}
div.WordSection1
        {page:WordSection1;}
--></style><!--[if gte mso 9]><xml>
<o:shapedefaults v:ext="edit" spidmax="1026" />
</xml><![endif]--><!--[if gte mso 9]><xml>
<o:shapelayout v:ext="edit">
<o:idmap v:ext="edit" data="1" />
</o:shapelayout></xml><![endif]-->
</head>
<body lang="EN-SG" link="blue" vlink="purple">
<div class="WordSection1">
<p class="MsoNormal" style="background:white"><span style="font-size:10.0pt;font-family:"Arial","sans-serif";color:#222222;mso-fareast-language:EN-SG">Hi Carson,<o:p></o:p></span></p>
<p class="MsoNormal" style="background:white"><span style="font-size:10.0pt;font-family:"Arial","sans-serif";color:#222222;mso-fareast-language:EN-SG"> <o:p></o:p></span></p>
<p class="MsoNormal" style="background:white"><span style="font-size:10.0pt;font-family:"Arial","sans-serif";color:#222222;mso-fareast-language:EN-SG">I am Prashant a Bioinformatics postdoctoral fellow from Prof B Venkatesh</span><span style="font-size:10.0pt;font-family:"Arial","sans-serif";color:black;mso-fareast-language:EN-SG">’s</span><span style="font-size:10.0pt;font-family:"Arial","sans-serif";color:#222222;mso-fareast-language:EN-SG">
 lab, IMCB, A*STAR. I am using </span><span style="font-size:10.0pt;font-family:"Arial","sans-serif";color:black;mso-fareast-language:EN-SG">MAKER-</span><span style="font-size:10.0pt;font-family:"Arial","sans-serif";color:#222222;mso-fareast-language:EN-SG">tool
 to annotate an invertebrate genome (~2Gb). During annotation process, we found several instances of split genes</span><span style="font-size:10.0pt;font-family:"Arial","sans-serif";color:black;mso-fareast-language:EN-SG"> even though we have full-length reference
 protein sequences from very closely related species</span><span style="font-size:10.0pt;font-family:"Arial","sans-serif";color:#222222;mso-fareast-language:EN-SG">. Hence we decided to look at one of the loc</span><span style="font-size:10.0pt;font-family:"Arial","sans-serif";color:black;mso-fareast-language:EN-SG">i</span><span style="font-size:10.0pt;font-family:"Arial","sans-serif";color:#222222;mso-fareast-language:EN-SG">
 to understand the reason behind it and to optimize the parameters.<o:p></o:p></span></p>
<p class="MsoNormal" style="background:white"><span style="font-size:10.0pt;font-family:"Arial","sans-serif";color:#222222;mso-fareast-language:EN-SG"><o:p> </o:p></span></p>
<p class="MsoNormal" style="background:white"><span style="font-size:10.0pt;font-family:"Arial","sans-serif";color:#222222;mso-fareast-language:EN-SG">We
</span><span style="font-size:10.0pt;font-family:"Arial","sans-serif";color:black;mso-fareast-language:EN-SG">looked at</span><span style="font-size:10.0pt;font-family:"Arial","sans-serif";color:#222222;mso-fareast-language:EN-SG"> a gene ~110kb long
</span><span style="font-size:10.0pt;font-family:"Arial","sans-serif";color:black;mso-fareast-language:EN-SG">and</span><span style="font-size:10.0pt;font-family:"Arial","sans-serif";color:#222222;mso-fareast-language:EN-SG"> codes for
</span><span style="font-size:10.0pt;font-family:"Arial","sans-serif";color:black;mso-fareast-language:EN-SG">a
</span><span style="font-size:10.0pt;font-family:"Arial","sans-serif";color:#222222;mso-fareast-language:EN-SG">~1200 amino acid protein. We have a highly identical
</span><span style="font-size:10.0pt;font-family:"Arial","sans-serif";color:black;mso-fareast-language:EN-SG">reference protein
</span><span style="font-size:10.0pt;font-family:"Arial","sans-serif";color:#222222;mso-fareast-language:EN-SG">(>90% identity and 100% coverage)</span><span style="font-size:10.0pt;font-family:"Arial","sans-serif";color:black;mso-fareast-language:EN-SG"> from
 another species</span><span style="font-size:10.0pt;font-family:"Arial","sans-serif";color:#222222;mso-fareast-language:EN-SG">.
</span><span style="font-size:10.0pt;font-family:"Arial","sans-serif";color:black;mso-fareast-language:EN-SG">In addition we also have</span><span style="font-size:10.0pt;font-family:"Arial","sans-serif";color:#222222;mso-fareast-language:EN-SG"> a high coverage
</span><span style="font-size:10.0pt;font-family:"Arial","sans-serif";color:black;mso-fareast-language:EN-SG">Trinity
</span><span style="font-size:10.0pt;font-family:"Arial","sans-serif";color:#222222;mso-fareast-language:EN-SG">transcript assembly
</span><span style="font-size:10.0pt;font-family:"Arial","sans-serif";color:black;mso-fareast-language:EN-SG">from our species</span><span style="font-size:10.0pt;font-family:"Arial","sans-serif";color:#222222;mso-fareast-language:EN-SG">. Still, this gene
 is split into 4 fragments during evidence-based </span><span style="font-size:10.0pt;font-family:"Arial","sans-serif";color:black;mso-fareast-language:EN-SG">MAKER</span><span style="font-size:10.0pt;font-family:"Arial","sans-serif";color:#222222;mso-fareast-language:EN-SG">
 run. On closer a look, we found that the above mentioned closely related protein is not aligned by exonerate (protein2genome) even though it is the closest protein to this gene in our dataset.
</span><span style="font-size:10.0pt;font-family:"Arial","sans-serif";color:black;mso-fareast-language:EN-SG">It looks like the program is giving more weightage to transcripts which are typically fragments of the gene. So we are at a loss as to how to predict
 this gene in full.</span><span style="font-size:10.0pt;font-family:"Arial","sans-serif";color:#222222;mso-fareast-language:EN-SG"><o:p></o:p></span></p>
<p class="MsoNormal" style="background:white"><span style="font-size:10.0pt;font-family:"Arial","sans-serif";color:#222222;mso-fareast-language:EN-SG"><o:p> </o:p></span></p>
<p class="MsoNormal" style="background:white"><span style="font-size:10.0pt;font-family:"Arial","sans-serif";color:#222222;mso-fareast-language:EN-SG">For your reference,
</span><span style="font-size:10.0pt;font-family:"Arial","sans-serif";color:black;mso-fareast-language:EN-SG">I am herewith enclosing</span><span style="font-size:10.0pt;font-family:"Arial","sans-serif";color:#222222;mso-fareast-language:EN-SG"> maker_opts.ctl
 file and maker_bopts.ctl. I will be glad to share the scaffold sequence and other input files if required.<o:p></o:p></span></p>
<p class="MsoNormal" style="background:white"><span style="font-size:10.0pt;font-family:"Arial","sans-serif";color:#222222;mso-fareast-language:EN-SG"><o:p> </o:p></span></p>
<p class="MsoNormal" style="background:white"><span style="font-size:10.0pt;font-family:"Arial","sans-serif";color:#222222;mso-fareast-language:EN-SG">Can you please help me to understand the reason behind MAKER not able to use</span><span style="font-size:10.0pt;font-family:"Arial","sans-serif";color:black;mso-fareast-language:EN-SG">
 the full-length reference</span><span style="font-size:10.0pt;font-family:"Arial","sans-serif";color:#222222;mso-fareast-language:EN-SG"> protein for gene prediction</span><span style="font-size:10.0pt;font-family:"Arial","sans-serif";color:black;mso-fareast-language:EN-SG">
 and how we can overcome this problem.</span><span style="font-size:10.0pt;font-family:"Arial","sans-serif";color:#222222;mso-fareast-language:EN-SG"><o:p></o:p></span></p>
<p class="MsoNormal"><span style="font-size:10.0pt;font-family:"Arial","sans-serif""><o:p> </o:p></span></p>
<p class="MsoNormal"><span style="font-size:10.0pt;font-family:"Arial","sans-serif"">Thanks
<span style="color:black">for your time and help.<o:p></o:p></span></span></p>
<p class="MsoNormal"><span style="font-size:10.0pt;font-family:"Arial","sans-serif";color:black"><o:p> </o:p></span></p>
<p class="MsoNormal"><span style="font-size:10.0pt;font-family:"Arial","sans-serif";color:black">Best</span><span style="font-size:10.0pt;font-family:"Arial","sans-serif""> regards,<o:p></o:p></span></p>
<p class="MsoNormal"><o:p> </o:p></p>
<p class="MsoNormal"><b><u><span lang="EN-US" style="font-size:9.0pt;color:#0E24F2;mso-fareast-language:EN-SG"><a href="mailto:prashantns@imcb.a-star.edu.sg">Prashant Shingate,
<span style="text-decoration:none">PhD</span></a></span></u></b><b><span lang="EN-US" style="font-size:9.0pt;color:#1F497D;mso-fareast-language:EN-SG">
</span></b><b><span lang="EN-US" style="font-size:9.0pt;color:black;mso-fareast-language:EN-SG">::
</span></b><b><span lang="EN-US" style="font-size:9.0pt;color:#1F497D;mso-fareast-language:EN-SG">Research Fellow :: Comparative and Medical Genomics Lab :: Institute of Molecular and Cell Biology (IMCB) :: Agency for Science, Technology and Research (A*STAR)</span></b><span style="font-size:9.0pt;color:#1F497D;mso-fareast-language:EN-SG"><o:p></o:p></span></p>
<p class="MsoNormal"><span lang="EN-US" style="font-size:9.0pt;color:#1F497D;mso-fareast-language:EN-SG">61 Biopolis Drive :: #05-04 Proteos :: Singapore 138673 :: DID (+65) 6586 9570 :: Fax (+65) 6779 1117</span><span lang="EN-US" style="font-size:9.0pt;color:#0E24F2;mso-fareast-language:EN-SG">::
<a href="http://www.imcb.a-star.edu.sg/"><span style="color:#0E24F2">http://www.imcb.a-star.edu.sg/</span></a></span><span style="font-size:9.0pt;color:#0E24F2;mso-fareast-language:EN-SG"><o:p></o:p></span></p>
<p class="MsoNormal" style="text-autospace:none"><b><span lang="EN-GB" style="font-size:9.0pt;color:red;mso-fareast-language:EN-SG">We advance science and develop innovative technology to further economic growth and improve lives. 
<o:p></o:p></span></b></p>
<p class="MsoNormal"><span style="mso-fareast-language:EN-SG"><o:p> </o:p></span></p>
<p class="MsoNormal"><o:p> </o:p></p>
</div>
<br>
<font face="Arial" color="Gray" size="1"><br>
Note: This message may contain confidential information. If this Email/Fax has been sent to you by mistake, please notify the sender and delete it immediately. Thank you.<br>
</font>
</body>
</html>