<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Archiving and Interchange DTD v1.2 20190208//EN" "http://jats.nlm.nih.gov/archiving/1.2/JATS-archivearticle1.dtd">
<article article-type="brief-report" xmlns:xlink="http://www.w3.org/1999/xlink">
  <front>
    <journal-meta>
      <journal-title-group>
        <journal-title>microPublication Biology</journal-title>
      </journal-title-group>
      <issn pub-type="epub">2578-9430</issn>
      <publisher>
        <publisher-name>Caltech Library</publisher-name>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="doi">10.17912/micropub.biology.000371</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>New Finding</subject>
        </subj-group>
        <subj-group subj-group-type="subject">
          <subject>Genotype Data</subject>
        </subj-group>
        <subj-group subj-group-type="species">
          <subject>Drosophila</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>
          <italic>Drosophila grimshawi</italic>
           &amp;#x2013; 
          <italic>Rheb</italic>
        </article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="author">
          <name>
            <surname>Rele</surname>
            <given-names>Chinmay P.</given-names>
          </name>
          <xref ref-type="aff" rid="aff1">1</xref>
          <xref ref-type="corresp" rid="cor1">§</xref>
        </contrib>
        <contrib contrib-type="author">
          <name>
            <surname>Williams</surname>
            <given-names>Jared</given-names>
          </name>
          <xref ref-type="aff" rid="aff2">2</xref>
        </contrib>
        <contrib contrib-type="author">
          <name>
            <surname>Reed</surname>
            <given-names>Laura K</given-names>
          </name>
          <xref ref-type="aff" rid="aff1">1</xref>
        </contrib>
        <contrib contrib-type="author">
          <name>
            <surname>Youngblom</surname>
            <given-names>James J</given-names>
          </name>
          <xref ref-type="aff" rid="aff2">2</xref>
        </contrib>
        <contrib contrib-type="author">
          <name>
            <surname>Leung</surname>
            <given-names>Wilson</given-names>
          </name>
          <xref ref-type="aff" rid="aff3">3</xref>
        </contrib>
        <aff id="aff1">
          <label>1</label>
          The University of Alabama, Tuscaloosa, AL 35487 
        </aff>
        <aff id="aff2">
          <label>2</label>
          California State University Stanislaus, Turlock, CA 95382 
        </aff>
        <aff id="aff3">
          <label>3</label>
          Washington University in St. Louis, St. Louis, MO 63130
        </aff>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Price</surname>
            <given-names>Donald</given-names>
          </name>
        </contrib>
      </contrib-group>
      <author-notes>
        <corresp id="cor1">
          <label>§</label>
          Correspondence to: Chinmay P. Rele (
          <email>cprele@ua.edu</email>
          )
        </corresp>
        <fn fn-type="con">
          <p>CR: Data curation, Software, Validation, Visualization, Writing - original draft, Writing - review and editing, Formal analysis, Investigation</p>
          <p>JW: Formal analysis, Investigation, Writing - original draft</p>
          <p>LR: Supervision, Funding acquisition, Conceptualization, Project administration</p>
          <p>JY: Supervision, Writing - review and editing</p>
          <p>WL: Data curation, Software, Validation, Visualization, Writing - review and editing</p>
        </fn>
      </author-notes>
      <pub-date date-type="pub" publication-format="electronic">
        <day>16</day>
        <month>2</month>
        <year>2021</year>
      </pub-date>
      <pub-date date-type="collection" publication-format="electronic">
        <year>2021</year>
      </pub-date>
      <volume>2021</volume>
      <elocation-id>10.17912/micropub.biology.000371</elocation-id>
      <history>
        <date date-type="received">
          <day>9</day>
          <month>6</month>
          <year>2020</year>
        </date>
        <date date-type="rev-recd">
          <day>28</day>
          <month>1</month>
          <year>2021</year>
        </date>
        <date date-type="accepted">
          <day>31</day>
          <month>1</month>
          <year>2021</year>
        </date>
      </history>
      <permissions>
        <copyright-statement>Copyright: © 2021 by the authors</copyright-statement>
        <copyright-year>2021</copyright-year>
        <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
          <license-p>This is an open-access article distributed under the terms of the Creative Commons Attribution License, which permits unrestricted use, distribution, and reproduction in any medium, provided the original author and source are credited.</license-p>
        </license>
      </permissions>
    </article-meta>
  </front>
  <body>
    <fig position="anchor" id="f1">
      <label>Figure 1</label>
      <caption>
        <p>
          (A) Synteny of genomic neighborhood of 
          <italic>Rheb</italic>
           in both 
          <italic>D. melanogaster </italic>
          as well as 
          <italic>D. grimshawi</italic>
          . (B) Gene Model in Apollo: A screenshot of the Apollo instance housing the gene model, containing student annotations, Dmel proteins, Gnomon annotations, transdecoder genes, RNA-Seq tracks and splice junctions; (C) Dot Plot of gene in 
          <italic>D. melanogaster</italic>
           (
          <italic>x</italic>
          -axis) vs. the gene in 
          <italic>D. grimshawi </italic>
          (
          <italic>y</italic>
          -axis); (D) Low sequence conservation near the start of the third coding exon, which is more obvious in other species, but still existent in 
          <italic>D. grimshawi</italic>
          .
        </p>
      </caption>
      <graphic xlink:href="25789430-2021-micropub.biology.000371"/>
    </fig>
    <sec>
      <title>Description</title>
      <p>
        <underline>Introduction</underline>
      </p>
      <p>
        The Ras homolog enriched in brain (
        <italic>Rheb</italic>
        ) encodes a Ras homolog (Karassek 
        <italic>et al.</italic>
         2010). Ras is family of genes that make proteins involved in cell signaling pathways that control cell growth and cell death (Banerjee and Resat 2016).
        <italic/>
        The gene model reported here (dgri_Rheb) was developed for the May 2011 assembly of 
        <italic>D. grimshawi </italic>
        Agencourt dgri_caf1/DgriCAF1 (GCA_000005155.1) to describe the ortholog to 
        <italic>D. melanogaster Rheb</italic>
        (FBgn0041191) at the locus previously annotated as XM_001989756.1. The general protocol and datasets for the genome browser tracks used to establish this reported gene model are reported in Rele 
        <italic>et al.</italic>
         2020. Additional tools and resources used in generating and confirming this model include HISAT (Kim 
        <italic>et al.</italic>
         2015), BEDTools (Quinlan 
        <italic>et al.</italic>
         2010), and the Sequence Read Archive (trace.ncbi.nlm.nih.gov/Traces/sra/?study=SRP073087)
        <italic>.</italic>
      </p>
      <p>
        <underline>Synteny</underline>
      </p>
      <p>
        The 
        <italic>Rheb</italic>
         gene on chromosome 3R in 
        <italic>D. melanogaster</italic>
         is surrounded by the genes 
        <italic>CG12746</italic>
        , 
        <italic>CG2931</italic>
        , 
        <italic>CRMP</italic>
        , and 
        <italic>CG2926</italic>
        . Upon a 
        <italic>tblastn</italic>
         search, the 
        <italic>Rheb</italic>
         ortholog gene in 
        <italic>D. grimshawi</italic>
        , on scaffold 14906, is surrounded by the genes XM_001989754.1, XM_001989755.1, XM_001989575.1, and XM_001989576.1 (orthologous to 
        <italic>Cenp-C</italic>
         , 
        <italic>CLS</italic>
        , 
        <italic>Nup93-2</italic>
        , and 
        <italic>CG2519) </italic>
        in
        <italic> D. melanogaster</italic>
        , Figure 1A). Though none of these flanking genes appear to be orthologous between the two species, we determined this region to contain the ortholog for 
        <italic>Rheb</italic>
         in 
        <italic>D. grimshawi</italic>
         because this location had a substantially better 
        <italic>blastp</italic>
         hit to the 
        <italic>Rheb</italic>
         protein sequence than to the second-best hit.
      </p>
      <p>
        <underline>Gene Model</underline>
      </p>
      <p>
        This gene model contains two isoforms of the 
        <italic>Rheb</italic>
         protein in 
        <italic>D. grimshawi</italic>
        , Rheb-PA and &amp;#xAD;Rheb-PB (Figure 1B). Each of these isoforms contains five identical coding exons. The model in 
        <italic>D. melanogaste</italic>
        r and 
        <italic>D. grimshawi</italic>
         have the same length and number of exons, and are similar in peptide sequence. However, there is a dissimilarity at the start of the third exon; but the peptides replacing the ones in 
        <italic>D. melanogaster</italic>
         have similar properties. The coordinates of the corrected gene model can be found in NCBI at GenBank/BankIt using the accession BK014396 and archived in CaltechData 
        <ext-link ext-link-type="uri" xlink:href="https://data.caltech.edu/records/1884">here</ext-link>
        .
      </p>
      <p>
        <underline>Special Characters of Gene Model</underline>
      </p>
      <p>
        <italic>Improper alignment at start of coding exon three</italic>
        : As shown in Figure 1D, there is a stretch of amino acids (Figure 1D) that are not identical (black color), but similar (gray/white), between 
        <italic>D. melanogaster</italic>
         and 
        <italic>D. grimshawi</italic>
        . This pattern is also evident in a few other species as compared to 
        <italic>D. melanogaster</italic>
         (Figure 1D). Though this is more obvious in 
        <italic>D. kikkawai, D. serrata, D. obscura, D. pseudoobscura, D. persimilis</italic>
        , and
        <italic> D. miranda </italic>
        (Figure 1D) as compared to 
        <italic>D. grimshawi</italic>
         (Figure 1D), it nonetheless exists.
      </p>
      <p>
        <italic>Changes in the splice donor site for coding exon four</italic>
        : Rheb-PA in 
        <italic>D. grimshawi </italic>
        has a canonical GT splice donor site at the end of coding exon four. In contrast, the end of coding exon four of Rheb-PA in 
        <italic>D. melanogaster</italic>
        , and in most of the other 
        <italic>Drosophila</italic>
         species across the genus 
        <italic>Sophophora</italic>
        , use a non-canonical GC splice donor site.
      </p>
      <p>Extended data:</p>
      <p>
        Fasta (.faa and .fna) and GFF files are archived and available on CaltechData:

        <ext-link ext-link-type="uri" xlink:href="https://data.caltech.edu/records/1884">D_grimshawi_Rheb_geneModel_gff_faa_fna</ext-link>
        .
This file contains
      </p>
      <list list-type="bullet">
        <list-item>
          <p>
            Peptide Sequence of 
            <italic>Rheb</italic>
             in 
            <italic>D. grimshawi</italic>
          </p>
        </list-item>
        <list-item>
          <p>
            Nucleotide Sequence of 
            <italic>Rheb</italic>
             in 
            <italic>D. grimshawi</italic>
          </p>
        </list-item>
        <list-item>
          <p>
            GFF of 
            <italic>Rheb</italic>
             in 
            <italic>D. grimshawi</italic>
          </p>
        </list-item>
      </list>
    </sec>
  </body>
  <back>
    <ack>
      <sec>
        <title>Acknowledgments</title>
        <p>this.convertHTML(ack)</p>
      </sec>
      <sec>
        <title>Funding</title>
        <p>This material is based upon work supported by the National Science Foundation under Grant No. IUSE-1915544 to LKR and the National Institute of General Medical Sciences of the National Institute of Health Award R25GM130517 to LKR. The Genomics Education Partnership is fully financed by Federal moneys. The content is solely the responsibility of the authors and does not necessarily represent the official views of the National Institutes of Health.</p>
      </sec>
    </ack>
    <ref-list>
      <ref id="R1">
        <mixed-citation>Aspuria P. J., and F. Tamanoi, 2004. The Rheb family of GTP-binding proteins. Cell. Signal. Volume 16, Issue 10: 1105-1112.</mixed-citation>
      </ref>
      <ref id="R2">
        <mixed-citation>Banerjee K. , Resat H. 2016. Constitutive activation of STAT3 in breast cancer cells: A review. Int. J. Cancer 138: 2570&amp;#x2013;2578</mixed-citation>
      </ref>
      <ref id="R3">
        <mixed-citation>Karassek S., C. Berghaus, M. Schwarten, C. G. Goemans, N. Ohse, et al. 2010. Ras homolog enriched in brain (Rheb) enhances apoptotic signaling. J. Biol. Chem. 285: 33979&amp;#x2013;91</mixed-citation>
      </ref>
      <ref id="R4">
        <element-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Kim</surname>
              <given-names>D</given-names>
            </name>
            <name>
              <surname>Langmead</surname>
              <given-names>B</given-names>
            </name>
            <name>
              <surname>Salzberg</surname>
              <given-names>SL</given-names>
            </name>
          </person-group>
          <year>2015</year>
          <month>3</month>
          <day>9</day>
          <article-title>HISAT: a fast spliced aligner with low memory requirements.</article-title>
          <source>Nat Methods</source>
          <volume>12</volume>
          <issue>4</issue>
          <issn>1548-7091</issn>
          <fpage>357</fpage>
          <lpage>360}</lpage>
          <pub-id pub-id-type="doi">10.1038/nmeth.3317</pub-id>
          <pub-id pub-id-type="pmid">25751142</pub-id>
        </element-citation>
      </ref>
      <ref id="R5">
        <mixed-citation>NCBI Expression Archives &amp;#x201C;Sequence Read Archive : NCBI/NLM/NIH.&amp;#x201D; National Center for Biotechnology Information, U.S. National Library of Medicine, trace.ncbi.nlm.nih.gov/Traces/sra/?study=SRP073087</mixed-citation>
      </ref>
      <ref id="R6">
        <element-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Quinlan</surname>
              <given-names>AR</given-names>
            </name>
            <name>
              <surname>Hall</surname>
              <given-names>IM</given-names>
            </name>
          </person-group>
          <year>2010</year>
          <month>1</month>
          <day>28</day>
          <article-title>BEDTools: a flexible suite of utilities for comparing genomic features.</article-title>
          <source>Bioinformatics</source>
          <volume>26</volume>
          <issue>6</issue>
          <issn>1367-4803</issn>
          <fpage>841</fpage>
          <lpage>842}</lpage>
          <pub-id pub-id-type="doi">10.1093/bioinformatics/btq033</pub-id>
          <pub-id pub-id-type="pmid">20110278</pub-id>
        </element-citation>
      </ref>
      <ref id="R7">
        <mixed-citation>Rele CP, Sandlin KM, Leung W, Reed LK. 2020. Manual annotation of genes within drosophila species: the genomics education partnership protocol. bioRxiv: 2020.12.10.420521.</mixed-citation>
      </ref>
    </ref-list>
  </back>
</article>