<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Archiving and Interchange DTD v1.2 20190208//EN" "http://jats.nlm.nih.gov/archiving/1.2/JATS-archivearticle1.dtd">
<article article-type="brief-report" xmlns:xlink="http://www.w3.org/1999/xlink">
  <front>
    <journal-meta>
      <journal-title-group>
        <journal-title>microPublication Biology</journal-title>
      </journal-title-group>
      <issn pub-type="epub">2578-9430</issn>
      <publisher>
        <publisher-name>Caltech Library</publisher-name>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="doi">10.17912/micropub.biology.001836</article-id>
      <article-id pub-id-type="accession" assigning-authority="wormbase">WBPaper00069590</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>new finding</subject>
        </subj-group>
        <subj-group subj-group-type="subject">
          <subject>genomic</subject>
        </subj-group>
        <subj-group subj-group-type="species">
          <subject>c. elegans</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>
          Location and organization of a complex, integrated transgenic array in a 
          <italic>Caenorhabditis elegans</italic>
           strain
          <italic/>
          carrying 
          <italic>hlh-29p::gfp</italic>
        </article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="author">
          <name>
            <surname>Anderson</surname>
            <given-names>Simon</given-names>
          </name>
          <role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Investigation" vocab-term-identifier="https://credit.niso.org/contributor-roles/investigation">Investigation</role>
          <role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Methodology" vocab-term-identifier="https://credit.niso.org/contributor-roles/methodology">Methodology</role>
          <role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing - original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft">Writing - original draft</role>
          <xref ref-type="aff" rid="aff1">1</xref>
        </contrib>
        <contrib contrib-type="author">
          <name>
            <surname>Barnard-Kubow</surname>
            <given-names>Karen </given-names>
          </name>
          <role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Methodology" vocab-term-identifier="https://credit.niso.org/contributor-roles/methodology">Methodology</role>
          <role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing - review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/Writing-review-editing">Writing - review &amp; editing</role>
          <xref ref-type="aff" rid="aff1">1</xref>
        </contrib>
        <contrib contrib-type="author">
          <name>
            <surname>Johnson</surname>
            <given-names>Casonya</given-names>
          </name>
          <role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Supervision" vocab-term-identifier="https://credit.niso.org/contributor-roles/supervision">Supervision</role>
          <role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Conceptualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/onceptualization">Conceptualization</role>
          <role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing - review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/Writing-review-editing">Writing - review &amp; editing</role>
          <xref ref-type="aff" rid="aff1">1</xref>
          <xref ref-type="aff" rid="aff2">2</xref>
          <xref ref-type="corresp" rid="cor1">§</xref>
        </contrib>
        <aff id="aff1">
          <label>1</label>
          Biology, James Madison University
        </aff>
        <aff id="aff2">
          <label>2</label>
          Office of Integrative Activities, Research Capacity &amp; Competitiveness, National Science Foundation
        </aff>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <anonymous/>
        </contrib>
      </contrib-group>
      <author-notes>
        <corresp id="cor1">
          <label>§</label>
          Correspondence to: Casonya Johnson (
          <email>casjohns@nsf.gov</email>
          )
        </corresp>
        <fn fn-type="coi-statement">
          <p>The authors declare that there are no conflicts of interest present.</p>
        </fn>
      </author-notes>
      <pub-date date-type="pub" publication-format="electronic">
        <day>8</day>
        <month>5</month>
        <year>2026</year>
      </pub-date>
      <pub-date date-type="collection" publication-format="electronic">
        <year>2026</year>
      </pub-date>
      <volume>2026</volume>
      <elocation-id>10.17912/micropub.biology.001836</elocation-id>
      <history>
        <date date-type="received">
          <day>2</day>
          <month>9</month>
          <year>2025</year>
        </date>
        <date date-type="rev-recd">
          <day>24</day>
          <month>4</month>
          <year>2026</year>
        </date>
        <date date-type="accepted">
          <day>4</day>
          <month>5</month>
          <year>2026</year>
        </date>
      </history>
      <permissions>
        <copyright-statement>Copyright: © 2026 by the authors</copyright-statement>
        <copyright-year>2026</copyright-year>
        <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
          <license-p>This is an open-access article distributed under the terms of the Creative Commons Attribution License, which permits unrestricted use, distribution, and reproduction in any medium, provided the original author and source are credited.</license-p>
        </license>
      </permissions>
      <abstract>
        <p>
          Hairy/Enhancer of Split (HES) proteins are critical for animal development and for the regulation of human diseases. The 
          <italic>
            <ext-link ext-link-type="uri" xlink:href="https://www.ncbi.nlm.nih.gov/Taxonomy/Browser/wwwtax.cgi?mode=Info&amp;id=6239">Caenorhabditis elegans</ext-link>
          </italic>
           genome encodes six HES orthologs, including 
          <ext-link ext-link-type="wormbase" xlink:href="WBGene00001968">HLH-29</ext-link>
          . We used Nanopore sequencing on the MinION platform to define the location and organization of an integrated transgenic array expressing green fluorescent protein driven by the 
          <italic>
            <ext-link ext-link-type="wormbase" xlink:href="WBGene00001968">hlh-29</ext-link>
          </italic>
           promoter. The array, 
          <italic>ardIS501</italic>
          , is at least 188.5 kb long, is inserted into Chromosome III of Bristol 
          <ext-link ext-link-type="wormbase" xlink:href="WBStrain00000001">N2</ext-link>
          , and contains at least 26 copies of 
          <italic>
            <ext-link ext-link-type="wormbase" xlink:href="WBGene00001968">hlh-29</ext-link>
            p::gfp
          </italic>
           and 11 copies of 
          <italic>
            <ext-link ext-link-type="wormbase" xlink:href="WBGene00004397">rol-6</ext-link>
            (
            <ext-link ext-link-type="wormbase" xlink:href="WBVar00248869">su1006</ext-link>
            )
          </italic>
          . The coding sequences 
          <italic>
            <ext-link ext-link-type="wormbase" xlink:href="WBGene00021592">Y46E12A.2</ext-link>
            .1
          </italic>
           and 
          <italic>
            <ext-link ext-link-type="wormbase" xlink:href="WBGene00194738">Y46E12A.5</ext-link>
            .1
          </italic>
           are deleted in this strain, with no observable phenotypes.
        </p>
      </abstract>
      <funding-group>
        <award-group>
          <funding-source>
            <institution-wrap>
              <institution>U.S. National Science Foundation (United States)</institution>
              <institution-id>https://ror.org/021nxhr62</institution-id>
            </institution-wrap>
          </funding-source>
          <award-id>2016342</award-id>
          <principal-award-recipient>Casonya Johnson</principal-award-recipient>
        </award-group>
      </funding-group>
    </article-meta>
  </front>
  <body>
    <fig position="anchor" id="f1">
      <label>
        Figure 1. Integration and chromosomal arrangement of 
        <italic>ardIS501</italic>
      </label>
      <caption>
        <p>
          <bold>
            A. Arrangement of 
            <italic>ardIS501</italic>
             into Chromosome III.
          </bold>
           This IGV screenshot shows the location of the insertion of 
          <italic>
            <ext-link ext-link-type="wormbase" xlink:href="WBGene00001968">hlh-29</ext-link>
            p::gfp(S65C)::
            <ext-link ext-link-type="wormbase" xlink:href="WBGene00006789">unc-54</ext-link>
          </italic>
          and 
          <italic>
            <ext-link ext-link-type="wormbase" xlink:href="WBGene00004397">rol-6</ext-link>
            (
            <ext-link ext-link-type="wormbase" xlink:href="WBVar00248869">su1006</ext-link>
            ) 
          </italic>
          into chromosome III of the wild-type 
          <italic>
            <ext-link ext-link-type="uri" xlink:href="https://www.ncbi.nlm.nih.gov/Taxonomy/Browser/wwwtax.cgi?mode=Info&amp;id=6239">C. elegans</ext-link>
          </italic>
           strain, 
          <ext-link ext-link-type="wormbase" xlink:href="WBStrain00000001">N2</ext-link>
          . Integration of the concatemer deleted 
          <italic>
            <ext-link ext-link-type="wormbase" xlink:href="WBGene00021592">Y46E12A.2</ext-link>
            .1
          </italic>
           and 
          <italic>
            <ext-link ext-link-type="wormbase" xlink:href="WBGene00194738">Y46E12A.5</ext-link>
            .1
          </italic>
          , as shown in the bottom track. Contig 37 extends 136 kb into the insertion from the upstream end and Contig 45 extends 53 kb into the insertion from the downstream end. The first 463 kb of Contig 37 and the last 332 kb of Contig 45 map to the reference genome.
        </p>
        <p>
          <bold>B. Schematic of the Contig 37 and Contig 45 sections of the insertion.</bold>
           These portions of the insertion shown comprise 188.5 kb, containing 26 copies of 
          <italic>
            <ext-link ext-link-type="wormbase" xlink:href="WBGene00001968">hlh-29</ext-link>
            p::gfp(S65C)::
            <ext-link ext-link-type="wormbase" xlink:href="WBGene00006789">unc-54</ext-link>
          </italic>
           and 11 copies of 
          <italic>
            <ext-link ext-link-type="wormbase" xlink:href="WBGene00004397">rol-6</ext-link>
            (
            <ext-link ext-link-type="wormbase" xlink:href="WBVar00248869">su1006</ext-link>
            )
          </italic>
           that are likely to be transcribed (here “likely to be transcribed” means that most of the promoter region and the majority of the protein coding region is present). An unknown amount of DNA is present between Contigs 37 and 45. The top row of features represents the forward strand of Chromosome III, the bottom row represents the reverse strand. The coordinates below the contig features refer to coordinates specific to the contig, not coordinates on Chromosome III.
        </p>
        <p>
          <bold>C. Overlaps between assembled contigs.</bold>
           (i.)
          <bold/>
          Schematic of overlap between Contig 67 and 37. Contig 67 (spanning 56 kb) was called by NECAT as an independent contig. Upon manual review and interrogation with dot plots (not shown) it appears that Contig 67 is within Contig 37. (ii).
          <bold/>
          Schematic of tandem overlap between
          <bold/>
          Contig 64 and Contig 70. The 3'-end of Contig 64 overlaps the 5'-end of Contig 70 by 21 kb.
        </p>
        <p>
          D. 
          <bold>Schematic of Contig 48 and Contig 50</bold>
          . Contig 48 and Contig 50 are representative of the variation among the 26 contigs that were assembled in this study. Contig 48 spans 266 kb and contains 72 copies of 
          <italic>
            <ext-link ext-link-type="wormbase" xlink:href="WBGene00001968">hlh-29</ext-link>
            p::gfp(S65C)::
            <ext-link ext-link-type="wormbase" xlink:href="WBGene00006789">unc-54</ext-link>
          </italic>
           and one copy of 
          <italic>
            <ext-link ext-link-type="wormbase" xlink:href="WBGene00004397">rol-6</ext-link>
            (
            <ext-link ext-link-type="wormbase" xlink:href="WBVar00248869">su1006</ext-link>
            )
          </italic>
           that are likely to be transcribed.&amp;nbsp; Note that the two 
          <italic>
            <ext-link ext-link-type="wormbase" xlink:href="WBGene00004397">rol-6</ext-link>
          </italic>
           sequences near the left of Contig 48 are truncated copies of the gene that lack upstream promoter regions and are unlikely to be transcribed.&amp;nbsp; Contig 50 spans 226.7 kb and contains 47 copies of 
          <italic>
            <ext-link ext-link-type="wormbase" xlink:href="WBGene00001968">hlh-29</ext-link>
            p::gfp(S65C)::
            <ext-link ext-link-type="wormbase" xlink:href="WBGene00006789">unc-54</ext-link>
          </italic>
           and 6 copies of 
          <italic>
            <ext-link ext-link-type="wormbase" xlink:href="WBGene00004397">rol-6</ext-link>
            (
            <ext-link ext-link-type="wormbase" xlink:href="WBVar00248869">su1006</ext-link>
            )
          </italic>
          .&amp;nbsp; These were the two longest contigs in the assembly, at a combined length of 492.7 kb; however, neither contig could reliably be connected to the 3' end of Contig 37 or the 5' end of Contig 45, rendering us unable to confirm their location within Chromosome III.
        </p>
      </caption>
    </fig>
    <graphic xlink:href="25789430-2026-micropub.biology.001836"/>
    <sec>
      <title>Description</title>
      <p>
        Previously, we used an uncharacterized integrated transcriptional reporter to identify cells and tissues that express the gene encoding 
        <ext-link ext-link-type="wormbase" xlink:href="WBGene00001968">HLH-29</ext-link>
         (McMiller et al., 2007; Hale et al., 2014; White et al., 2012; Quach et al., 2013; Haeussler et al. 2021), a transcription factor that is responsive to Notch signaling (Neves and Priess, 2005
        <bold>) </bold>
        and one of six orthologs of the mammalian Hairy/Enhancer of Split (HES) proteins. Transgenic lines were generated by microinjection of a complex array of 
        <italic>
          <ext-link ext-link-type="wormbase" xlink:href="WBGene00001968">hlh-29</ext-link>
          p::gfp(S65C)::
          <ext-link ext-link-type="wormbase" xlink:href="WBGene00006789">unc-54</ext-link>
        </italic>
        and linearized 
        <italic>
          <ext-link ext-link-type="wormbase" xlink:href="WBGene00004397">rol-6</ext-link>
          (
          <ext-link ext-link-type="wormbase" xlink:href="WBVar00248869">su1006</ext-link>
          )
        </italic>
         (Fire, 1986; Kramer et al., 1990), as previously described (Mello et al., 1991; Hobert, 2002), outcrossed six times to 
        <ext-link ext-link-type="wormbase" xlink:href="WBStrain00000001">N2</ext-link>
        , and then maintained as heterozygotes for greater than 100 generations. Genetic mapping and quantitative PCR to identify the site of integration and 
        <italic>
          <ext-link ext-link-type="wormbase" xlink:href="WBGene00001968">hlh-29</ext-link>
          p::gfp(S65C)::
          <ext-link ext-link-type="wormbase" xlink:href="WBGene00006789">unc-54</ext-link>
        </italic>
        copy number, respectively, were inconclusive, suggesting only that the insertion was not on chromosome I or chromosome X. In this present study, we used third generation long read sequencing on the Oxford Nanopore platform to determine the site of integration, as well as the copy number, orientation, and order of the genes contained within the array.
      </p>
      <p>
        MinION Nanopore sequencing of genomic DNA from mixed-stage, genetically homozygous, transgenic populations produced a read length totaling 4.57 GB with 25% of the 582,770 reads exceeding 10.6 kb. The reads ranged from 1 bp to 210,269 bp, with a mean read length of 8,731 bp and a median read length of 4,864 bp. There were 200 reads over 100 kb. For reads ranging from 100 kb to 210 kb, 12 were longer than 150 kb. The complex array containing 
        <italic>
          <ext-link ext-link-type="wormbase" xlink:href="WBGene00001968">hlh-29</ext-link>
          p::gfp(S65C)::
          <ext-link ext-link-type="wormbase" xlink:href="WBGene00006789">unc-54</ext-link>
        </italic>
        and 
        <italic>
          <ext-link ext-link-type="wormbase" xlink:href="WBGene00004397">rol-6</ext-link>
          (
          <ext-link ext-link-type="wormbase" xlink:href="WBVar00248869">su1006</ext-link>
          )
        </italic>
         is inserted into Chromosome III, between bases 1,756,475 and 1,759,577 in WBcel235 (
        <xref ref-type="fig" rid="f1">Figure 1A</xref>
        ). The insertion event resulted in the deletion of 3.1 kb from the chromosome (
        <xref ref-type="fig" rid="f1">Figure 1A</xref>
        ) which deletes two genes of unknown function: 
        <italic>
          <ext-link ext-link-type="wormbase" xlink:href="WBGene00021592">Y46E12A.2</ext-link>
        </italic>
        . and 
        <italic>
          <ext-link ext-link-type="wormbase" xlink:href="WBGene00194738">Y46E12A.5</ext-link>
        </italic>
         (Hashimshony et al., 2015). Transgenic animals appear phenotypically unaffected by the deletion.
      </p>
      <p>
        The reads assembled to 135,928 bp of the left end (Contig 37) and 52,651 bp of the right end (Contig 45) of the insertion. Contig 37 contains 20 copies of 
        <italic>
          <ext-link ext-link-type="wormbase" xlink:href="WBGene00001968">hlh-29</ext-link>
          p::gfp(S65C)::
          <ext-link ext-link-type="wormbase" xlink:href="WBGene00006789">unc-54</ext-link>
        </italic>
        and eight copies of 
        <italic>
          <ext-link ext-link-type="wormbase" xlink:href="WBGene00004397">rol-6</ext-link>
          (
          <ext-link ext-link-type="wormbase" xlink:href="WBVar00248869">su1006</ext-link>
          )
        </italic>
         that are likely to be transcribed, while Contig 45 contains six copies of 
        <italic>
          <ext-link ext-link-type="wormbase" xlink:href="WBGene00001968">hlh-29</ext-link>
          p::gfp(S65C)::
          <ext-link ext-link-type="wormbase" xlink:href="WBGene00006789">unc-54</ext-link>
        </italic>
        and three copies of 
        <italic>
          <ext-link ext-link-type="wormbase" xlink:href="WBGene00004397">rol-6</ext-link>
          (
          <ext-link ext-link-type="wormbase" xlink:href="WBVar00248869">su1006</ext-link>
          ) 
        </italic>
        (
        <xref ref-type="fig" rid="f1">Figure 1B</xref>
        ). Summing the regions of Contigs 37 and 45 that do not map to the reference genome gives a minimum length for the insertion of 188,579 bp, containing 26 copies of 
        <italic>
          <ext-link ext-link-type="wormbase" xlink:href="WBGene00001968">hlh-29</ext-link>
          p::gfp(S65C)::
          <ext-link ext-link-type="wormbase" xlink:href="WBGene00006789">unc-54</ext-link>
        </italic>
        and 11 copies of 
        <italic>
          <ext-link ext-link-type="wormbase" xlink:href="WBGene00004397">rol-6</ext-link>
          (
          <ext-link ext-link-type="wormbase" xlink:href="WBVar00248869">su1006</ext-link>
          )
        </italic>
         (
        <xref ref-type="fig" rid="f1">Figure 1B</xref>
        ).
      </p>
      <p>
        In total, we assembled 26 contigs, some with significant overlap, and determined the length, 
        <italic>
          <ext-link ext-link-type="wormbase" xlink:href="WBGene00001968">hlh-29</ext-link>
          p::gfp(S65C)::
          <ext-link ext-link-type="wormbase" xlink:href="WBGene00006789">unc-54</ext-link>
        </italic>
        copy number, and 
        <italic>
          <ext-link ext-link-type="wormbase" xlink:href="WBGene00004397">rol-6</ext-link>
          (
          <ext-link ext-link-type="wormbase" xlink:href="WBVar00248869">su1006</ext-link>
          )
        </italic>
         copy number of each. We were not able to identify a single read that spanned the entire length of the insertion, nor were we able to assemble the reads and the 26 contigs to describe the full structure that links the 3'-end of Contig 37 to the 5'-end of Contig 45. However, we were able to map Contig 67 to chromosome III, within Contig 37 (
        <xref ref-type="fig" rid="f1">Figure 1C</xref>
        .i). Contig 67 spans 56 kb, containing eight copies of 
        <italic>
          <ext-link ext-link-type="wormbase" xlink:href="WBGene00001968">hlh-29</ext-link>
          p::gfp(S65C)::
          <ext-link ext-link-type="wormbase" xlink:href="WBGene00006789">unc-54</ext-link>
        </italic>
        and two copies of 
        <italic>
          <ext-link ext-link-type="wormbase" xlink:href="WBGene00004397">rol-6</ext-link>
          (
          <ext-link ext-link-type="wormbase" xlink:href="WBVar00248869">su1006</ext-link>
          ).
        </italic>
         The 26 assembled contigs ranged in length from 4.9 kb to 266 bp, containing between 1 and 72 copies of 
        <italic>
          <ext-link ext-link-type="wormbase" xlink:href="WBGene00001968">hlh-29</ext-link>
          p::gfp(S65C)::
          <ext-link ext-link-type="wormbase" xlink:href="WBGene00006789">unc-54</ext-link>
        </italic>
        , and between 0 and 8 copies of 
        <italic>
          <ext-link ext-link-type="wormbase" xlink:href="WBGene00004397">rol-6</ext-link>
          (
          <ext-link ext-link-type="wormbase" xlink:href="WBVar00248869">su1006</ext-link>
          ). 
        </italic>
        We noted several other instances of overlap among the contigs; for example, there is a 20 kb tandem overlap between Contig 64 and Contig 70 (
        <xref ref-type="fig" rid="f1">Figure 1C</xref>
        .ii), and a 37.5 kb inverted overlap between Contig 57 and Contig 59 (not shown). Each of these contigs was called by NECAT as being separate sections of concatemeric chromosomal DNA, despite sharing genetic content over approximately 20kb and 37.5 kb, respectively. This high degree of similarity over a significant length of the DNA indicates that the two pairs of contigs are likely connected within a portion of concatemeric DNA, though none of the contigs could reliably be connected to Chromosome III via Contig 37 or Contig 45. It should be noted that, with the exception of Contig 67, &amp;nbsp;the ends of Contig 37 and Contig 45 were not found to overlap to a significant degree with any of the 24 other contigs.
      </p>
      <p>
        Finally, we noted that there was not a correlation between the number of copies of 
        <italic>
          <ext-link ext-link-type="wormbase" xlink:href="WBGene00001968">hlh-29</ext-link>
          p::gfp(S65C)::
          <ext-link ext-link-type="wormbase" xlink:href="WBGene00006789">unc-54</ext-link>
        </italic>
        and 
        <italic>
          <ext-link ext-link-type="wormbase" xlink:href="WBGene00004397">rol-6</ext-link>
          (
          <ext-link ext-link-type="wormbase" xlink:href="WBVar00248869">su1006</ext-link>
          )
        </italic>
         within a contig
        <italic>. </italic>
        For example, Contig 48 was the longest assembled contig, spanning 266 kb that contained 72 copies of 
        <italic>
          <ext-link ext-link-type="wormbase" xlink:href="WBGene00001968">hlh-29</ext-link>
          p::gfp(S65C)::
          <ext-link ext-link-type="wormbase" xlink:href="WBGene00006789">unc-54</ext-link>
        </italic>
        , but only 1 copy of 
        <italic>
          <ext-link ext-link-type="wormbase" xlink:href="WBGene00004397">rol-6</ext-link>
          (
          <ext-link ext-link-type="wormbase" xlink:href="WBVar00248869">su1006</ext-link>
          )
        </italic>
        .
        <italic/>
        In contrast,
        <italic/>
        Contig 50 spanned 226.7 kb, with 47 copies of 
        <italic>
          <ext-link ext-link-type="wormbase" xlink:href="WBGene00001968">hlh-29</ext-link>
          p::gfp(S65C)::
          <ext-link ext-link-type="wormbase" xlink:href="WBGene00006789">unc-54</ext-link>
        </italic>
        and 6 copies of 
        <italic>
          <ext-link ext-link-type="wormbase" xlink:href="WBGene00004397">rol-6</ext-link>
          (
          <ext-link ext-link-type="wormbase" xlink:href="WBVar00248869">su1006</ext-link>
          )
        </italic>
         (
        <xref ref-type="fig" rid="f1">Figure 1D</xref>
        ),
        <italic/>
        failed to map to either Contig 37 or Contig 45. Collectively, based on the summation of the contigs and accounting for overlapping segments, our data suggest that the transgenic array spans greater than 454.5 kb and contains 98 copies of 
        <italic>
          <ext-link ext-link-type="wormbase" xlink:href="WBGene00001968">hlh-29</ext-link>
          p::gfp(S65C)::
          <ext-link ext-link-type="wormbase" xlink:href="WBGene00006789">unc-54</ext-link>
        </italic>
        and 12 copies of 
        <italic>
          <ext-link ext-link-type="wormbase" xlink:href="WBGene00004397">rol-6</ext-link>
          (
          <ext-link ext-link-type="wormbase" xlink:href="WBVar00248869">su1006</ext-link>
          )
        </italic>
        . However, the overlap between contigs and our inability to assemble reads to span the entire length of the insertion suggest that simple summation of the 26 generated contigs will not produce an accurate estimate of the total length of the inserted concatemer, and that computerized assembly of long reads generated via MinION Nanopore may produce separate contigs requiring human review or further processing to facilitate more complete assemblage.
      </p>
    </sec>
    <sec>
      <title>Methods</title>
      <p>
        <bold>DNA extraction</bold>
      </p>
      <p>
        The strain carrying an integrated concatemer of 
        <italic>
          <ext-link ext-link-type="wormbase" xlink:href="WBGene00001968">hlh-29</ext-link>
          p::gfp(S65C)::
          <ext-link ext-link-type="wormbase" xlink:href="WBGene00006789">unc-54</ext-link>
        </italic>
        and 
        <italic>
          <ext-link ext-link-type="wormbase" xlink:href="WBGene00004397">rol-6</ext-link>
          (
          <ext-link ext-link-type="wormbase" xlink:href="WBVar00248869">su1006</ext-link>
          )
        </italic>
         (McMiller et al., 2007) was created as described in McMiller and Johnson, 2005, outcrossed 10X, and maintained as a heterozygous population for greater than 100 generations (Lewis and Fleming, 1995). Prior to genomic DNA extractions, homozygous populations were generated by manual selection of hermaphrodites producing 100% roller progeny over multiple generations. DNA was extracted from approximately 200 μL packed, adult-stage hermaphrodites using the Monarch HMW DNA Extraction Kit for Tissue (New England BioLab, T3060G). DNA quality and quantity was checked using a Nanodrop spectrophotometer and a Qubit 3.0 Fluorometer.
      </p>
      <p>
        <bold>Library prep, sequencing, and basecalling</bold>
      </p>
      <p>The DNA library was generated using 1 μg of purified genomic DNA. The DNA was cleaned using Ampure XP magnetic beads and then prepped for MinION sequencing using the SQK-LSK110 Ligation Sequencing Kit (Nanopore). Seventy-five microliters of solution containing 12 μL prepped DNA, 37.5 μL sequencing buffer, and 25.5 μL loading beads was loaded onto a FLO-MIN106 flow cell and sequenced over 41 hours. The binary FAST5 file output from the sequencer was fed into Guppy Basecaller (Nanopore, version cpu_4.5.4_linux64) using a minimum quality score of seven.</p>
      <p>
        <bold>Mapping raw reads and assembly of de novo contigs</bold>
      </p>
      <p>
        Raw and polished basecalled reads (output as a FASTQ file) were mapped to the WBcel235 Bristol 
        <ext-link ext-link-type="wormbase" xlink:href="WBStrain00000001">N2</ext-link>
         reference genome using minimap2 (version 2.22). Basecalled reads were also assembled into de novo contigs using NECAT (version necat_20200803_Linux-amd64), with the genome size set to 100 Mb with a minimum read length of 3 kb. Read and contigs were mapped using the option “-ax map-ont”. The raw reads were deposited in NCBI's SRA (
        <ext-link ext-link-type="uri" xlink:href="https://www.ncbi.nlm.nih.gov/bioproject/PRJNA964757">PRJNA964757</ext-link>
        ).
      </p>
      <p>
        <bold>BLAST analysis and visualization</bold>
      </p>
      <p>
        The original transgene was designed to contain the 
        <italic>gfp(S65C)</italic>
         coding sequence (JX171292.1, bases 2779-3648) immediately preceded by sequences 1000 bases upstream of the chromosomal 
        <italic>
          <ext-link ext-link-type="wormbase" xlink:href="WBGene00001968">hlh-29</ext-link>
        </italic>
         coding sequence (referred to hereafter as 
        <italic>
          <ext-link ext-link-type="wormbase" xlink:href="WBGene00001968">hlh-29</ext-link>
        </italic>
         promoter: bases 17,549,640 to 17,548,640 on the X chromosome of WBcel235). The 
        <italic>gfp(S65C) </italic>
        coding sequence is terminated by the 
        <italic>
          <ext-link ext-link-type="wormbase" xlink:href="WBGene00006789">unc-54</ext-link>
           (myosin-4)
        </italic>
         terminator (JX171292.1, bases 3785-4519). The transgene was also designed to contain 
        <italic>
          <ext-link ext-link-type="wormbase" xlink:href="WBGene00004397">rol-6</ext-link>
          (
          <ext-link ext-link-type="wormbase" xlink:href="WBVar00248869">su1006</ext-link>
          )
        </italic>
         (WBVar00248869), derived from the cloning vector pRF-4 (Wormbase), kindly provided by Dr. Andrew Fire (available from Addgene, Inc., Cambridge, MA). Sequenced contigs were analyzed using BLAST (https://blast.ncbi.nlm.nih.gov/Blast.cgi) to first identify and count the occurrence of 
        <italic>gfp(S65C)</italic>
        , and then GFP-containing contigs were analyzed to identify the locations of 
        <italic>
          <ext-link ext-link-type="wormbase" xlink:href="WBGene00001968">hlh-29</ext-link>
        </italic>
         promoters, 
        <italic>
          <ext-link ext-link-type="wormbase" xlink:href="WBGene00006789">unc-54</ext-link>
        </italic>
         3' UTRs (terminator), and copies of 
        <italic>
          <ext-link ext-link-type="wormbase" xlink:href="WBGene00004397">rol-6</ext-link>
          (
          <ext-link ext-link-type="wormbase" xlink:href="WBVar00248869">su1006</ext-link>
          ).
        </italic>
         Raw reads, assembled contigs, and their mapping to the reference genome were visualized using the Broad Institute's Integrative Genomics Viewer (IGV). The structure of each contig (the location and orientation of 
        <italic>
          <ext-link ext-link-type="wormbase" xlink:href="WBGene00004397">rol-6</ext-link>
        </italic>
        and GFP elements) was visualized in Desmos graphing calculator using data obtained from BLAST analyses.
      </p>
    </sec>
  </body>
  <back>
    <ref-list>
      <ref id="R1">
        <element-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Fire</surname>
              <given-names>Andrew</given-names>
            </name>
          </person-group>
          <year>1986</year>
          <month>10</month>
          <day>1</day>
          <article-title>
            Integrative transformation of
                    
            <italic>Caenorhabditis elegans</italic>
          </article-title>
          <source>The EMBO Journal</source>
          <volume>5</volume>
          <issue>10</issue>
          <issn>0261-4189</issn>
          <fpage>2673</fpage>
          <lpage>2680</lpage>
          <pub-id pub-id-type="doi">10.1002/j.1460-2075.1986.tb04550.x</pub-id>
        </element-citation>
      </ref>
      <ref id="R2">
        <element-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Hale</surname>
              <given-names>JJ</given-names>
            </name>
            <name>
              <surname>Amin</surname>
              <given-names>NM</given-names>
            </name>
            <name>
              <surname>George</surname>
              <given-names>C</given-names>
            </name>
            <name>
              <surname>Via</surname>
              <given-names>Z</given-names>
            </name>
            <name>
              <surname>Shi</surname>
              <given-names>H</given-names>
            </name>
            <name>
              <surname>Liu</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <year>2014</year>
          <month>2</month>
          <day>7</day>
          <article-title>A role of the LIN-12/Notch signaling pathway in diversifying the non-striated egg-laying muscles in C. elegans.</article-title>
          <source>Dev Biol</source>
          <volume>389</volume>
          <issue>2</issue>
          <issn>0012-1606</issn>
          <fpage>137</fpage>
          <lpage>148</lpage>
          <pub-id pub-id-type="doi">10.1016/j.ydbio.2014.02.001</pub-id>
          <pub-id pub-id-type="pmid">24512688</pub-id>
        </element-citation>
      </ref>
      <ref id="R3">
        <element-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Haeussler</surname>
              <given-names>S</given-names>
            </name>
            <name>
              <surname>Yeroslaviz</surname>
              <given-names>A</given-names>
            </name>
            <name>
              <surname>Rolland</surname>
              <given-names>SG</given-names>
            </name>
            <name>
              <surname>Luehr</surname>
              <given-names>S</given-names>
            </name>
            <name>
              <surname>Lambie</surname>
              <given-names>EJ</given-names>
            </name>
            <name>
              <surname>Conradt</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <year>2021</year>
          <month>3</month>
          <day>30</day>
          <article-title>Genome-wide RNAi screen for regulators of UPRmt in Caenorhabditis elegans mutants with defects in mitochondrial fusion.</article-title>
          <source>G3 (Bethesda)</source>
          <pub-id pub-id-type="doi">10.1093/g3journal/jkab095</pub-id>
          <pub-id pub-id-type="pmid">33784383</pub-id>
        </element-citation>
      </ref>
      <ref id="R4">
        <element-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Hashimshony</surname>
              <given-names>T</given-names>
            </name>
            <name>
              <surname>Feder</surname>
              <given-names>M</given-names>
            </name>
            <name>
              <surname>Levin</surname>
              <given-names>M</given-names>
            </name>
            <name>
              <surname>Hall</surname>
              <given-names>BK</given-names>
            </name>
            <name>
              <surname>Yanai</surname>
              <given-names>I</given-names>
            </name>
          </person-group>
          <year>2014</year>
          <month>12</month>
          <day>10</day>
          <article-title>Spatiotemporal transcriptomics reveals the evolutionary history of the endoderm germ layer.</article-title>
          <source>Nature</source>
          <volume>519</volume>
          <issue>7542</issue>
          <issn>0028-0836</issn>
          <fpage>219</fpage>
          <lpage>222</lpage>
          <pub-id pub-id-type="doi">10.1038/nature13996</pub-id>
          <pub-id pub-id-type="pmid">25487147</pub-id>
        </element-citation>
      </ref>
      <ref id="R5">
        <element-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Hobert</surname>
              <given-names>O</given-names>
            </name>
          </person-group>
          <year>2002</year>
          <month>4</month>
          <day>1</day>
          <article-title>PCR fusion-based approach to create reporter gene constructs for expression analysis in transgenic C. elegans.</article-title>
          <source>Biotechniques</source>
          <volume>32</volume>
          <issue>4</issue>
          <issn>0736-6205</issn>
          <fpage>728</fpage>
          <lpage>730</lpage>
          <pub-id pub-id-type="doi">10.2144/02324bm01</pub-id>
          <pub-id pub-id-type="pmid">11962590</pub-id>
        </element-citation>
      </ref>
      <ref id="R6">
        <element-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Kramer</surname>
              <given-names>J M</given-names>
            </name>
            <name>
              <surname>French</surname>
              <given-names>R P</given-names>
            </name>
            <name>
              <surname>Park</surname>
              <given-names>E C</given-names>
            </name>
            <name>
              <surname>Johnson</surname>
              <given-names>J J</given-names>
            </name>
          </person-group>
          <year>1990</year>
          <month>5</month>
          <day>1</day>
          <article-title>The Caenorhabditis elegans rol-6 gene, which interacts with the sqt-1 collagen gene to determine organismal morphology, encodes a collagen.</article-title>
          <source>Molecular and Cellular Biology</source>
          <volume>10</volume>
          <issue>5</issue>
          <issn>0270-7306</issn>
          <fpage>2081</fpage>
          <lpage>2089</lpage>
          <pub-id pub-id-type="doi">10.1128/mcb.10.5.2081</pub-id>
        </element-citation>
      </ref>
      <ref id="R7">
        <mixed-citation>Lewis JA, Fleming JT. Basic culture methods. In: Epstein HF, Shakes DC, eds. Caenorhabditis Elegans, Modern Biological Analysis of an Organism. Academic Press; 1995:3-29.</mixed-citation>
      </ref>
      <ref id="R8">
        <element-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>McMiller</surname>
              <given-names>Tracee L.</given-names>
            </name>
            <name>
              <surname>Johnson</surname>
              <given-names>Casonya M.</given-names>
            </name>
          </person-group>
          <year>2005</year>
          <month>8</month>
          <day>1</day>
          <article-title>Molecular characterization of HLH-17, a C. elegans bHLH protein required for normal larval development</article-title>
          <source>Gene</source>
          <volume>356</volume>
          <issn>0378-1119</issn>
          <fpage>1</fpage>
          <lpage>10</lpage>
          <pub-id pub-id-type="doi">10.1016/j.gene.2005.05.003</pub-id>
        </element-citation>
      </ref>
      <ref id="R9">
        <element-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>McMiller</surname>
              <given-names>Tracee L.</given-names>
            </name>
            <name>
              <surname>Sims</surname>
              <given-names>Denise</given-names>
            </name>
            <name>
              <surname>Lee</surname>
              <given-names>Tameshia</given-names>
            </name>
            <name>
              <surname>Williams</surname>
              <given-names>Tiffany</given-names>
            </name>
            <name>
              <surname>Johnson</surname>
              <given-names>Casonya M.</given-names>
            </name>
          </person-group>
          <year>2007</year>
          <month>1</month>
          <day>1</day>
          <article-title>Molecular characterization of the Caenorhabditis elegans REF-1 family member, hlh-29/hlh-28</article-title>
          <source>Biochimica et Biophysica Acta (BBA) - Gene Structure and Expression</source>
          <volume>1769</volume>
          <issue>1</issue>
          <issn>0167-4781</issn>
          <fpage>5</fpage>
          <lpage>19</lpage>
          <pub-id pub-id-type="doi">10.1016/j.bbaexp.2006.12.001</pub-id>
        </element-citation>
      </ref>
      <ref id="R10">
        <element-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Mello</surname>
              <given-names>CC</given-names>
            </name>
            <name>
              <surname>Kramer</surname>
              <given-names>JM</given-names>
            </name>
            <name>
              <surname>Stinchcomb</surname>
              <given-names>D</given-names>
            </name>
            <name>
              <surname>Ambros</surname>
              <given-names>V</given-names>
            </name>
          </person-group>
          <year>1991</year>
          <month>12</month>
          <day>1</day>
          <article-title>Efficient gene transfer in C.elegans: extrachromosomal maintenance and integration of transforming sequences.</article-title>
          <source>EMBO J</source>
          <volume>10</volume>
          <issue>12</issue>
          <issn>0261-4189</issn>
          <fpage>3959</fpage>
          <lpage>3970</lpage>
          <pub-id pub-id-type="pmid">1935914</pub-id>
        </element-citation>
      </ref>
      <ref id="R11">
        <element-citation publication-type="comparative study">
          <person-group person-group-type="author">
            <name>
              <surname>Neves</surname>
              <given-names>A</given-names>
            </name>
            <name>
              <surname>Priess</surname>
              <given-names>JR</given-names>
            </name>
          </person-group>
          <year>2005</year>
          <month>6</month>
          <day>1</day>
          <article-title>The REF-1 family of bHLH transcription factors pattern C. elegans embryos through Notch-dependent and Notch-independent pathways.</article-title>
          <source>Dev Cell</source>
          <volume>8</volume>
          <issue>6</issue>
          <issn>1534-5807</issn>
          <fpage>867</fpage>
          <lpage>879</lpage>
          <pub-id pub-id-type="doi">10.1016/j.devcel.2005.03.012</pub-id>
          <pub-id pub-id-type="pmid">15935776</pub-id>
        </element-citation>
      </ref>
      <ref id="R12">
        <element-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Quach</surname>
              <given-names>Thanh K.</given-names>
            </name>
            <name>
              <surname>Chou</surname>
              <given-names>Han Ting</given-names>
            </name>
            <name>
              <surname>Wang</surname>
              <given-names>Kun</given-names>
            </name>
            <name>
              <surname>Milledge</surname>
              <given-names>Gaolin Zheng</given-names>
            </name>
            <name>
              <surname>Johnson</surname>
              <given-names>Casonya M.</given-names>
            </name>
          </person-group>
          <year>2013</year>
          <month>3</month>
          <day>22</day>
          <article-title>Genome-Wide Microarrray Analysis Reveals Roles for the REF-1 Family Member HLH-29 in Ferritin Synthesis and Peroxide Stress Response</article-title>
          <source>PLoS ONE</source>
          <volume>8</volume>
          <issue>3</issue>
          <issn>1932-6203</issn>
          <fpage>e59719</fpage>
          <lpage>e59719</lpage>
          <pub-id pub-id-type="doi">10.1371/journal.pone.0059719</pub-id>
        </element-citation>
      </ref>
      <ref id="R13">
        <element-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>White</surname>
              <given-names>Ana</given-names>
            </name>
            <name>
              <surname>Fearon</surname>
              <given-names>Abegail</given-names>
            </name>
            <name>
              <surname>Johnson</surname>
              <given-names>Casonya M.</given-names>
            </name>
          </person-group>
          <year>2012</year>
          <month>2</month>
          <day>8</day>
          <article-title>
            HLH-29 regulates ovulation in 
            <italic>C. elegans</italic>
             by targeting genes in the inositol triphosphate signaling pathway
          </article-title>
          <source>Biology Open</source>
          <volume>1</volume>
          <issue>3</issue>
          <issn>2046-6390</issn>
          <fpage>261</fpage>
          <lpage>268</lpage>
          <pub-id pub-id-type="doi">10.1242/bio.2012046</pub-id>
        </element-citation>
      </ref>
    </ref-list>
  </back>
</article>