
<!DOCTYPE article
  PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Archiving and Interchange DTD with MathML3 v1.3 20210610//EN" "JATS-archivearticle1-3-mathml3.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" dtd-version="1.3" article-type="research-article" xml:lang="en"><processing-meta tagset-family="jats" base-tagset="archiving" mathml-version="3.0" table-model="xhtml"><custom-meta-group><custom-meta assigning-authority="highwire" xlink:type="simple"><meta-name>recast-jats-build</meta-name><meta-value>1d2b230b09</meta-value></custom-meta></custom-meta-group></processing-meta><front><journal-meta><journal-id journal-id-type="hwp">jitc</journal-id><journal-id journal-id-type="nlm-ta">J Immunother Cancer</journal-id><journal-id journal-id-type="publisher-id">jitc</journal-id><journal-title-group><journal-title>Journal for ImmunoTherapy of Cancer</journal-title><abbrev-journal-title abbrev-type="publisher">J Immunother Cancer</abbrev-journal-title><abbrev-journal-title>J Immunother Cancer</abbrev-journal-title></journal-title-group><issn pub-type="epub">2051-1426</issn><publisher><publisher-name>BMJ Publishing Group Ltd</publisher-name></publisher></journal-meta><article-meta><article-id pub-id-type="publisher-id">jitc-2019-000299</article-id><article-id pub-id-type="doi">10.1136/jitc-2019-000299</article-id><article-id pub-id-type="pmid">32527930</article-id><article-id pub-id-type="apath" assigning-authority="highwire">/jitc/8/1/e000299.atom</article-id><article-categories><subj-group subj-group-type="heading"><subject>Immune cell therapies and immune cell engineering</subject></subj-group><subj-group subj-group-type="collection" assigning-authority="publisher"><subject>Open access</subject></subj-group><subj-group subj-group-type="collection" assigning-authority="publisher"><subject>Immune Cell Therapies and Immune Cell Engineering</subject></subj-group><subj-group subj-group-type="collection" assigning-authority="highwire"><subject>Special collections</subject><subj-group><subject>JITC</subject><subj-group><subject>Immune Cell Therapies and Immune Cell Engineering</subject></subj-group></subj-group></subj-group><subj-group subj-group-type="collection" assigning-authority="highwire"><subject>Special collections</subject><subj-group><subject>Open access</subject></subj-group></subj-group><series-title>Original research</series-title></article-categories><title-group><article-title>Nanopore sequencing as a scalable, cost-effective platform for analyzing polyclonal vector integration sites following clinical T cell therapy</article-title></title-group><contrib-group><contrib contrib-type="author" id="author-74226321" xlink:type="simple"><contrib-id contrib-id-type="orcid" authenticated="false">http://orcid.org/0000-0002-0311-6725</contrib-id><name name-style="western"><surname>Zhang</surname><given-names>Ping</given-names></name><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author" id="author-74227149" xlink:type="simple"><contrib-id contrib-id-type="orcid" authenticated="false">http://orcid.org/0000-0001-8149-6703</contrib-id><name name-style="western"><surname>Ganesamoorthy</surname><given-names>Devika</given-names></name><xref ref-type="aff" rid="aff2">2</xref></contrib><contrib contrib-type="author" id="author-74227166" xlink:type="simple"><contrib-id contrib-id-type="orcid" authenticated="false">http://orcid.org/0000-0003-3802-908X</contrib-id><name name-style="western"><surname>Nguyen</surname><given-names>Son Hoang</given-names></name><xref ref-type="aff" rid="aff2">2</xref></contrib><contrib contrib-type="author" id="author-74227177" xlink:type="simple"><name name-style="western"><surname>Au</surname><given-names>Raymond</given-names></name><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author" id="author-74227108" xlink:type="simple"><contrib-id contrib-id-type="orcid" authenticated="false">http://orcid.org/0000-0002-4300-455X</contrib-id><name name-style="western"><surname>Coin</surname><given-names>Lachlan J</given-names></name><xref ref-type="aff" rid="aff2">2</xref><xref ref-type="aff" rid="aff3">3</xref><xref ref-type="aff" rid="aff4">4</xref></contrib><contrib contrib-type="author" corresp="yes" id="author-74227196" xlink:type="simple"><contrib-id contrib-id-type="orcid" authenticated="false">http://orcid.org/0000-0001-9567-382X</contrib-id><name name-style="western"><surname>Tey</surname><given-names>Siok-Keen</given-names></name><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="aff" rid="aff5">5</xref><xref ref-type="aff" rid="aff6">6</xref></contrib></contrib-group><aff id="aff1">
<label>1</label>
<institution content-type="department" xlink:type="simple">Department of Immunology</institution>, <institution xlink:type="simple">QIMR Berghofer Medical Research Institute</institution>, <addr-line content-type="city">Herston</addr-line>, <addr-line content-type="state">Queensland</addr-line>, <country>Australia</country>
</aff><aff id="aff2">
<label>2</label>
<institution content-type="department" xlink:type="simple">Institute for Molecular Bioscience</institution>, <institution xlink:type="simple">University of Queensland</institution>, <addr-line content-type="city">Brisbane</addr-line>, <addr-line content-type="state">Queensland</addr-line>, <country>Australia</country>
</aff><aff id="aff3">
<label>3</label>
<institution content-type="department" xlink:type="simple">Department of Clinical Pathology</institution>, <institution xlink:type="simple">The University of Melbourne</institution>, <addr-line content-type="city">Melbourne</addr-line>, <addr-line content-type="state">Victoria</addr-line>, <country>Australia</country>
</aff><aff id="aff4">
<label>4</label>
<institution content-type="department" xlink:type="simple">Department of Infectious Disease</institution>, <institution xlink:type="simple">Imperial College London</institution>, <addr-line content-type="city">London</addr-line>, <addr-line content-type="state">London</addr-line>, <country>UK</country>
</aff><aff id="aff5">
<label>5</label>
<institution content-type="department" xlink:type="simple">Department of Haematology and Bone Marrow Transplantation</institution>, <institution xlink:type="simple">Royal Brisbane and Women's Hospital</institution>, <addr-line content-type="city">Herston</addr-line>, <addr-line content-type="state">Queensland</addr-line>, <country>Australia</country>
</aff><aff id="aff6">
<label>6</label>
<institution content-type="department" xlink:type="simple">Faculty of Medicine</institution>, <institution xlink:type="simple">University of Queensland</institution>, <addr-line content-type="city">Brisbane</addr-line>, <addr-line content-type="state">Queensland</addr-line>, <country>Australia</country>
</aff><author-notes><corresp>
<label>Correspondence to</label> Siok-Keen Tey; <email xlink:type="simple">siok.tey@qimrberghofer.edu.au</email>
</corresp><fn fn-type="other"><p>PZ and DG are joint first authors.</p></fn><fn fn-type="other"><p>LJC and S-KT are joint senior authors.</p></fn></author-notes><pub-date date-type="pub" iso-8601-date="2020-06" pub-type="ppub" publication-format="print"><month>6</month><year>2020</year></pub-date><pub-date date-type="pub" iso-8601-date="2020-06-10" pub-type="epub-original" publication-format="electronic"><day>10</day><month>6</month><year>2020</year></pub-date><pub-date iso-8601-date="2019-12-20T04:54:25-08:00" pub-type="hwp-received"><day>20</day><month>12</month><year>2019</year></pub-date><pub-date iso-8601-date="2019-12-20T04:54:25-08:00" pub-type="hwp-created"><day>20</day><month>12</month><year>2019</year></pub-date><pub-date iso-8601-date="2020-06-10T22:01:22-07:00" pub-type="epub"><day>10</day><month>6</month><year>2020</year></pub-date><volume>8</volume><issue>1</issue><elocation-id>e000299</elocation-id><history><date date-type="accepted" iso-8601-date="2020-03-28"><day>28</day><month>03</month><year>2020</year></date></history><permissions><copyright-statement>© Author(s) (or their employer(s)) 2020. Re-use permitted under CC BY-NC. No commercial re-use. See rights and permissions. Published by BMJ.</copyright-statement><copyright-year>2020</copyright-year><license license-type="open-access" xlink:href="http://creativecommons.org/licenses/" xlink:type="simple"><ali:license_ref xmlns:ali="http://www.niso.org/schemas/ali/1.0/" start_date="2020-06-10">http://creativecommons.org/licenses/by-nc/4.0/</ali:license_ref><license-p>This is an open access article distributed in accordance with the Creative Commons Attribution Non Commercial (CC BY-NC 4.0) license, which permits others to distribute, remix, adapt, build upon this work non-commercially, and license their derivative works on different terms, provided the original work is properly cited, appropriate credit is given, any changes made indicated, and the use is non-commercial. See <ext-link ext-link-type="uri" xlink:href="http://creativecommons.org/licenses/by-nc/4.0/" xlink:type="simple">http://creativecommons.org/licenses/by-nc/4.0/</ext-link>.</license-p></license></permissions><self-uri content-type="pdf" xlink:href="jitc-2019-000299.pdf" xlink:type="simple"/><abstract><sec><title>Background</title><p>Analysis of vector integration sites in gene-modified cells can provide critical information on clonality and potential biological impact on nearby genes. Current short-read next-generation sequencing methods require specialized instruments and large batch runs.</p></sec><sec><title>Methods</title><p>We used nanopore sequencing to analyze the vector integration sites of T cells transduced by the gammaretroviral vector, SFG.iCasp9.2A.ΔCD19. DNA from oligoclonal cell lines and polyclonal clinical samples were restriction enzyme digested with two 6-cutters, <italic toggle="yes">NcoI</italic> and <italic toggle="yes">BspHI</italic>; and the flanking genomic DNA amplified by inverse PCR or cassette ligation PCR. Following nested PCR and barcoding, the amplicons were sequenced on the Oxford Nanopore platform. Reads were filtered for quality, trimmed, and aligned. Custom tool was developed to cluster reads and merge overlapping clusters.</p></sec><sec><title>Results</title><p>Both inverse PCR and cassette ligation PCR could successfully amplify flanking genomic DNA, with cassette ligation PCR showing less bias. The 4.8 million raw reads were grouped into 12,186 clusters and 6410 clones. The 3′long terminal repeat (LTR)-genome junction could be resolved within a 5-nucleotide span for a majority of clusters and within one nucleotide span for clusters with ≥5 reads. The chromosomal distributions of the insertional sites and their predilection for regions proximate to transcription start sites were consistent with previous reports for gammaretroviral vector integrants as analyzed by short-read next-generation sequencing.</p></sec><sec><title>Conclusion</title><p>Our study shows that it is feasible to use nanopore sequencing to map polyclonal vector integration sites. The assay is scalable and requires minimum capital, which together enable cost-effective and timely analysis. Further refinement is required to reduce amplification bias and improve single nucleotide resolution.</p></sec></abstract><kwd-group><kwd>genetics</kwd><kwd>oncology</kwd><kwd>immunology</kwd><kwd>cell engineering</kwd><kwd>immunotherapy, adoptive</kwd></kwd-group><funding-group specific-use="FundRef"><award-group id="funding-1" xlink:type="simple"><funding-source xlink:type="simple">
<institution-wrap><institution-id institution-id-type="FundRef">http://dx.doi.org/10.13039/501100001077</institution-id><institution xlink:type="simple">Royal Brisbane and Women's Hospital Foundation</institution></institution-wrap>
</funding-source></award-group><award-group id="funding-2" xlink:type="simple"><funding-source xlink:type="simple">
<institution-wrap><institution-id institution-id-type="FundRef">http://dx.doi.org/10.13039/501100000925</institution-id><institution xlink:type="simple">National Health and Medical Research Council</institution></institution-wrap>
</funding-source><award-id xlink:type="simple">Early Career Fellowship: APP1054786</award-id><award-id xlink:type="simple">Project Grant: APP1053135</award-id></award-group><award-group id="funding-3" xlink:type="simple"><funding-source xlink:type="simple">
<institution-wrap><institution xlink:type="simple">Metro North Hospital and Health Service (Brisbane)</institution></institution-wrap>
</funding-source><award-id xlink:type="simple">Clinician Research Fellowship</award-id></award-group></funding-group><custom-meta-group><custom-meta xlink:type="simple"><meta-name>special-feature</meta-name><meta-value>unlocked</meta-value></custom-meta><custom-meta xlink:type="simple"><meta-name>special-property</meta-name><meta-value>contains-inline-supplementary-material</meta-value></custom-meta></custom-meta-group></article-meta></front><body><sec id="s1" sec-type="intro"><title>Introduction</title><p>Gene modification can be highly efficient and effective in conferring specific biological traits to a cellular therapeutic. In a majority of cases, gene modification involves the integration of one or more copies of a transgene into the host cell genome, which is passed down to all its progenies. Although targeted transgene integration using CRISPR/cas9 and other genome editing techniques hold great promise and may well be the path of the future,<xref ref-type="bibr" rid="R1 R2">1 2</xref> the vast majority of current gene-modified cellular therapeutics use gammaretroviral, lentiviral, or non-viral vectors that are non-targeted and can integrate at multiple sites, with some predilection for open chromatin and transcriptionally active regions.<xref ref-type="bibr" rid="R3 R4 R5 R6">3–6</xref> Analysis of vector integration sites can provide critical information on the clonality of gene-modified cells and potential biological impacts of specific transgene insertion sites, including the potential for insertional mutagenesis through the inactivation of tumor suppressor genes or activation of proto-oncogenes, such as <italic toggle="yes">LMO2</italic>
<xref ref-type="bibr" rid="R7 R8">7 8</xref> and <italic toggle="yes">EVI1</italic>;<xref ref-type="bibr" rid="R9">9</xref> or alternatively, enhanced therapeutic efficacy, such as enhanced chimeric antigen receptor (CAR) T cell function through transgene disruption of <italic toggle="yes">TET2</italic>.<xref ref-type="bibr" rid="R10">10</xref>
</p><p>In general, the analysis of transgene integration sites involves PCR amplification of the flanking genomic sequences, followed by sequencing of the PCR amplicons. This can be achieved by a number of methods, with one of the most commonly used being linear-amplification mediated PCR (LAM-PCR) or similar methodology followed by short-read high-throughput sequencing on Illumina or similar platforms.<xref ref-type="bibr" rid="R3 R11 R12">3 11 12</xref> These next-generation sequencing platforms can generate a very large number of high-quality reads per flow cell, and thus provide economy of scale. However, the flow cells are expensive, the cost per run is high, and it is therefore necessary to pool a large number of samples to be cost efficient. In addition, short-read lengths can result in inefficient genome alignment. Oxford Nanopore sequencing is a relatively new sequencing platform which directly sequences a strand of DNA as it passes through a nanopore,<xref ref-type="bibr" rid="R13 R14">13 14</xref> and is capable of ultralong reads, as long as two Mb. Additionally, the sequencing flow cells from Oxford Nanopore Technologies are relatively inexpensive and sequencing can be performed in any laboratory without the need for dedicated sequencing equipment. Hence, it may be a cost-efficient platform for integration site analysis for smaller cell therapy centers where there are low sample volumes and potentially limited access to high-cost sequencing instruments.</p><p>We recently conducted a phase I clinical trial using T cells that were transduced with a gammaretroviral vector that carried the inducible caspase 9 (<italic toggle="yes">iCasp9</italic>) safety switch.<xref ref-type="bibr" rid="R15">15</xref> In order to understand the in vivo clonal dynamics of the infused T cells, we developed a method to analyze the vector integration sites in patient samples using inverse PCR followed by nanopore sequencing.<xref ref-type="bibr" rid="R15 R16">15 16</xref> In the current paper, we describe in detail the inverse PCR methodology and an improved methodology using cassette ligation PCR, which has less bias, both followed by nanopore sequencing. We show that nanopore sequencing can be a readily accessible platform for vector integration site analysis. It has some limitations in regard to read quality and single nucleotide resolution, both of which are partially offset by the longer read lengths and are likely to improve with newer generations of nanopore sequencers and refinement in methodology.</p></sec><sec id="s2" sec-type="materials"><title>Materials and methods</title><sec id="s2-1"><title>Retroviral vector and gene-modified cells</title><p>The gammaretroviral vector, SFG.iCasp9.2A.ΔCD19, has been previously described.<xref ref-type="bibr" rid="R17">17</xref> It encodes a safety switch, inducible caspase 9 (<italic toggle="yes">iCasp9</italic>), and truncated CD19 (ΔCD19), which enables the detection of transduced cells by flow cytometry. The vector was pseudotyped with Gibbon ape leukemia virus envelope.<xref ref-type="bibr" rid="R17">17</xref> Patient samples and generation of transduced Jurkat cell clones are described in the <xref ref-type="supplementary-material" rid="SP1">online supplementary information</xref>.</p><supplementary-material id="SP1" position="float" orientation="portrait" xlink:type="simple"><object-id pub-id-type="publisher-id">SP1</object-id><object-id pub-id-type="doi">10.1136/jitc-2019-000299.supp1</object-id><label>Supplementary data</label><p>
<inline-supplementary-material id="SS1" xlink:href="jitc-2019-000299supp001.pdf" mime-subtype="pdf" mimetype="application" xlink:type="simple"/>
</p></supplementary-material></sec><sec id="s2-2"><title>DNA extraction and restriction enzyme digestion</title><p>Genomic DNA was extracted using Purelink genomic DNA mini kit (Invitrogen, Waltham, MA) according to the manufacturer’s instructions. Genomic DNA was digested with two 6-cutter restriction enzymes which generate compatible cohesive ends (underlined): <italic toggle="yes">NcoI</italic>, which cuts at C/<underline>CATG</underline>G and <italic toggle="yes">BspHI</italic>, which cuts at T/<underline>CATG</underline>A (both from New England BioLabs, Ipswich, MA). <italic toggle="yes">NcoI</italic> has three cut sites and <italic toggle="yes">BspHI</italic> has one cut site within the transgene, with the most distal cut site generated by <italic toggle="yes">NcoI</italic> at 1185 base pair (bp) from the junction between the vector insert and the flanking genomic DNA (<xref ref-type="fig" rid="F1">figure 1A</xref>). Note that these restriction enzymes do not have any cut sites within the 5′ and 3′ long terminal repeats (LTR), which flank the transgene and are identical in sequence and orientation. This assay design avoids restriction enzyme digestion within the 5′LTR, which can result in the downstream amplification of the internal transgene sequence, producing non-informative reads. The resulting DNA fragments were circularized for inverse PCR or ligated to linker cassettes for downstream PCR amplification.</p><fig position="float" id="F1" orientation="portrait"><object-id pub-id-type="publisher-id">F1</object-id><label>Figure 1</label><caption><p>Schematic for PCR amplification of flanking genomic sequences. (A) Genomic DNA is digested with two 6-cutter restriction enzymes, <italic toggle="yes">NcoI</italic> and <italic toggle="yes">BspHI</italic>, which together are anticipated to cut at approximately 2 kb intervals. There are four restriction sites within the transgene sequence, the most distal of which is 1185 bp from the 3′LTR / genomic junction. <italic toggle="yes">NcoI</italic> and <italic toggle="yes">BspHI</italic> generate identical 4-nucleotide 5′ overhangs: 5′-CATG-3′, which can be circularized for inverse PCR or ligated to linker cassettes. (B) Inverse PCR begins with circularization with T4 DNA ligase, followed by PCR amplification of the unknown flanking genomic sequences using primers targeting the 3′LTR and the 3′LTR/distal transgene junction, indicated by continuous arrows. This is followed by nested PCR, indicated by dotted arrows, which incorporates tailing sequences for subsequent barcoding. The combined lengths of the dotted lines in the inner circle indicate the minimum theoretical length prior to the addition of tailing sequences and barcodes. (C) The ligation cassette comprises two partially complementary strands: a 27-nucleotide strand and a 14-nucleotide strand, the latter with a mismatched A at the 3′ end and a 5′overhang (5′-ATG-3′). Before cassette ligation, the genomic DNA fragments are filled with a single ddCTP to prevent elongation or ligation at the recessed 3′ end. Cassette ligation results in a nick on this strand, indicated by ‘X’. During the first cycle of PCR, fragments containing flanking genomic DNA are amplified by a primer spanning the transgene/3′LTR. The longer cassette strand does not prime because its complementary shorter strand has not ligated; whereas the shorter cassette strand does not prime because only 10 nucleotides are complementary to the longer cassette strand, resulting in a low annealing temperature. This cassette design limits the amplification of non-flanking genomic DNA and reduces PCR blocking by the shorter cassette strand. Subsequent cycles are primed by both the transgene/3′LTR primer and the longer cassette strand.</p></caption><graphic xlink:href="jitc-2019-000299f01" position="float" orientation="portrait" xlink:type="simple"/></fig></sec><sec id="s2-3"><title>Inverse PCR</title><p>Inverse PCR was performed as previously described.<xref ref-type="bibr" rid="R15 R16">15 16</xref> In brief, DNA fragments were circularized in a dilute mixture of 1 ng/µL DNA in T4 DNA ligase buffer with one cohesive end unit/μL T4 DNA ligase (New England Biolabs) for 16 hours at 16°C. The ligation product was purified by ethanol precipitation. The first PCR reaction was 35 cycles, using a forward primer that was complementary to the distal 3′LTR and directed towards the flanking genomic DNA; and a reverse primer complementary to the junction between the distal transgene and 3′LTR (<xref ref-type="fig" rid="F1">figure 1B</xref>). The PCR mixture was as follows: 50–400 ng circularized DNA template, forward and reverse primers (100 nM each), dNTP (250 nM), 1.25 Unit HotStart Taq DNA polymerase (Qiagen, Hilden, Germany), 1X PCR buffer, and 1X Q-Solution (Qiagen), in a final reaction volume of 50 µL. A 0.5 µL aliquot of the first PCR product was amplified in a nested PCR reaction for 35 cycles, and tailing sequences were added for barcoding and nanopore sequencing. All PCR reactions were performed on a Bio-Rad T100 thermal cycler (Bio-Rad Laboratories, Hercules, CA). Primer sequences and thermocycling conditions are listed in <xref ref-type="supplementary-material" rid="SP1">online supplementary table S1</xref>.</p></sec><sec id="s2-4"><title>Cassette ligation PCR</title><p>Cassette ligation PCR was performed according to the schema in <xref ref-type="fig" rid="F1">figure 1C</xref>. The restriction enzymes generated 5′ overhangs. A single dideoxy-CTP (ddCTP) was filled in to prevent elongation of the recessed 3′ ends using the following reaction mixture: <italic toggle="yes">NcoI/BspHI</italic> digested DNA 16.7 ng/µL, ddCTP 33 µM (GE Healthcare, Chicago, IL), DNA polymerase I, large (Klenow) fragment 0.167 U/µL (New England BioLabs) in CutSmart buffer (New England BioLabs) in a final reaction volume of 15 µL. The mixture was incubated at 25°C for 30 min, heat inactivated at 75°C for 20 min, and purified by ethanol precipitation.</p><p>Linker cassettes were made by annealing two single-stranded DNAs: 5′-ATGTCCCATGGTCA-3′ and 5′-CATAGTTGTTCCACTCCGACCATGGGA-3′ (both at 20 µM) in Tris-HCl (50 mM) with MgCl<sub>2</sub> (5 mM). The mixture was heated to 95°C for 5 min, then gradually cooled to room temperature by turning off the heating block. The linker cassettes were aliquoted, stored at –20°C, and used without repeated freeze/thaw. The ddCTP-filled in DNA fragments were ligated to the linker cassettes using the following reaction mixture: DNA 5 ng/µL, linker cassette 500 nM, and T7 DNA ligase 30 U/µL in T7 ligase buffer (New England BioLabs). The mixture was incubated at 25°C for 30 min, heat inactivated at 65°C for 10 min, and purified by ethanol precipitation. Because the 3′ recessed end of the DNA fragments had a ddCTP, this reaction resulted in ligation of the longer linker cassette strand and a nick in the shorter linker cassette strand. The first PCR reaction was 30 cycles in 50 µL: the forward primer was complementary to the junction between the transgene and the 3′LTR to minimize non-informative reads from 5′LTR priming; and the reverse primer was identical to the longer linker cassette strand. The unligated linker cassette strand was short (14 nucleotides) relative to the ligated cassette strand (27 nucleotides), which reduced unwanted PCR priming of non-flanking genomic fragments. A 0.5 µL aliquot of the first PCR product was amplified 30 cycles in a nested PCR reaction (50 µL) which included tailing sequences for barcoding and nanopore sequencing.</p></sec><sec id="s2-5"><title>Fragment size estimation by agarose gel electrophoresis</title><p>Fragment size estimation was performed by agarose gel electrophoresis and imaged on Vilber Lourmat Ebox CX5 (Vilber Lourmat). The nested PCR products (8 µL) were run on 1% agarose gel. To check for specificity of the amplicons, the PCR products were digested with <italic toggle="yes">SmaI,</italic> which has cut sites within the 3′LTR and distal transgene, generating DNA fragments of 244 bp and 391 bp from inverse PCR amplicons and fragments of 244 bp from cassette ligation PCR amplicons (<xref ref-type="fig" rid="F2">figure 2</xref>).</p><fig position="float" id="F2" orientation="portrait"><object-id pub-id-type="publisher-id">F2</object-id><label>Figure 2</label><caption><p>Schematic and agarose gel electrophoresis of PCR amplification products. (A) Schematic representations of PCR amplicons from inverse PCR (upper) and cassette ligation PCR (lower). The theoretical minimum lengths including the tailing sequences (22 bp x 2) are 929 bp and 406 bp, respectively. (B) 1% agarose gel electrophoresis of inverse PCR (left) and cassette ligation PCR (right) products. Lane 0: non-transduced genomic DNA (negative control). A small proportion of bands (especially sample 5A) were smaller than the theoretical minimum lengths. (C) 2% agarose gel electrophoresis of PCR products after <italic toggle="yes">SmaI</italic> digestion. Arrows point to the expected specific bands.</p></caption><graphic xlink:href="jitc-2019-000299f02" position="float" orientation="portrait" xlink:type="simple"/></fig></sec><sec id="s2-6"><title>Nanopore sequencing</title><p>Sequencing libraries were prepared according to 1D PCR barcoding amplicons protocol from Oxford Nanopore Technologies (ONT, Oxford UK). First, PCR amplicons from inverse PCR and cassette ligation PCR were barcoded using PCR barcodes provided by the supplier. Barcoding PCR mixture was as follows: 24 µL of nested PCR product (0.5 nM), 25 µL of LongAmp Taq master mix (New England Biolabs), and 1 µL of PCR barcode (ONT). Reactions were amplified in a thermal cycler with the following conditions: 95°C for 3 min, 15 cycles of amplification at 95°C for 15 s, 62°C for 15 s, and 65°C for 4 min, followed by final extension of 65°C for 1 min. Barcoded PCR products were purified using 0.8 X Agencourt AMPure XP beads (Beckman Coulter, Brea, CA). Concentrations of purified PCR products were measured using Qubit High Sensitivity Kit (Thermo Fisher, Waltham MA). Based on the concentrations, PCR products were pooled using 10 times more polyclonal clinical samples as compared with oligoclonal samples to increase sequencing coverage. Sequencing libraries were prepared from pooled barcoded PCR products according to manufacturer’s instruction. Briefly, end repair was performed in the following mixture: 48 µL of pooled PCR product, 3.5 µL of NEBNext FFPE DNA repair buffer, 2 µL of NEBNext FFPE DNA repair mix, 3.5 µL of Ultra II End-prep reaction buffer, and 3 µL of Ultra II End-prep enzyme mix (all from New England Biolabs); the mixture was incubated at 20°C for 15 min and 65°C for 15 min. End repaired products were purified with 1X Ampure XP beads (Agencourt) and eluted in 60 µL of nuclease-free water. Purified end-repaired products were ligated with 25 µL Ligation Buffer (ONT), 10 µL NEBNext Quick T4 DNA Ligase (New England Biolabs), and 5 µL Adapter Mix (ONT) and incubated at room temperature for 30 min. Ligated products were purified with 0.4X Ampure XP beads (Agencourt) and Short Fragment Buffer (ONT) and final sequencing library was eluted in Elution Buffer (ONT). Sequencing library was loaded into a single ONT PromethION flowcell and sequenced for 40 hours.</p></sec><sec id="s2-7"><title>Sequence data analysis</title><p>A flow diagram for sequence data analysis is outlined in <xref ref-type="fig" rid="F3">figure 3</xref>. Analysis parameters and custom scripts are provided in <xref ref-type="supplementary-material" rid="SP1">online supplementary information</xref>. Sequencing reads were base-called and demultiplexed using Guppy basecaller V.2.3.7 (ONT). Reads were classified based on the read quality score as pass (≥7) or fail (&lt;7) by the basecaller. Adapters and sample barcodes were trimmed using Porechop V.0.2.4 (<ext-link ext-link-type="uri" xlink:href="https://github.com/rrwick/Porechop" xlink:type="simple">https://github.com/rrwick/Porechop</ext-link>). Reads that were shorter than the combined lengths of the predicted flanking sequences of the amplicons (885 bp for inverse PCR and 362 bp for cassette ligation PCR) were excluded from analysis. For inverse PCR, filtered reads were aligned to hg38 genome and both flanking sequences (ie, 3′LTR and distal transgene sequence), with masking of the distal transgene sequence using BWA mem (V.0.7.15).<xref ref-type="bibr" rid="R18">18</xref> For cassette ligation PCR, the flanking cassette sequence was short and difficult to align; hence, this was first trimmed with Porechop and the trimmed reads were then aligned to hg38 genome and flanking 3′LTR with BWA mem (V.0.7.15).<xref ref-type="bibr" rid="R18">18</xref> Note that as a result of cassette trimming, the final reads for cassette ligation PCR were 27 bp shorter than the original filtered reads. To determine which of the two ends represented the 3′LTR-genome junction, we developed a tool called FlankDetect (<ext-link ext-link-type="uri" xlink:href="https://github.com/mdcao/japsa" xlink:type="simple">https://github.com/mdcao/japsa</ext-link>) (V.1.9-10b) (<xref ref-type="supplementary-material" rid="SP1">online supplementary information</xref>), which identifies reads which contain the flanking sequences and reports the integration site that flanks the junctional 3′LTR sequence. This tool also assigns clonality by clustering reads based on the flanking integration sites. Reads which have integration sites within 10 bp of each other are clustered together. During clustering, alignments that were not primary alignment and less than mapping quality of 20 were excluded from further analysis. To eliminate false clusters, Bedtools (V.2.26.0) merge option was used to merge any overlapping clusters which contain reads that align to the same region. The integration site that is most frequently observed within all the reads that are merged together is retained as the integration site of the clone.</p><fig position="float" id="F3" orientation="portrait"><object-id pub-id-type="publisher-id">F3</object-id><label>Figure 3</label><caption><p>Flowchart for nanopore sequencing analysis. Tools used for analysis are italicized.</p></caption><graphic xlink:href="jitc-2019-000299f03" position="float" orientation="portrait" xlink:type="simple"/></fig></sec><sec id="s2-8"><title>Annotation of integration sites</title><p>Genomic locations of transcription start site (TSS), exonic regions, intronic regions, and intergenic regions were extracted from GENCODE V.28 gene annotation file using custom scripts (<xref ref-type="supplementary-material" rid="SP1">online supplementary information</xref>). Genomic annotation of integration site was performed using Bedtools (V.2.26.0) intersect option. Genomic distance of the integration site from TSS was calculated using custom scripts (<xref ref-type="supplementary-material" rid="SP1">online supplementary information</xref>).</p></sec></sec><sec id="s3" sec-type="results"><title>Results</title><sec id="s3-1"><title>Amplification of flanking DNA by inverse PCR and cassette ligation PCR</title><p>The amplicons from inverse PCR and cassette ligation PCR were predicted to have a sandwich structure: the flanking genomic sequence in the middle, which would be contiguous with the 3′LTR on one end, and the sticky-end ligated distal transgene sequence or linker cassette sequence on the other end (<xref ref-type="fig" rid="F2">figure 2A</xref>). The theoretical minimum lengths of productive amplicons, including the tailing sequences, were 929 bp for inverse PCR and 406 bp for cassette ligation PCR. We performed flanking sequence amplification on non-transduced peripheral blood mononuclear cells (PBMC), and SFG.iCasp9.2A.ΔCD19-transduced Jurkat cell clones and polyclonal clinical samples from our previously published phase I clinical trial.<xref ref-type="bibr" rid="R15">15</xref> There was no significant amplification of negative control non-transduced PBMC by inverse PCR (<xref ref-type="fig" rid="F2">figure 2A</xref>., lane 0A) but there was some amplification by cassette ligation PCR (<xref ref-type="fig" rid="F2">figure 2A</xref>, lane 0B). As expected, inverse PCR and cassette ligation PCR on transgenic Jurkat cell clones (clones 1 and 2) resulted in single PCR fragments (<xref ref-type="fig" rid="F2">figure 2B</xref>: lanes 1A, 1B, 2A, 2B); and a 1:1 mixture of the two Jurkat cell clones resulted in a combination of the two bands (lanes 3A and 3B). Amplification of a polyclonal SFG.iCasp9.2A.ΔCD19-transduced clinical cell product yielded a polyclonal smear (lanes 4A and 4B), as did amplification of patient PBMC collected at Day 369 after T cell infusion (lanes 5A and 5B). However, amplification of patient PBMC from Day 1332 after T cell infusion showed a dominant band with inverse PCR and a polyclonal smear with cassette ligation PCR (lanes 6A and 6B), suggesting a possibility of bias in DNA fragment circularization or PCR amplification with the former. The inverse PCR amplicons in lanes 4A and 5A also contained bands that were shorter than the minimum theoretical length of 929 bp. These were later shown on nanopore sequencing to contain 3′LTR and transgene sequences without any intervening genomic DNA, which was consistent with the circularization of degraded DNA fragments near the 3′LTR.</p></sec><sec id="s3-2"><title>Specificity of PCR amplification</title><p>A combination of two 6-cutters (<italic toggle="yes">NcoI</italic> and <italic toggle="yes">BspHI</italic>) is expected to cut at approximately every 2048 bp (ie, 4<sup>6</sup>/2), generating an estimated 1.5×10<sup>6</sup> DNA fragments per diploid human cell, which has a genome of approximately 3×10<sup>9</sup> bp. Given that a majority of transgenic T cells carry only a small number of transgene inserts per cell, this would mean that only a tiny fraction (&lt;0.005%) of the DNA fragments would include a transgene flanking sequence. Non-specific amplification of non-flanking sequences is therefore a challenge. As shown in <xref ref-type="fig" rid="F2">figure 2A</xref>, specific PCR amplicons following both inverse PCR and cassette ligation PCR should contain a <italic toggle="yes">SmaI</italic> restriction site within the 3′LTR flanking sequence, with inverse PCR amplicons having an additional <italic toggle="yes">SmaI</italic> restriction site at the transgene end. Thus, <italic toggle="yes">SmaI</italic> restriction enzyme digestion of specific PCR amplicons is anticipated to yield a 244 bp DNA fragment from the 3′LTR end and, in the case of inverse PCR, an additional 391 bp DNA fragment from the transgene end, along with flanking genomic DNA fragments of variable lengths. We digested the PCR products with <italic toggle="yes">SmaI</italic> and confirmed that the amplicons from SFG.iCasp9.2A.ΔCD19-transduced samples were specific, with the generation of 244 bp and 391 bp fragments from inverse PCR and a 244 bp fragment from cassette ligation PCR (<xref ref-type="fig" rid="F2">figure 2C</xref>). In contrast, <italic toggle="yes">SmaI</italic> digestion of PCR products from negative control non-transduced genomic DNA did not result in any specific 244 bp or 391 bp fragments (<xref ref-type="fig" rid="F2">figure 2C</xref>, lanes 0A and 0B).</p></sec><sec id="s3-3"><title>Nanopore output and read filtering</title><p>All 12 paired PCR products from the six samples were pooled into one nanopore sequencing run. In order to ensure adequate read-depth, the amount of input DNA was limited to the equivalent of less than 10,000 transduced cells per sample (see <xref ref-type="supplementary-material" rid="SP1">online supplementary table S2</xref>). Because the Jurkat samples were clonal and hence required fewer total reads, they were pooled with the polyclonal patient samples at a ratio of 1:10. The sequencing run produced 23.4 million reads in total and 59% of reads were classified as passing quality score (read quality ≥7). Approximately 6% of the pass reads could not be demultiplexed and were excluded. In most of the samples, &gt;90% of the resulting reads were longer than the minimum theoretical length of 885 bp for inverse PCR and 362 bp for cassette ligation PCR after adapter trimming. A vast majority of the length-filtered reads were specific, with 95% (range 89%–98%) having both expected flanking sequences: the junctional 3′LTR flank on one end and the cassette or transgene sequence on the other end. <xref ref-type="table" rid="T1">Table 1</xref> summarizes the number of reads retained after each data analysis step.</p><table-wrap position="float" id="T1" orientation="portrait"><object-id pub-id-type="publisher-id">T1</object-id><label>Table 1</label><caption><p>Number and proportion of reads after filtering and alignment</p></caption><table frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom" rowspan="2" colspan="2"/><td align="left" valign="bottom" rowspan="2" colspan="1">Sample ID</td><td align="left" valign="bottom" rowspan="1" colspan="1">Pass reads</td><td align="left" valign="bottom" colspan="2" rowspan="1">Adapter trimmed reads</td><td align="left" valign="bottom" colspan="2" rowspan="1">Reads &gt;minimum theoretical length</td><td align="left" valign="bottom" colspan="2" rowspan="1">Reads with both flanks</td><td align="left" valign="bottom" colspan="2" rowspan="1">Aligned reads</td></tr><tr><td align="left" valign="bottom" rowspan="1" colspan="1">Number of reads</td><td align="left" valign="bottom" rowspan="1" colspan="1">Number of reads</td><td align="left" valign="bottom" rowspan="1" colspan="1">% of pass reads</td><td align="left" valign="bottom" rowspan="1" colspan="1">Number of reads</td><td align="left" valign="bottom" rowspan="1" colspan="1">% of adapter trimmed reads</td><td align="left" valign="bottom" rowspan="1" colspan="1">Number of reads</td><td align="left" valign="bottom" rowspan="1" colspan="1">% of reads &gt;minimum theoretical length</td><td align="left" valign="bottom" rowspan="1" colspan="1">Number of reads</td><td align="left" valign="bottom" rowspan="1" colspan="1">% of reads with both flanks</td></tr></thead><tbody><tr><td align="left" valign="middle" rowspan="6" colspan="1">Inverse PCR</td><td align="left" valign="middle" rowspan="3" colspan="1">Jurkat cells</td><td align="char" char="." valign="top" rowspan="1" colspan="1">1A</td><td align="char" char="." valign="top" rowspan="1" colspan="1">56,043</td><td align="char" char="." valign="top" rowspan="1" colspan="1">50,396</td><td align="char" char="." valign="top" rowspan="1" colspan="1">89.9</td><td align="char" char="." valign="top" rowspan="1" colspan="1">48,451</td><td align="char" char="." valign="top" rowspan="1" colspan="1">96.1</td><td align="char" char="." valign="top" rowspan="1" colspan="1">44,776</td><td align="char" char="." valign="top" rowspan="1" colspan="1">92.4</td><td align="char" char="." valign="top" rowspan="1" colspan="1">44,475</td><td align="char" char="." valign="top" rowspan="1" colspan="1">99.3</td></tr><tr><td align="char" char="." valign="top" rowspan="1" colspan="1">2A</td><td align="char" char="." valign="top" rowspan="1" colspan="1">272,138</td><td align="char" char="." valign="top" rowspan="1" colspan="1">249,196</td><td align="char" char="." valign="top" rowspan="1" colspan="1">91.6</td><td align="char" char="." valign="top" rowspan="1" colspan="1">237,487</td><td align="char" char="." valign="top" rowspan="1" colspan="1">95.3</td><td align="char" char="." valign="top" rowspan="1" colspan="1">232,040</td><td align="char" char="." valign="top" rowspan="1" colspan="1">97.7</td><td align="char" char="." valign="top" rowspan="1" colspan="1">218,894</td><td align="char" char="." valign="top" rowspan="1" colspan="1">94.3</td></tr><tr><td align="char" char="." valign="top" rowspan="1" colspan="1">3A</td><td align="char" char="." valign="top" rowspan="1" colspan="1">157,759</td><td align="char" char="." valign="top" rowspan="1" colspan="1">146,228</td><td align="char" char="." valign="top" rowspan="1" colspan="1">92.7</td><td align="char" char="." valign="top" rowspan="1" colspan="1">139,974</td><td align="char" char="." valign="top" rowspan="1" colspan="1">95.7</td><td align="char" char="." valign="top" rowspan="1" colspan="1">136,263</td><td align="char" char="." valign="top" rowspan="1" colspan="1">97.3</td><td align="char" char="." valign="top" rowspan="1" colspan="1">129,181</td><td align="char" char="." valign="top" rowspan="1" colspan="1">94.8</td></tr><tr><td align="left" valign="middle" rowspan="3" colspan="1">Clinical samples</td><td align="char" char="." valign="top" rowspan="1" colspan="1">4A</td><td align="char" char="." valign="top" rowspan="1" colspan="1">1,949,817</td><td align="char" char="." valign="top" rowspan="1" colspan="1">1,800,452</td><td align="char" char="." valign="top" rowspan="1" colspan="1">92.3</td><td align="char" char="." valign="top" rowspan="1" colspan="1">581,723</td><td align="char" char="." valign="top" rowspan="1" colspan="1">32.3</td><td align="char" char="." valign="top" rowspan="1" colspan="1">519,444</td><td align="char" char="." valign="top" rowspan="1" colspan="1">89.3</td><td align="char" char="." valign="top" rowspan="1" colspan="1">327,685</td><td align="char" char="." valign="top" rowspan="1" colspan="1">63.1</td></tr><tr><td align="char" char="." valign="top" rowspan="1" colspan="1">5A</td><td align="char" char="." valign="top" rowspan="1" colspan="1">3,102,548</td><td align="char" char="." valign="top" rowspan="1" colspan="1">2,889,377</td><td align="char" char="." valign="top" rowspan="1" colspan="1">93.1</td><td align="char" char="." valign="top" rowspan="1" colspan="1">231,456</td><td align="char" char="." valign="top" rowspan="1" colspan="1">8.0</td><td align="char" char="." valign="top" rowspan="1" colspan="1">213,196</td><td align="char" char="." valign="top" rowspan="1" colspan="1">92.1</td><td align="char" char="." valign="top" rowspan="1" colspan="1">146,956</td><td align="char" char="." valign="top" rowspan="1" colspan="1">68.9</td></tr><tr><td align="char" char="." valign="top" rowspan="1" colspan="1">6A</td><td align="char" char="." valign="top" rowspan="1" colspan="1">2,868,949</td><td align="char" char="." valign="top" rowspan="1" colspan="1">2,645,501</td><td align="char" char="." valign="top" rowspan="1" colspan="1">92.2</td><td align="char" char="." valign="top" rowspan="1" colspan="1">2,377,721</td><td align="char" char="." valign="top" rowspan="1" colspan="1">89.9</td><td align="char" char="." valign="top" rowspan="1" colspan="1">2,338,293</td><td align="char" char="." valign="top" rowspan="1" colspan="1">98.3</td><td align="char" char="." valign="top" rowspan="1" colspan="1">1,724,250</td><td align="char" char="." valign="top" rowspan="1" colspan="1">73.7</td></tr><tr><td align="left" valign="middle" rowspan="6" colspan="1">Cassette ligation PCR</td><td align="left" valign="middle" rowspan="3" colspan="1">Jurkat cells</td><td align="char" char="." valign="top" rowspan="1" colspan="1">1B</td><td align="char" char="." valign="top" rowspan="1" colspan="1">91,891</td><td align="char" char="." valign="top" rowspan="1" colspan="1">84,230</td><td align="char" char="." valign="top" rowspan="1" colspan="1">91.7</td><td align="char" char="." valign="top" rowspan="1" colspan="1">78,796</td><td align="char" char="." valign="top" rowspan="1" colspan="1">93.5</td><td align="char" char="." valign="top" rowspan="1" colspan="1">73,476</td><td align="char" char="." valign="top" rowspan="1" colspan="1">93.2</td><td align="char" char="." valign="top" rowspan="1" colspan="1">70,763</td><td align="char" char="." valign="top" rowspan="1" colspan="1">96.3</td></tr><tr><td align="char" char="." valign="top" rowspan="1" colspan="1">2B</td><td align="char" char="." valign="top" rowspan="1" colspan="1">150,027</td><td align="char" char="." valign="top" rowspan="1" colspan="1">135,417</td><td align="char" char="." valign="top" rowspan="1" colspan="1">90.3</td><td align="char" char="." valign="top" rowspan="1" colspan="1">129,610</td><td align="char" char="." valign="top" rowspan="1" colspan="1">95.7</td><td align="char" char="." valign="top" rowspan="1" colspan="1">125,634</td><td align="char" char="." valign="top" rowspan="1" colspan="1">96.9</td><td align="char" char="." valign="top" rowspan="1" colspan="1">118,086</td><td align="char" char="." valign="top" rowspan="1" colspan="1">94.0</td></tr><tr><td align="char" char="." valign="top" rowspan="1" colspan="1">3B</td><td align="char" char="." valign="top" rowspan="1" colspan="1">131,303</td><td align="char" char="." valign="top" rowspan="1" colspan="1">111,739</td><td align="char" char="." valign="top" rowspan="1" colspan="1">85.1</td><td align="char" char="." valign="top" rowspan="1" colspan="1">110,416</td><td align="char" char="." valign="top" rowspan="1" colspan="1">98.8</td><td align="char" char="." valign="top" rowspan="1" colspan="1">102,695</td><td align="char" char="." valign="top" rowspan="1" colspan="1">93.0</td><td align="char" char="." valign="top" rowspan="1" colspan="1">97,443</td><td align="char" char="." valign="top" rowspan="1" colspan="1">94.9</td></tr><tr><td align="left" valign="middle" rowspan="3" colspan="1">Clinical samples</td><td align="char" char="." valign="top" rowspan="1" colspan="1">4B</td><td align="char" char="." valign="top" rowspan="1" colspan="1">1,488,028</td><td align="char" char="." valign="top" rowspan="1" colspan="1">1,373,853</td><td align="char" char="." valign="top" rowspan="1" colspan="1">92.3</td><td align="char" char="." valign="top" rowspan="1" colspan="1">1,272,524</td><td align="char" char="." valign="top" rowspan="1" colspan="1">92.6</td><td align="char" char="." valign="top" rowspan="1" colspan="1">1,234,596</td><td align="char" char="." valign="top" rowspan="1" colspan="1">97.0</td><td align="char" char="." valign="top" rowspan="1" colspan="1">856,189</td><td align="char" char="." valign="top" rowspan="1" colspan="1">69.3</td></tr><tr><td align="char" char="." valign="top" rowspan="1" colspan="1">5B</td><td align="char" char="." valign="top" rowspan="1" colspan="1">1,333,591</td><td align="char" char="." valign="top" rowspan="1" colspan="1">1,203,536</td><td align="char" char="." valign="top" rowspan="1" colspan="1">90.2</td><td align="char" char="." valign="top" rowspan="1" colspan="1">1,072,963</td><td align="char" char="." valign="top" rowspan="1" colspan="1">89.2</td><td align="char" char="." valign="top" rowspan="1" colspan="1">1,040,570</td><td align="char" char="." valign="top" rowspan="1" colspan="1">97.0</td><td align="char" char="." valign="top" rowspan="1" colspan="1">726,298</td><td align="char" char="." valign="top" rowspan="1" colspan="1">69.8</td></tr><tr><td align="char" char="." valign="top" rowspan="1" colspan="1">6B</td><td align="char" char="." valign="top" rowspan="1" colspan="1">1,228,503</td><td align="char" char="." valign="top" rowspan="1" colspan="1">1,137,012</td><td align="char" char="." valign="top" rowspan="1" colspan="1">92.6</td><td align="char" char="." valign="top" rowspan="1" colspan="1">945,077</td><td align="char" char="." valign="top" rowspan="1" colspan="1">83.1</td><td align="char" char="." valign="top" rowspan="1" colspan="1">926,182</td><td align="char" char="." valign="top" rowspan="1" colspan="1">98.0</td><td align="char" char="." valign="top" rowspan="1" colspan="1">435,600</td><td align="char" char="." valign="top" rowspan="1" colspan="1">47.0</td></tr></tbody></table></table-wrap></sec><sec id="s3-4"><title>Sequence alignment and clustering</title><p>Greater than 94% of reads containing the expected flanking sequences from the transduced Jurkat cell lines (samples 1, 2, and 3) could be uniquely aligned to the genome (<xref ref-type="table" rid="T1">table 1</xref>). The genome alignment rate was lower for the polyclonal clinical samples, with 47%–74% (median 69%) of reads with the expected flanking sequences being successfully aligned. A majority of reads that could not be aligned to genomic DNA were only marginally longer than the minimum theoretical lengths of the PCR amplicons and were therefore too short to be uniquely aligned (<xref ref-type="fig" rid="F4">figure 4A</xref>). Long unaligned reads generally lacked the anticipated flanking 3′LTR/transgene or cassette sequences and therefore represented non-specific amplicons. A significant proportion of inverse PCR amplicons in samples 4 and 5 were below the minimum theoretical lengths. Alignment of three dominant clones (560 bp, 388 bp, and 318 bp) showed that these consisted of the terminal regions of the flanking 3′LTR and transgene sequences, without any intervening genomic DNA (<xref ref-type="fig" rid="F4">figure 4B</xref>), in an orientation that was consistent with the circularization and PCR amplification of degraded DNA fragments within the transgene/3′LTR region (<xref ref-type="fig" rid="F4">figure 4C</xref>).</p><fig position="float" id="F4" orientation="portrait"><object-id pub-id-type="publisher-id">F4</object-id><label>Figure 4</label><caption><p>Read alignment and clustering. (A) Read-length distribution for the polyclonal clinical samples by inverse PCR (top row) and cassette ligation PCR (bottom row) relative to their respective minimum theoretical lengths of 885 and 335 bp (after cassette trimming). Shown are reads that were below the minimum theoretical length (black), reads that were above the minimum theoretical length but did not have the expected flanking sequences (orange), and reads with the expected flanking sequences that were aligned (green) or unaligned (blue) to genomic DNA. (B) Schematic representation of the dominant short inverse PCR amplicons in samples 4A (i and ii) and 5A (iii). Note that the junctions between the 3′LTR and transgene were formed by circularization of DNA fragments and were not the native junction. (C) Schematic representation of the formation of short amplicons from DNA fragments. (D) Distribution of number of reads per cluster. Shown are data for all 12 samples. (E) Span of 3′LTR-genome junction for clusters that contained two to four reads. ‘0’ indicates identical 3′LTR-genome junction for all reads within the cluster. (F) Span of 3′LTR-genome junction that includes 80% of reads in clusters that include five or more reads. (G) Number of clusters per clone after merging clusters with overlapping read alignment.</p></caption><graphic xlink:href="jitc-2019-000299f04" position="float" orientation="portrait" xlink:type="simple"/></fig><p>Aligned reads with 3′LTR-genome junctions that were within 10 bp of each other were clustered together using our customized tool, FlankDetect. The 4,895,820 reads were grouped into 12,186 clusters. Each cluster consisted of 1 to &gt;10<sup>6</sup> reads: 59% of clusters had single reads, 24% of clusters had 2–10 reads, 7% of clusters had 11–100 reads, and the remaining 10% of clusters had &gt;100 reads (<xref ref-type="fig" rid="F4">figure 4D</xref>). For clusters with two to four reads, the 3′LTR -genome junction was identical in 24% of the clusters. The junction varied by one nucleotide in 28% of clusters, and by two to three nucleotides in 18% of clusters (<xref ref-type="fig" rid="F4">figure 4E</xref>). Overall, for clusters with two to four reads, the spread of 3′LTR -genome junctions was within five nucleotides in 88% of the clusters, but a few clusters had a spread of 10 to 15 nucleotides. For clusters with ≥5 reads, we defined R80 as the span of 3′LTR -genome junction that contained at least 80% of reads within the cluster: 15% of clusters had R80 of 0 nucleotides, meaning 80% of the reads had identical 3′LTR-genome junction; and 80% of clusters had R80 of 1 nucleotide (<xref ref-type="fig" rid="F4">figure 4F</xref>). Overall, for clusters with five or more reads, 97% had an R80 of ≤5 nucleotide, meaning 80% of reads within the clusters were within a span of five nucleotides, although there were isolated clusters with a spread of up to 40 nucleotides.</p><p>We observed that a proportion of the clusters were very proximate to each other. In some cases, the read alignments were very closely matched but the clusters were considered separate because the 3′LTR-genome junction was assigned to opposite ends of the read, which would suggest an underlying alignment error. In order to avoid splitting clonal integration sites into multiple artificial clones, clusters with overlapping read alignments were merged and considered as belonging to the same clone. Using this merging algorithm, we identified 6410 unique vector integration clones: 4440 clones (69%) consisted of only one cluster, 697 clones (11%) consisted of two clusters, 383 clones (6%) consisted of four clusters, and the remaining 890 clones (14%) consisted of four to 18 clusters (<xref ref-type="fig" rid="F4">figure 4G</xref>).</p></sec><sec id="s3-5"><title>Clonal composition by inverse PCR and cassette ligation PCR</title><p>Samples 1 and 2 each contained a unique vector integration site, which were detected by both inverse PCR and cassette ligation PCR. Note that both samples had a degree of subclonal contamination, which was more prominent on cassette ligation PCR than inverse PCR. Sample 3 consisted of an equal mixture of samples 1 and 2 but there was a dominance of the integration site from sample 2, with the bias being more pronounced by inverse PCR (<xref ref-type="fig" rid="F5">figure 5A</xref>). The clinical samples were polyclonal: the cell product (sample 4) was anticipated to be the most clonally diverse, with some degree of clonal dominance emerging in the postinfusion patient samples (samples 5 and 6).<xref ref-type="bibr" rid="R15">15</xref> The number of unique vector integration sites identified in samples 4, 5, and 6 were 979, 196, and 602 by inverse PCR and 2258, 1251, and 669 by cassette ligation PCR, with the starting materials containing approximately 7500, 4700, and 2500 <italic toggle="yes">iCasp9</italic>-transduced cells. In all three samples, clonal skewing was more pronounced with inverse PCR than cassette ligation PCR: the top 10 integration sites in samples 4, 5, and 6 accounted for 49%, 93%, and &gt;99%, respectively, of the total aligned reads by inverse PCR; as compared with 7%, 58%, and 76% of the total aligned reads by cassette ligation PCR (<xref ref-type="fig" rid="F5">figure 5B</xref>). A proportion of the integration sites were detected by both techniques but their percentage representation within the sample differed between the two techniques, and a majority of integration sites were mapped by only one of the techniques (<xref ref-type="fig" rid="F5">figure 5C</xref>). The very large clone representing 97% of reads in sample 6 by inverse PCR, represented only 0.1% of the reads by cassette ligation PCR. This clone also had higher clonal representation by inverse PCR relative to cassette ligation PCR in samples 4 and 5 (0.08% vs 0.02%; and 0.44% vs 0.15%), suggesting amplification bias.</p><fig position="float" id="F5" orientation="portrait"><object-id pub-id-type="publisher-id">F5</object-id><label>Figure 5</label><caption><p>Clonal composition of vector integration sites. (A) Distribution of vector integration sites as a proportion of total aligned reads in <italic toggle="yes">iCasp9</italic>-transduced Jurkat cell clones. Shown are paired analysis by inverse PCR (top row) and cassette ligation PCR (bottom row). Samples 1 and 2 were two separate Jurkat cell clones, and sample 3 was a 1:1 mix of samples 1 and 2. Green and blue indicate different clones. Light green and light blue indicate subclones. (B) Distribution of vector integration sites as a proportion of total aligned reads in polyclonal clinical samples. Shown are paired analysis by inverse PCR (top row) and cassette ligation PCR (bottom row). Sample 4 was <italic toggle="yes">iCasp9</italic>-transduced cell product; and samples 5 and 6 were PBMC obtained at day +369 and +1332 after cell infusion, respectively. The top 10 clones for each sample are shown in color; with the remainder represented in white. The color representation is random and does not correspond to the same clones across different pie charts. (C) Overlap of unique vector integration sites identified by inverse PCR and cassette ligation PCR in the polyclonal clinical samples.<xref ref-type="fig" rid="F5">figure 5C</xref> was plotted with R V.3.5.3 (venneuler package).</p></caption><graphic xlink:href="jitc-2019-000299f05" position="float" orientation="portrait" xlink:type="simple"/></fig></sec><sec id="s3-6"><title>Location of integration sites within the genome</title><p>Vector integration sites were identified within all chromosomes, with higher representations within the larger chromosomes, as these represented a larger component of the total genome (<xref ref-type="fig" rid="F6">figure 6A</xref>). A majority (61%–68%) of integration sites were intragenic, with 55%–58% within the introns, and 6%–12% within the exons; with the remaining 32%–39% of integration sites being intergenic (<xref ref-type="fig" rid="F6">figure 6B</xref>). There was a predilection for vector integration near TSS (<xref ref-type="fig" rid="F6">figure 6C</xref>), which was consistent with other reports.<xref ref-type="bibr" rid="R3 R5 R6">3 5 6</xref> There was no predilection for vector integration near LTR73 and LTR76, which are human endogenous retrovirus sequences with some sequence similarity to the SFG vector LTR (<xref ref-type="supplementary-material" rid="SP1">online supplementary figure S1</xref>).</p><fig position="float" id="F6" orientation="portrait"><object-id pub-id-type="publisher-id">F6</object-id><label>Figure 6</label><caption><p>Distribution of unique vector integration sites within the genome as detected by inverse PCR (top) and cassette ligation PCR (bottom). Integration sites are annotated by (A) chromosomes, (B) gene coding regions (exons, introns, and intergenic), and (C) distance to transcription start sites (TSS). Median values were presented.</p></caption><graphic xlink:href="jitc-2019-000299f06" position="float" orientation="portrait" xlink:type="simple"/></fig></sec></sec><sec id="s4" sec-type="discussion"><title>Discussion</title><p>Analysis of vector integration sites is currently restricted to highly specialized academic institutions where it is used largely as a research tool. However, gene-modified cellular therapeutics, especially CAR T cells, are rapidly entering routine clinical practice and vector integration site analysis would be required from time-to-time to monitor for the emergence of dominant clones. Many smaller clinical centers do not have access to expensive sequencing instrument and, furthermore, while short-read next-generation sequencing is cost effective for large batches, the cost per batch is very high. As a result, centers with low sample volumes will need to either run smaller batches at significantly higher cost per sample, or accumulate samples over a very long period of time for cost-effective batching, which reduces the timeliness of the analysis. In this paper, we showed that nanopore sequencing platform could be successfully utilized to map polyclonal vector integration sites.</p><p>Nanopore sequencing has been used by others to identify the transgene integration site in transgenic animals.<xref ref-type="bibr" rid="R19">19</xref> In this setting, the transgene integrates within a single locus in the host cell genome but the changes are complex because microinjection of linearized DNA fragments into the pronucleus of zygotes typically results in multiple copies of the transgene inserted in tandem, often with complex internal structure, including transgene inversions, and contamination by <italic toggle="yes">Escherichia Coli</italic> genomic DNA, together with large deletions and other structural changes in the flanking host cell genome.<xref ref-type="bibr" rid="R19 R20">19 20</xref> Long-read whole genome sequencing by nanopore or other platforms can simultaneously identify the integration site and define these large, complex and tandem changes which are very difficult to resolve by short-read sequencing.<xref ref-type="bibr" rid="R19">19</xref> In contrast, retrovirus-mediated transgene integration in clinical cell therapy is cleaner: each transgene integration site contains a single copy rather than tandem copies of the vector insert, without any large structural changes to the flanking genome. However, retrovirus-mediated somatic gene modification involves hundreds of thousands of parental cells, each with one or more distinct integration event, which results in a very large number of unique integration sites. These vector integration sites cannot be studied by whole genome sequencing; instead, some form of amplification or capture of the vector integrant together with the flanking genomic DNA is essential.</p><p>We used two different methods to amplify flanking genomic DNA: inverse PCR and cassette ligation PCR. Both methods used the same nested PCR primers at the 3′LTR flank (<xref ref-type="supplementary-material" rid="SP1">online supplementary table S1</xref>). The SFG backbone in SFG.iCasp9.2A.ΔCD19 was derived from Moloney Murine Leukemia Virus,<xref ref-type="bibr" rid="R21 R22">21 22</xref> which did not in evolution infect human and has minimum sequence similarity with human endogenous retroviruses (<ext-link ext-link-type="uri" xlink:href="http://dfam.org" xlink:type="simple">http://dfam.org</ext-link>).<xref ref-type="bibr" rid="R23">23</xref> Thus, although elements from endogenous retroviruses constitute up to 8% of the human genome,<xref ref-type="bibr" rid="R24">24</xref> the 3′LTR flank and the primers used in this analysis are specific to the vector. There are two human endogenous retrovirus sequences, LTR73 and LTR76, which have a degree of sequence similarity to the vector LTR; however, any non-specific amplicons that may arise from mispriming of these LTRs will be excluded from analysis because their degree of similarity to the vector LTR is &lt;50%, which is below the 80% threshold set by our FlankDetect script.</p><p>Inverse PCR was slightly less demanding technically but has a higher potential for bias because efficient circularization is limited to DNA fragments of 300 bp to 3 kb, and secondary structure formation can further limit circularization efficiency. There is also competition between intramolecular circularization and intermolecular ligation, although this can be partially minimized using a dilute DNA ligation mix. In order to reduce bias, we adapted a previously described cassette ligation PCR method<xref ref-type="bibr" rid="R25">25</xref> to amplify the flanking genomic sequences with high efficiency and specificity. This method had significantly less bias compared with the inverse PCR method but it was not completely bias-free as an equal mix of the two Jurkat clones did not produce equal representations of reads from each clone, although was less skewed than inverse PCR.</p><p>Our analysis considered clusters with any degree of overlap in read alignments as belonging to the same vector integration site. It is possible that this could erroneously merge proximate but distinct vector integration sites, resulting in an underestimation of clonal diversity. We have developed our clustering protocol to err on the side of over-clustering because a key function of vector integration site analysis is to detect clonal dominance, which can sometimes indicate autonomous growth or insertional mutagenesis, and it is therefore important to avoid splitting single integration sites into multiple artificial clones. The number of unique integration sites mapped in our study was consistent with those using LAM-PCR followed by next-generation short-read sequencing, which typically detects around 200 to 8000 unique integration sites from 10<sup>3</sup> to 10<sup>6</sup> transduced T cells.<xref ref-type="bibr" rid="R3 R5 R6">3 5 6</xref> However, in our analysis of polyclonal clinical samples using inverse PCR and cassette ligation PCR in parallel, only 7% of unique vector integration sites could be detected by both methods. This low level of overlap was likely a result of both PCR amplification bias and sampling artifact. Gene-modified T cells, including <italic toggle="yes">iCasp9</italic>-transduced T cells, have been shown to be highly polyclonal by T cell receptor<xref ref-type="bibr" rid="R15 R26">15 26</xref> and vector integration site analysis.<xref ref-type="bibr" rid="R3 R15">3 15</xref> We and others have detected 10<sup>3</sup> to 10<sup>4</sup> unique clonotypes within aliquots of infused cell products and postinfusion patient samples in T cell therapy trials using gammaretroviral vectors.<xref ref-type="bibr" rid="R3 R6 R15">3 6 15</xref> The actual clonal richness is likely much higher if a very large number of cells can be sampled and sequenced at depth without bias. The likelihood of a particular clone being randomly sampled twice is a function of its clonal frequency and the sample size. In this study, the amount of input DNA in the polyclonal clinical samples represented &lt;0.001% of the total pool of transduced cells; hence, our observation that only a small proportion of clones could be detected by both inverse PCR and cassette ligation PCR was consistent with the anticipated low likelihood of a particular clone being randomly sampled into both reaction mixtures. Nonetheless, the large differences in the clonal size of the identified overlapping clones would suggest that there was also significant contribution from amplification or sequencing bias.</p><p>In studies using gene-modified T cells, clonality can also be assessed by T cell receptor clonotype analysis. Although this remains an expensive assay, it is somewhat more accessible and can be outsourced to commercial entities. T cell receptor clonotype can provide a good indication of the clonal diversity of the transduced cells because clones bearing the same vector integration sites will bear the same T cell receptor clonotype. In our previous publication, clonal diversity as determined by vector integration site analysis using inverse PCR followed by nanopore sequencing closely correlated with clonal diversity by T cell receptor analysis.<xref ref-type="bibr" rid="R15">15</xref> However, T cell receptor analysis does not provide any information on the nature of the vector integration sites and cells with the same T cell receptor clonotype can sometimes carry different vector integration sites through separate transduction events.<xref ref-type="bibr" rid="R15 R27">15 27</xref>
</p><p>The amount of data that can be generated and the feasibility to scale as required make nanopore sequencing an attractive option for analysis of vector integration sites. In this report, we reused an ONT PromethION flow cell and obtained 15 Gb of sequencing data, which was sufficient to analyze six polyclonal and six oligoclonal samples, with &gt;5500 unique integration sites identified. Based on this estimate, the smaller ONT MinION flow cell, which costs around US$500–900 and capable of generating 20–30 Gb of sequencing data, could be used to sequence 12 polyclonal samples; whereas the larger ONT PromethION flow cell, which costs around US$1600–2000 and capable of generating around 80–100 Gb of sequencing data, would be suitable for larger batches. There is also now a very small ONT Flongle that is capable of 1.8 Gb of sequencing data at a cost of US$90 each, which may be suitable for single sample analysis. The sequencing cost for short-read next-generation sequencing is highly dependent on scale: larger, higher throughput instruments are much more cost efficient per unit of sequencing data but the cost per run is much higher. For example, short-read Illumina sequencing instruments come in a range of sizes, each with a choice of kits with different levels of output and cycle lengths. The cost for 150-cycle or 300-cycle kits that are typically used for this application ranges from US$1050–1200 for 3.5–5 Gb of sequencing data on an Illumina MiSeq instrument; to US$1250–5300 for 20–120 Gb of sequencing data on the larger Illumina NextSeq instrument; and US$6500–12,000 for 375–750 Gb of sequencing data on the even larger Illumina HiSeq instrument. Instrument access charges typically add 30–100% to the sequencing cost.</p><p>The data obtained from the different sequencing platforms cannot be directly compared: short-read next-generation sequencing provides better read quality than nanopore sequencing but their short-read lengths can limit their capacity to be uniquely aligned, especially when part of the read has been taken up by the flanking vector sequence. This caveat aside, the sequencing cost for 12 samples, yielding 20 Gb of sequencing data, is estimated at US$1650–2540 on an Illumina NextSeq, which consists of US$1250 for a mid-output 150-cycle kit plus 30–100% in facility charges; as compared with US$500–900 on a Nanopore MinIon, which has negligible capital cost and no access charges. The reagent cost for library preparation is around US$60–80 per sample for both nanopore and short-read next-generation sequencing.</p><p>A distinct advantage of nanopore sequencing is its low cost of entry as it does not require any dedicated sequencing instrument, making it highly feasible for smaller centers. These features are of immense relevance in the context of current developments in the CAR T cell field, which have seen their emergence from large dedicated academic research centers into routine implementation in smaller clinical centers where the ability to perform vector integration site analysis in a timely manner, with flexibility of scale, can be clinically important. The total assay time is under 4 days: one-and-a-half days to complete ligation and nested PCR, and 2 days for library preparation, sequencing, and data analysis.</p><p>The main drawback of nanopore sequencing is its high error rate. This limits its ability to confidently map the 3′LTR-genome junction at single nucleotide resolution. Nonetheless, a majority of clusters could be resolved within a 5-nucleotide span and 94% of clusters with five or more reads could be resolved within one nucleotide span. The resolution will likely improve with evolution in the technology platform and refinement in the assay design and data analysis. At present, the higher error rate also meant that relatively long stretches of flanking DNA sequence are required for successful alignment. The length of the flanking DNA sequence is predetermined by the position of the restriction site and hence integration sites that are very close to the restriction sites will always be very difficult to align. However, it may be possible to perform parallel analysis using different sets of restriction enzymes or tagmentation without restriction enzymes to increase the proportion of aligned reads.<xref ref-type="bibr" rid="R5 R6">5 6</xref>
</p><p>In summary, we have developed a readily accessible, highly scalable, low cost, and low capital method to analyze vector integration sites within a polyclonal sample using nanopore sequencing. This platform has the potential to become a practical alternative to short-read next-generation sequencing, especially for smaller clinical centers with low volume throughput where flexibility of scale and timeliness of results are important.</p></sec></body><back><ack><p>The authors acknowledge the advice from Dr Edmund Chang, previously at the Center for Cell and Gene Therapy, Baylor College of Medicine, Houston, Texas, USA, who suggested using nanopore sequencing for this purpose. The authors are grateful to the patients and their families for their participation in the associated phase I clinical trial.</p></ack><fn-group><fn fn-type="other"><label>Contributors</label><p>LJC and S-KT designed the study. PZ, DG, and RA performed experiments. DG, SHN, and LJC performed analysis of sequencing data; and PZ and S-KT analyzed the annotated data. PZ, DG, LJC, and S-KT wrote the manuscript.</p></fn><fn fn-type="other"><label>Funding</label><p>This work was supported by a Project Grant (APP1053135) from the National Health and Medical Research Council (NHMRC, Australia) and Royal Brisbane and Women's Hospital Foundation. S-KT was supported by an NHMRC Early Career Fellowship (APP1054786) and Metro North Hospital and Health Service Clinician Research Fellowship. LJC was supported by an NHMRC Career Development Fellowship (APP1130084).</p></fn><fn fn-type="conflict"><label>Competing interests</label><p>None declared.</p></fn><fn fn-type="other"><label>Patient consent for publication</label><p>Written informed consent was obtained from all subjects.</p></fn><fn fn-type="other"><label>Ethics approval</label><p>The associated clinical trial and use of study samples were prospectively approved by the Human Research Ethics Committee (Institutional Review Board) of Royal Brisbane and Women's Hospital. The clinical trial was conducted in accordance with the Declaration of Helsinki and the Australian National Statement on Ethical Conduct in Human Research.</p></fn><fn fn-type="other"><label>Provenance and peer review</label><p>Not commissioned; externally peer reviewed.</p></fn><fn fn-type="other"><label>Data availability statement</label><p>Data are available upon reasonable request</p></fn></fn-group><ref-list><title>References</title><ref id="R1"><label>1</label><mixed-citation publication-type="journal" xlink:type="simple">
<person-group person-group-type="author">
<string-name name-style="western">
<surname>Eyquem</surname> <given-names>J</given-names>
</string-name>, <string-name name-style="western">
<surname>Mansilla-Soto</surname> <given-names>J</given-names>
</string-name>, <string-name name-style="western">
<surname>Giavridis</surname> <given-names>T</given-names>
</string-name>, <etal>et al</etal>
</person-group>. <article-title>Targeting a car to the TRAC locus with CRISPR/Cas9 enhances tumour rejection</article-title>. <source>Nature</source> <year>2017</year>;<volume>543</volume>:<fpage>113</fpage>–<lpage>7</lpage>.<ext-link ext-link-type="uri" xlink:href="http://dx.doi.org/10.1038/nature21405" xlink:type="simple">doi:10.1038/nature21405</ext-link>
<pub-id pub-id-type="pmid" xlink:type="simple">http://www.ncbi.nlm.nih.gov/pubmed/28225754</pub-id>
</mixed-citation></ref><ref id="R2"><label>2</label><mixed-citation publication-type="journal" xlink:type="simple">
<person-group person-group-type="author">
<string-name name-style="western">
<surname>Dunbar</surname> <given-names>CE</given-names>
</string-name>, <string-name name-style="western">
<surname>High</surname> <given-names>KA</given-names>
</string-name>, <string-name name-style="western">
<surname>Joung</surname> <given-names>JK</given-names>
</string-name>, <etal>et al</etal>
</person-group>. <article-title>Gene therapy comes of age</article-title>. <source>Science</source> <year>2018</year>;<volume>359</volume>:<elocation-id>eaan4672</elocation-id>.<ext-link ext-link-type="uri" xlink:href="http://dx.doi.org/10.1126/science.aan4672" xlink:type="simple">doi:10.1126/science.aan4672</ext-link>
</mixed-citation></ref><ref id="R3"><label>3</label><mixed-citation publication-type="journal" xlink:type="simple">
<person-group person-group-type="author">
<string-name name-style="western">
<surname>Chang</surname> <given-names>EC</given-names>
</string-name>, <string-name name-style="western">
<surname>Liu</surname> <given-names>H</given-names>
</string-name>, <string-name name-style="western">
<surname>West</surname> <given-names>JA</given-names>
</string-name>, <etal>et al</etal>
</person-group>. <article-title>Clonal dynamics in vivo of virus integration sites of T cells expressing a safety switch</article-title>. <source>Mol Ther</source> <year>2016</year>;<volume>24</volume>:<fpage>736</fpage>–<lpage>45</lpage>.<ext-link ext-link-type="uri" xlink:href="http://dx.doi.org/10.1038/mt.2015.217" xlink:type="simple">doi:10.1038/mt.2015.217</ext-link>
<pub-id pub-id-type="pmid" xlink:type="simple">http://www.ncbi.nlm.nih.gov/pubmed/26639404</pub-id>
</mixed-citation></ref><ref id="R4"><label>4</label><mixed-citation publication-type="journal" xlink:type="simple">
<person-group person-group-type="author">
<string-name name-style="western">
<surname>Recchia</surname> <given-names>A</given-names>
</string-name>, <string-name name-style="western">
<surname>Bonini</surname> <given-names>C</given-names>
</string-name>, <string-name name-style="western">
<surname>Magnani</surname> <given-names>Z</given-names>
</string-name>, <etal>et al</etal>
</person-group>. <article-title>Retroviral vector integration deregulates gene expression but has no consequence on the biology and function of transplanted T cells</article-title>. <source>Proc Natl Acad Sci U S A</source> <year>2006</year>;<volume>103</volume>:<fpage>1457</fpage>–<lpage>62</lpage>.<ext-link ext-link-type="uri" xlink:href="http://dx.doi.org/10.1073/pnas.0507496103" xlink:type="simple">doi:10.1073/pnas.0507496103</ext-link>
<pub-id pub-id-type="pmid" xlink:type="simple">http://www.ncbi.nlm.nih.gov/pubmed/16432223</pub-id>
</mixed-citation></ref><ref id="R5"><label>5</label><mixed-citation publication-type="journal" xlink:type="simple">
<person-group person-group-type="author">
<string-name name-style="western">
<surname>Hamada</surname> <given-names>M</given-names>
</string-name>, <string-name name-style="western">
<surname>Nishio</surname> <given-names>N</given-names>
</string-name>, <string-name name-style="western">
<surname>Okuno</surname> <given-names>Y</given-names>
</string-name>, <etal>et al</etal>
</person-group>. <article-title>Integration mapping of piggyBac-Mediated CD19 chimeric antigen receptor T cells analyzed by novel Tagmentation-Assisted PCR</article-title>. <source>EBioMedicine</source> <year>2018</year>;<volume>34</volume>:<fpage>18</fpage>–<lpage>26</lpage>.<ext-link ext-link-type="uri" xlink:href="http://dx.doi.org/10.1016/j.ebiom.2018.07.008" xlink:type="simple">doi:10.1016/j.ebiom.2018.07.008</ext-link>
<pub-id pub-id-type="pmid" xlink:type="simple">http://www.ncbi.nlm.nih.gov/pubmed/30082227</pub-id>
</mixed-citation></ref><ref id="R6"><label>6</label><mixed-citation publication-type="journal" xlink:type="simple">
<person-group person-group-type="author">
<string-name name-style="western">
<surname>Cattoglio</surname> <given-names>C</given-names>
</string-name>, <string-name name-style="western">
<surname>Maruggi</surname> <given-names>G</given-names>
</string-name>, <string-name name-style="western">
<surname>Bartholomae</surname> <given-names>C</given-names>
</string-name>, <etal>et al</etal>
</person-group>. <article-title>High-Definition mapping of retroviral integration sites defines the fate of allogeneic T cells after donor lymphocyte infusion</article-title>. <source>PLoS One</source> <year>2010</year>;<volume>5</volume>:<elocation-id>e15688</elocation-id>.<ext-link ext-link-type="uri" xlink:href="http://dx.doi.org/10.1371/journal.pone.0015688" xlink:type="simple">doi:10.1371/journal.pone.0015688</ext-link>
<pub-id pub-id-type="pmid" xlink:type="simple">http://www.ncbi.nlm.nih.gov/pubmed/21203516</pub-id>
</mixed-citation></ref><ref id="R7"><label>7</label><mixed-citation publication-type="journal" xlink:type="simple">
<person-group person-group-type="author">
<string-name name-style="western">
<surname>Hacein-Bey-Abina</surname> <given-names>S</given-names>
</string-name>, <string-name name-style="western">
<surname>Garrigue</surname> <given-names>A</given-names>
</string-name>, <string-name name-style="western">
<surname>Wang</surname> <given-names>GP</given-names>
</string-name>, <etal>et al</etal>
</person-group>. <article-title>Insertional oncogenesis in 4 patients after retrovirus-mediated gene therapy of SCID-X1</article-title>. <source>J Clin Invest</source> <year>2008</year>;<volume>118</volume>:<fpage>3132</fpage>–<lpage>42</lpage>.<ext-link ext-link-type="uri" xlink:href="http://dx.doi.org/10.1172/JCI35700" xlink:type="simple">doi:10.1172/JCI35700</ext-link>
<pub-id pub-id-type="pmid" xlink:type="simple">http://www.ncbi.nlm.nih.gov/pubmed/18688285</pub-id>
</mixed-citation></ref><ref id="R8"><label>8</label><mixed-citation publication-type="journal" xlink:type="simple">
<person-group person-group-type="author">
<string-name name-style="western">
<surname>Howe</surname> <given-names>SJ</given-names>
</string-name>, <string-name name-style="western">
<surname>Mansour</surname> <given-names>MR</given-names>
</string-name>, <string-name name-style="western">
<surname>Schwarzwaelder</surname> <given-names>K</given-names>
</string-name>, <etal>et al</etal>
</person-group>. <article-title>Insertional mutagenesis combined with acquired somatic mutations causes leukemogenesis following gene therapy of SCID-X1 patients</article-title>. <source>J Clin Invest</source> <year>2008</year>;<volume>118</volume>:<fpage>3143</fpage>–<lpage>50</lpage>.<ext-link ext-link-type="uri" xlink:href="http://dx.doi.org/10.1172/JCI35798" xlink:type="simple">doi:10.1172/JCI35798</ext-link>
<pub-id pub-id-type="pmid" xlink:type="simple">http://www.ncbi.nlm.nih.gov/pubmed/18688286</pub-id>
</mixed-citation></ref><ref id="R9"><label>9</label><mixed-citation publication-type="journal" xlink:type="simple">
<person-group person-group-type="author">
<string-name name-style="western">
<surname>Stein</surname> <given-names>S</given-names>
</string-name>, <string-name name-style="western">
<surname>Ott</surname> <given-names>MG</given-names>
</string-name>, <string-name name-style="western">
<surname>Schultze-Strasser</surname> <given-names>S</given-names>
</string-name>, <etal>et al</etal>
</person-group>. <article-title>Genomic instability and myelodysplasia with monosomy 7 consequent to EVI1 activation after gene therapy for chronic granulomatous disease</article-title>. <source>Nat Med</source> <year>2010</year>;<volume>16</volume>:<fpage>198</fpage>–<lpage>204</lpage>.<ext-link ext-link-type="uri" xlink:href="http://dx.doi.org/10.1038/nm.2088" xlink:type="simple">doi:10.1038/nm.2088</ext-link>
<pub-id pub-id-type="pmid" xlink:type="simple">http://www.ncbi.nlm.nih.gov/pubmed/20098431</pub-id>
</mixed-citation></ref><ref id="R10"><label>10</label><mixed-citation publication-type="journal" xlink:type="simple">
<person-group person-group-type="author">
<string-name name-style="western">
<surname>Fraietta</surname> <given-names>JA</given-names>
</string-name>, <string-name name-style="western">
<surname>Nobles</surname> <given-names>CL</given-names>
</string-name>, <string-name name-style="western">
<surname>Sammons</surname> <given-names>MA</given-names>
</string-name>, <etal>et al</etal>
</person-group>. <article-title>Disruption of TET2 promotes the therapeutic efficacy of CD19-targeted T cells</article-title>. <source>Nature</source> <year>2018</year>;<volume>558</volume>:<fpage>307</fpage>–<lpage>12</lpage>.<ext-link ext-link-type="uri" xlink:href="http://dx.doi.org/10.1038/s41586-018-0178-z" xlink:type="simple">doi:10.1038/s41586-018-0178-z</ext-link>
<pub-id pub-id-type="pmid" xlink:type="simple">http://www.ncbi.nlm.nih.gov/pubmed/29849141</pub-id>
</mixed-citation></ref><ref id="R11"><label>11</label><mixed-citation publication-type="journal" xlink:type="simple">
<person-group person-group-type="author">
<string-name name-style="western">
<surname>Paruzynski</surname> <given-names>A</given-names>
</string-name>, <string-name name-style="western">
<surname>Arens</surname> <given-names>A</given-names>
</string-name>, <string-name name-style="western">
<surname>Gabriel</surname> <given-names>R</given-names>
</string-name>, <etal>et al</etal>
</person-group>. <article-title>Genome-Wide high-throughput integrome analyses by nrLAM-PCR and next-generation sequencing</article-title>. <source>Nat Protoc</source> <year>2010</year>;<volume>5</volume>:<fpage>1379</fpage>–<lpage>95</lpage>.<ext-link ext-link-type="uri" xlink:href="http://dx.doi.org/10.1038/nprot.2010.87" xlink:type="simple">doi:10.1038/nprot.2010.87</ext-link>
<pub-id pub-id-type="pmid" xlink:type="simple">http://www.ncbi.nlm.nih.gov/pubmed/20671722</pub-id>
</mixed-citation></ref><ref id="R12"><label>12</label><mixed-citation publication-type="journal" xlink:type="simple">
<person-group person-group-type="author">
<string-name name-style="western">
<surname>Schmidt</surname> <given-names>M</given-names>
</string-name>, <string-name name-style="western">
<surname>Schwarzwaelder</surname> <given-names>K</given-names>
</string-name>, <string-name name-style="western">
<surname>Bartholomae</surname> <given-names>C</given-names>
</string-name>, <etal>et al</etal>
</person-group>. <article-title>High-Resolution insertion-site analysis by linear amplification-mediated PCR (LAM-PCR)</article-title>. <source>Nat Methods</source> <year>2007</year>;<volume>4</volume>:<fpage>1051</fpage>–<lpage>7</lpage>.<ext-link ext-link-type="uri" xlink:href="http://dx.doi.org/10.1038/nmeth1103" xlink:type="simple">doi:10.1038/nmeth1103</ext-link>
<pub-id pub-id-type="pmid" xlink:type="simple">http://www.ncbi.nlm.nih.gov/pubmed/18049469</pub-id>
</mixed-citation></ref><ref id="R13"><label>13</label><mixed-citation publication-type="journal" xlink:type="simple">
<person-group person-group-type="author">
<string-name name-style="western">
<surname>Ameur</surname> <given-names>A</given-names>
</string-name>, <string-name name-style="western">
<surname>Kloosterman</surname> <given-names>WP</given-names>
</string-name>, <string-name name-style="western">
<surname>Hestand</surname> <given-names>MS</given-names>
</string-name>
</person-group>. <article-title>Single-Molecule sequencing: towards clinical applications</article-title>. <source>Trends Biotechnol</source> <year>2019</year>;<volume>37</volume>:<fpage>72</fpage>–<lpage>85</lpage>.<ext-link ext-link-type="uri" xlink:href="http://dx.doi.org/10.1016/j.tibtech.2018.07.013" xlink:type="simple">doi:10.1016/j.tibtech.2018.07.013</ext-link>
<pub-id pub-id-type="pmid" xlink:type="simple">http://www.ncbi.nlm.nih.gov/pubmed/30115375</pub-id>
</mixed-citation></ref><ref id="R14"><label>14</label><mixed-citation publication-type="journal" xlink:type="simple">
<person-group person-group-type="author">
<string-name name-style="western">
<surname>Lu</surname> <given-names>H</given-names>
</string-name>, <string-name name-style="western">
<surname>Giordano</surname> <given-names>F</given-names>
</string-name>, <string-name name-style="western">
<surname>Ning</surname> <given-names>Z</given-names>
</string-name>
</person-group>. <article-title>Oxford nanopore MinION sequencing and genome assembly</article-title>. <source>Genomics Proteomics Bioinformatics</source> <year>2016</year>;<volume>14</volume>:<fpage>265</fpage>–<lpage>79</lpage>.<ext-link ext-link-type="uri" xlink:href="http://dx.doi.org/10.1016/j.gpb.2016.05.004" xlink:type="simple">doi:10.1016/j.gpb.2016.05.004</ext-link>
<pub-id pub-id-type="pmid" xlink:type="simple">http://www.ncbi.nlm.nih.gov/pubmed/27646134</pub-id>
</mixed-citation></ref><ref id="R15"><label>15</label><mixed-citation publication-type="journal" xlink:type="simple">
<person-group person-group-type="author">
<string-name name-style="western">
<surname>Zhang</surname> <given-names>P</given-names>
</string-name>, <string-name name-style="western">
<surname>Raju</surname> <given-names>J</given-names>
</string-name>, <string-name name-style="western">
<surname>Ullah</surname> <given-names>MA</given-names>
</string-name>, <etal>et al</etal>
</person-group>. <article-title>Phase I trial of inducible caspase 9 T cells in adult stem cell transplant demonstrates massive clonotypic proliferative potential and long-term persistence of transgenic T cells</article-title>. <source>Clin Cancer Res</source> <year>2019</year>;<volume>25</volume>:<fpage>1749</fpage>–<lpage>55</lpage>.<ext-link ext-link-type="uri" xlink:href="http://dx.doi.org/10.1158/1078-0432.CCR-18-3069" xlink:type="simple">doi:10.1158/1078-0432.CCR-18-3069</ext-link>
<pub-id pub-id-type="pmid" xlink:type="simple">http://www.ncbi.nlm.nih.gov/pubmed/30765390</pub-id>
</mixed-citation></ref><ref id="R16"><label>16</label><mixed-citation publication-type="journal" xlink:type="simple">
<person-group person-group-type="author">
<string-name name-style="western">
<surname>Pavlopoulos</surname> <given-names>A</given-names>
</string-name>
</person-group>. <article-title>Identification of DNA sequences that flank a known region by inverse PCR</article-title>. <source>Methods Mol Biol</source> <year>2011</year>;<volume>772</volume>:<fpage>267</fpage>–<lpage>75</lpage>.<ext-link ext-link-type="uri" xlink:href="http://dx.doi.org/10.1007/978-1-61779-228-1_16" xlink:type="simple">doi:10.1007/978-1-61779-228-1_16</ext-link>
<pub-id pub-id-type="pmid" xlink:type="simple">http://www.ncbi.nlm.nih.gov/pubmed/22065444</pub-id>
</mixed-citation></ref><ref id="R17"><label>17</label><mixed-citation publication-type="journal" xlink:type="simple">
<person-group person-group-type="author">
<string-name name-style="western">
<surname>Tey</surname> <given-names>S-K</given-names>
</string-name>, <string-name name-style="western">
<surname>Dotti</surname> <given-names>G</given-names>
</string-name>, <string-name name-style="western">
<surname>Rooney</surname> <given-names>CM</given-names>
</string-name>, <etal>et al</etal>
</person-group>. <article-title>Inducible caspase 9 suicide gene to improve the safety of allodepleted T cells after haploidentical stem cell transplantation</article-title>. <source>Biol Blood Marrow Transplant</source> <year>2007</year>;<volume>13</volume>:<fpage>913</fpage>–<lpage>24</lpage>.<ext-link ext-link-type="uri" xlink:href="http://dx.doi.org/10.1016/j.bbmt.2007.04.005" xlink:type="simple">doi:10.1016/j.bbmt.2007.04.005</ext-link>
<pub-id pub-id-type="pmid" xlink:type="simple">http://www.ncbi.nlm.nih.gov/pubmed/17640595</pub-id>
</mixed-citation></ref><ref id="R18"><label>18</label><mixed-citation publication-type="journal" xlink:type="simple">
<person-group person-group-type="author">
<string-name name-style="western">
<surname>Holstein</surname> <given-names>M</given-names>
</string-name>, <string-name name-style="western">
<surname>Mesa-Nuñez</surname> <given-names>C</given-names>
</string-name>, <string-name name-style="western">
<surname>Miskey</surname> <given-names>C</given-names>
</string-name>, <etal>et al</etal>
</person-group>. <article-title>Efficient non-viral gene delivery into human hematopoietic stem cells by minicircle sleeping Beauty transposon vectors</article-title>. <source>Mol Ther</source> <year>2018</year>;<volume>26</volume>:<fpage>1137</fpage>–<lpage>53</lpage>.<ext-link ext-link-type="uri" xlink:href="http://dx.doi.org/10.1016/j.ymthe.2018.01.012" xlink:type="simple">doi:10.1016/j.ymthe.2018.01.012</ext-link>
<pub-id pub-id-type="pmid" xlink:type="simple">http://www.ncbi.nlm.nih.gov/pubmed/29503198</pub-id>
</mixed-citation></ref><ref id="R19"><label>19</label><mixed-citation publication-type="journal" xlink:type="simple">
<person-group person-group-type="author">
<string-name name-style="western">
<surname>Nicholls</surname> <given-names>PK</given-names>
</string-name>, <string-name name-style="western">
<surname>Bellott</surname> <given-names>DW</given-names>
</string-name>, <string-name name-style="western">
<surname>Cho</surname> <given-names>T-J</given-names>
</string-name>, <etal>et al</etal>
</person-group>. <article-title>Locating and characterizing a transgene integration site by nanopore sequencing</article-title>. <source>G3</source> <year>2019</year>;<volume>9</volume>:<fpage>1481</fpage>–<lpage>6</lpage>.<ext-link ext-link-type="uri" xlink:href="http://dx.doi.org/10.1534/g3.119.300582" xlink:type="simple">doi:10.1534/g3.119.300582</ext-link>
<pub-id pub-id-type="pmid" xlink:type="simple">http://www.ncbi.nlm.nih.gov/pubmed/30837263</pub-id>
</mixed-citation></ref><ref id="R20"><label>20</label><mixed-citation publication-type="journal" xlink:type="simple">
<person-group person-group-type="author">
<string-name name-style="western">
<surname>Goodwin</surname> <given-names>LO</given-names>
</string-name>, <string-name name-style="western">
<surname>Splinter</surname> <given-names>E</given-names>
</string-name>, <string-name name-style="western">
<surname>Davis</surname> <given-names>TL</given-names>
</string-name>, <etal>et al</etal>
</person-group>. <article-title>Large-Scale discovery of mouse transgenic integration sites reveals frequent structural variation and insertional mutagenesis</article-title>. <source>Genome Res</source> <year>2019</year>;<volume>29</volume>:<fpage>494</fpage>–<lpage>505</lpage>.<ext-link ext-link-type="uri" xlink:href="http://dx.doi.org/10.1101/gr.233866.117" xlink:type="simple">doi:10.1101/gr.233866.117</ext-link>
<pub-id pub-id-type="pmid" xlink:type="simple">http://www.ncbi.nlm.nih.gov/pubmed/30659012</pub-id>
</mixed-citation></ref><ref id="R21"><label>21</label><mixed-citation publication-type="journal" xlink:type="simple">
<person-group person-group-type="author">
<string-name name-style="western">
<surname>Büeler</surname> <given-names>H</given-names>
</string-name>, <string-name name-style="western">
<surname>Mulligan</surname> <given-names>RC</given-names>
</string-name>
</person-group>. <article-title>Induction of antigen-specific tumor immunity by genetic and cellular vaccines against MAGE: enhanced tumor protection by coexpression of granulocyte-macrophage colony-stimulating factor and B7-1</article-title>. <source>Mol Med</source> <year>1996</year>;<volume>2</volume>:<fpage>545</fpage>–<lpage>55</lpage>.<ext-link ext-link-type="uri" xlink:href="http://dx.doi.org/10.1007/BF03401639" xlink:type="simple">doi:10.1007/BF03401639</ext-link>
<pub-id pub-id-type="pmid" xlink:type="simple">http://www.ncbi.nlm.nih.gov/pubmed/8898371</pub-id>
</mixed-citation></ref><ref id="R22"><label>22</label><mixed-citation publication-type="journal" xlink:type="simple">
<person-group person-group-type="author">
<string-name name-style="western">
<surname>Rivière</surname> <given-names>I</given-names>
</string-name>, <string-name name-style="western">
<surname>Brose</surname> <given-names>K</given-names>
</string-name>, <string-name name-style="western">
<surname>Mulligan</surname> <given-names>RC</given-names>
</string-name>
</person-group>. <article-title>Effects of retroviral vector design on expression of human adenosine deaminase in murine bone marrow transplant recipients engrafted with genetically modified cells</article-title>. <source>Proc Natl Acad Sci U S A</source> <year>1995</year>;<volume>92</volume>:<fpage>6733</fpage>–<lpage>7</lpage>.<ext-link ext-link-type="uri" xlink:href="http://dx.doi.org/10.1073/pnas.92.15.6733" xlink:type="simple">doi:10.1073/pnas.92.15.6733</ext-link>
<pub-id pub-id-type="pmid" xlink:type="simple">http://www.ncbi.nlm.nih.gov/pubmed/7624312</pub-id>
</mixed-citation></ref><ref id="R23"><label>23</label><mixed-citation publication-type="journal" xlink:type="simple">
<person-group person-group-type="author">
<string-name name-style="western">
<surname>Hubley</surname> <given-names>R</given-names>
</string-name>, <string-name name-style="western">
<surname>Finn</surname> <given-names>RD</given-names>
</string-name>, <string-name name-style="western">
<surname>Clements</surname> <given-names>J</given-names>
</string-name>, <etal>et al</etal>
</person-group>. <article-title>The Dfam database of repetitive DNA families</article-title>. <source>Nucleic Acids Res</source> <year>2016</year>;<volume>44</volume>:<fpage>D81</fpage>–<lpage>9</lpage>.<ext-link ext-link-type="uri" xlink:href="http://dx.doi.org/10.1093/nar/gkv1272" xlink:type="simple">doi:10.1093/nar/gkv1272</ext-link>
<pub-id pub-id-type="pmid" xlink:type="simple">http://www.ncbi.nlm.nih.gov/pubmed/26612867</pub-id>
</mixed-citation></ref><ref id="R24"><label>24</label><mixed-citation publication-type="journal" xlink:type="simple">
<person-group person-group-type="author">
<string-name name-style="western">
<surname>Lander</surname> <given-names>ES</given-names>
</string-name>, <string-name name-style="western">
<surname>Linton</surname> <given-names>LM</given-names>
</string-name>, <string-name name-style="western">
<surname>Birren</surname> <given-names>B</given-names>
</string-name>, <etal>et al</etal>
</person-group>. <article-title>Initial sequencing and analysis of the human genome</article-title>. <source>Nature</source> <year>2001</year>;<volume>409</volume>:<fpage>860</fpage>–<lpage>921</lpage>.<ext-link ext-link-type="uri" xlink:href="http://dx.doi.org/10.1038/35057062" xlink:type="simple">doi:10.1038/35057062</ext-link>
<pub-id pub-id-type="pmid" xlink:type="simple">http://www.ncbi.nlm.nih.gov/pubmed/11237011</pub-id>
</mixed-citation></ref><ref id="R25"><label>25</label><mixed-citation publication-type="journal" xlink:type="simple">
<person-group person-group-type="author">
<string-name name-style="western">
<surname>Iwahana</surname> <given-names>H</given-names>
</string-name>, <string-name name-style="western">
<surname>Tsujisawa</surname> <given-names>T</given-names>
</string-name>, <string-name name-style="western">
<surname>Katashima</surname> <given-names>R</given-names>
</string-name>, <etal>et al</etal>
</person-group>. <article-title>Pcr with end trimming and cassette ligation: a rapid method to clone exon-intron boundaries and a 5'-upstream sequence of genomic DNA based on a cDNA sequence</article-title>. <source>PCR Methods Appl</source> <year>1994</year>;<volume>4</volume>:<fpage>19</fpage>–<lpage>25</lpage>.<ext-link ext-link-type="uri" xlink:href="http://dx.doi.org/10.1101/gr.4.1.19" xlink:type="simple">doi:10.1101/gr.4.1.19</ext-link>
<pub-id pub-id-type="pmid" xlink:type="simple">http://www.ncbi.nlm.nih.gov/pubmed/9018312</pub-id>
</mixed-citation></ref><ref id="R26"><label>26</label><mixed-citation publication-type="journal" xlink:type="simple">
<person-group person-group-type="author">
<string-name name-style="western">
<surname>Di Stasi</surname> <given-names>A</given-names>
</string-name>, <string-name name-style="western">
<surname>Tey</surname> <given-names>S-K</given-names>
</string-name>, <string-name name-style="western">
<surname>Dotti</surname> <given-names>G</given-names>
</string-name>, <etal>et al</etal>
</person-group>. <article-title>Inducible apoptosis as a safety switch for adoptive cell therapy</article-title>. <source>N Engl J Med</source> <year>2011</year>;<volume>365</volume>:<fpage>1673</fpage>–<lpage>83</lpage>.<ext-link ext-link-type="uri" xlink:href="http://dx.doi.org/10.1056/NEJMoa1106152" xlink:type="simple">doi:10.1056/NEJMoa1106152</ext-link>
<pub-id pub-id-type="pmid" xlink:type="simple">http://www.ncbi.nlm.nih.gov/pubmed/22047558</pub-id>
</mixed-citation></ref><ref id="R27"><label>27</label><mixed-citation publication-type="journal" xlink:type="simple">
<person-group person-group-type="author">
<string-name name-style="western">
<surname>Zhang</surname> <given-names>P</given-names>
</string-name>, <string-name name-style="western">
<surname>Tey</surname> <given-names>S-K</given-names>
</string-name>
</person-group>. <article-title>Adoptive T cell therapy following haploidentical hematopoietic stem cell transplantation</article-title>. <source>Front Immunol</source> <year>2019</year>;<volume>10</volume>:<elocation-id>1854</elocation-id>.<ext-link ext-link-type="uri" xlink:href="http://dx.doi.org/10.3389/fimmu.2019.01854" xlink:type="simple">doi:10.3389/fimmu.2019.01854</ext-link>
<pub-id pub-id-type="pmid" xlink:type="simple">http://www.ncbi.nlm.nih.gov/pubmed/31447852</pub-id>
</mixed-citation></ref></ref-list></back></article>