<?xml version="1.0" encoding="UTF-8" standalone="no"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Bioeng. Biotechnol.</journal-id>
<journal-title>Frontiers in Bioengineering and Biotechnology</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Bioeng. Biotechnol.</abbrev-journal-title>
<issn pub-type="epub">2296-4185</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fbioe.2020.00235</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Bioengineering and Biotechnology</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Linker and N-Terminal Domain Engineering of Pyrrolysyl-tRNA Synthetase for Substrate Range Shifting and Activity Enhancement</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name><surname>Jiang</surname> <given-names>Han-Kai</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/886998/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Lee</surname> <given-names>Man-Nee</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/917012/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Tsou</surname> <given-names>Jo-Chu</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Chang</surname> <given-names>Kuan-Wen</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Tseng</surname> <given-names>Hsueh-Wei</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Chen</surname> <given-names>Kuang-Po</given-names></name>
<xref ref-type="aff" rid="aff4"><sup>4</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Li</surname> <given-names>Yaw-Kuen</given-names></name>
<xref ref-type="aff" rid="aff4"><sup>4</sup></xref>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name><surname>Wang</surname> <given-names>Yane-Shih</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<xref ref-type="aff" rid="aff5"><sup>5</sup></xref>
<xref ref-type="corresp" rid="c001"><sup>&#x002A;</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/809653/overview"/>
</contrib>
</contrib-group>
<aff id="aff1"><sup>1</sup><institution>Institute of Biological Chemistry, Academia Sinica</institution>, <addr-line>Taipei</addr-line>, <country>Taiwan</country></aff>
<aff id="aff2"><sup>2</sup><institution>Chemical Biology and Molecular Biophysics Program, Taiwan International Graduate Program, Academia Sinica</institution>, <addr-line>Taipei</addr-line>, <country>Taiwan</country></aff>
<aff id="aff3"><sup>3</sup><institution>Department of Chemistry, National Tsing Hua University</institution>, <addr-line>Hsinchu</addr-line>, <country>Taiwan</country></aff>
<aff id="aff4"><sup>4</sup><institution>Department of Applied Chemistry, National Chiao Tung University</institution>, <addr-line>Hsinchu</addr-line>, <country>Taiwan</country></aff>
<aff id="aff5"><sup>5</sup><institution>Institute of Biochemical Sciences, National Taiwan University</institution>, <addr-line>Taipei</addr-line>, <country>Taiwan</country></aff>
<author-notes>
<fn fn-type="edited-by"><p>Edited by: Chenguang Fan, University of Arkansas, United States</p></fn>
<fn fn-type="edited-by"><p>Reviewed by: Wenshe R. Liu, Texas A&#x0026;M University, United States; Akiyoshi Nakamura, National Institute of Advanced Industrial Science and Technology (AIST), Japan</p></fn>
<corresp id="c001">&#x002A;Correspondence: Yane-Shih Wang, <email>yaneshihwang@gate.sinica.edu.tw</email></corresp>
<fn fn-type="other" id="fn004"><p>This article was submitted to Synthetic Biology, a section of the journal Frontiers in Bioengineering and Biotechnology</p></fn>
</author-notes>
<pub-date pub-type="epub">
<day>07</day>
<month>04</month>
<year>2020</year>
</pub-date>
<pub-date pub-type="collection">
<year>2020</year>
</pub-date>
<volume>8</volume>
<elocation-id>235</elocation-id>
<history>
<date date-type="received">
<day>14</day>
<month>01</month>
<year>2020</year>
</date>
<date date-type="accepted">
<day>06</day>
<month>03</month>
<year>2020</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#x00A9; 2020 Jiang, Lee, Tsou, Chang, Tseng, Chen, Li and Wang.</copyright-statement>
<copyright-year>2020</copyright-year>
<copyright-holder>Jiang, Lee, Tsou, Chang, Tseng, Chen, Li and Wang</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p></license>
</permissions>
<abstract>
<p>The <italic>Methanosarcina mazei</italic> pyrrolysyl-tRNA synthetase (PylRS)&#x22C5;tRNA<sup>Pyl</sup> pair can be used to incorporate non-canonical amino acids (ncAAs) into proteins at installed amber stop codons. Although engineering of the PylRS active site generates diverse binding pockets, the substrate ranges are found similar in charging lysine and phenylalanine analogs. To expand the diversity of the ncAA side chains that can be incorporated <italic>via</italic> the PylRS&#x22C5;tRNA<sup>Pyl</sup> pair, exploring remote interactions beyond the active site is an emerging approach in expanding the genetic code research. In this work, remote interactions between tRNA<sup>Pyl</sup>, the tRNA binding domain of PylRS, and/or an introduced non-structured linker between the N- and C-terminus of PylRS were studied. The substrate range of the PylRS&#x22C5;tRNA<sup>Pyl</sup> pair was visualized by producing <italic>sfGFP-UAG</italic> gene products, which also indicated amber suppression efficiencies and substrate specificity. The unstructured loop linking the N-terminal and C-terminal domains (CTDs) of PylRS has been suggested to regulate the interaction between PylRS and tRNA<sup>Pyl</sup>. In exploring the detailed role of the loop region, different lengths of the linker were inserted into the junction between the N-terminal and the C-terminal domains of PylRS to unearth the impact on remote effects. Our findings suggest that the insertion of a moderate-length linker tunes the interface between PylRS and tRNA<sup>Pyl</sup> and subsequently leads to improved suppression efficiencies. The suppression activity and the substrate specificity of PylRS were altered by introducing three mutations at or near the N-terminal domain of PylRS (N-PylRS). Using a N-PylRS&#x22C5;tRNA<sup>Pyl</sup> pair, three ncAA substrates, two <italic>S</italic>-benzyl cysteine and a histidine analog, were incorporated into the protein site specifically.</p>
</abstract>
<kwd-group>
<kwd>non-canonical amino acids</kwd>
<kwd>pyrrolysyl-tRNA synthetase</kwd>
<kwd>linker engineering</kwd>
<kwd>amber codon suppression</kwd>
<kwd>tRNA binding domain</kwd>
</kwd-group>
<counts>
<fig-count count="9"/>
<table-count count="1"/>
<equation-count count="0"/>
<ref-count count="29"/>
<page-count count="14"/>
<word-count count="0"/>
</counts>
</article-meta>
</front>
<body>
<sec id="S1">
<title>Introduction</title>
<p>Expanding the genetic code is a pragmatic approach to incorporate over 200 different kinds of non-canonical amino acids (ncAAs) into proteins <italic>in vivo</italic> (<xref ref-type="bibr" rid="B22">Vargas-Rodriguez et al., 2018</xref>). This technology employs a bioorthogonal aminoacyl-tRNA synthetase (AARS)&#x22C5;tRNA pair to decode nonsense or rare codons in living systems genetically (<xref ref-type="bibr" rid="B16">O&#x2019;Donoghue et al., 2012</xref>). One of most used AARS&#x22C5;tRNA systems for genetic code expansion is the pyrrolysyl-tRNA synthetase (PylRS)&#x22C5;tRNA<sup>Pyl</sup> derived from the archaea <italic>Methanosarcina barkeri</italic> (<italic>Mb</italic>) or <italic>Methanosarcina mazei</italic> (<italic>Mm</italic>) or the eubacteria <italic>Desulfitobacterium hafniense</italic> (<italic>Dh</italic>) (<xref ref-type="bibr" rid="B6">Herring et al., 2007</xref>; <xref ref-type="bibr" rid="B13">Neumann et al., 2008</xref>; <xref ref-type="bibr" rid="B29">Yanagisawa et al., 2008</xref>). The PylRS&#x22C5;tRNA<sup>Pyl</sup> pair has a wide range of bio-orthogonality in different species from prokaryotes to eukaryotes (<xref ref-type="bibr" rid="B11">Mukai et al., 2008</xref>; <xref ref-type="bibr" rid="B13">Neumann et al., 2008</xref>; <xref ref-type="bibr" rid="B4">Han et al., 2017</xref>). The <italic>Mm</italic>PylRS&#x22C5;<italic>Mm</italic>tRNA<sup>Pyl</sup> (PylRS&#x22C5;tRNA<sup>Pyl</sup>) pair was naturally evolved for amber TAG codon recoding with slow enzyme kinetic properties (<xref ref-type="bibr" rid="B3">Guo et al., 2014</xref>). Uniquely, PylRS harbors a sophisticated and dynamic active site for recognizing pyrrolysine, a lysine analog modified with a 4-methylpyrroline-ring through an <italic>N</italic><sup>&#x03B5;</sup>-amide bond linkage (<xref ref-type="bibr" rid="B5">Hao et al., 2002</xref>). Various evolved PylRS&#x22C5;tRNA<sup>Pyl</sup> pairs for incorporating lysine and phenylalanine analogs have been reported through directed-evolution and rational design approaches (<xref ref-type="bibr" rid="B11">Mukai et al., 2008</xref>; <xref ref-type="bibr" rid="B13">Neumann et al., 2008</xref>; <xref ref-type="bibr" rid="B24">Wang Y.S. et al., 2012</xref>; <xref ref-type="bibr" rid="B26">Wang et al., 2010</xref>; <xref ref-type="bibr" rid="B3">Guo et al., 2014</xref>). The diverse substrate scope and co-crystal structures of ncAA substrate-PylRS mutants reveal that the substrate can have multiple binding modes and a slower feature in enzymatic kinetic studies (<xref ref-type="bibr" rid="B9">Kavran et al., 2007</xref>; <xref ref-type="bibr" rid="B14">Nozawa et al., 2009</xref>). The directed evolution of full-length PylRS has been studied. However, a systematic investigation of interactions between the C-terminal domain (CTD) and the N-terminal domain (NTD) of the protein and the cognate tRNA, as well as the impact of those interactions of the dynamic substrate range, remains unexplored.</p>
<p>The co-crystal structure of <italic>Mm</italic>PylRS CTD with pyrrolysine revealed a distinct binding mode for the amino acid, which is deeply embedded into the hydrophobic pocket of the catalytic domain. The CTD of PylRS contains the binding domain that harbors tRNA<sup>Pyl</sup> and ATP (<xref ref-type="bibr" rid="B14">Nozawa et al., 2009</xref>). The interplay between tRNA<sup>Pyl</sup> and PylRS plays a key role in affecting enzymatic activity and substrate scope. The G1:C72 base pair and discriminator G73, which are located on the acceptor arm of tRNA<sup>Pyl</sup>, are thought to be required for PylRS recognition (<xref ref-type="bibr" rid="B6">Herring et al., 2007</xref>). Mutations in the D loop, T loop, or variable loop of tRNA<sup>Pyl</sup> spatially perturb its shape, which in turn diminishes the activity of PylRS. The suppression efficiency is slightly influenced by a change in the anticodon loop compared to the D or the T loop, suggesting the inessential element for PylRS recognition (<xref ref-type="bibr" rid="B1">Ambrogelly et al., 2007</xref>).</p>
<p>The anticodon loop and acceptor arm of the tRNA are fundamental and essential elements for endogenous AARSs recognition (<xref ref-type="bibr" rid="B17">Schimmel et al., 1993</xref>; <xref ref-type="bibr" rid="B15">O&#x2019;Donoghue and Luthey-Schulten, 2003</xref>). As opposed to this binding mode, PylRS recognizes its cognate tRNA<sup>Pyl</sup> distinctly. This characteristic helps PylRS to selectively distinguish tRNA<sup>Pyl</sup> in the translational system. The T loop and the variable loop of tRNA<sup>Pyl</sup> have hydrophilic interactions with the PylRS-NTD. The tRNA<sup>Pyl</sup> is oppositely embraced by the NTD and the CTD of PylRS, which is in connection with the postulated flexible loops (<xref ref-type="bibr" rid="B21">Suzuki et al., 2017</xref>; <xref ref-type="fig" rid="F1">Figure 1A</xref>). This compatible binding mode dynamically controls the interaction between PylRS and tRNA<sup>Pyl</sup>.</p>
<fig id="F1" position="float">
<label>FIGURE 1</label>
<caption><p>Protein designs of evolved <italic>Mm</italic>PylRS and their linker engineering. <bold>(A)</bold> Illustration of the interaction between <italic>Mm</italic>PylRS and tRNA<sup>Pyl</sup>. R61K/H63Y/S193R mutations (labeled in open red circles) are distributed on the tRNA binding domain of <italic>Mm</italic>PylRS NTD or CTD (labeled as filled blue circle). The detailed interactions from X-ray crystal structures in PylRS-NTD/tRNA (<xref ref-type="bibr" rid="B21">Suzuki et al., 2017</xref>) and PylRS-CTD/tRNA (<xref ref-type="bibr" rid="B14">Nozawa et al., 2009</xref>) are indicated in <xref ref-type="fig" rid="F2">Figures 2</xref>, <xref ref-type="fig" rid="F3">3</xref>. tRNA 2D topology and sequence are labeled in green filled circles. The orange dashed line denotes the inserted linker between P149 and A150. <bold>(B)</bold> Engineered <italic>Mm</italic>PylRS constructs used in this work. N-PylRS represents <italic>Mm</italic>PylRS with R61K/H63Y/S193R mutations; PylRS-D1 represents <italic>Mm</italic>PylRS with insertion of the spacer containing the stop and the start codons between P149 and A150; PylRS-L1 indicates the insertion of SGGGGS linker between P149 and A150; PylRS-L2 for S(GGGGS)<sub>2</sub> linker insertion; PylRS-L3 for S(GGGGS)<sub>3</sub> linker insertion.</p></caption>
<graphic xlink:href="fbioe-08-00235-g001.tif"/>
</fig>
<p>Moreover, the truncation of PylRS NTD significantly precludes the binding specificity of PylRS by making it incapable to charge tRNA<sup>Pyl</sup> (<xref ref-type="bibr" rid="B8">Jiang and Krzycki, 2012</xref>). The mutations on NTD of the evolved chimeric PylRS (chPylRS) have played a crucial role in tuning the binding of tRNA<sup>Pyl</sup> (<xref ref-type="bibr" rid="B21">Suzuki et al., 2017</xref>). The previous study of class II AARS seryl-tRNA synthetase (SerRS) showed that the R76 and the R94 of the NTD of <italic>Mb</italic>SerRS were curial for tRNA recognition, and the alanine mutations of both had abolished the amber suppression efficiency (<xref ref-type="bibr" rid="B7">Jaric et al., 2009</xref>). N-terminal Add-1 domain from an exceptional class I AARS arginyl-tRNA synthetase (ArgRS) of <italic>Saccharomyces cerevisiae</italic> was found to bind the D loop of tRNA<sup>Arg</sup>, which is a rare spatial arrangement among class I AARSs but similar to <italic>Mm</italic>PylRS and <italic>Mb</italic>SerRS (<xref ref-type="bibr" rid="B2">Cavarelli et al., 1998</xref>). The length of NTD extensively affects the orientation of tRNA<sup>Arg</sup> by the positional change of ArgRS (<xref ref-type="bibr" rid="B20">Shimada et al., 2001</xref>). Using directed evolution, certain mutations generated on PylRS NTD accompanied by variations surrounding the catalytic site also led to increased suppression efficiencies as well as substrate specificity (<xref ref-type="bibr" rid="B12">Mukai et al., 2015</xref>). Evolved PylRS harboring three mutations on NTD was found to enhance the suppression efficiency in charging BocK (<bold>1</bold>, <xref ref-type="fig" rid="F1a">Scheme 1</xref>) (<xref ref-type="bibr" rid="B19">Sharma et al., 2018</xref>). The above studies support the idea that the mutations on the NTD might influence the binding mode and the activity of PylRS.</p>
<fig id="F1a" position="float">
<label>SCHEME 1</label>
<caption><p>Chemical structures of the non-canonical amino acids described in this study. ncAA <bold>1</bold>: <italic>N</italic><sup>&#x03B5;</sup>-(<italic>tert</italic>-butoxycarbonyl)-L-lysine (BocK); <bold>2</bold>: <italic>N</italic><sup>&#x03B5;</sup>- (alloyloxycarbonyl)-L-lysine (AlloK); <bold>3</bold>: <italic>S</italic>-(4-methylbenzyl)-L-cysteine (MbzlC); <bold>4</bold>: <italic>S</italic>-(4-methoxylbenzyl)-L-cysteine (MeObzlC); <bold>5</bold>: <italic>N</italic>-&#x03C0;-methyl-L-histidine (3MeH); <bold>6</bold>: <italic>N</italic><sup>&#x03B5;</sup>-(carbobenzyloxy)-L-lysine (CbzK); <bold>7</bold>: <italic>N</italic><sup>&#x03B5;</sup>-(2-chlorocarbobenzyloxy)-L-lysine (ClCbzK); <bold>8</bold>: <italic>N</italic><sup>&#x03B5;</sup>-(carbobenzyloxy)-D-lysine (DCbzK); <bold>9</bold>: <italic>N</italic><sup>&#x03B5;</sup>-(2-chlorocarbobenzyloxy)- D-lysine (DClCbzK); <bold>10</bold>: (<italic>R</italic>)-2-amino-3-(2-benzyloxycarbonylaminoethylselanyl)propanoic acid (SeCbzK); <bold>11</bold>: (<italic>S</italic>)-6-(benzyloxycarbonylamino)-2-hydroxygexanoic acid (CbzKOH).</p></caption>
<graphic xlink:href="fbioe-08-00235-s001.tif"/>
</fig>
<p>Here we report the generation of PylRS variants with mutations beyond the catalytic site, which has allowed us to further decipher the interaction between PylRS and tRNA<sup>Pyl</sup>. Fast screening of a ncAAs library using an amber-codon-installed <italic>superfolder green fluorescent protein</italic> (<italic>sfGFP</italic>) gene allowed us to determine the substrate range and suppression efficiency and, in turn, fine-tuning of the interaction between PylRS and tRNA<sup>Pyl</sup>. We found that extending the length of a linker between the NTD and the CTD of PylRS further probed the management of flexible loop and their effectiveness in ncAA incorporation yield.</p>
</sec>
<sec id="S2" sec-type="materials|methods">
<title>Materials and Methods</title>
<sec id="S2.SS1">
<title>General Strains and Plasmid Constructions</title>
<p>Natural amino acids and ncAAs were purchased from Chem Impex Inc (Wood Dale, IL, United States). The ncAA SeCbzK (<bold>10</bold>) (<xref ref-type="bibr" rid="B25">Wang Z.U. et al., 2012</xref>) and CbzKOH (<bold>11</bold>) (<xref ref-type="bibr" rid="B10">Li et al., 2012</xref>; <xref ref-type="bibr" rid="B23">Wang, 2012</xref>) (<xref ref-type="fig" rid="F1a">Scheme 1</xref>) were synthesized by the reported methods. PCR was performed using the KOD hot start polymerase kit (Merck). Oligonucleotide synthesis and DNA sequencing were done by Genomics Inc. (Taipei, Taiwan). The primer sequences are listed in the <xref ref-type="supplementary-material" rid="DS1">Supplementary Materials</xref>. Construction of the pET-<italic>pylT-sfGFP-TAG2</italic> and the pET-<italic>pylT-sfGFP-TAG27</italic> plasmids followed general cloning protocols. The <italic>sfGFP-TAG2</italic> gene was amplified by PCR from pET-<italic>pylT-sfGFP</italic> (<xref ref-type="bibr" rid="B3">Guo et al., 2014</xref>) with the primers sfGFP-TAG2-<italic>Nde</italic>I-F and sfGFP-<italic>Sac</italic>I-R2. The <italic>sfGFP-TAG27</italic> was generated by overlap extension PCR with two fragments (fragment 1: primer sfGFP-<italic>Nde</italic>I-F1 and sfGFP-TAG27-R; fragment 2: sfGFP-TAG27-F and sfGFP-<italic>Sac</italic>I-R2). The overlapped <italic>sfGFP</italic> gene products and pET-<italic>pylT</italic> plasmid were then double-digested with restriction enzyme <italic>Nde</italic>I and <italic>Sac</italic>I, and then T4 DNA ligase was used for DNA ligation.</p>
<p>In the construction of the plasmid pCDF-<italic>N-PylRS</italic> variants, the <italic>PylRS-R61K/H63Y/S193R</italic> (<italic>N-PylRS</italic>) gene was generated by overlap extension PCR with three fragments using the template pCDF-<italic>PylRS</italic>: fragment 1: PylRS-<italic>Nco</italic>I-F and PylRS-R61K/H63Y-R; fragment 2: PylRS-R61K/H63Y-F and PylRS-S193R-R; fragment 3: PylRS-S193R-F and PylRS-<italic>Bam</italic>HI-R. In preparing pCDF-<italic>PylRS-R61K</italic>, pCDF-<italic>PylRS-H63Y</italic>, and pCDF-<italic>PylRS-S193R</italic>, the same procedures were performed with the following primers to produce <italic>PylRS-R61K</italic>, <italic>PylRS- H63Y</italic>, and <italic>PylRS-S193R</italic> genes with pCDF-<italic>PylRS</italic> template and following the overlap extension PCR; <italic>PylRS-R61K</italic> gene: fragment 1, PylRS-<italic>Nco</italic>I-F and PylRS-R61K-R; fragment 2, PylRS-R61K-F and PylRS-<italic>Bam</italic>HI-R; <italic>PylRS-H63Y</italic> gene: fragment 1, PylRS-<italic>Nco</italic>I-F and PylRS-H63Y-R; fragment 2, PylRS-H63Y-F and PylRS-<italic>Bam</italic>HI-R; <italic>PylRS-S193R</italic> gene: fragment 1, PylRS-<italic>Nco</italic>I-F and PylRS-S193R-R; fragment 2, PylRS-S193R-F and PylRS-<italic>Bam</italic>HI-R. In preparing pCDF-<italic>PylRS-ND</italic>, the <italic>PylRS-ND</italic> gene fragment was generated by PCR with two primers, PylRS-<italic>Nco</italic>I-F and PylRS-P149-<italic>Bam</italic>HI-R, and pCDF-<italic>PylRS</italic> was used as a template. In the preparation of pCDF-<italic>PylRS-D1</italic>, the spacer sequence (TGAAAAAAGCGATG), including the TGA stop codon and the ATG start codon, was installed between positions P149 and A150 of the <italic>PylRS</italic> gene. The <italic>PylRS-D1</italic> gene fragment was generated by overlap extension PCR with two fragments using pCDF-<italic>PylRS</italic> as a template. Fragment 1 was generated by the primers PylRS-<italic>Nco</italic>I-F and PylRS-P149SSS-R1; fragment 2 was generated by the primers PylRS-P149SSS-F2 and PylRS-<italic>Bam</italic>HI-R. Different lengths of linker were installed in PylRS variants between sposition 149 and 150. In preparing pCDF-<italic>PylRS-L1</italic>, pCDF-<italic>PylRS-L2</italic>, and pCDF-<italic>PylRS-L3</italic> (<xref ref-type="fig" rid="F1">Figure 1B</xref>), the same procedures were performed by the following primers to produce <italic>PylRS-L1</italic>, <italic>PylRS-L2</italic>, and <italic>PylRS-L3</italic> genes with pCDF-<italic>PylRS</italic> template and following overlap extension PCR: <italic>PylRS-L1</italic> gene, PylRS-<italic>Nco</italic>I-F, and Linker-1XG4S-R1, Linker-1XG4S-F2, and PylRS-<italic>Bam</italic>HI-R; <italic>PylRS-L2</italic> gene: fragment 1, PylRS-<italic>Nco</italic>I-F and Linker-2XG4S-R1; fragment 2, Linker-2XG4S-F2 and Linker-2XG4S-R2; fragment 3, Linker-2XG4S-F3 and PylRS-<italic>Bam</italic>HI-R; <italic>PylRS-L3</italic> gene: fragments 1 and 3 were from the <italic>PylRS-L2</italic> gene; fragment 2, Linker-3XG4S-F2 and Linker-3XG4S-R2.</p>
<p>The pCDF-<italic>N-PylRS</italic> plasmids with the inserted linker, pCDF-<italic>N-PylRS-D1</italic>, pCDF-<italic>N-PylRS-L1</italic>, pCDF-<italic>N-PylRS-L2</italic>, and pCDF-<italic>N-PylRS-L3</italic> (<xref ref-type="fig" rid="F1">Figure 1B</xref>), were then constructed using the procedures mentioned above. pCDF-<italic>ZRS</italic> was derived from pEVOL-<italic>mKRS1-pylT</italic> (<xref ref-type="bibr" rid="B25">Wang Z.U. et al., 2012</xref>). The <italic>N-PylRS</italic> mutations were transplanted to <italic>ZRS</italic> by the methods mentioned earlier to construct pCDF-<italic>N-ZRS</italic>. The linkers were inserted into <italic>ZRS</italic> to generate pCDF-<italic>N-ZRS-D1</italic>, pCDF-<italic>ZRS-L1</italic>, pCDF-<italic>ZRS-L2</italic>, and pCDF-<italic>ZRS-L3</italic> plasmids. All the ligated products were transformed to <italic>E. coli</italic> DH5&#x03B1;, and the colonies were selected for DNA sequencing, respectively.</p>
</sec>
<sec id="S2.SS2">
<title>Expression and Purification of ncAA-Encoded sfGFP</title>
<p>To produce ncAA-encoded sfGFP proteins, the pET-<italic>pylT-sfGFP-TAG2</italic> or pET-<italic>pylT-sfGFP-TAG27</italic> plasmid was co-transformed with different pCDF-<italic>PylRS</italic> variants into <italic>E. coli</italic> BL21 (DE3) individually. After an hour of recovery, the bacteria were spread on a plate containing ampicillin (Amp) (100 &#x03BC;g/ml) and streptomycin (Sm) (100 &#x03BC;g/ml). A single colony was chosen from the plate and cultured in 1 ml LB medium overnight. The cultured bacteria were then transferred to 50 ml fresh LB medium and incubated at 37&#x00B0;C until the OD<sub>595</sub> reached 0.6&#x2013;0.8. Protein expression was induced with the supplement of 1 mM IPTG and ncAA (except for sfGFP-<bold>3</bold> and sfGFP-<bold>4</bold> protein production, where the medium was changed to GMML medium supplemented with 2 mM ncAA) and incubated at 37&#x00B0;C for 12 h. The bacteria were then harvested and resuspended in lysis buffer [1X phosphate-buffered saline (PBS), pH 7.4] and sonicated. After centrifugation (60 min, 20,000 &#x00D7; <italic>g</italic>, 4&#x00B0;C), the supernatant was collected and incubated with 0.5 ml Ni<sup>2+</sup>-NTA resin (Roche) for protein purification. A total of 5 ml lysis buffer and 2.5 ml washing buffer (1X PBS, 5 mM imidazole, pH 7.4) were used to remove proteins bound non-specifically to the resin. The target protein was eluted from the resin with 2.5 ml elution buffer (1X PBS, 200 mM imidazole, pH 7.4). The buffer of the eluted fractions was changed to 1X PBS with Amicon Ultra-15 Centrifugal Filter Units (MWCO 10 kDa). Purified sfGFP was analyzed by 12% sodium dodecyl sulfate&#x2013;polyacrylamide gel electrophoresis (SDS-PAGE) with instant blue staining.</p>
</sec>
<sec id="S2.SS3">
<title>Western Blot Analysis</title>
<p>Whole cells were collected and lysed at 100&#x00B0;C with SDS loading dye for 15 min and then subjected to 12% SDS-PAGE analysis. The gels were stained with InstantBlue<sup>TM</sup> Stain to visualize the target proteins with the expected molecular weight of around 28 kDa. The suppression efficiency of the amber codon in the sfGFP proteins with a C-terminal His tag was observed by western blot with an anti-6X His tag antibody. Western blots were performed using a Trans-Blot Turbo System (Bio-Rad) and an RTA transfer kit. Anti-His (SignalChem, H99-61M-100) and horseradish peroxidase (HRP)-conjugated secondary antibody (Cell Signaling Technology, 7076P2) were used for immunoblotting. After SDS-PAGE analysis, the gel was immersed in the transfer buffer and then blotted with a polyvinylidene fluoride (PVDF) membrane (25 V/1.3 A, 10 min). After the transfer process was finished, the PVDF membrane was washed thrice with phosphate-buffered saline with Tween<sup>&#x00AE;</sup> (PBST) buffer for 5 min. Next, the membrane was blocked with 5% skimmed milk for 1 h at room temperature. Then, the membrane was washed thrice with PBST buffer for 5 min (washing step). The primary antibody (1:1,000 dilution) was added and incubated with the membrane for 1 h at room temperature following the washing step. Subsequently, the HRP-conjugated secondary antibody (1:5,000 dilution) was added and incubated with the membrane for 1 h at room temperature. The membrane was then treated by a washing step. Finally, the WesternBright ECL HRP substrate (Advansta, K-12045-D50) was mixed and spread onto the membrane to visualize the band signals using the ChemiDoc Imaging Systems (Bio-Rad) in bioluminescence detection mode.</p>
</sec>
<sec id="S2.SS4">
<title>Electrospray Ionization-Mass Spectrometry Characterization of sfGFP</title>
<p>The pure protein was diluted with 50% acetonitrile and 1% formic acid. An aliquot corresponding to 1 pmol of the pure protein was injected into an ESI source (Waters LockSpray Exact Mass Ionization Source) with a syringe pump (Harvard Apparatus, MA, United States) and a flow rate of 5 &#x03BC;l/min was held throughout the analysis. The mass of the intact proteins was determined using Waters Synapt G2 HDMS mass spectrometer (Waters, Milford, MA, United States). The acquired spectra were deconvoluted to single-charge state using the MaxEnt1 algorithm of the MassLynx 4.1 software (Waters).</p>
</sec>
<sec id="S2.SS5">
<title>Matrix-Assisted Laser Desorption/Ionization-Time of Flight-Tandem Mass Spectrometry Characterization of sfGFP</title>
<p>Details of in-gel digestion are as follows: after the staining procedure, the gel bands were excised and cut into small pieces. The gel pieces were sequentially washed with 25 mM NH<sub>4</sub>HCO<sub>3</sub>, 40% methanol solution, and 100% acetonitrile before being treated with DTT and then iodoacetamide. Washing of the gel pieces with 25 mM NH<sub>4</sub>HCO<sub>3</sub> and 50% acetonitrile and then drying in a vacuum centrifuge provided the materials for trypsin digestion. A solution of 65 to 100 ng of sequencing-grade modified trypsin (Promega) in 25 mM NH<sub>4</sub>HCO<sub>3</sub> and 10% acetonitrile (25&#x2013;30 &#x03BC;l) was added and incubated with the gel pieces for 12&#x2013;16 hrs at 37&#x00B0;C. The reaction was stopped by adding 1&#x2013;2 &#x03BC;l of 5% formic acid. Details of the MS and data analysis are as follows: the digested samples (0.5 &#x03BC;l) were carefully mixed with the matrix solution (0.5 &#x03BC;l of 5 mg/ml DHB in 0.1% TFA/30% acetonitrile) and 0.5 &#x03BC;l of the mixture was deposited onto a MTP 600/384 AnchorChip (Bruker Daltonics). All mass spectrometry experiments were done using a Bruker Autoflex III MALDI TOF/TOF mass spectrometer (Bremen, Germany) equipped with a 200-Hz SmartBean Laser in positive ion mode with delayed extraction in the reflectron mode. Data acquisition was done manually with FlexControl 3.4, and data processing was performed with Flex-Analysis 3.4 (both Bruker Daltonik). Protein database searches through Mascot, using combined PMF and tandem mass spectrometry MS/MS datasets, were performed <italic>via</italic> Biotools 3.2 (Bruker).</p>
</sec>
<sec id="S2.SS6">
<title>Determination of the Suppression Efficiencies of PylRS</title>
<p>To understand the substrate range of PylRS variants, screening of a 359 ncAAs library was performed. The plasmid pET-<italic>pylT-sfGFP-TAG2</italic> or pET-<italic>pylT-sfGFP-TAG27</italic> and pCDF-<italic>PylRS</italic> variants were co-transformed into <italic>E. coli</italic> BL21 (DE3) individually. The bacteria were spread on a plate supplemented with Amp (100 &#x03BC;g/ml) and Sm (100 &#x03BC;g/ml). The plate was incubated at 37&#x00B0;C overnight. Ten colonies were then inoculated and cultured in 3 ml LB medium at 37&#x00B0;C overnight before 500 &#x03BC;l of each cultured bacteria was transferred to 25 ml of fresh LB medium and incubated at 37&#x00B0;C until the OD<sub>595</sub> reached 0.6&#x2013;0.8. The cells were harvested and washed twice with M9 salts and suspended in M9 medium (M9 salts, 1% glycerol, 2 mM MgSO<sub>4</sub>, and 0.1 mM CaCl<sub>2</sub>) containing 1 mM IPTG. Aliquots (50 &#x03BC;l) of the suspended cells were loaded into a 384-well plate containing a different ncAAs (1 mM) in 359 wells (<xref ref-type="supplementary-material" rid="DS1">Supplementary Table S2</xref>). Cells were incubated in a plate reader (BioTek) at 37&#x00B0;C for 12 h, with continuous monitoring of the fluorescence intensity (excitation 535 nm and emission 595 nm) as well as OD<sub>595</sub>. Twelve wells were used as controls to measure the background signals (six wells without ncAAs and IPTG; six wells without ncAAs but containing IPTG). The fluorescence intensity of sfGFP was divided by the OD<sub>595</sub> following the subtraction of the control signals (containing IPTG but no ncAAs) to generate the relative fluorescence intensity.</p>
</sec>
</sec>
<sec id="S3">
<title>Results</title>
<sec id="S3.SS1">
<title>Designing Active PylRS Variants With Mutations at or Near the N-Terminal Domain and Linker Engineering</title>
<p>To explore novel substrate ranges, this work aimed to generate novel PylRS variants without active site mutations for studying remote effects in altering the interaction between the tRNA and the PylRS NTD or CTD. In a previous study, the evolved PylRS, HarRS, had R61K, H63Y, S193R, N203T, L305H, L309W, N346D, C348S, L367M, Y384F, K429M, K431M, D433G, and G444E mutations. These mutations of HarRS have been found to enhance the activity and the selectivity in charging homoarginine (<xref ref-type="bibr" rid="B12">Mukai et al., 2015</xref>). To understand how the mutations on NTD affect the suppression efficiency of PylRS, the first three mutation sites in HarRS are transplanted to PylRS to generate N-PylRS (R61K/H63Y/S193R) (<xref ref-type="fig" rid="F1">Figure 1</xref>). The R62K and H63Y mutations are in the NTD and at the interface between the PylRS-NTD and the tRNA T loop region (<xref ref-type="fig" rid="F2">Figure 2</xref>). The S193R mutation is in the CTD and is located at the interface with the tRNA D-loop region (<xref ref-type="fig" rid="F3">Figure 3</xref>) based on an overlapped model of the <italic>Dh</italic>PylRS CTD/tRNA<sup>Pyl</sup> co-crystal and the <italic>Mm</italic>PylRS CTD crystal structures. In phage-assisted non-continuous evolution (PANCE) approach for evolving chPylRS, some mutants were found to be active in charging BocK with two separated genes by inserted TGA stop codon and following ATG start codon between NTD and CTD (<xref ref-type="bibr" rid="B21">Suzuki et al., 2017</xref>). The chPylRS was generated by fusing <italic>Mb</italic>PylRS NTD (1&#x2013;149 residues) with the <italic>Mm</italic>PylRS C-terminus (185&#x2013;454 residues). In this work, wild-type <italic>Mm</italic>PylRS (wt-PylRS) was used to translate the inserted mutation between P149 and A150 to form the PylRS-D1 construct (<xref ref-type="fig" rid="F1">Figure 1B</xref>) in generating <italic>Mm</italic>PylRS NTD (1&#x2013;149 residues) and <italic>Mm</italic>PylRS CTD (150&#x2013;454 residues) proteins. The truncated <italic>Mm</italic>PylRS NTD (1&#x2013;149 residues), namely, PylRS-ND, was also generated for comparison.</p>
<fig id="F2" position="float">
<label>FIGURE 2</label>
<caption><p>Structure of <italic>Mm</italic>PylRS NTD complex with tRNA<sup>Pyl</sup>. R61 and H63 located in the PylRS NTD; the yellow dashed lines represent potential hydrogen-bonding interactions. Three such interactions are illustrated between the side chain of R61 and R52 within PylRS NTD and the phosphodiester backbone of 58A and 59U in tRNA<sup>Pyl</sup>. One hydrogen-bonding interaction was found between the side chain of H63 and K85 within the PylRS NTD. The structure is based on the PDB entry 5UD5.</p></caption>
<graphic xlink:href="fbioe-08-00235-g002.tif"/>
</fig>
<fig id="F3" position="float">
<label>FIGURE 3</label>
<caption><p>Structure of <italic>Mm</italic>PylRS CTD and its superimposition with the <italic>Dh</italic>PylRS CTD/tRNA<sup>Pyl</sup> complex. <bold>(A)</bold> S193 is located in the tRNA binding domain of <italic>Mm</italic>PylRS CTD (green). <bold>(B)</bold> The superimposed structure of <italic>Mm</italic>PylRS CTD (green) and <italic>Dh</italic>PylRS CTD&#x22C5;<italic>Dh</italic>tRNA<sup>Pyl</sup> complex (cyan). The structures are based on the PDB entry 2Q7H and 2ZNI.</p></caption>
<graphic xlink:href="fbioe-08-00235-g003.tif"/>
</fig>
<p>To probe the crosstalk between the PylRS NTD and the CTD in charging amino acid substrates, three flexible loops of different lengths were inserted between these domains in PylRS-D1. The linkers were the hexapeptide SGGGGS (PylRS-L1), the tridecapeptide S(GGGGS)<sub>2</sub> (PylRS-L2), and the non-adecapeptide S(GGGGS)<sub>3</sub> (PylRS-L3) (<xref ref-type="fig" rid="F1">Figure 1B</xref>). In addition to these three mutants, we also compared wt-PylRS and PylRS-D1; these five PylRS variants were subjected to test substrate range with the supplement of co-transformed <italic>E. coli</italic> carrying <italic>MmPylRS/tRNA<sup>Pyl</sup></italic> gene cassettes and reporter gene <italic>sfGFP-TAG2</italic> or <italic>sfGFP-TAG27</italic>, respectively. The fluorescence intensities of the <italic>sfGFP-UAG2</italic> and <italic>sfGFP-UAG27</italic> gene products indicated the read-through of the amber codon in response to the ncAA. Generally, the <italic>sfGFP-UAG2</italic> suppression test has 4.7 to 1.6 times higher signal than <italic>sfGFP-UAG27</italic> suppression test in charging ncAA <bold>1</bold> and <bold>2</bold> (<xref ref-type="fig" rid="F1a">Scheme 1</xref>), but the reverse results are seen with ncAA <bold>3</bold>&#x2013;<bold>5</bold>. After producing the <italic>sfGFP-UAG2</italic> and <italic>sfGFP-UAG27</italic> gene products, 359 ncAAs (see <xref ref-type="supplementary-material" rid="DS1">Supplementary Table S1</xref> for structures) were tested as substrates. The screening results (<xref ref-type="supplementary-material" rid="DS1">Supplementary Figures S15&#x2013;S24</xref>) show various intensities of signals in charging BocK (<bold>1</bold>) and AlloK (<bold>2</bold>) (<xref ref-type="fig" rid="F1a">Scheme 1</xref>), which are considered as good substrates for wt-PylRS recognition (<xref ref-type="bibr" rid="B29">Yanagisawa et al., 2008</xref>). In <italic>sfGFP-UAG2</italic> gene production, PylRS-D1 preserved 34% of activity in charging AlloK (<bold>2</bold>) compared to wt-PylRS. The PylRS variants with linkers generate better activities (<xref ref-type="fig" rid="F4">Figure 4A</xref>). All three PylRS variants (PylRS-L1, PylRS-L2, and PylRS-L3) were rescued by inserted linkers and showed enhanced activity at 120&#x2013;230% compared to the activity of wt-PylRS. In <italic>sfGFP-UAG27</italic> gene production (<xref ref-type="fig" rid="F4">Figure 4B</xref>), however, the activity of all five PylRS variants maintained a similar pattern with less charging of ncAA <bold>1</bold> and <bold>2</bold>. Small signals in charging 3MeH (<bold>5</bold>) (<xref ref-type="fig" rid="F1a">Scheme 1</xref>) were found in wt-PylRS, PylRS-L1, PylRS-L2, and PylRS-3 in this amber suppression test.</p>
<fig id="F4" position="float">
<label>FIGURE 4</label>
<caption><p>The <italic>sfGFP-UAG2</italic> and <italic>sfGFP-UAG27</italic> gene suppression efficiencies of PylRS enzyme variants. Incorporation efficiencies of PylRS variants (<xref ref-type="fig" rid="F1">Figure 1B</xref>) as measured by fluorescence intensities of sfGFP with an amber mutation at position 2 <bold>(A)</bold> and 27 <bold>(B)</bold>. The proteins were expressed in 1 mM ncAA and IPTG in GMML medium at 37&#x00B0;C for 12 h. The cells were excited at 485 nm and the fluorescence intensities were detected at 535 nm. The cell density was monitored by absorbance at 595 nm. &#x201C;C&#x201D; indicates the Control experiments of cells with the supplement of 1 mM IPTG; 1&#x2013;5 denote the supplement of 1 mM IPTG and ncAA <bold>1</bold>&#x2013;<bold>5</bold> (<xref ref-type="fig" rid="F1a">Scheme 1</xref>). The background signals from cells without adding IPTG were subtracted from each group. The error bars represent the standard deviation of sfGFP production from four repeated experiments.</p></caption>
<graphic xlink:href="fbioe-08-00235-g004.tif"/>
</fig>
<p>The effects of PylRS-R61K, PylRS-H63Y, and PylRS-S193R variants were determined and found to improve the suppression efficiency against ncAA <bold>1</bold>&#x2013;<bold>2</bold> in <italic>sfGFP-UAG2</italic> production compared to wt-PylRS, whereas no fluorescence signals were observed in PylRS-ND (<xref ref-type="supplementary-material" rid="DS1">Supplementary Figure S47</xref>). Combining the three beneficial mutations, N-PylRS harboring R61K/H63Y/S193R mutations was evaluated in its substrate range by <italic>sfGFP-UAG2</italic> and <italic>sfGFP-UAG27</italic> gene production (<xref ref-type="supplementary-material" rid="DS1">Supplementary Figures S25, S26</xref>). Thus, we decided to investigate N-PylRS and its four variants, N-PylRS-D1 and N-PylRS-L1&#x2013;L3 (<xref ref-type="supplementary-material" rid="DS1">Supplementary Figures S27&#x2013;S34</xref>). Noticeably, N-PylRS showed nearly 5.6 and 4.1 times higher fluorescent signals in charging BocK (<bold>1</bold>) and AlloK (<bold>2</bold>) than wt-PylRS in the <italic>sfGFP-UAG2</italic> gene suppression yield (<xref ref-type="fig" rid="F4">Figure 4A</xref>). In the <italic>sfGFP-UAG27</italic> gene suppression study, N-PylRS was found to recognize ncAA <bold>1</bold>&#x2013;<bold>5</bold>. While AlloK (<bold>2</bold>) is still the best substrate, 3MeH (<bold>5</bold>) has a higher signal than BocK (<bold>1</bold>) (<xref ref-type="fig" rid="F4">Figure 4B</xref>). In addition, N-PylRS was capable of incorporating <italic>S</italic>-benzyl cysteine analogs MbzlC (<bold>3</bold>) and MeObzlC (<bold>4</bold>) in low suppression efficiencies in <italic>sfGFP-UAG27</italic> production. In contrast to PylRS-D1, the substrate specificity profiles of N-PylRS-D1 have revealed abolished fluorescence intensities in charging ncAA <bold>1</bold>&#x2013;<bold>5</bold> in <italic>sfGFP-UAG2</italic> and <italic>sfGFP-UAG27</italic> suppression tests. The N-PylRS-L1&#x2013;L3 variants showed reinstalled signals in <italic>sfGFP-UAG2</italic> suppression with similar activities in charging BocK (<bold>1</bold>) and AlloK (<bold>2</bold>). The <italic>sfGFP-UAG27</italic> gene suppression test in N-PylRS-L1&#x2013;L3 had a gradual decrease in activity along with increasing linker length in charging ncAA <bold>1</bold>&#x2013;<bold>5</bold>.</p>
</sec>
<sec id="S3.SS2">
<title>Substrate Range Study of ZRS and Its Variants</title>
<p>ZRS was evolved from <italic>Mm</italic>PylRS with Y306M/L309A/C348T/T364K/Y384F mutations at the active site (<xref ref-type="bibr" rid="B26">Wang et al., 2010</xref>). To validate the influence on the activity of ZRS by the R61K/H63Y/S193R mutations, as well as the introduction of the linker, these variations in the wt-PylRS study were transplanted and tested on ZRS, which was initially found to incorporate CbzK (<bold>6</bold>) and CbzK analogs (<bold>7</bold>, <bold>10</bold>&#x2013;<bold>11</bold>) (<xref ref-type="fig" rid="F1a">Scheme 1</xref>) (<xref ref-type="bibr" rid="B25">Wang Z.U. et al., 2012</xref>). Thus, ZRS variants, N-ZRS, ZRS-D1, ZRS-L1, ZRS-L2, and ZRS-L3, were constructed for evaluating their effects with active site mutation. The screening results of the substrate range in <italic>sfGFP-UAG2</italic> and <italic>sfGFP-UAG27</italic> suppression for the ZRS and the five variants are shown in <xref ref-type="supplementary-material" rid="DS1">Supplementary Figures S35&#x2013;S46</xref>. NcAA <bold>3</bold>&#x2013;<bold>11</bold> (<xref ref-type="fig" rid="F1a">Scheme 1</xref>) had a positive response and are illustrated in <xref ref-type="fig" rid="F5">Figure 5</xref>.</p>
<fig id="F5" position="float">
<label>FIGURE 5</label>
<caption><p>The <italic>sfGFP-UAG2</italic> and <italic>sfGFP-UAG27</italic> gene suppression efficiencies of ZRS enzyme variants. Incorporation efficiencies of ZRS variants (<xref ref-type="fig" rid="F1">Figure 1B</xref>) as measured by the fluorescence intensities of sfGFP with amber mutation at position 2 <bold>(A)</bold> and 27 <bold>(B)</bold>. The proteins were expressed in 1 mM ncAA and IPTG in GMML medium at 37&#x00B0;C for 12 h. The cells were excited at 485 nm and the fluorescence intensities were detected at 535 nm. The cell density was monitored by absorbance at 595 nm. &#x201C;C&#x201D; indicate the Control experiments of cells with the supplement of 1 mM IPTG; <bold>3</bold>, <bold>4</bold>, <bold>6</bold>&#x2013;<bold>11</bold> denote the supplement of 1 mM IPTG and ncAA <bold>3</bold>, <bold>4</bold>, <bold>6</bold>&#x2013;<bold>11</bold> (<xref ref-type="fig" rid="F1a">Scheme 1</xref>). Error bars represent the standard deviation of sfGFP production from four repeated experiments.</p></caption>
<graphic xlink:href="fbioe-08-00235-g005.tif"/>
</fig>
<p>CbzK (<bold>6</bold>) was efficiently incorporated into sfGFP in response to the amber codon as reported for ZRS. The CbzK analogs, ClCbzK (<bold>7</bold>), SeCbzK (<bold>10</bold>), and CbzKOH (<bold>11</bold>) (<xref ref-type="fig" rid="F1a">Scheme 1</xref>), also showed similar intensity in the <italic>sfGFP-UAG2</italic> suppression study. Two D-form CbzK analogs, DCbzK (<bold>8</bold>) and DClCbzK (<bold>9</bold>), were positive but had lower signals (<xref ref-type="fig" rid="F5">Figure 5A</xref>). <italic>sfGFP-UAG27</italic> suppression in ncAAs library screening of ZRS showed 12.8 times lower signal in charging CbzK compared to the <italic>sfGFP-UAG2</italic> suppression study but was only 1.6 times lower in charging SeCbzK. The substrate range of N-ZRS remained the same as that of ZRS; nevertheless, the substrate specificity profiles of N-ZRS in the <italic>sfGFP-UAG2</italic> suppression study showed a higher fluorescence intensity as compared to ZRS, especially in charging D-ncAA <bold>8</bold> and <bold>9</bold>. Unexpectedly, <italic>S</italic>-benzyl cysteine analogs ncAA <bold>3</bold> and <bold>4</bold> were also incorporated into sfGFP with low efficiencies by N-ZRS in the <italic>sfGFP-UAG27</italic> suppression study. The ZRS-D1 screening results showed a significant decrease in activity in the <italic>sfGFP-UAG2</italic> and <italic>sfGFP-UAG27</italic> suppression studies compared to ZRS and other ZRS variants. The ZRS-D1 activity with CbzKOH (<bold>11</bold>), however, was the best in the <italic>sfGFP-UAG2</italic> screening and had diminished activity in the <italic>sfGFP-UAG27</italic> screening (<xref ref-type="fig" rid="F5">Figure 5</xref>). The addition of a linker did not raise the suppression efficiencies of ZRS albeit a slight increase in the fluorescence intensities of ZRS-L2 can be observed with ncAA <bold>6</bold> and <bold>10</bold> in response to <italic>sfGFP-UAG2</italic> and <italic>sfGFP-UAG27</italic> (<xref ref-type="fig" rid="F5">Figure 5</xref>).</p>
</sec>
<sec id="S3.SS3">
<title>Western Blotting, Electrospray Ionization-Mass Spectrometry, and Tandem Mass Spectrometry Characterization of ncAA-Encoded sfGFP</title>
<p>Some amber screening results show reverse or different intensity patterns, and western blotting analysis was used to confirm sfGFP protein yield to support the sfGFP fluorescence intensity results. N-ZRS and ZRS-D1 were chosen for analyzing sfGFP-UAG27 and sfGFP-UAG2 protein productions (<xref ref-type="fig" rid="F6">Figure 6A</xref>). An anti-His tag antibody was used to detect the C-terminal-His tag present in full-length sfGFP, which indicates the amount of read-through at the amber stop codon. Western blotting analysis of N-ZRS/sfGFP-UAG27 indicates strong amber read-through for ncAA <bold>6</bold>&#x2013;<bold>8</bold> and <bold>10</bold> and weaker response for ncAA <bold>9</bold> and <bold>11</bold> in SDS-PAGE and anti-His channel. Clearly, sfGFP-<bold>11</bold> showed an additional band at lower molecular weight, near the 25-kDa protein marker in SDS-PAGE, which was also detected by western blotting (<xref ref-type="fig" rid="F6">Figure 6A</xref>). These results are in partial agreement with the sfGFP fluorescent screening. They match for ncAA <bold>3</bold>, <bold>4</bold>, <bold>9</bold>, and <bold>10</bold>, not for ncAA <bold>6</bold>&#x2013;<bold>8</bold> and <bold>11</bold> (<xref ref-type="fig" rid="F5">Figure 5B</xref>). A ZRS-D1/sfGFP-UAG2 analysis (<xref ref-type="fig" rid="F6">Figure 6A</xref>), however, matches well with sfGFP fluorescent screening results (<xref ref-type="fig" rid="F5">Figure 5A</xref>), confirming that ZRS-D1 charges CbzKOH to generate acylated tRNA with high activity. The purified sfGFP-<bold>11</bold><sup>&#x2217;</sup> protein produced by the ZRS-D1&#x22C5;tRNA<sup>Pyl</sup> pair generated two additional major mass peaks because of ester bond cleavage and Cbz group deprotection: 27,773 Da (without the N-terminal Met) and 27,639 Da (without the N-terminal Met and Cbz group) (<xref ref-type="table" rid="T1">Table 1</xref> and <xref ref-type="supplementary-material" rid="DS1">Supplementary Figure S7</xref>). Purified sfGFP-<bold>6</bold>, sfGFP-<bold>7</bold>, and sfGFP-<bold>11</bold>, which were produced by N-ZRS&#x22C5;tRNA<sup>Pyl</sup> pair, were analyzed by electrospray ionization-mass spectrometry (ESI-MS) (<xref ref-type="table" rid="T1">Table 1</xref> and <xref ref-type="fig" rid="F6">Figure 6B</xref>, <xref ref-type="supplementary-material" rid="DS1">Supplementary Figures S4&#x2013;S6</xref>). The experimental mass of sfGFP-<bold>6</bold> (28,086 and 27,955 Da) and sfGFP-<bold>7</bold> (28,120, and 27,988 Da) matched well to the calculated molecular weight of sfGFP-<bold>6</bold> (28,085 and 27,955 Da) and sfGFP-<bold>7</bold> (28,120 and 27,989 Da). A matrix-assisted laser desorption/ionization-time of flight-tandem mass spectrometry (MALDI-TOF-MS/MS) analysis of peptide <sup>27</sup>XSV<sup>30</sup>R fragments which encoded ncAA <bold>6</bold> and <bold>7</bold> further provides the correct molecular mass and sufficient b and y fragments to indicate ncAA purity at position 27 of the sfGFP (<xref ref-type="table" rid="T1">Table 1</xref> and <xref ref-type="supplementary-material" rid="DS1">Supplementary Figures S10</xref>, <xref ref-type="supplementary-material" rid="DS1">S11</xref>). In characterizing the mass of sfGFP-<bold>11</bold>, the replacement of the amino group with a hydroxyl group in the main chain results in additional mass peaks. Three mass peaks, at 27,955, 27,820, and 25,036 Da, were observed in the sfGFP-<bold>11</bold> mass spectrum. The calculated mass of full-length and truncated sfGFP-<bold>11</bold> is 27,955 (-Met) and 25,320 Da, respectively. The full-length sfGFP-<bold>11</bold> mass agrees with the calculated mass, and the peak at 27,820 Da matches the expected mass of sfGFP-<bold>11</bold> with Cbz group deprotection. The mass of sfGFP truncated at 28 position, 25,036 Da, does not fully match the calculated mass 25,057 Da and instead shows a loss of 21 Da, which indicates CbzKOH deletion at 27 position of the truncated sfGFP-<bold>11</bold> (<xref ref-type="table" rid="T1">Table 1</xref> and <xref ref-type="fig" rid="F6">Figure 6B</xref>, <xref ref-type="supplementary-material" rid="DS1">Supplementary Figure S6</xref>).</p>
<fig id="F6" position="float">
<label>FIGURE 6</label>
<caption><p>sfGFP production by ZRS variants and mass characterization. <bold>(A)</bold> Amber suppression of the <italic>sfGFP-UAG27</italic> gene (N-ZRS&#x22C5;tRNA<sup>Pyl</sup> pair) and the <italic>sfGFP-UAG2</italic> gene (ZRS-D1&#x22C5;tRNA<sup>Pyl</sup> pair) product with ncAA <bold>3</bold>&#x2013;<bold>4</bold> and <bold>6</bold>&#x2013;<bold>11</bold>. The sfGFP proteins were produced in <italic>E. coli</italic> BL21 (DE3) coding N-ZRS&#x22C5;tRNA<sup>Pyl</sup> or ZRS-D1&#x22C5;tRNA<sup>Pyl</sup> pair with the supplement of 1 mM IPTG and ncAAs in GMML medium at 37&#x00B0;C for 12 h. The whole-cell lysate was analyzed by SDS-PAGE and western blotting by anti-His tag antibody indicated as &#x03B1;-His6X. <bold>(B)</bold> ESI-MS determination of sfGFP-UAG27 proteins with ncAA <bold>6</bold>, <bold>7</bold>, and <bold>11</bold>. Full-length sfGFP-<bold>6</bold> and sfGFP-<bold>7</bold> proteins were produced by N-ZRS&#x22C5;tRNA<sup>Pyl</sup> pair in <italic>E. coli</italic> BL21 (DE3) with the supplement of 1 mM IPTG and ncAA <bold>6</bold> or <bold>7</bold> in LB medium at 37&#x00B0;C for 12 h. Full-length sfGFP-<bold>11</bold> proteins were produced with the same condition but with 1 mM ncAA <bold>11</bold> and in GMML minimal medium. The calculated molecular masses of sfGFP-<bold>7</bold> are 28,121 and 27,989 Da (&#x2013;Met); the observed molecular masses are 28,120 and 27,989 Da (&#x2013;Met). The calculated molecular masses of sfGFP-<bold>6</bold> are 28,085 and 27,954 Da (&#x2013;Met); the observed molecular masses are 28,085 and 27,955 Da (&#x2013;Met). The calculated molecular masses of sfGFP-<bold>11</bold> are 28,086, 27,955 (&#x2013;Met), and 25,320 Da (truncated sfGFP at 27 position); the observed molecular masses are 27,955 (&#x2013;Met) and 27,820 Da (without Cbz group at 27 position and N-terminal Met residues) and 25,036 Da. The detailed electrospray and deconvoluted mass spectra are shown in <xref ref-type="supplementary-material" rid="DS1">Supplementary Figures S4&#x2013;S6</xref>. ESI-MS determination of sfGFP-UAG2 protein. sfGFP-<bold>11</bold>&#x002A; with ncAA <bold>11</bold> (ZRS-D1&#x22C5;tRNA<sup>Pyl</sup> pair) is shown in <xref ref-type="supplementary-material" rid="DS1">Supplementary Figure S7</xref>.</p></caption>
<graphic xlink:href="fbioe-08-00235-g006.tif"/>
</fig>
<table-wrap position="float" id="T1">
<label>TABLE 1</label>
<caption><p>Electrospray ionization-mass spectrometry (ESI-MS) analysis of sfGFP proteins.</p></caption>
<table cellspacing="5" cellpadding="5" frame="hsides" rules="groups">
<thead>
<tr>
<td valign="top" align="left">Protein<sup>1</sup></td>
<td valign="top" align="center">PylRS mutants</td>
<td valign="top" align="left">Calculated mass (Da)</td>
<td valign="top" align="left">Actual mass (Da)</td>
<td valign="top" align="center">ESI-MS<sup>4</sup></td>
<td valign="top" align="center">MALDI-TOF-MS/MS<sup>5</sup></td>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">sfGFP-<bold>3</bold></td>
<td valign="top" align="center">N-PylRS</td>
<td valign="top" align="left">28,030, 27,899 (-Met)<sup>2</sup></td>
<td valign="top" align="left">28,030, 27,899</td>
<td valign="top" align="center">S1</td>
<td valign="top" align="center">8A</td>
</tr>
<tr>
<td valign="top" align="left">sfGFP-<bold>4</bold></td>
<td/>
<td valign="top" align="left">28,046, 27,915 (-Met)</td>
<td valign="top" align="left">28,046, 27,915</td>
<td valign="top" align="center">S2</td>
<td valign="top" align="center">S14</td>
</tr>
<tr>
<td valign="top" align="left">sfGFP-<bold>5</bold></td>
<td/>
<td valign="top" align="left">27,974, 27,843 (-Met)</td>
<td valign="top" align="left">27,974, 27,843</td>
<td valign="top" align="center">S3</td>
<td valign="top" align="center">8B</td>
</tr>
<tr>
<td valign="top" align="left">sfGFP-<bold>6</bold></td>
<td valign="top" align="center">N-ZRS</td>
<td valign="top" align="left">28,086, 27,955 (-Met)</td>
<td valign="top" align="left">28,085, 27,955</td>
<td valign="top" align="center">S4</td>
<td valign="top" align="center">S10</td>
</tr>
<tr>
<td valign="top" align="left">sfGFP-<bold>7</bold></td>
<td/>
<td valign="top" align="left">28,120, 27,988 (-Met)</td>
<td valign="top" align="left">28,120, 27,989</td>
<td valign="top" align="center">S5</td>
<td valign="top" align="center">S11</td>
</tr>
<tr>
<td valign="top" align="left">sfGFP-<bold>11</bold></td>
<td/>
<td valign="top" align="left">27,955 (-Met), 27,820<sup>6</sup>, 25,057<sup>7</sup></td>
<td valign="top" align="left">27,955, 27,820, 25,036</td>
<td valign="top" align="center">S6</td>
<td valign="top" align="center">&#x2013;</td>
</tr>
<tr>
<td valign="top" align="left">sfGFP-<bold>3</bold></td>
<td/>
<td valign="top" align="left">27,899 (-Met)</td>
<td valign="top" align="left">27,899, 27,878<sup>3</sup></td>
<td valign="top" align="center">S8</td>
<td valign="top" align="center">S12</td>
</tr>
<tr>
<td valign="top" align="left">sfGFP-<bold>4</bold></td>
<td/>
<td valign="top" align="left">27,915 (-Met)</td>
<td valign="top" align="left">27,916, 27,878<sup>3</sup></td>
<td valign="top" align="center">S9</td>
<td valign="top" align="center">S13</td>
</tr>
<tr>
<td valign="top" align="left">sfGFP-<bold>11</bold><sup>&#x2217;</sup></td>
<td valign="top" align="center">ZRS-D1</td>
<td valign="top" align="left">27,904, 27,773 (-Met), 27,639<sup>8</sup></td>
<td valign="top" align="left">27904, 27,773, 27,639</td>
<td valign="top" align="center">S7</td>
<td valign="top" align="center">&#x2013;</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<attrib><italic>&#x002A;The sfGFP protein was produced from <italic>sfGFP-UAG2</italic> gene. sfGFP-<bold>3</bold>, sfGFP-<bold>4</bold>, sfGFP-<bold>11</bold>, and sfGFP-<bold>11</bold>&#x002A; were produced in GMML medium; sfGFP-<bold>5</bold>, sfGFP-<bold>6</bold>, and sfGFP-<bold>7</bold> were prepared in LB medium. <sup><italic>1</italic></sup>The sfGFP proteins were produced from <italic>sfGFP-UAG27</italic> gene. <sup><italic>2</italic></sup>(&#x2013;Met) indicates full-length sfGFP protein without N-terminus methionine residues. <sup><italic>3</italic></sup>Actual mass of 27,878 Da is full-length sfGFP with tryptophan incorporation at F27 position without N-terminus methionine (calculated mass: 27,878 Da). <sup><italic>4</italic></sup>Full-length sfGFP electrospray and deconvoluted mass spectrometries. <sup><italic>5&#x2009;27</italic></sup>XSV<sup><italic>30</italic></sup>R peptide fragment was selected for MALDI-TOF-MS/MS analysis. <sup><italic>6</italic></sup>27,820 Da is the calculated molecular weight of sfGFP without Cbz group at 27 position and N-terminal Met residues. <sup><italic>7</italic></sup>25,057 Da is the calculated mass of truncated sfGFP at 28 position. <sup><italic>8</italic></sup>27,639 Da is the calculated mass of sfGFP without N-terminal Met and Cbz group on the CbzKOH side chain.</italic></attrib>
</table-wrap-foot>
</table-wrap>
<p>The purified sfGFP-<bold>3</bold> and sfGFP-<bold>4</bold> proteins with ncAA <bold>3</bold> and <bold>4</bold> encoded at 27 position that were produced by the N-ZRS&#x22C5;tRNA<sup>Pyl</sup> pair in <italic>E. coli</italic> were characterized, and they matched the calculated mass (<xref ref-type="table" rid="T1">Table 1</xref> and <xref ref-type="supplementary-material" rid="DS1">Supplementary Figures S8</xref>, <xref ref-type="supplementary-material" rid="DS1">S9</xref>). The mass spectra of sfGFP-<bold>3</bold> and sfGFP-<bold>4</bold> show a molecular peak indicating tryptophan incorporation, 27,878 Da. A MALDI-TOF-MS/MS analysis of sfGFP-<bold>3</bold> and sfGFP-<bold>4</bold> also confirmed the presence of ncAA <bold>3</bold> and <bold>4</bold> at position 27 of sfGFP. To confirm the ncAAs screening results mentioned in the N-PylRS&#x22C5;tRNA<sup>Pyl</sup> pair study, sfGFP-<bold>3</bold>, sfGFP-<bold>4</bold>, and sfGFP-<bold>5</bold> were expressed and purified, respectively, and then subjected to ESI-MS analysis (<xref ref-type="table" rid="T1">Table 1</xref> and <xref ref-type="supplementary-material" rid="DS1">Supplementary Figures S1&#x2013;S3</xref>). The calculated molecular weight of sfGFP-<bold>3</bold>, sfGFP-<bold>4</bold>, and sfGFP-<bold>5</bold>, generated by N-PylRS, matched the observed mass in the full-length sfGFP (<xref ref-type="fig" rid="F7">Figure 7</xref>). The incorporation of ncAA <bold>3</bold>, <bold>4</bold>, and <bold>5</bold> into sfGFP at position 27 was shown by MALDI-TOF-MS/MS (<xref ref-type="fig" rid="F8">Figure 8</xref> and <xref ref-type="supplementary-material" rid="DS1">Supplementary Figures S12&#x2013;S14</xref>). This multiple evidence indicates that MbzlC (<bold>3</bold>), MeObzlC (<bold>4</bold>), and 3MeH (<bold>5</bold>) are incorporated into proteins by non-active, mutated N-PylRS&#x22C5;tRNA<sup>Pyl</sup> pair site-specifically.</p>
<fig id="F7" position="float">
<label>FIGURE 7</label>
<caption><p>Deconvoluted ESI-MS spectra of sfGFP containing ncAAs at position 27. Full-length sfGFP-<bold>3</bold>, sfGFP-<bold>4</bold>, and sfGFP-<bold>5</bold> were expressed using the N-PylRS&#x22C5;tRNA<sup>Pyl</sup> pair in the presence of ncAA <bold>3</bold>, <bold>4</bold> (2 mM) or <bold>5</bold> (1 mM), respectively, in GMML medium (sfGFP-<bold>3</bold> and sfGFP-<bold>4)</bold> or LB medium (sfGFP-<bold>5</bold>). The purified protein samples were subjected to ESI-MS for identification of the incorporation of defined ncAA. Deconvoluted ESI-MS of ncAA <bold>3</bold>&#x2013;<bold>5</bold> incorporated sfGFP at position 27 are shown above. sfGFP-X in which X represents one of the ncAA <bold>3</bold>&#x2013;<bold>5</bold> was incorporated into sfGFP at position 27. The calculated molecular masses of sfGFP-<bold>3</bold> are 28,030 and 27,899 Da (-Met); the observed molecular masses are 28,030 and 27,899 Da (-Met). The calculated molecular masses of sfGFP-<bold>4</bold> are 28,046 and 27,915 Da (-Met); the observed molecular masses are 28,046 and 27,915 Da (-Met). The calculated molecular masses of sfGFP-<bold>5</bold> are 27,974 and 27,843 Da (-Met); the observed molecular masses are 27,974 and 27,843 Da (-Met). The detailed electrospray and deconvoluted mass spectra are shown in <xref ref-type="supplementary-material" rid="DS1">Supplementary Figures S1&#x2013;S3</xref>.</p></caption>
<graphic xlink:href="fbioe-08-00235-g007.tif"/>
</fig>
<fig id="F8" position="float">
<label>FIGURE 8</label>
<caption><p>MALDI-TOF-MS/MS analysis of sfGFP-3 and sfGFP-5. The sfGFP-<bold>3</bold> and sfGFP-<bold>5</bold> proteins were in-gel digested with trypsin and subjected to MALDI-TOF-MS/MS analysis. <bold>(A)</bold> The tandem mass spectrum of the X(<bold>3</bold>)SVR; X denotes a fragment from sfGFP-<bold>3</bold>, with ncAA <bold>3</bold> incorporated at position 27. The calculated molecular mass of the X(<bold>3</bold>)SVR peptide fragment is 567.284 Da and the actual molecular mass is 568.327 Da. Full-length sfGFP-<bold>3</bold> was expressed using N-PylRS in the presence of 2 mM ncAA <bold>3</bold> in GMML medium. <bold>(B)</bold> The tandem mass spectrum of the X(<bold>5</bold>)SVR; X denotes a fragment from sfGFP-<bold>5</bold> with ncAA <bold>5</bold> incorporated at position 27. The calculated molecular mass of the X(<bold>5</bold>)SVR peptide fragment is 511.287 Da and the actual molecular mass is 512.609 Da. Full-length sfGFP-<bold>5</bold> was produced using N-PylRS&#x22C5;tRNA<sup>Pyl</sup> pair in the presence of 1 mM ncAA <bold>5</bold> in LB medium.</p></caption>
<graphic xlink:href="fbioe-08-00235-g008.tif"/>
</fig>
</sec>
</sec>
<sec id="S4">
<title>Discussion</title>
<p>In this study, we showed that the R61K/H63Y/S193R mutations, which are located beyond the catalytic site, increase the suppression efficiencies of PylRS and ZRS toward their preferred substrates. The substrate range of N-PylRS allowed the incorporation of ncAA <bold>3</bold>&#x2013;<bold>5</bold>, two S-benzyl cysteine analogs and a histidine analog, with high efficiency as compared to wt-PylRS. This suggests that the remote mutations tune the interaction between PylRS and tRNA<sup>Pyl</sup>, which leads to the successful incorporation of ncAA <bold>3</bold>&#x2013;<bold>5</bold> despite the active site engineering of PylRS (<xref ref-type="bibr" rid="B28">Xiao et al., 2014</xref>; <xref ref-type="bibr" rid="B18">Sharma et al., 2016</xref>). A similar tuning effect has been observed in PylRS N-terminal mutations by global-directed evolution and PANCE, which results in enhancement of enzyme efficiencies (<xref ref-type="bibr" rid="B19">Sharma et al., 2018</xref>). We chose R61 and H63 of PylRS as they are clustered on the loop adjacent to the extremity of the &#x03B1;-helix. Specifically, the guanidinium side-chain of R61 has a polar interaction with the phosphodiester backbone near 58A of tRNA<sup>Pyl</sup> as well as the R52 residue within the NTD. In addition, the imidazole side-chain of H63 hydrogen bonds with the amino group on the side chain of K85 (<xref ref-type="fig" rid="F2">Figure 2</xref>). The R61K and H63Y mutations may disrupt these interactions. The S193 is located on the tRNA binding domain of the PylRS CTD. Although S193 is relatively far from the NTD, it does not interact with residues alongside the catalytic site. We envision that the S193R mutation moderately tunes the binding between PylRS and tRNA<sup>Pyl</sup> (<xref ref-type="fig" rid="F3">Figure 3</xref>). By placing the R61K/H63Y/S193R mutations on wt-PylRS, the substrate range was shifted to introduce ncAA <bold>3</bold>&#x2013;<bold>5</bold>. We postulate that the catalytic core of wt-PylRS expands locally to harbor ncAA with shorter bulky side-chains owing to the sophisticated regulation with the binding of tRNA<sup>Pyl</sup>. The ZRS shows its best incorporation efficiencies toward ncAA <bold>6</bold>, and it was also found to incorporate ncAA <bold>7</bold>, <bold>3</bold>, and <bold>4</bold> into sfGFP based on the screening results. Unanticipatedly, the substrate range of N-ZRS remained the same as that of ZRS. The fine-tuning effect of the mutations seen with wt-PylRS is not seen with ZRS, which might result from its tightly regulated substrate range of the evolved catalytic pocket. This result also implies the current directed-evolution approach at the PylRS active site which leads to a stabilized local arrangement that prevents it from the tuning effects of N-terminal mutations. This also explains no significant activity enhancement in introducing a linker to N-PylRS and ZRS. Although no significant improvement of an introduced linker was found, the repeated peptide sequence, (GGGGS)<sub>1</sub><sub>&#x2013;</sub><sub>3</sub>, could be evolved to explore additional interaction with tRNA<sup>Pyl</sup> for altering substrate range and activity enhancement. Importantly, the D-form ncAA <bold>8</bold> and <bold>9</bold> gave small but positive signals in ZRS and a yield enhancement in N-ZRS based on fluorescence screening and western blotting analysis. ZRS-D1 with separated NTD and CTD seems tightening up the chiral specificity by releasing the structural remote effects, which results in a losing activity in charging the D-form ncAAs <bold>8</bold> and <bold>9</bold> (<xref ref-type="fig" rid="F5">Figures 5</xref>, <xref ref-type="fig" rid="F6">6A</xref>).</p>
<p>Two different sfGFP proteins, namely, sfGFP-UAG2 and sfGFP-UAG27, were used in this study to compare the incorporation efficiencies of the PylRS variants. Our studies have proven that the former fluorescence intensity of lysine derivatives was considerably stronger than the latter one. This indicates that the serine 2 of sfGFP located on the flexible loop might be suitable for the long and polar side-chains of ncAAs. On the contrary, the latter substrate range of amino acids with bulky and aromatic side-chain derivatives were easier to be observed than the former one. However, western blotting analysis of N-ZRS in producing the sfGFP-UAG27 proteins by installing ncAA <bold>6</bold>&#x2013;<bold>9</bold> (<xref ref-type="fig" rid="F6">Figure 6A</xref>) shows reverse intensity in fluorescent screening. This suggests that the sfGFP variants containing these ncAAs have lost their folded structure, resulting in fluorescent quenching by penetrating water molecules or protein precipitation. Surprisingly, sfGFP-<bold>10</bold> has a higher fluorescent signal than would be expected due to the western-blotting results. This may be due to a smaller bond angle at the selenium atom that causes a bended side-chain and stabilizes the sfGFP &#x03B2;-barrel structure. The characterization of sfGFP-<bold>11</bold> and sfGFP-<bold>11</bold><sup>&#x2217;</sup>, which are produced by N-ZRS and ZRS-D1, also indicate ester bond hydrolysis and partial Cbz group deprotection.</p>
<p>Various PylRS have been discovered in nature to catalyze the acylation reactions between pyrrolysine and tRNA<sup>Pyl</sup>. Previous studies have shown that PylRS can be expressed in the form of either a single polypeptide (<italic>Mm</italic>PylRS or <italic>Mb</italic>PylRS) or separated polypeptides (<italic>Dh</italic>PylRS) (<xref ref-type="bibr" rid="B8">Jiang and Krzycki, 2012</xref>). &#x0394;NPylRS is a group of PylRS which lacks the NTD but which shows decent suppression efficiencies <italic>in vivo</italic> (<xref ref-type="bibr" rid="B27">Willis and Chin, 2018</xref>). Our findings demonstrate that the separated polypeptide of <italic>Mm</italic>PylRS, PylRS-D1, still retains the lower catalytic activity, but this was not the case for N-PylRS-D1. Noticeably, the substrate specificity profiles of N-PylRS-D1 showed a decrease in activity as compared to PylRS-D1. The abolished activity of N-PylRS-D1 implies that the R61K/H63Y/S193R mutations need a linkage between the NTD and the CTD to transfer the remote effect in improving enzyme activity. In addition, our results point out the indispensability of the unstructured flexible loop connecting the NTD and the CTD of PylRS. The separately expressed NTD and CTD of <italic>Mm</italic>PylRS are believed to be functionally reassembled in cells according to the substrate specificity profiles of PylRS-D1, showing the reasonable decrease in activity toward the same substrates in contrast to wt-PylRS. Recombining the linker between the junctions has conspicuously restored the activity of N-PylRS-D1. This suggests that the tuning effect of R61K/H63Y/S193R between PylRS and tRNA<sup>Pyl</sup> could also mutually regulate the interplay between the NTD and the CTD and that the truncation of the flexible loop might perturb their binding mode, leading to a reduction in activity. Increasing the length of a linker leads to an upward trend in the suppression efficiencies of wt-PylRS, whereas this effect is not observed with ZRS. These findings lead us to believe that the identity of the residues in the linker affects PylRS activity <italic>via</italic> tuning flexibility interactions involving the NTD and the CTD or providing beneficial interactions between linker residues and tRNA.</p>
</sec>
<sec id="S5">
<title>Conclusion</title>
<p>Introduction of R61K/H63Y/S193R mutations to wt-PylRS has altered its substrate range for the incorporation of ncAA <bold>3</bold>&#x2013;<bold>5</bold>, which, we propose, arises from the refinement of the dynamics between PylRS and tRNA<sup>Pyl</sup>. The addition of a linker provides extra flexibility to potentially regulate the interaction between NTD and CTD of PylRS and changes the interface between PylRS and tRNA<sup>Pyl</sup>, in turn enhancing the suppression efficiencies. Our findings not only indicate the sophisticated interaction between NTD and CTD of PylRS and tRNA<sup>Pyl</sup> but also reveal the importance of N-terminus engineering in exploring the novel substrate range and improving the suppression efficiency.</p>
</sec>
<sec id="S6">
<title>Data Availability Statement</title>
<p>All datasets generated for this study are included in the article/<xref ref-type="supplementary-material" rid="DS1">Supplementary Material</xref>.</p>
</sec>
<sec id="S7">
<title>Author Contributions</title>
<p>Y-SW: conceptualization, resources, supervision, project administration, and funding acquisition. H-KJ, J-CT, K-WC, H-WT, K-PC, Y-KL, and Y-SW: methodology. Y-SW and H-KJ: validation. H-KJ and M-NL: formal analysis. H-KJ, M-NL, and Y-SW: data curation. H-KJ: writing &#x2013; original draft preparation. Y-SW, Y-KL, and H-KJ: writing &#x2013; review and editing.</p>
</sec>
<sec id="conf1">
<title>Conflict of Interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
</body>
<back>
<fn-group>
<fn fn-type="financial-disclosure">
<p><bold>Funding.</bold> This research was funded by the Taiwan Protein Project (AS-KPQ-105-TPP) and the Ministry of Science and Technology (MOST), Taiwan (MOST 107-2113-M-001-025-MY3). Y-SW was supported by the Award for Supporting Talent Junior Faculty, MOST and Academia Sinica.</p>
</fn>
</fn-group>
<ack>
<p>We thank Dr. Shu-Yu Lin for the assistance in full-length protein mass spectrometry analysis and data processing that were acquired at the Academia Sinica Common Mass Spectrometry Facilities for the proteomics and protein modification analysis located at the Institute of Biological Chemistry, Academia Sinica, supported by Academia Sinica Core Facility and Innovative Instrument Project (AS-CFII-108-107). We also thank Cheng-Hsilin Hsieh for the technical assistance in MALDI-TOF/TOF mass spectrometry from Genomics Core at the Institute of Molecular Biology, Academia Sinica. We are grateful to Prof. Todd L. Lowary (Institute of Biological Chemistry, Academia Sinica) for critical discussion and helpful suggestions. We thank AS-TIGP for supporting H-KJ with AS-TIGP Research Performance Fellowship Award.</p>
</ack>
<sec id="S10" sec-type="supplementary material"><title>Supplementary Material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fbioe.2020.00235/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fbioe.2020.00235/full#supplementary-material</ext-link></p>
<supplementary-material xlink:href="Data_Sheet_1.pdf" id="DS1" mimetype="application/pdf" xmlns:xlink="http://www.w3.org/1999/xlink"/>
</sec>
<ref-list>
<title>References</title>
<ref id="B1"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ambrogelly</surname> <given-names>A.</given-names></name> <name><surname>Gundllapalli</surname> <given-names>S.</given-names></name> <name><surname>Herring</surname> <given-names>S.</given-names></name> <name><surname>Polycarpo</surname> <given-names>C.</given-names></name> <name><surname>Frauer</surname> <given-names>C.</given-names></name> <name><surname>S&#x00F6;ll</surname> <given-names>D.</given-names></name></person-group> (<year>2007</year>). <article-title>Pyrrolysine is not hardwired for cotranslational insertion at UAG codons.</article-title> <source><italic>Proc. Natl. Acad. Sci. U.S.A.</italic></source> <volume>104</volume> <fpage>3141</fpage>&#x2013;<lpage>3146</lpage>. <pub-id pub-id-type="doi">10.1073/pnas.0611634104</pub-id> <pub-id pub-id-type="pmid">17360621</pub-id></citation></ref>
<ref id="B2"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Cavarelli</surname> <given-names>J.</given-names></name> <name><surname>Delagoutte</surname> <given-names>B.</given-names></name> <name><surname>Eriani</surname> <given-names>G.</given-names></name> <name><surname>Gangloff</surname> <given-names>J.</given-names></name> <name><surname>Moras</surname> <given-names>D.</given-names></name></person-group> (<year>1998</year>). <article-title>L-arginine recognition by yeast arginyl-tRNA synthetase.</article-title> <source><italic>EMBO J.</italic></source> <volume>17</volume> <fpage>5438</fpage>&#x2013;<lpage>5448</lpage>. <pub-id pub-id-type="doi">10.1093/emboj/17.18.5438</pub-id></citation></ref>
<ref id="B3"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Guo</surname> <given-names>L. T.</given-names></name> <name><surname>Wang</surname> <given-names>Y. S.</given-names></name> <name><surname>Nakamura</surname> <given-names>A.</given-names></name> <name><surname>Eiler</surname> <given-names>D.</given-names></name> <name><surname>Kavran</surname> <given-names>J. M.</given-names></name> <name><surname>Wong</surname> <given-names>M.</given-names></name><etal/></person-group> (<year>2014</year>). <article-title>Polyspecific pyrrolysyl-tRNA synthetases from directed evolution.</article-title> <source><italic>Proc. Natl. Acad. Sci. U. S. A.</italic></source> <volume>111</volume> <fpage>16724</fpage>&#x2013;<lpage>16729</lpage>. <pub-id pub-id-type="doi">10.1073/pnas.1419737111</pub-id> <pub-id pub-id-type="pmid">25385624</pub-id></citation></ref>
<ref id="B4"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Han</surname> <given-names>S.</given-names></name> <name><surname>Yang</surname> <given-names>A.</given-names></name> <name><surname>Lee</surname> <given-names>S.</given-names></name> <name><surname>Lee</surname> <given-names>H.-W.</given-names></name> <name><surname>Park</surname> <given-names>C. B.</given-names></name> <name><surname>Park</surname> <given-names>H.-S.</given-names></name></person-group> (<year>2017</year>). <article-title>Expanding the genetic code of Mus musculus.</article-title> <source><italic>Nat. Commun.</italic></source> <volume>8</volume>:<issue>14568</issue>. <pub-id pub-id-type="doi">10.1038/ncomms14568</pub-id> <pub-id pub-id-type="pmid">28220771</pub-id></citation></ref>
<ref id="B5"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Hao</surname> <given-names>B.</given-names></name> <name><surname>Gong</surname> <given-names>W.</given-names></name> <name><surname>Ferguson</surname> <given-names>T. K.</given-names></name> <name><surname>James</surname> <given-names>C. M.</given-names></name> <name><surname>Krzycki</surname> <given-names>J. A.</given-names></name> <name><surname>Chan</surname> <given-names>M. K.</given-names></name></person-group> (<year>2002</year>). <article-title>A new UAG-encoded residue in the structure of a methanogen methyltransferase.</article-title> <source><italic>Science</italic></source> <volume>296</volume> <fpage>1462</fpage>&#x2013;<lpage>1466</lpage>. <pub-id pub-id-type="doi">10.1126/science.1069556</pub-id> <pub-id pub-id-type="pmid">12029132</pub-id></citation></ref>
<ref id="B6"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Herring</surname> <given-names>S.</given-names></name> <name><surname>Ambrogelly</surname> <given-names>A.</given-names></name> <name><surname>Polycarpo</surname> <given-names>C. R.</given-names></name> <name><surname>Soll</surname> <given-names>D.</given-names></name></person-group> (<year>2007</year>). <article-title>Recognition of pyrrolysine tRNA by the Desulfitobacterium hafniense pyrrolysyl-tRNA synthetase.</article-title> <source><italic>Nucleic Acids Res.</italic></source> <volume>35</volume> <fpage>1270</fpage>&#x2013;<lpage>1278</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkl1151</pub-id> <pub-id pub-id-type="pmid">17267409</pub-id></citation></ref>
<ref id="B7"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Jaric</surname> <given-names>J.</given-names></name> <name><surname>Bilokapic</surname> <given-names>S.</given-names></name> <name><surname>Lesjak</surname> <given-names>S.</given-names></name> <name><surname>Crnkovic</surname> <given-names>A.</given-names></name> <name><surname>Ban</surname> <given-names>N.</given-names></name> <name><surname>Weygand-Durasevic</surname> <given-names>I.</given-names></name></person-group> (<year>2009</year>). <article-title>Identification of amino acids in the N-terminal domain of atypical methanogenic-type seryl-tRNA synthetase critical for tRNA recognition.</article-title> <source><italic>J. Biol. Chem.</italic></source> <volume>284</volume> <fpage>30643</fpage>&#x2013;<lpage>30651</lpage>. <pub-id pub-id-type="doi">10.1074/jbc.M109.044099</pub-id> <pub-id pub-id-type="pmid">19734148</pub-id></citation></ref>
<ref id="B8"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Jiang</surname> <given-names>R. S.</given-names></name> <name><surname>Krzycki</surname> <given-names>J. A.</given-names></name></person-group> (<year>2012</year>). <article-title>PylSn and the homologous N-terminal domain of pyrrolysyl-tRNA synthetase bind the tRNA that is essential for the genetic encoding of pyrrolysine.</article-title> <source><italic>J. Biol. Chem.</italic></source> <volume>287</volume> <fpage>32738</fpage>&#x2013;<lpage>32746</lpage>. <pub-id pub-id-type="doi">10.1074/jbc.M112.396754</pub-id> <pub-id pub-id-type="pmid">22851181</pub-id></citation></ref>
<ref id="B9"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kavran</surname> <given-names>J. M.</given-names></name> <name><surname>Gundllapalli</surname> <given-names>S.</given-names></name> <name><surname>O&#x2019;Donoghue</surname> <given-names>P.</given-names></name> <name><surname>Englert</surname> <given-names>M.</given-names></name> <name><surname>Soll</surname> <given-names>D.</given-names></name> <name><surname>Steitz</surname> <given-names>T. A.</given-names></name></person-group> (<year>2007</year>). <article-title>Structure of pyrrolysyl-tRNA synthetase, an archaeal enzyme for genetic code innovation.</article-title> <source><italic>Proc. Natl. Acad. Sci. U.S.A.</italic></source> <volume>104</volume> <fpage>11268</fpage>&#x2013;<lpage>11273</lpage>. <pub-id pub-id-type="doi">10.1073/pnas.0704769104</pub-id> <pub-id pub-id-type="pmid">17592110</pub-id></citation></ref>
<ref id="B10"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Li</surname> <given-names>Y.-M.</given-names></name> <name><surname>Yang</surname> <given-names>M.-Y.</given-names></name> <name><surname>Huang</surname> <given-names>Y.-C.</given-names></name> <name><surname>Li</surname> <given-names>Y.-T.</given-names></name> <name><surname>Chen</surname> <given-names>P. R.</given-names></name> <name><surname>Liu</surname> <given-names>L.</given-names></name></person-group> (<year>2012</year>). <article-title>Ligation of expressed protein &#x03B1;-hydrazides via genetic incorporation of an &#x03B1;-hydroxy acid.</article-title> <source><italic>ACS Chem. Biol.</italic></source> <volume>7</volume> <fpage>1015</fpage>&#x2013;<lpage>1022</lpage>. <pub-id pub-id-type="doi">10.1021/cb300020s</pub-id> <pub-id pub-id-type="pmid">22424086</pub-id></citation></ref>
<ref id="B11"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Mukai</surname> <given-names>T.</given-names></name> <name><surname>Kobayashi</surname> <given-names>T.</given-names></name> <name><surname>Hino</surname> <given-names>N.</given-names></name> <name><surname>Yanagisawa</surname> <given-names>T.</given-names></name> <name><surname>Sakamoto</surname> <given-names>K.</given-names></name> <name><surname>Yokoyama</surname> <given-names>S.</given-names></name></person-group> (<year>2008</year>). <article-title>Adding l-lysine derivatives to the genetic code of mammalian cells with engineered pyrrolysyl-tRNA synthetases.</article-title> <source><italic>Biochem. Biophys. Res. Commun.</italic></source> <volume>371</volume> <fpage>818</fpage>&#x2013;<lpage>822</lpage>. <pub-id pub-id-type="doi">10.1016/j.bbrc.2008.04.164</pub-id> <pub-id pub-id-type="pmid">18471995</pub-id></citation></ref>
<ref id="B12"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Mukai</surname> <given-names>T.</given-names></name> <name><surname>Yamaguchi</surname> <given-names>A.</given-names></name> <name><surname>Ohtake</surname> <given-names>K.</given-names></name> <name><surname>Takahashi</surname> <given-names>M.</given-names></name> <name><surname>Hayashi</surname> <given-names>A.</given-names></name> <name><surname>Iraha</surname> <given-names>F.</given-names></name><etal/></person-group> (<year>2015</year>). <article-title>Reassignment of a rare sense codon to a non-canonical amino acid in <italic>Escherichia coli</italic>.</article-title> <source><italic>Nucleic Acids Res.</italic></source> <volume>43</volume> <fpage>8111</fpage>&#x2013;<lpage>8122</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkv787</pub-id> <pub-id pub-id-type="pmid">26240376</pub-id></citation></ref>
<ref id="B13"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Neumann</surname> <given-names>H.</given-names></name> <name><surname>Peak-Chew</surname> <given-names>S. Y.</given-names></name> <name><surname>Chin</surname> <given-names>J. W.</given-names></name></person-group> (<year>2008</year>). <article-title>Genetically encoding N(epsilon)-acetyllysine in recombinant proteins.</article-title> <source><italic>Nat. Chem. Biol.</italic></source> <volume>4</volume> <fpage>232</fpage>&#x2013;<lpage>234</lpage>. <pub-id pub-id-type="doi">10.1038/nchembio.73</pub-id> <pub-id pub-id-type="pmid">18278036</pub-id></citation></ref>
<ref id="B14"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Nozawa</surname> <given-names>K.</given-names></name> <name><surname>O&#x2019;Donoghue</surname> <given-names>P.</given-names></name> <name><surname>Gundllapalli</surname> <given-names>S.</given-names></name> <name><surname>Araiso</surname> <given-names>Y.</given-names></name> <name><surname>Ishitani</surname> <given-names>R.</given-names></name> <name><surname>Umehara</surname> <given-names>T.</given-names></name><etal/></person-group> (<year>2009</year>). <article-title>Pyrrolysyl-tRNA synthetase-tRNA(Pyl) structure reveals the molecular basis of orthogonality.</article-title> <source><italic>Nature</italic></source> <volume>457</volume> <fpage>1163</fpage>&#x2013;<lpage>1167</lpage>. <pub-id pub-id-type="doi">10.1038/nature07611</pub-id> <pub-id pub-id-type="pmid">19118381</pub-id></citation></ref>
<ref id="B15"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>O&#x2019;Donoghue</surname> <given-names>P.</given-names></name> <name><surname>Luthey-Schulten</surname> <given-names>Z.</given-names></name></person-group> (<year>2003</year>). <article-title>On the evolution of structure in aminoacyl-tRNA synthetases.</article-title> <source><italic>Microbiol. Mol. Biol. Rev.</italic></source> <volume>67</volume> <fpage>550</fpage>&#x2013;<lpage>573</lpage>. <pub-id pub-id-type="doi">10.1128/mmbr.67.4.550-573.2003</pub-id> <pub-id pub-id-type="pmid">14665676</pub-id></citation></ref>
<ref id="B16"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>O&#x2019;Donoghue</surname> <given-names>P.</given-names></name> <name><surname>Prat</surname> <given-names>L.</given-names></name> <name><surname>Heinemann</surname> <given-names>I. U.</given-names></name> <name><surname>Ling</surname> <given-names>J.</given-names></name> <name><surname>Odoi</surname> <given-names>K.</given-names></name> <name><surname>Liu</surname> <given-names>W. R.</given-names></name><etal/></person-group> (<year>2012</year>). <article-title>Near-cognate suppression of amber, opal and quadruplet codons competes with aminoacyl-tRNAPyl for genetic code expansion.</article-title> <source><italic>FEBS Lett.</italic></source> <volume>586</volume> <fpage>3931</fpage>&#x2013;<lpage>3937</lpage>. <pub-id pub-id-type="doi">10.1016/j.febslet.2012.09.033</pub-id> <pub-id pub-id-type="pmid">23036644</pub-id></citation></ref>
<ref id="B17"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Schimmel</surname> <given-names>P.</given-names></name> <name><surname>Giege</surname> <given-names>R.</given-names></name> <name><surname>Moras</surname> <given-names>D.</given-names></name> <name><surname>Yokoyama</surname> <given-names>S.</given-names></name></person-group> (<year>1993</year>). <article-title>An operational RNA code for amino acids and possible relationship to genetic code.</article-title> <source><italic>Proc. Natl. Acad. Sci. U.S.A.</italic></source> <volume>90</volume> <fpage>8763</fpage>&#x2013;<lpage>8768</lpage>. <pub-id pub-id-type="doi">10.1073/pnas.90.19.8763</pub-id> <pub-id pub-id-type="pmid">7692438</pub-id></citation></ref>
<ref id="B18"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Sharma</surname> <given-names>V.</given-names></name> <name><surname>Wang</surname> <given-names>Y.-S.</given-names></name> <name><surname>Liu</surname> <given-names>W. R.</given-names></name></person-group> (<year>2016</year>). <article-title>Probing the catalytic charge-relay system in alanine racemase with genetically encoded histidine mimetics.</article-title> <source><italic>ACS Chem. Biol.</italic></source> <volume>11</volume> <fpage>3305</fpage>&#x2013;<lpage>3309</lpage>. <pub-id pub-id-type="doi">10.1021/acschembio.6b00940</pub-id> <pub-id pub-id-type="pmid">27978711</pub-id></citation></ref>
<ref id="B19"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Sharma</surname> <given-names>V.</given-names></name> <name><surname>Zeng</surname> <given-names>Y.</given-names></name> <name><surname>Wang</surname> <given-names>W. W.</given-names></name> <name><surname>Qiao</surname> <given-names>Y.</given-names></name> <name><surname>Kurra</surname> <given-names>Y.</given-names></name> <name><surname>Liu</surname> <given-names>W. R.</given-names></name></person-group> (<year>2018</year>). <article-title>Evolving the N-terminal domain of Pyrrolysyl-tRNA synthetase for improved incorporation of noncanonical amino acids.</article-title> <source><italic>ChemBioChem</italic></source> <volume>19</volume> <fpage>26</fpage>&#x2013;<lpage>30</lpage>. <pub-id pub-id-type="doi">10.1002/cbic.201700268</pub-id> <pub-id pub-id-type="pmid">29096043</pub-id></citation></ref>
<ref id="B20"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Shimada</surname> <given-names>A.</given-names></name> <name><surname>Nureki</surname> <given-names>O.</given-names></name> <name><surname>Goto</surname> <given-names>M.</given-names></name> <name><surname>Takahashi</surname> <given-names>S.</given-names></name> <name><surname>Yokoyama</surname> <given-names>S.</given-names></name></person-group> (<year>2001</year>). <article-title>Structural and mutational studies of the recognition of the arginine tRNA-specific major identity element, A20, by arginyl-tRNA synthetase.</article-title> <source><italic>Proc. Natl. Acad. Sci. U.S.A.</italic></source> <volume>98</volume> <fpage>13537</fpage>&#x2013;<lpage>13542</lpage>. <pub-id pub-id-type="doi">10.1073/pnas.231267998</pub-id> <pub-id pub-id-type="pmid">11698642</pub-id></citation></ref>
<ref id="B21"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Suzuki</surname> <given-names>T.</given-names></name> <name><surname>Miller</surname> <given-names>C.</given-names></name> <name><surname>Guo</surname> <given-names>L. T.</given-names></name> <name><surname>Ho</surname> <given-names>J. M. L.</given-names></name> <name><surname>Bryson</surname> <given-names>D. I.</given-names></name> <name><surname>Wang</surname> <given-names>Y. S.</given-names></name><etal/></person-group> (<year>2017</year>). <article-title>Crystal structures reveal an elusive functional domain of pyrrolysyl-tRNA synthetase.</article-title> <source><italic>Nat. Chem. Biol.</italic></source> <volume>13</volume> <fpage>1261</fpage>&#x2013;<lpage>1266</lpage>. <pub-id pub-id-type="doi">10.1038/nchembio.2497</pub-id> <pub-id pub-id-type="pmid">29035363</pub-id></citation></ref>
<ref id="B22"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Vargas-Rodriguez</surname> <given-names>O.</given-names></name> <name><surname>Sevostyanova</surname> <given-names>A.</given-names></name> <name><surname>Soll</surname> <given-names>D.</given-names></name> <name><surname>Crnkovic</surname> <given-names>A.</given-names></name></person-group> (<year>2018</year>). <article-title>Upgrading aminoacyl-tRNA synthetases for genetic code expansion.</article-title> <source><italic>Curr. Opin. Chem. Biol.</italic></source> <volume>46</volume> <fpage>115</fpage>&#x2013;<lpage>122</lpage>. <pub-id pub-id-type="doi">10.1016/j.cbpa.2018.07.014</pub-id> <pub-id pub-id-type="pmid">30059834</pub-id></citation></ref>
<ref id="B23"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wang</surname> <given-names>Y.-S.</given-names></name></person-group> (<year>2012</year>). <article-title><italic>Expanding Genetic Code for Protein Lysine and Phenylalanine Modifications</italic>.</article-title> <comment>Ph.D. thesis</comment>, <publisher-name>Texas A&#x0026;M University</publisher-name>, <publisher-loc>College Station, TX</publisher-loc>.</citation></ref>
<ref id="B24"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wang</surname> <given-names>Y. S.</given-names></name> <name><surname>Fang</surname> <given-names>X.</given-names></name> <name><surname>Wallace</surname> <given-names>A. L.</given-names></name> <name><surname>Wu</surname> <given-names>B.</given-names></name> <name><surname>Liu</surname> <given-names>W. R.</given-names></name></person-group> (<year>2012</year>). <article-title>A rationally designed pyrrolysyl-tRNA synthetase mutant with a broad substrate spectrum.</article-title> <source><italic>J. Am. Chem. Soc.</italic></source> <volume>134</volume> <fpage>2950</fpage>&#x2013;<lpage>2953</lpage>. <pub-id pub-id-type="doi">10.1021/ja211972x</pub-id> <pub-id pub-id-type="pmid">22289053</pub-id></citation></ref>
<ref id="B25"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wang</surname> <given-names>Z. U.</given-names></name> <name><surname>Wang</surname> <given-names>Y. S.</given-names></name> <name><surname>Pai</surname> <given-names>P. J.</given-names></name> <name><surname>Russell</surname> <given-names>W. K.</given-names></name> <name><surname>Russell</surname> <given-names>D. H.</given-names></name> <name><surname>Liu</surname> <given-names>W. R.</given-names></name></person-group> (<year>2012</year>). <article-title>A facile method to synthesize histones with posttranslational modification mimics.</article-title> <source><italic>Biochemistry</italic></source> <volume>51</volume> <fpage>5232</fpage>&#x2013;<lpage>5234</lpage>. <pub-id pub-id-type="doi">10.1021/bi300535a</pub-id> <pub-id pub-id-type="pmid">22697363</pub-id></citation></ref>
<ref id="B26"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wang</surname> <given-names>Y.-S.</given-names></name> <name><surname>Wu</surname> <given-names>B.</given-names></name> <name><surname>Wang</surname> <given-names>Z.</given-names></name> <name><surname>Huang</surname> <given-names>Y.</given-names></name> <name><surname>Wan</surname> <given-names>W.</given-names></name> <name><surname>Russell</surname> <given-names>W. K.</given-names></name><etal/></person-group> (<year>2010</year>). <article-title>A genetically encoded photocaged N&#x03B5;-methyl-l-lysine.</article-title> <source><italic>Mol. Biosyst.</italic></source> <volume>6</volume> <fpage>1557</fpage>&#x2013;<lpage>1560</lpage>. <pub-id pub-id-type="doi">10.1039/C002155E</pub-id> <pub-id pub-id-type="pmid">20711534</pub-id></citation></ref>
<ref id="B27"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Willis</surname> <given-names>J. C. W.</given-names></name> <name><surname>Chin</surname> <given-names>J. W.</given-names></name></person-group> (<year>2018</year>). <article-title>Mutually orthogonal pyrrolysyl-tRNA synthetase/tRNA pairs.</article-title> <source><italic>Nat. Chem.</italic></source> <volume>10</volume> <fpage>831</fpage>&#x2013;<lpage>837</lpage>. <pub-id pub-id-type="doi">10.1038/s41557-018-0052-5</pub-id> <pub-id pub-id-type="pmid">29807989</pub-id></citation></ref>
<ref id="B28"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Xiao</surname> <given-names>H.</given-names></name> <name><surname>Peters</surname> <given-names>F. B.</given-names></name> <name><surname>Yang</surname> <given-names>P. Y.</given-names></name> <name><surname>Reed</surname> <given-names>S.</given-names></name> <name><surname>Chittuluru</surname> <given-names>J. R.</given-names></name> <name><surname>Schultz</surname> <given-names>P. G.</given-names></name></person-group> (<year>2014</year>). <article-title>Genetic incorporation of histidine derivatives using an engineered pyrrolysyl-tRNA synthetase.</article-title> <source><italic>ACS Chem. Biol.</italic></source> <volume>9</volume> <fpage>1092</fpage>&#x2013;<lpage>1096</lpage>. <pub-id pub-id-type="doi">10.1021/cb500032c</pub-id> <pub-id pub-id-type="pmid">24506189</pub-id></citation></ref>
<ref id="B29"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Yanagisawa</surname> <given-names>T.</given-names></name> <name><surname>Ishii</surname> <given-names>R.</given-names></name> <name><surname>Fukunaga</surname> <given-names>R.</given-names></name> <name><surname>Kobayashi</surname> <given-names>T.</given-names></name> <name><surname>Sakamoto</surname> <given-names>K.</given-names></name> <name><surname>Yokoyama</surname> <given-names>S.</given-names></name></person-group> (<year>2008</year>). <article-title>Multistep engineering of pyrrolysyl-tRNA synthetase to genetically encode N(epsilon)-(o-azidobenzyloxycarbonyl) lysine for site-specific protein modification.</article-title> <source><italic>Chem. Biol.</italic></source> <volume>15</volume> <fpage>1187</fpage>&#x2013;<lpage>1197</lpage>. <pub-id pub-id-type="doi">10.1016/j.chembiol.2008.10.004</pub-id> <pub-id pub-id-type="pmid">19022179</pub-id></citation></ref>
</ref-list>
</back>
</article>