﻿<?xml version="1.0" encoding="utf-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.1 20151215//EN" "JATS-journalpublishing1.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article">
<front>
<journal-meta>
<journal-id journal-id-type="nlm-ta">Explor Drug Sci</journal-id>
<journal-id journal-id-type="publisher-id">EDS</journal-id>
<journal-title-group>
<journal-title>Exploration of Drug Science</journal-title>
</journal-title-group>
<issn pub-type="epub">2836-7677</issn>
<publisher>
<publisher-name>Open Exploration Publishing</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.37349/eds.2024.00053</article-id>
<article-id pub-id-type="manuscript">100853</article-id>
<article-categories>
<subj-group>
<subject>Original Article</subject>
</subj-group>
</article-categories>
<title-group>
<article-title>From canonical to unique: extension of a lipophilicity scale of amino acids to non-standard residues</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<contrib-id contrib-id-type="orcid">https://orcid.org/0000-0002-2112-5828</contrib-id>
<name>
<surname>Viayna</surname>
<given-names>Antonio</given-names>
</name>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/">Conceptualization</role>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/">Data curation</role>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/">Formal analysis</role>
<role content-type="https://credit.niso.org/contributor-roles/funding-acquisition/">Funding acquisition</role>
<role content-type="https://credit.niso.org/contributor-roles/investigation/">Investigation</role>
<role content-type="https://credit.niso.org/contributor-roles/methodology/">Methodology</role>
<role content-type="https://credit.niso.org/contributor-roles/project-administration/">Project administration</role>
<role content-type="https://credit.niso.org/contributor-roles/resources/">Resources</role>
<role content-type="https://credit.niso.org/contributor-roles/supervision/">Supervision</role>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing—original draft</role>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing—review &amp; editing</role>
<xref ref-type="aff" rid="I1">
<sup>1</sup>
</xref>
<xref ref-type="corresp" rid="cor1">
<sup>*</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<contrib-id contrib-id-type="orcid">https://orcid.org/0009-0009-6719-0746</contrib-id>
<name>
<surname>Matamoros</surname>
<given-names>Paulina</given-names>
</name>
<role content-type="https://credit.niso.org/contributor-roles/investigation/">Investigation</role>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/">Data curation</role>
<role content-type="https://credit.niso.org/contributor-roles/visualization/">Visualization</role>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing—review &amp; editing</role>
<xref ref-type="aff" rid="I2">
<sup>2</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<contrib-id contrib-id-type="orcid">https://orcid.org/0009-0000-8370-2515</contrib-id>
<name>
<surname>Blázquez-Ruano</surname>
<given-names>David</given-names>
</name>
<role content-type="https://credit.niso.org/contributor-roles/investigation/">Investigation</role>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/">Data curation</role>
<role content-type="https://credit.niso.org/contributor-roles/visualization/">Visualization</role>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing—review &amp; editing</role>
<xref ref-type="aff" rid="I3">
<sup>3</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<contrib-id contrib-id-type="orcid">https://orcid.org/0000-0003-4029-4528</contrib-id>
<name>
<surname>Zamora</surname>
<given-names>William J.</given-names>
</name>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/">Conceptualization</role>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/">Data curation</role>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/">Formal analysis</role>
<role content-type="https://credit.niso.org/contributor-roles/funding-acquisition/">Funding acquisition</role>
<role content-type="https://credit.niso.org/contributor-roles/investigation/">Investigation</role>
<role content-type="https://credit.niso.org/contributor-roles/methodology/">Methodology</role>
<role content-type="https://credit.niso.org/contributor-roles/project-administration/">Project administration</role>
<role content-type="https://credit.niso.org/contributor-roles/resources/">Resources</role>
<role content-type="https://credit.niso.org/contributor-roles/supervision/">Supervision</role>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing—original draft</role>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing—review &amp; editing</role>
<xref ref-type="aff" rid="I2">
<sup>2</sup>
</xref>
<xref ref-type="aff" rid="I4">
<sup>4</sup>
</xref>
<xref ref-type="aff" rid="I5">
<sup>5</sup>
</xref>
<xref ref-type="corresp" rid="cor2">
<sup>*</sup>
</xref>
</contrib>
<contrib contrib-type="editor">
<name>
<surname>Tolomelli</surname>
<given-names>Alessandra</given-names>
</name>
<role>Academic Editor</role>
<aff>University of Bologna, Italy</aff>
</contrib>
</contrib-group>
<aff id="I1">
<sup>1</sup>Departament de Nutrició, Ciències de l’Alimentació i Gastronomia, Facultat de Farmàcia i Ciències de l’Alimentació, Institut de Biomedicina (IBUB), Universitat de Barcelona (UB), 08921 Santa Coloma de Gramenet, Spain</aff>
<aff id="I2">
<sup>2</sup>CBio<sup>3</sup> Laboratory, School of Chemistry, University of Costa Rica, 11501-2060 San José, Costa Rica</aff>
<aff id="I3">
<sup>3</sup>CIC bioGUNE, Basque Research and Technology Alliance, 48160 Derio, Spain</aff>
<aff id="I4">
<sup>4</sup>Laboratory of Computational Toxicology and Biological Testing Laboratory (LEBi), University of Costa Rica, 11501-2060 San José, Costa Rica</aff>
<aff id="I5">
<sup>5</sup>Advanced Computing Lab (CNCA), National High Technology Center (CeNAT), 10109 San José, Costa Rica</aff>
<author-notes>
<corresp id="cor1">
<bold>
<sup>*</sup>Correspondence:</bold> Antonio Viayna, Departament de Nutrició, Ciències de l’Alimentació i Gastronomia, Facultat de Farmàcia i Ciències de l’Alimentació, Institut de Biomedicina (IBUB), 08921 Santa Coloma de Gramenet, Spain. <email>toniviayna@ub.edu</email></corresp>
<corresp id="cor2">William J. Zamora, CBio<sup>3</sup> Laboratory, School of Chemistry, University of Costa Rica, 11501-2060 San José, Costa Rica. <email>william.zamoraramirez@ucr.ac.cr</email></corresp>
</author-notes>
<pub-date pub-type="ppub">
<year>2024</year>
</pub-date>
<pub-date pub-type="epub">
<day>30</day>
<month>07</month>
<year>2024</year>
</pub-date>
<volume>2</volume>
<issue>4</issue>
<fpage>389</fpage>
<lpage>407</lpage>
<history>
<date date-type="received">
<day>31</day>
<month>01</month>
<year>2024</year>
</date>
<date date-type="accepted">
<day>25</day>
<month>04</month>
<year>2024</year>
</date>
</history>
<permissions>
<copyright-statement>© The Author(s) 2024.</copyright-statement>
<license xlink:href="https://creativecommons.org/licenses/by/4.0/">
<license-p>This is an Open Access article licensed under a Creative Commons Attribution 4.0 International License (<ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">https://creativecommons.org/licenses/by/4.0/</ext-link>), which permits unrestricted use, sharing, adaptation, distribution and reproduction in any medium or format, for any purpose, even commercially, as long as you give appropriate credit to the original author(s) and the source, provide a link to the Creative Commons license, and indicate if changes were made.</license-p>
</license>
</permissions>
<abstract>
<sec>
<title>Aim:</title>
<p id="absp-1">The lipophilicity of amino acids plays a crucial role in delineating their physicochemical properties, offering insights into solubility, binding affinity, and bioavailability, properties that are a cornerstone for the use of peptides as therapeutic agents. In this study, we employ the integral equation formalism polarizable continuum model/Miertus-Scrocco-Tomasi (IEFPCM/MST) implicit solvation model to compute the <italic>n</italic>-octanol/water partition coefficient, serving as a lipophilic descriptor for non-standard amino acids. This approach allows us to expand upon our prior scale developed for canonical amino acids.</p>
</sec>
<sec>
<title>Methods:</title>
<p id="absp-2">Using the IEFPCM/MST implicit solvation model, we extended our previous work on the hydrophobicity scale of amino acids. To this end, we employed two structural models, Model 1 and 2, differentiated solely by their <italic>C</italic>-terminal capping groups using an <italic>N</italic>- or <italic>O</italic>-methyl substituent, respectively.</p>
</sec>
<sec>
<title>Results:</title>
<p id="absp-3">Our findings revealed substantial similarities between the models, validating the lipophilicity values for the non-standard side chains. Differences were observed in fewer cases, indicating an effect of the capping group on the side chain hydrophobicity. This effect is expected as one model contains a hydrogen bond donor (Model 1) while the other one uses a hydrogen bond acceptor (Model 2).</p>
</sec>
<sec>
<title>Conclusions:</title>
<p id="absp-4">Overall, both models exhibit good correlations with the experimental values, with Model 1 showing lower statistical errors. In addition, our predictions were able to correctly predict the experimental hydrophobicity change due to the number of acetylated lysines in peptide pairs determined by HPLC, suggesting that our scale can be employed for proteomics studies that include post-translational modifications beyond acetylation.</p>
</sec>
</abstract>
<abstract abstract-type="graphical">
<p>
<fig id="F0">
<label>Graphical abstract.</label>
<caption>
<p> Lipophilicity of non-standard amino acids</p>
</caption>
<graphic xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="eds-02-100853-g000.tif" />
</fig>
</p>
</abstract>
<kwd-group>
<kwd>Partition coefficient</kwd>
<kwd>lipophilicity</kwd>
<kwd>non-natural amino acids</kwd>
<kwd>solvation</kwd>
<kwd>post-translational modifications</kwd>
<kwd>proteomics</kwd>
<kwd>lysine acetylation</kwd>
</kwd-group>
<funding-group>
<award-group id="award001">
<funding-source>
<institution-wrap>
<institution>Ministerio de Ciencia e Innovación&lt;/bold&gt; [PID2020-117646RB-I00, MCIN/AEI/10.13039/501100011033], &lt;bold&gt;Generalitat de Catalunya&lt;/bold&gt; [2021SGR00671], and &lt;bold&gt;Consorci de Serveis Universitaris de Catalunya</institution>
</institution-wrap>
</funding-source>
<award-id>PID2020-117646RB-I00</award-id>
<award-id>MCIN/AEI/10.13039/501100011033]</award-id>
<award-id>&lt;bold&gt;Generalitat de Catalunya&lt;/bold&gt; [2021SGR00671</award-id>
</award-group>
</funding-group>
</article-meta>
</front>
<body>
<sec id="s1">
<title>Introduction</title>
<p id="p-1">Amino acids are organic molecules that constitute the basic building blocks of proteins. From a functional point of view, mainly directed by their sequence and 3D arrangement, they play a fundamental role in a multitude of biological processes and functions in living organisms, such as enzymatic catalysis, cell signaling, structural support, or immune response, among others [<xref ref-type="bibr" rid="B1">1</xref>].</p>
<p id="p-2">Non-standard amino acids, also known as non-canonical or non-proteinogenic amino acids, deviate from the conventional ones typically present in proteins and synthesized by ribosomes in living organisms. Unlike the standard set of 20 amino acids which are enciphered by the genetic code and commonly incorporated into protein synthesis during translation [<xref ref-type="bibr" rid="B2">2</xref>], non-standard amino acids encompass a wide range of structurally diverse molecules, that may occur naturally or be synthesized artificially. Some non-standard amino acids occur naturally in certain organisms, although they are not part of the standard genetic code. For instance, selenocysteine and pyrrolysine, are examples of non-standard amino acids that are incorporated into proteins in certain bacteria and archaea, respectively [<xref ref-type="bibr" rid="B3">3</xref>].</p>
<p id="p-3">Shifting the focus to the physicochemical aspect of amino acids and/or proteins, is important consider their lipophilicity, a fundamental feature with a clear impact on biology, pharmacology, medicinal chemistry, and drug discovery [<xref ref-type="bibr" rid="B4">4</xref>, <xref ref-type="bibr" rid="B5">5</xref>]. In the context of proteins is important for understanding processes such as protein folding, where hydrophobic amino acids tend to cluster in the protein interior away from the aqueous environment. It also influences ligand binding, affecting the binding affinity and specificity of proteins and contributing to the formation of receptor-ligand interactions and also in protein-protein interactions, promoting the formation of protein complexes, among others. In addition, recent studies have created energy functions based on lipophilicity for membrane-protein studies of receptors, channels, and transporters [<xref ref-type="bibr" rid="B6">6</xref>]. Given these reasons, it is crucial to have tools that permit the quantification of the degree of hydrophobicity of proteins.</p>
<p id="p-4">For proteins, lipophilicity is primarily influenced by the specific features of the amino acid side chains. Consequently, one of the main strategies, involves quantifying the individual hydrophobicity of each amino acid, leading to the development of lipophilicity scales. These scales consider various properties such as partitioning of small molecules in a bulk solvent, employing knowledge-based techniques based on structural data and/or using experimental information coming from biological assays [<xref ref-type="bibr" rid="B7">7</xref>–<xref ref-type="bibr" rid="B9">9</xref>].</p>
<p id="p-5">By employing these scales, it is possible to generate lipophilicity profiles of peptides and/or proteins based on the individual hydrophobicity values of residues, assuming an additivity principle. However, depending on the employed scale, variations can occur not only in the absolute magnitude of residues but also in their relative values. These variations pose difficulties in correlating different scales, as well as reflect discrepancies between materials, methods, and experimental conditions that permit the definition of each scale.</p>
<p id="p-6">In this line, in our previous study [<xref ref-type="bibr" rid="B10">10</xref>], we developed an extensive lipophilicity scale of the 20 standard amino acids based on theoretical computations that took into account the local context of each amino acid in the proteins deposited in the Dunbrak’s rotamer library [<xref ref-type="bibr" rid="B11">11</xref>]. Thus, this scale incorporated the structural features of the conformational landscape of amino acids, as well as the impact of pH, providing a reliable depiction of the pH-adapted lipophilicity profile in peptides and proteins.</p>
<p id="p-7">However, when we move to non-standard amino acids, derivatives that differ in structure or composition from the 20 standard ones usually found in proteins, set a challenge to have new adaptations of the classical lipophilicity scales to be reliably standardized to be applied to those biomolecules with non-canonical modifications.</p>
<p id="p-8">Recent efforts have focused on the impact of the presence of non-canonical amino acids on peptide and protein structure and function. In fact, this new class of amino acids has found an excellent opportunity for use in the design of peptidomimetics. This is mainly because they have been identified naturally and have been found to improve both the stability of the structures and their bioactivity [<xref ref-type="bibr" rid="B12">12</xref>], which clearly points out that all this knowledge promises to deliver new biologically active molecules and therefore that non-standard amino acids (NSAAs) are and will be fundamental in drug discovery. Concerning structure, it has been shown that the presence of such residues decreases the accuracy of structure prediction tools, so it has been recommended to simulate first using the proteinogenic amino acids and then perform the modification to carry out molecular dynamic studies [<xref ref-type="bibr" rid="B13">13</xref>]. Regarding function, non-canonical amino acids have emerged in the field of synthetic biology, focusing mainly on the research of biomaterials looking for adhesion capabilities, also in the design of antimicrobial peptides improving their protease resistance, solubility, and half-life [<xref ref-type="bibr" rid="B14">14</xref>]. Such efforts have led to novel structure/activity studies on modified peptides that present chemoinformatics tools to efficiently characterize the chemical space of these new peptides and thereby better understand their activities, e.g., their antimicrobial activity against multidrug-resistant bacteria [<xref ref-type="bibr" rid="B15">15</xref>].</p>
<p id="p-9">In the context of the lipophilicity for non-canonical amino acids, prominent examples highlighting the significance and relevance of this topic include recent studies by Kubyshkin (2021) [<xref ref-type="bibr" rid="B16">16</xref>] and Oeller et al. (2023) [<xref ref-type="bibr" rid="B17">17</xref>]. The computational work of Oeller et al. introduced the Cambridge solvation post-translational modifications (CamSol-PTM) tool, which offers a rapid and accurate methodology for predicting the solubility of peptides containing non-standard amino acids. Regarding to the experimental work of Kubyshkin, aimed to develop an experimental lipophilicity scale incorporating both coded and non-coded amino acids, using the <italic>n</italic>-octanol/water partition coefficient. This work, based on <italic>N</italic>-acetyl and <italic>O</italic>-methyl amino acid analogs, determined the log<italic>P</italic> for these synthetic compounds using the nuclear magnetic resonance (NMR) technique, which provides a valuable opportunity to validate computational tools for lipophilicity determination. However, it has time constraints in case of generating new chemical modifications due to the experimental protocol to be implemented. Thus, a computational strategy with adequate accuracy to reproduce these experimental values can alleviate the laborious and time-consuming process of the experimental techniques and can offer the advantage of being able to apply a rapid and straightforward strategy to calculate the lipophilicity upon any modification to create a new non-standard amino acid.</p>
<p id="p-10">Therefore, the present work aims to expand our previous work on pH-dependent lipophilicity scale of amino acids [<xref ref-type="bibr" rid="B10">10</xref>], specifically the scale that reproduces the behavior of residues in solvent-like environments (SolvL scale), by extending it to a set of non-standard amino acids presented and experimentally measured by Kubyshkin in 2021 [<xref ref-type="bibr" rid="B16">16</xref>]. The objective is to test, validate, and update our lipophilicity scale to properly account for this descriptor on non-coded amino acids.</p>
</sec>
<sec id="s2">
<title>Materials and methods</title>
<sec id="t2-1">
<title>Dataset</title>
<p id="p-11">In the present article, we selected different non-canonical amino acids (see <xref ref-type="sec" rid="s-suppl">Tables S1</xref>–<xref ref-type="sec" rid="s-suppl">6</xref>) that had been previously investigated and published in an experimental study [<xref ref-type="bibr" rid="B16">16</xref>]. The work presented by Kubyshkin [<xref ref-type="bibr" rid="B16">16</xref>] focused on examining the experimental lipophilicity of non-standard amino acid derivatives originating from methionine, phenylalanine, tyrosine, tryptophan, lysine, and proline using the <italic>n</italic>-octanol/water system. In our study, non-taking into account the standard versions of amino acids, a total of 57 non-canonical amino acids have been investigated. This includes 7 modifications of methionine, 4 of lysine, 9 of phenylalanine, 4 of tyrosine, 25 of proline, and 8 of tryptophan.</p>
<p id="p-12">For each molecule, we considered two variants regarding the <italic>N</italic>- and <italic>C</italic>-terminal capping groups. These end fragments are responsible for mimicking the peptide bond which confers rigidity to these regions, as well as, aiming to mimic the physicochemical behavior of the amino acid when present inside a protein, rather than in an individual state. Our study included in parallel both variants for all amino acids, in order to preserve the original capping groups from our previous study [<xref ref-type="bibr" rid="B10">10</xref>], but also to compare with those used by Kubyshkin [<xref ref-type="bibr" rid="B16">16</xref>] in his experimental study (see <xref ref-type="fig" rid="fig1">Figure 1</xref>).</p>
<fig id="fig1" position="float">
<label>Figure 1</label>
<caption>
<p id="fig1-p-1">Chemical scaffolds of the capping group models used for the amino acids studied in this article: <italic>N</italic>-methyl (in blue), <italic>O</italic>-methyl (in green), and Acetyl group (in red). In the case of proline, scaffolds were slightly diverse, due to the natural features of this amino acid (see <xref ref-type="sec" rid="s-suppl">Figure S1</xref>)</p>
</caption>
<graphic xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="eds-02-100853-g001.tif" />
</fig>
<p id="p-13">
<xref ref-type="fig" rid="fig1">Figure 1</xref> shows the first variant, known as “Model 1”, which involves the introduction of an <italic>N</italic>-methyl (NME) group at the <italic>N</italic>-terminal end and an acetyl (ACE) group at the <italic>C</italic>-terminal end of the derivatives. “Model 2” uses the capping groups of the experimental data published in Kubyshkin’s [<xref ref-type="bibr" rid="B16">16</xref>] article, which presents slight modifications. While the <italic>C</italic>-terminal group remains the same, the <italic>N</italic>-terminal end features an <italic>O</italic>-methyl (OME) group instead of the NME group.</p>
<p id="p-14">This a priori small change presumes to have a reasonable impact on the hydrophobicity of the studied compounds. Since the NH to O modification supposes the loss of a hydrogen bond donor interaction and translates into an increase of lipophilicity, like the experimental values of <italic>N</italic>-methylacetamide (log<italic>P</italic> = –1.05) and methyl acetate (log<italic>P</italic> = 0.18) reported by Hansch et al. in 1995 support [<xref ref-type="bibr" rid="B18">18</xref>].</p>
<p id="p-15">Using the DataWarrior software [<xref ref-type="bibr" rid="B19">19</xref>], within the framework of Model 1 diverse simple descriptors were calculated to better capture the chemical diversity of the studied sets. Thanks to that it could be highlighted that, the molecular weights of the explored molecules lie in the range of 168 to 339 g/mol (see <xref ref-type="sec" rid="s-suppl">Figure S2</xref>). The total number of rotatable bonds varies from one to nine (see <xref ref-type="sec" rid="s-suppl">Figure S3</xref>). Additionally, the count of hydrogen bond acceptors spans from four to seven (see <xref ref-type="sec" rid="s-suppl">Figure S4</xref>), while hydrogen bond donors range from one to four (see <xref ref-type="sec" rid="s-suppl">Figure S5</xref>). In the context of Model 2, which involves substituting the NH group with an oxygen atom in one of the capping groups, there is an approximate one-unit increase in molecular weight. Simultaneously, there is a decrease of one unit in the count of hydrogen bond donor, while the number of acceptors remains unchanged. For more detailed information check <xref ref-type="sec" rid="s-suppl">Tables S7</xref>–<xref ref-type="sec" rid="s-suppl">12</xref> in the <xref ref-type="sec" rid="s-suppl">Supplementary material</xref>.</p>
<p id="p-16">Concerning their lipophilicity, if we consider the difference of each non-standard amino acid compared to the original, based on experimental values reported by Kubyshkin [<xref ref-type="bibr" rid="B16">16</xref>] for methionine derivatives, four of them are slightly more lipophilic, and three are more hydrophilic, with variations ranging from plus 0.80 units (most lipophilic) to minus 1.92 (most hydrophilic). In the case of lysine, all derivatives are more hydrophilic than the canonical, with the most marked difference being 2.43 units. Moving to tyrosine, among the four cases, except for a single case (Dopa) that is slightly more hydrophilic, all others are more lipophilic, despite moving in a narrow range from 0.50 (most hydrophilic) to 0.69 (most lipophilic).</p>
<p id="p-17">For phenylalanine, five derivatives are more lipophilic, three are more hydrophilic, and one has the same experimental log<italic>P</italic> value. The variation range spans 2.29 units, from the most hydrophilic to the most lipophilic. A similar situation is observed for tryptophan derivatives, where out of the eight cases, only two derivatives with polar groups (5-amino and 5-hydroxy) are more hydrophilic than the standard residue (1.46 units less than the most hydrophilic and 1.17 units more than the most lipophilic, resulting in a range of 2.63 units). Among the 25 proline cases, except for six instances, all are more lipophilic, with the most lipophilic being 1.59 units greater than standard proline and the most hydrophilic being 0.93 units less lipophilic.</p>
<p id="p-18">We decided not to include some tyrosine derivatives containing iodine atoms in our study. This decision was based on the limitations of the DFT-based integral equation formalism polarizable continuum model/Miertus-Scrocco-Tomasi (IEFPCM/MST) continuum solvation method used for estimating solvation energies, as it lacks parameterization for iodine atoms. However, this method does include parameterization for other halogen atoms like fluorine, chlorine, and bromine, which present minimal differences experimentally when compared to iodine derivatives. Hence, we included molecules containing these three halogen atoms in our study. A similar criterion was taken in the exclusion of selenomethionine from the analysis since the selenium atom is also not included in the IEFPCM/MST current parametrization [<xref ref-type="bibr" rid="B20">20</xref>].</p>
</sec>
<sec id="t2-2">
<title>Conformational studies and log<italic>P</italic> estimations</title>
<p id="p-19">All molecules were designed using Avogadro software (version 1.1.1) [<xref ref-type="bibr" rid="B21">21</xref>]. Then, we employed OpenBabel 2.4.0 genetic algorithm to stochastically conduct a preliminary generation of the preferred conformations of the amino acids based on energy score [<xref ref-type="bibr" rid="B22">22</xref>]. Due to the structural complexity of some molecules (with several rotatable bonds ranging from 1 to 9), we limited the generation of conformers to a maximum of 100 structures, to make a balance between a complete conformational landscape of them, but at the same time deal with an acceptable number of conformers.</p>
<p id="p-20">Then, generated geometries of the conformers in both water and <italic>n</italic>-octanol were optimized using the B3LYP/6-31G(d) level of theory [<xref ref-type="bibr" rid="B23">23</xref>–<xref ref-type="bibr" rid="B25">25</xref>]. The influence of solvent on the geometric parameters was considered by employing the IEFPCM/MST model [<xref ref-type="bibr" rid="B26">26</xref>–<xref ref-type="bibr" rid="B28">28</xref>], integrated into a local version of Gaussian16 [<xref ref-type="bibr" rid="B29">29</xref>]. The minimum energy state of optimized geometries in each solvent was confirmed by inspecting the vibrational frequencies, excluding those conformations presenting negative ones. Afterward, thermal corrections were introduced to estimate the relative free energy of the conformers in water and <italic>n</italic>-octanol. Also, single-point energy calculations were carried out in the gas phase to evaluate the solvation free energy of each conformation. Those redundant conformers that after visual inspection converged in the same geometry were eliminated to avoid weight imbalance between both solvents. Obtaining a final conformational distribution in both solvents (like the one highlighted in <xref ref-type="sec" rid="s-suppl">Figure S6</xref>). Finally, the log<italic>P</italic> value was estimated by considering the Boltzmann-weighted distribution of the conformational families obtained in water and <italic>n</italic>-octanol.</p>
</sec>
<sec id="t2-3">
<title>Capping group reference value based on glycine residue</title>
<p id="p-21">To ensure that the log<italic>P</italic> values obtained from our computations were exclusively influenced by the inherent characteristics of their side chains rather than the capping groups, a reference framework was implemented. This involved considering the computationally predicted log<italic>P</italic> value for glycine, a molecule lacking a heavy atom side chain, but still marked by the influence of capping groups. In the context of the derivatives estimated in Model 1 (incorporating the ACE and NME capping groups), an adjustment was introduced by adding +0.17 log<italic>P</italic> units to the calculated value. This value originated from the disparity observed between the glycine amino acid value as reported by Zamora et al. [<xref ref-type="bibr" rid="B10">10</xref>] in their 2019 publication and the experimental value documented by Fauchère and Pliska [<xref ref-type="bibr" rid="B30">30</xref>] on their published scale. Conversely, within the framework of Model 2 (incorporating the ACE and OME capping groups), a correction was made by subtracting –0.78 log<italic>P</italic> units. This value reflected the difference existing between the log<italic>P</italic> value computed using the IEFPCM/MST approach and the experimental value detailed in Kubyshkin’s article [<xref ref-type="bibr" rid="B16">16</xref>]. Additionally, the structural models used in our previous work [<xref ref-type="bibr" rid="B10">10</xref>] did not contain the terminal methylated amide present in Model 1 of this work. However, the effect of methylation is well-known, leading to an increase of log<italic>P</italic> values by approximately 0.60 units (see <xref ref-type="sec" rid="s-suppl">Table S13</xref>) where we report the computed values for the 20 canonical amino acids using the capping group of the methylated amide). Furthermore, previous research conducted by our group has already explored models featuring methyl groups for hydration computations [<xref ref-type="bibr" rid="B31">31</xref>]. Consequently, for the present work, we decided to add a methyl group to better mimic the protein environment and facilitate comparison with the ester model (Model 2) used by Kubyshkin [<xref ref-type="bibr" rid="B16">16</xref>].</p>
</sec>
</sec>
<sec id="s3">
<title>Results</title>
<p id="p-22">This work focuses on the reproduction of the experimental values obtained for Kubyshkin [<xref ref-type="bibr" rid="B16">16</xref>] using our continuous solvation model. The discussion will be done by amino acid type as follows.</p>
<sec id="t3-1">
<title>Methionine derivates</title>
<p id="p-23">The canonical residue methionine is an essential amino acid for its antioxidant effect by reacting with oxidizing species [<xref ref-type="bibr" rid="B32">32</xref>], therefore, the tuning of its properties, e.g., lipophilicity, may be relevant to enhance its bioactivity. To this end, <xref ref-type="fig" rid="fig2">Figure 2</xref> shows a consistent behavior between Models 1 and 2. Notably, most lipophilic moieties exhibit a congruent (response about the standard methionine residue values). In Model 1, the log<italic>P</italic> value is near zero, while in Model 2 there is a slightly augmented lipophilicity (0.27). More detailed values can be observed in <xref ref-type="sec" rid="s-suppl">Table S14</xref>.</p>
<fig id="fig2" position="float">
<label>Figure 2</label>
<caption>
<p id="fig2-p-1">Partition coefficients for methionine (Met) derivatives using Models 1 (left) and Models 2 (right). Standard Met residue value is present in the central line of each representation. Nonstandard residue values more lipophilic and more hydrophilic than the original one, are represented in yellow and blue bars, respectively. Experimental values are represented in orange bars. Detailed experimental data can be found in <xref ref-type="sec" rid="s-suppl">Table S14</xref></p>
</caption>
<graphic xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="eds-02-100853-g002.tif" />
</fig>
<p id="p-24">Nonstandard residues ethionine (Eth), norvaline (Nva), norleucine (Nle), and trifluoronorleucine (Tfnle) exhibited a more lipophilic profile than methionine, with log<italic>P</italic> values moving between 0.20 and 1.82, considering both models. This behavior is logical, attributable to the aliphatic nature of these derivatives (Nle, Nva, and Eth), or the addition of halogen moieties, exemplified by Tfnle.</p>
<p id="p-25">In the case of hydrophilic derivatives, methionine sulfoxide (MetO) and azidohomoalanine (Aha) a consistent pattern is observed. The introduction of functional groups such as azide or sulfoxide provoked a discernible alteration in the lipophilic profile of methionine, culminating in marked negative values, moving between –0.90 and –1.20, considering both models. This is to be expected due to the high polarity of the oxygen and nitrogen atoms that confer hydrogen bond acceptor properties.</p>
<p id="p-26">One of the most evident divergences between both approximations arises in the case of methoxinine (Mox), characterized by the replacement of the sulfur atom with an oxygen moiety relative to the standard methionine structure. Model 1 gives a sub-zero value of –0.65, whereas Model 2 manifests a migration towards an apolar value of 0.46. This small incongruity may be ascribed, at least in part, to the presence of an <italic>O</italic>-methyl capping group in Model 2, different from the NME capping group featured in Model 1. The computational method IEFPCM/MST elucidates a propensity to increase lipophilicity concerning Model 1, accentuated by the alteration of a nitrogen-hydrogen moiety to oxygen, resulting in the loss of a donor hydrogen bond interaction, a structural modification that IEFPCM/MST tends to penalize towards a more lipophilic value.</p>
<p id="p-27">Although the influence of capping groups is notably adjusted by the previously commented corrections in the methodological section, certain Model 2 values are corrected starting from an overestimated lipophilic value, and therefore exhibiting an inclination towards greater lipophilicity. This tendency is also observed in Eth and Tfnle cases, that present a difference of 1–1.2 log<italic>P</italic> units between Models 1 and 2.</p>
<p id="p-28">According to correspondence with experimental data (<xref ref-type="sec" rid="s-suppl">Table S14</xref>), in Model 1, apart from Aha (+1.09 log<italic>P</italic> units), which contains a chemical group that tends to present difficulties in their estimation, all methionine cases maintain differences lower than 1 log<italic>P</italic> unit. Instead, in Model 2, two cases are above 1 unit of difference, more specifically Tfnle (1.10 units) and Mox (1.11 units), probably ascribed to the presence of groups that exaggerate their lipophilic profile.</p>
</sec>
<sec id="t3-2">
<title>Aromatic derivates</title>
<p id="p-29">In our study, we analyzed modifications of the main aromatic residues, tyrosine, phenylalanine, and tryptophan. These residues have several functions that maintain the structure and function of proteins. Interactions with cations are essential for maintaining bioactive protein conformations [<xref ref-type="bibr" rid="B33">33</xref>]. Thus, any structural modification of these residues will have an impact on both their lipophilicity and aromaticity and thus on the structure/activity relationships.</p>
<sec id="t3-2-1">
<title>Tyrosine derivates</title>
<p id="p-30">Turning our attention to tyrosine derivatives (depicted in <xref ref-type="fig" rid="fig3">Figure 3</xref>), a similar pattern to methionine is observed, the log<italic>P</italic> value tends to augment lipophilicity in Model 2 (0.52), while registering a slightly hydrophilic quotient of –0.02 in Model 1. More detailed values can be consulted in <xref ref-type="sec" rid="s-suppl">Table S15</xref>.</p>
<fig id="fig3" position="float">
<label>Figure 3</label>
<caption>
<p id="fig3-p-1">Partition coefficients for tyrosine (Tyr) derivatives using Models 1 (left) and Models 2 (right). Standard Tyr residue value is present in the central line of each representation. Nonstandard residue values more lipophilic and more hydrophilic than the original one, are represented in yellow and blue bars, respectively. Experimental values are represented in orange bars. Detailed experimental data can be found in <xref ref-type="sec" rid="s-suppl">Table S15</xref></p>
</caption>
<graphic xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="eds-02-100853-g003.tif" />
</fig>
<p id="p-31">Delving into the assessment of the most lipophilic derivatives, a discernible hierarchy emerges, with 3-fluorotyrosine (3-F-Tyr), 3-nitrotyrosine (3-NO<sub>2</sub>-Tyr), and 2,3,5,6-tetrafluorotyrosine (2,3,5,6-tetraFTyr) exhibiting proportional lipophilic tendency. Within Model 1, their log<italic>P</italic> values span from 0.36 to 1.66, while Model 2 assigns values between 0.59 and 2.10—a correlation that is consistently maintained across both models, with the latter consistently indicating a slightly higher lipophilicity.</p>
<p id="p-32">Conversely, a notable disagreement emerges in the characterization of the Dopa derivative. While Model 1 classifies it as a hydrophilic residue compared to the standard tyrosine (–0.78), Model 2 designates an equivalent lipophilicity to the reference amino acid (0.52). Once again, Model 2 tends to give more lipophilic values in certain cases with respect to Model 1. A trend was observed to a greater or lesser extent in the other tyrosine derivatives. From a chemical point of view, the main difference between tyrosine and Dopa is that the latter has an additional hydroxyl group, a hydrophilic group. Therefore, it is expected that Dopa should have a log<italic>P</italic> value more similar to that of Model 1 (–0.78), which is more hydrophilic and closer to the experimental value reported by Kubyshkin (–0.21).</p>
<p id="p-33">In this case, all Model 1 estimations clearly maintain under a 1 log<italic>P</italic> unit difference with respect to the experimental value. The only case with greater deviation is 2,3,5,6-tetraFTyr, present in Model 2, which shows an overestimation of 1.12 units in log<italic>P</italic>, probably due to the simultaneous presence of 4 fluorine atoms in their structure.</p>
</sec>
<sec id="t3-2-2">
<title>Phenylalanine derivates</title>
<p id="p-34">In a similar line with observations in other derivatives, the log<italic>P</italic> value associated with standard phenylalanine (see <xref ref-type="fig" rid="fig4">Figure 4</xref>) reveals a discernible contrast between Model 2 (1.60) and Model 1 (0.61), reflecting a notable increment of one unit in lipophilic propensity within the former. Detailed values can be checked in <xref ref-type="sec" rid="s-suppl">Table S16</xref>.</p>
<fig id="fig4" position="float">
<label>Figure 4</label>
<caption>
<p id="fig4-p-1">Partition coefficient for phenylalanine (Phe) derivatives using Models 1 (left) and Models 2 (right). Standard Phe residue value is present in the central line of each representation. Nonstandard residue values more lipophilic and more hydrophilic than the original one, are represented in yellow and blue bars, respectively. Experimental values are represented in orange bars. Detailed experimental data can be found in <xref ref-type="sec" rid="s-suppl">Table S16</xref></p>
</caption>
<graphic xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="eds-02-100853-g004.tif" />
</fig>
<p id="p-35">The most lipophilic non-standard residues coincide between both models, encompassing 4-fluorophenylalanine (4-F-Phe), 4-chlorophenylalanine (4-Cl-Phe), 4-trifluoromethylphenylalanine (4-CF<sub>3</sub>-Phe), and 4-bromophenylalanine (4-Br-Phe). In Model 1, this subset gives log<italic>P</italic> values ranging from 1.52 to 2.92, while Model 2 attributes values span from 1.79 to 3.92. Despite not being an identical range, a certain proportionality is maintained between the 4 residues (4-F-Phe &lt; 4-Cl-Phe &lt; 4-CF<sub>3</sub>-Phe &lt; 4-Br-Phe). All of them have in common that they are residues with halogen groups where those more lipophilic halogen residues (Br) correspond to those that are less lipophilic (F).</p>
<p id="p-36">Clear disparities appear in two cases. The characterization of methyltyrosine within Model 1 denotes an apolar amino acid, diverging from Model 2’s classification as slightly polar relative to the reference phenylalanine value. Although the absolute values in both models (1.42 vs. 1.48) closely approximate the experimental value of 0.92—which unmistakably denotes an apolar nature—the discrepant classifications stem from Model 2’s overestimation of the lipophilic propensity of standard phenylalanine (valued at 1.60), influencing the classification. Also, a slight discrepancy between models of the amino acid 4-(Acetylamino)phenylalanine is observed, being more hydrophilic in Model 1 than in Model 2 with a difference of 1.53 units between them.</p>
<p id="p-37">Delving into experimental values consonance, just some specific cases present deviations greater than 1 unit of log<italic>P</italic>: 4-azidophenylalanine (2.13 units in Model 1 and 1.32 in Model 2), 4-bromophenylalanine (2.00 units Model 2) and 4-acetamidophenylalanine (1.16 units in Model 2). All cases are in line with other situations observed.</p>
</sec>
<sec id="t3-2-3">
<title>Tryptophan derivates</title>
<p id="p-38">In this specific scenario, differences between Model 1 and Model 2 about the log<italic>P</italic> value assessment for standard tryptophan exhibit a nearly negligible difference. As evidenced in <xref ref-type="fig" rid="fig5">Figure 5</xref>, Model 1 assigns a value of 1.37, while its Model 2 counterpart presents a value of 1.71, illustrating a marginal deviation of merely 0.34 units. It is worth noting that, both of these values closely approximate the experimental measurement (1.20), differing between 0.17 to 0.51 log<italic>P</italic> units, denoting a modest shift towards heightened lipophilicity. More exact values are available in <xref ref-type="sec" rid="s-suppl">Table S17</xref>.</p>
<fig id="fig5" position="float">
<label>Figure 5</label>
<caption>
<p id="fig5-p-1">Partition coefficient for tryptophan (Trp) derivatives using Models 1 (left) and Models 2 (right). Standard Trp residue value is present in the central line of each representation. Nonstandard residue values more lipophilic and more hydrophilic than the original one, are represented in yellow and blue, respectively. Experimental values are represented in orange bars. Detailed experimental data can be found in <xref ref-type="sec" rid="s-suppl">Table S17</xref></p>
</caption>
<graphic xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="eds-02-100853-g005.tif" />
</fig>
<p id="p-39">A clear trend emerges, demonstrating the congruence in residue classification across both models. On one hand, residues exhibiting enhanced polarity relative to standard phenylalanine are characterized by the introduction of aliphatic or halogen substituents. Examples encompass 5-methyltryptophan (5-CH<sub>3</sub>-Trp), 5-fluorotryptophan (5-F-Trp), 5-chlorotryptophan (5-Cl-Trp), 1-methyltryptophan (1-CH<sub>3</sub>-Trp), 6-bromotryptophan (6-Br-Trp), and 5-bromotryptophan (5-Br-Trp), characterized by absolute values ranging from 1.37 to 4.07 in Model 1, and 1.79 to 4.66 in Model 2. On the other hand, polar residues are exemplified by 5-aminotryptophan (5-NH<sub>2</sub>-Trp) and 5-hydroxytryptophan (5-OH-Trp), exhibiting values of –0.24 and 0.42 in Model 1, and 0.01 and 0.28 in Model 2, respectively. While the trend holds true for hydrophilic residues, certain alterations in the order become evident in the case of hydrophobic derivatives, particularly noticeable in the order of bromine and methyl derivatives.</p>
<p id="p-40">In this case, divergent values compared to experimental ones are, in both models, the two compounds with bromine atoms: 5-Br-Trp and 6-Br-Trp, being always too lipophilic. For 5-bromotryptophan, the difference is between 1.56 and 1.73 log<italic>P</italic> units, and for 6-bromotryptohan is between 1.34 and 2.29. The rest of cases maintain values lower than 1 log<italic>P</italic> unit.</p>
</sec>
</sec>
<sec id="t3-3">
<title>Lysine derivates</title>
<p id="p-41">This amino acid represents the most frequently post-translationally modified so it is no coincidence its impact on protein regulation and function [<xref ref-type="bibr" rid="B34">34</xref>]. The reference log<italic>P</italic> value for standard lysine is taken from Zamora et al. [<xref ref-type="bibr" rid="B10">10</xref>], which gives an approximate log<italic>P</italic> of –0.40 for the amide model (the derived experimental log<italic>P</italic> from the Fauchère’s experimental [<xref ref-type="bibr" rid="B30">30</xref>] log<italic>D</italic><sub>7.4</sub> = –3.07 and using a pKa = 10.0 yields an experimental log<italic>P</italic> of –0.47) and 0.17 for the <italic>N</italic>-acetyl-L-amino-acid-<italic>N</italic>-methyl amide (Model 1) residue (see <xref ref-type="sec" rid="s-suppl">Table S13</xref>). Based on that, as can be seen in <xref ref-type="fig" rid="fig6">Figure 6</xref>, most lipophilic nonstandard residue is <italic>S</italic>-allylcysteine (Sac), which have almost identical values in one each model, around ~1.30, respectively. Absolute values can be checked in <xref ref-type="sec" rid="s-suppl">Table S18</xref>.</p>
<fig id="fig6" position="float">
<label>Figure 6</label>
<caption>
<p id="fig6-p-1">Partition coefficients for lysine (Lys) derivatives using Models 1 (left) and Models 2 (right). Standard Lys residue value is present in the central line of each representation. Nonstandard residue values more lipophilic and more hydrophilic than the original one, are represented in yellow and blue, respectively. Experimental values are represented in orange bars. Detailed experimental data can be found in <xref ref-type="sec" rid="s-suppl">Table S18</xref>. For more detailed information from the Lys log<italic>P</italic> reference value (for Models 1 and 2), check <uri xlink:href="http://">Supplementary material</uri></p>
</caption>
<graphic xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="eds-02-100853-g006.tif" />
</fig>
<p id="p-42">However, discrepancies manifest in the two other cases. Concerning <italic>N</italic>-propargyloxycarbonyl-lysine [(Pro)Lys], Model 1 considers it slightly polar (–0.45), whereas Model 2 positions it distinctly as more apolar (0.57), but in both cases more apolar compared to coded lysine (1.11). Let us mention that, these differences, although not negligible, are within the range found even in experimental measurements.</p>
<p id="p-43">According to <italic>N</italic>-acetyl-lysine [(Ac)Lys], Model 1 denotes an extremely hydrophilic characterization of –1.64, while Model 2 persists in –0.39. Chemically insight underscores the incorporation of an ACE group, analogous to (Boc)Lys and [(Pro)Lys], that should provoke a slight increase in the lipophilicity. Consequently, Model 1 tends to excessively accentuate the hydrophilic trait of this residue, while Model 2’s depiction is more aligned with a hydrophobic profile. However, the tendency is to be more hydrophilic than the standard version of the amino acid.</p>
<p id="p-44">In this case, the comparison with experimental data shows that all cases in both Models almost have a perfect fitting, presenting a difference of lower than 1 unit. In Model 1, the most deviated case has a 0.75 units divergence while in Model 2 is 0.68 units.</p>
</sec>
<sec id="t3-4">
<title>Proline derivates</title>
<p id="p-45">In the context of proline residues, their examination was previously undertaken by Matamoros et al. in 2022 [<xref ref-type="bibr" rid="B35">35</xref>], employing the SMD solvation approach [<xref ref-type="bibr" rid="B36">36</xref>], In the current study, we subject these residues to analysis via our IEFPCM/MST methodology. As illustrated in <xref ref-type="fig" rid="fig7">Figure 7</xref> and detailed in <xref ref-type="sec" rid="s-suppl">Table S19</xref>, the outcomes affirm the comparable efficacy of our approach, thus rendering it well-suited and eminently applicable for extending our scale of lipophilicity.</p>
<fig id="fig7" position="float">
<label>Figure 7</label>
<caption>
<p id="fig7-p-1">Partition coefficient for proline (Pro) derivatives using Models 1 (up) and 2 (down). Standard Pro residue value is present in the central line of each representation. Nonstandard residue values more lipophilic and more hydrophilic than the original one, are represented in yellow and blue, respectively. Detailed experimental values can be found in <xref ref-type="sec" rid="s-suppl">Table S19</xref>. For more detailed information from the Pro log<italic>P</italic> reference value (for Models 1 and 2), check <uri xlink:href="http://">Supplementary material</uri></p>
</caption>
<graphic xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="eds-02-100853-g007.tif" />
</fig>
<p id="p-46">Regarding proline, in general, all cases maintain a difference with respect to the experimental value, lower than 2 units of log<italic>P</italic> in both models. Only dehydroproline (Dhp) in Model 1, presents a deviation of 2.26 log<italic>P</italic> units, presenting an excessive hydrophilic profile due to the capacity of performing hydrogen bond interaction of the NH group.</p>
</sec>
<sec id="t3-5">
<title>General correlation between experimental and computational data</title>
<p id="p-47">Regarding the correlation between experimental and computational estimations, <xref ref-type="fig" rid="fig8">Figures 8</xref> and <xref ref-type="fig" rid="fig9">9</xref> reveal a noteworthy similarity between the two models. Both exhibit a correlation coefficient (R<sup>2</sup>) that is moderately acceptable—0.73 for Model 1 and 0.71 for Model 2. Also, the root mean square error (RMSE) for Model 1 is 0.7, while Model 2 stands at 0.9. Furthermore, additional statistical parameters such as MSE and mean unsigned error (MUE) also indicate a consistent pattern across both models. Despite the subtle differences, Model 1 demonstrates a stronger correlation and exhibits lower error when compared to the experimental values. This observation aligns coherently with our previously published findings that utilized similar capping groups as those in Model 1.</p>
<fig id="fig8" position="float">
<label>Figure 8</label>
<caption>
<p id="fig8-p-1">Correlation between calculated log<italic>P</italic> (corrected by eliminating the influence of capping groups of Model 1) (axis X) and experimental log<italic>P</italic> values reported by Kubyshkin (axis Y). Groups of residues are represented in different patterns of colors: methionine (yellow), tyrosine (green), phenylalanine (orange), tryptophan (grey), lysine (blue), and proline (red)</p>
</caption>
<graphic xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="eds-02-100853-g008.tif" />
</fig>
<fig id="fig9" position="float">
<label>Figure 9</label>
<caption>
<p id="fig9-p-1">Correlation between calculated log<italic>P</italic> (corrected by eliminating the influence of capping groups of Model 2) (axis X) and experimental log<italic>P</italic> values reported by Kubyshkin (axis Y). Groups of residues are represented in different patterns of colors: methionine (yellow), tyrosine (green), phenylalanine (orange), tryptophan (grey), lysine (blue), and proline (red)</p>
</caption>
<graphic xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="eds-02-100853-g009.tif" />
</fig>
<p id="p-48">Delving into specifics, it becomes evident that indistinctly of the model considered, all methionine and tyrosine residues (yellow and green colored dots in <xref ref-type="fig" rid="fig8">Figures 8</xref> and <xref ref-type="fig" rid="fig9">9</xref>, respectively) consistently exhibit present values with a discrepancy not higher than 1.2 log<italic>P</italic> units. Similarly, in the case of lysine is even better, remaining below than 1 log<italic>P</italic> unit in all cases (blue colored dots in <xref ref-type="fig" rid="fig8">Figures 8</xref> and <xref ref-type="fig" rid="fig9">9</xref>). This can be translated into the fact that there is hardly any difference between the experimental values and those reproduced computationally. It’s worth noting that a deviation near 1 log<italic>P</italic> unit can often be attributed to inherent errors within the method itself.</p>
<p id="p-49">As regards the other derivatives, in general trend is maintained, however, certain cases with notably substantial discrepancies have come to light. In the case of the phenylalanine derivatives (orange-colored dots in <xref ref-type="fig" rid="fig8">Figures 8</xref> and <xref ref-type="fig" rid="fig9">9</xref>), the Aha derivative (4-N<sub>3</sub>-Phe) in Model 1, presents a deviation of 2.13 units from the experimental value, though this deviation is somewhat mitigated in Model 2 (1.32 units). An underlying explanation could be associated with the azide group present within the side chain. Despite the group’s net charge being neutral, there exists a subtle polarization distributed across its nitrogen atoms. This charge distribution potentially contributes to deviations and fluctuations in accurately estimating the compound’s lipophilicity [<xref ref-type="bibr" rid="B37">37</xref>–<xref ref-type="bibr" rid="B42">42</xref>]. The difference of 0.81 units in the assessment of the identical residue across Model 1 and Model 2 might arise from the distinct origins of their unadjusted initial values. In Model 1, the original value comes from a measurement involving the NME capping group, introducing a hydrogen bond interaction that doesn’t occur with the OME capping in Model 2. Consequently, this residue could potentially be overestimated as hydrophilic, driven by the presence of the NME capping group. This last aspect is also observed in the most deviated case from the proline dataset (red dots in <xref ref-type="fig" rid="fig8">Figures 8</xref> and <xref ref-type="fig" rid="fig9">9</xref>), Dhp in the case of Model 1 deviates 2.26 units more hydrophilic than the experimental one.</p>
<p id="p-50">Another pattern observed in deviated cases is the presence of bromine atoms, more specifically, in the case of phenylalanine and tryptophan residues (orange and grey colored dots in figures 8 and 9, respectively), 4-Br-Phe, 5-Br-Trp and 6-Br-Trp present a more marked difference. While the rest of the residues present a deviation around 1 log<italic>P</italic> unit, these cases move around 1.34 and 2.29, between both models. The bromine atom is a relatively heavy atom compared to other lighter halogens like fluor and chlorine (deviations around 0–0.8 log<italic>P</italic> units) and it has unique electronic properties due to its larger size and higher atomic number. These factors can influence the interactions of bromine with its surrounding environment, including solvent molecules and other atoms in a molecule.</p>
<p id="p-51">Another potential source of mismatch between experimental and computational results can be attributed to the fact that IEFPCM/MST method is an implicit solvation model, that treats the solvent as a continuous dielectric medium, simplifying the simulation and reducing the computational cost. This approach permits to be more efficient but sometimes can oversimplify the solvent behavior and fail to capture specific solvent-solute interactions accurately. Contrary to that explicit solvation models represent individual solvent molecules, which can sometimes permit a detailed description of these interactions. For instance, the polarized structure-specific backbone charge (PSBC) explicit model has been successful in predicting both the experimental folding of helical peptides [<xref ref-type="bibr" rid="B41">41</xref>] and <italic>β</italic>-sheet structures [<xref ref-type="bibr" rid="B42">42</xref>] thanks to considering the polarizability of backbone hydrogen bonds by implementing the partial charges of backbone hydrogen-bond donor and acceptor atoms during peptide folding simulations. However, despite their differences some bibliography holds that for predicting solvation energies and partition coefficients, both methods can perform quite reasonable results [<xref ref-type="bibr" rid="B43">43</xref>, <xref ref-type="bibr" rid="B44">44</xref>].</p>
</sec>
<sec id="t3-6">
<title>Application of non-standard amino acids in proteomics</title>
<p id="p-52">Acetylation is a relevant post-translational modification that is mainly carried out in both the <italic>ε</italic>-amine on the side chain of lysine and in the <italic>α</italic>-amine of the N-terminus in peptides and proteins [<xref ref-type="bibr" rid="B45">45</xref>]. In health and pathological states, the reversible acetylation of lysine residues plays a crucial role in regulating cellular and developmental processes. These facts make the correct identification of acetylated peptides and proteins a constantly developing field in modern proteomics [<xref ref-type="bibr" rid="B46">46</xref>]. In this context, experimental studies have analyzed the impact of peptide acetylation on chromatographic retention time in reversed phase-high performance liquid chromatography (RP HPLC) in order to create predictive models that suggest an efficient way for the separation of these peptides that will allow their identification [<xref ref-type="bibr" rid="B46">46</xref>].</p>
<p id="p-53">
<xref ref-type="table" rid="t1">Table 1</xref> reports the experimental hydrophobicity index (ΔHI) obtained by Mizero and collaborators [<xref ref-type="bibr" rid="B47">47</xref>], calculated as the difference between the hydrophobicity index for modified (acetylated) and non-modified peptide pairs expressed in % acetonitrile (% ACN). As can be seen, it is evident that the greater the change in the degree of acetylation in the lysines of the peptide pairs, the greater the amount of organic solvent (% ACN) will be necessary.</p>
<table-wrap id="t1">
<label>Table 1</label>
<caption>
<p id="t1-p-1">Variation of the experimental hydrophobicity index (HI) using as separation mode acetonitrile (% ACN) in RP HPLC 0.1 % of formic acid for modified (acetylated) and non-modified peptide pairs</p>
</caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th>
<bold>Acetylated lysine residues in peptide (number of peptide pairs)</bold>
</th>
<th>
<bold>Experimental hydrophobicity index (ΔHI) in RP HPLC 0.1% formic acid (% ACN)</bold>
</th>
<th>
<bold>Δ(Ac)Lys</bold>
</th>
<th>
<bold>ΔΔHI/Δ(Ac)Lys</bold>
</th>
</tr>
</thead>
<tbody>
<tr>
<td>                    0 (10,632)</td>
<td>                                  5.02</td>
<td>      -</td>
<td>       -</td>
</tr>
<tr>
<td>                    1 (13,791)</td>
<td>                                  9.14</td>
<td>      1</td>
<td>     4.12</td>
</tr>
<tr>
<td>                    2 (2,390)</td>
<td>                                  11.20</td>
<td>      2</td>
<td>     6.18</td>
</tr>
<tr>
<td>                    3 (316)</td>
<td>                                  12.54</td>
<td>      3</td>
<td>     7.52</td>
</tr>
</tbody>
</table>
</table-wrap>
<p id="p-54">
<xref ref-type="fig" rid="fig10">Figure 10</xref> depicts the derivative of the change in the hydrophobic index with respect to the change in (Ac)Lys residues in the modified/non-modified pairs [ΔΔHI/Δ(Ac)Lys] from which the slope permit to obtain the increase in hydrophobicity due to the acetylation of a lysine residue (~1.70 units).</p>
<fig id="fig10" position="float">
<label>Figure 10</label>
<caption>
<p id="fig10-p-1">Representation of the variation of the experimental hydrophobic index (% ACN) by the change in the number of acetylated lysines in peptide pairs as a function of the change of acetylated lysines in peptide pairs</p>
</caption>
<graphic xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="eds-02-100853-g010.tif" />
</fig>
<p id="p-55">In order to further evaluate the reliability of the predictions of the calculations performed in this work, <xref ref-type="table" rid="t2">Table 2</xref> reports the increase of hydrophobicity under the acetylation of lysine residues (Δlog<italic>P</italic><sub>Ac</sub>) using our computations but also those obtained of ChemAxon [<xref ref-type="bibr" rid="B48">48</xref>] and milogP [<xref ref-type="bibr" rid="B49">49</xref>]. Let us mention that HPLC separation systems are carried out under acidic conditions (pH around 2). Therefore, our reported value of –3.07 refers mainly to the partitioning of the ionic species (log<italic>D</italic><sub>2</sub>) and not to the neutral species (log<italic>P</italic>). For acetylated lysine, the reported value corresponds to the log<italic>P</italic>. Thus, since our prediction (~1.43 log<italic>P</italic> units) is close to that obtained experimentally (see <xref ref-type="fig" rid="fig10">Figure 10</xref>), it can be used to efficiently predict experimental HPLC conditions to separate acetylated peptides and thus, be used for proteomic studies.</p>
<table-wrap id="t2">
<label>Table 2</label>
<caption>
<p id="t2-p-1">Partition coefficients (log<italic>P</italic>) values for lysine (Lys) and acetyllysine [(Ac)Lys] using the capping groups of the Model 1 and change in lipophilicity due to acetylation (Δlog<italic>P</italic><sub>Ac</sub>) of lysine residues</p>
</caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th rowspan="2">                <break />             <bold>Amino acid code</bold></th>
<th colspan="2">                             <bold>Lipophilicity</bold></th>
<th rowspan="2">                  <break />          <bold>Δlog<italic>P</italic><sub>Ac</sub></bold></th>
</tr>
<tr>
<th>        <bold>Lys (log<italic>D</italic><italic><sub>2</sub></italic>)</bold></th>
<th>        <bold>(Ac)Lys (log<italic>P</italic>)</bold></th>
</tr>
</thead>
<tbody>
<tr>
<td>                  This work</td>
<td>              –3.07</td>
<td>                –1.64</td>
<td>            1.43</td>
</tr>
<tr>
<td>                 ChemAxon</td>
<td>              –4.51</td>
<td>                –1.66</td>
<td>            2.85</td>
</tr>
<tr>
<td>                     milogP</td>
<td>              –3.73</td>
<td>                –1.25</td>
<td>            2.48</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
</sec>
<sec id="s4">
<title>Discussion</title>
<p id="p-56">The lipophilicity of amino acids is one of the main physicochemical properties of these biomolecules as it gives an estimate of solubility, binding propensity, and bioavailability. In this work we show how several structural modifications in residues such as methionine, aromatic, lysine, and proline can tune the hydrophobic properties of these residues, opening a window of possibilities to be used as a guide for the design of peptides and proteins with tailor-made characteristics. The structural models used, based on differences in capping groups showed mostly important similarities, validating the lipophilicity values obtained for the non-standard side chains.</p>
<p id="p-57">Delving into the specifics of the deviations in both number and magnitude, the results presented herein demonstrate considerable promise. Evaluating the proposed models and considering that deviations of up to 2 log<italic>P</italic> units fall within the expected variation for the estimated parameter [<xref ref-type="bibr" rid="B50">50</xref>], we can observe that out of the 126 estimated cases (considering Models 1 and 2) only 3 surpass the threshold of two units. This translates to a deviation rate of less than 2.5% across the dataset. Notably, amino acids such as methionine, tyrosine, and lysine exhibit no instances surpassing this limit. Even employing a stricter criterion for all the sets (deviation exceeding 1 log<italic>P</italic> unit), still 80% of the cases remain within an acceptable range of accuracy. As previously pointed out in this study, the calculated values and associated errors demonstrate promise, aligning well with those reported in previous research on widely studied canonical amino acids with established functional groups [<xref ref-type="bibr" rid="B10">10</xref>]. Once again, the IEFPCM/MST model has demonstrated good accuracy with minimal uncertainties, a performance consistently reflected in the SAMPL blind challenges [<xref ref-type="bibr" rid="B51">51</xref>, <xref ref-type="bibr" rid="B52">52</xref>]</p>
<p id="p-58">Differences were found in fewer cases, which can be expected as one model uses a hydrogen bond donor (Model 1) while the other uses a hydrogen bond acceptor (Model 2), this lies in the effect of the polarizability on the atoms in the backbone which includes the capping groups [<xref ref-type="bibr" rid="B41">41</xref>, <xref ref-type="bibr" rid="B42">42</xref>]. In general, both models correlate well with the experimental values, obtaining lower statistical errors in the case of Model 1.</p>
<p id="p-59">In addition, our predictions were able to efficiently predict the experimental hydrophobicity change due to the number of acetylated lysines in peptide pairs determined by HPLC, opening up the possibility that our scale can be employed for proteomics studies that include post-translational modifications beyond acetylation.</p>
<p id="p-60">Overall, this work represents the first computational work to systematically reproduce the lipophilicity values of non-canonical amino acids, paving the way for these can be easily implemented in computational tools related to the calculation of peptide solubility, aggregation, scoring functions of molecular docking programs and also to efficiently predict the presence of post-translational modifications in the area of proteomics.</p>
</sec>
</body>
<back>
<glossary>
<title>Abbreviations</title>
<def-list>
<def-item>
<term>ACE</term>
<def>
<p>acetyl</p>
</def>
</def-item>
<def-item>
<term>(Ac)Lys</term>
<def>
<p>
<italic>N</italic>-acetyl-lysine</p>
</def>
</def-item>
<def-item>
<term>Aha</term>
<def>
<p>azidohomoalanine</p>
</def>
</def-item>
<def-item>
<term>Eth</term>
<def>
<p>ethionine</p>
</def>
</def-item>
<def-item>
<term>IEFPCM/MST</term>
<def>
<p>integral equation formalism polarizable continuum model/miertus-scrocco-tomasi</p>
</def>
</def-item>
<def-item>
<term>Tfnle</term>
<def>
<p>trifluoronorleucine</p>
</def>
</def-item>
<def-item>
<term>NME</term>
<def>
<p>
<italic>N</italic>-methyl</p>
</def>
</def-item>
<def-item>
<term>OME</term>
<def>
<p>
<italic>O</italic>-methyl</p>
</def>
</def-item>
<def-item>
<term>RP HPLC</term>
<def>
<p>reversed phase-high performance liquid chromatography</p>
</def>
</def-item>
<def-item>
<term>4-Br-Phe</term>
<def>
<p>4-bromophenylalanine</p>
</def>
</def-item>
<def-item>
<term>5-Br-Trp</term>
<def>
<p>5-bromotryptophan</p>
</def>
</def-item>
<def-item>
<term>6-Br-Trp</term>
<def>
<p>6-bromotryptophan</p>
</def>
</def-item>
</def-list>
</glossary>
<sec id="s-suppl" sec-type="supplementary-material">
<title>Supplementary materials</title>
<p>The supplementary materials for this article are available at: <uri xlink:href="https://www.explorationpub.com/uploads/Article/file/100853_sup_1.pdf">https://www.explorationpub.com/uploads/Article/file/100853_sup_1.pdf</uri>.</p>
<supplementary-material id="SD1" content-type="local-data">
<media xlink:href="100853_sup_1.pdf" mimetype="application" mime-subtype="pdf"></media>
</supplementary-material>
</sec>
<sec id="s6">
<title>Declarations</title>
<sec id="t-6-1">
<title>Author contributions</title>
<p>AV and WJZ: Conceptualization, Data curation, Formal analysis, Funding acquisition, Investigation, Methodology, Project administration, Resources, Supervision, Writing—original draft, Writing—review &amp; editing. PM and DBR: Investigation, Data curation, Visualization, Writing—review &amp; editing.</p>
</sec>
<sec id="t-6-2" sec-type="COI-statement">
<title>Conflicts of interest</title>
<p>The authors declare that they have no conflicts of interest.</p>
</sec>
<sec id="t-6-3">
<title>Ethical approval</title>
<p>Not applicable.</p>
</sec>
<sec id="t-6-4">
<title>Consent to participate</title>
<p>Not applicable.</p>
</sec>
<sec id="t-6-5">
<title>Consent to publication</title>
<p>Not applicable.</p>
</sec>
<sec id="t-6-6" sec-type="data-availability">
<title>Availability of data and materials</title>
<p>The datasets generated and/or analyzed for this study can be found in the NSAAs-Lipophilicity Github repository: <uri xlink:href="https://github.com/tviayna/NSAAs-Lipophilicity">https://github.com/tviayna/NSAAs-Lipophilicity</uri>.</p>
</sec>
<sec id="t-6-7">
<title>Funding</title>
<p>The authors thank the Spanish Ministerio de Ciencia e Innovación [PID2020-117646RB-I00, MCIN/AEI/10.13039/501100011033], Generalitat de Catalunya [2021SGR00671], and Consorci de Serveis Universitaris de Catalunya [CSUC; Molecular Recognition project] for financial support. The authors thank the Vice Chancellor for Research of the University of Costa Rica for its support work via the research project [115-C1-450]. The funders had no role in study design, data collection and analysis, decision to publish, or preparation of the manuscript.</p>
</sec>
<sec id="t-6-8">
<title>Copyright</title>
<p>© The Author(s) 2024.</p>
</sec>
</sec>
<ref-list>
<ref id="B1">
<label>1</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>von Heijne</surname>
<given-names>G</given-names>
</name>
</person-group>
<article-title>Protein Evolution and Design</article-title>
<source>Annu Rev Biochem</source>
<year iso-8601-date="2018">2018</year>
<volume>87</volume>
<fpage>101</fpage>
<lpage>3</lpage>
<pub-id pub-id-type="doi">10.1146/annurev-biochem-062917-012013</pub-id>
<pub-id pub-id-type="pmid">29925266</pub-id>
</element-citation>
</ref>
<ref id="B2">
<label>2</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Doig</surname>
<given-names>AJ</given-names>
</name>
</person-group>
<article-title>Frozen, but no accident - why the 20 standard amino acids were selected</article-title>
<source>FEBS J</source>
<year iso-8601-date="2017">2017</year>
<volume>284</volume>
<fpage>1296</fpage>
<lpage>305</lpage>
<pub-id pub-id-type="doi">10.1111/febs.13982</pub-id>
<pub-id pub-id-type="pmid">27926995</pub-id>
</element-citation>
</ref>
<ref id="B3">
<label>3</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chin</surname>
<given-names>JW</given-names>
</name>
</person-group>
<article-title>Expanding and reprogramming the genetic code</article-title>
<source>Nature</source>
<year iso-8601-date="2017">2017</year>
<volume>550</volume>
<fpage>53</fpage>
<lpage>60</lpage>
<pub-id pub-id-type="doi">10.1038/nature24031</pub-id>
<pub-id pub-id-type="pmid">28980641</pub-id>
</element-citation>
</ref>
<ref id="B4">
<label>4</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Efremov</surname>
<given-names>RG</given-names>
</name>
<name>
<surname>Chugunov</surname>
<given-names>AO</given-names>
</name>
<name>
<surname>Pyrkov</surname>
<given-names>TV</given-names>
</name>
<name>
<surname>Priestle</surname>
<given-names>JP</given-names>
</name>
<name>
<surname>Arseniev</surname>
<given-names>AS</given-names>
</name>
<name>
<surname>Jacoby</surname>
<given-names>E</given-names>
</name>
</person-group>
<article-title>Molecular lipophilicity in protein modeling and drug design</article-title>
<source>Curr Med Chem</source>
<year iso-8601-date="2007">2007</year>
<volume>14</volume>
<fpage>393</fpage>
<lpage>415</lpage>
<pub-id pub-id-type="doi">10.2174/092986707779941050</pub-id>
<pub-id pub-id-type="pmid">17305542</pub-id>
</element-citation>
</ref>
<ref id="B5">
<label>5</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Tang</surname>
<given-names>S</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>J</given-names>
</name>
<name>
<surname>Huang</surname>
<given-names>G</given-names>
</name>
<name>
<surname>Yan</surname>
<given-names>L</given-names>
</name>
</person-group>
<article-title>Predicting Protein Surface Property with its Surface Hydrophobicity</article-title>
<source>Protein Pept Lett</source>
<year iso-8601-date="2021">2021</year>
<volume>28</volume>
<fpage>938</fpage>
<lpage>44</lpage>
<pub-id pub-id-type="doi">10.2174/0929866528666210222160603</pub-id>
<pub-id pub-id-type="pmid">33618636</pub-id>
</element-citation>
</ref>
<ref id="B6">
<label>6</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Weinstein</surname>
<given-names>JY</given-names>
</name>
<name>
<surname>Elazar</surname>
<given-names>A</given-names>
</name>
<name>
<surname>Fleishman</surname>
<given-names>SJ</given-names>
</name>
</person-group>
<article-title>A lipophilicity-based energy function for membrane-protein modelling and design</article-title>
<source>PLoS Comput Biol</source>
<year iso-8601-date="2019">2019</year>
<volume>15</volume>
<elocation-id>e1007318</elocation-id>
<pub-id pub-id-type="doi">10.1371/journal.pcbi.1007318</pub-id>
<pub-id pub-id-type="pmid">31461441</pub-id>
<pub-id pub-id-type="pmcid">PMC6736313</pub-id>
</element-citation>
</ref>
<ref id="B7">
<label>7</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Simm</surname>
<given-names>S</given-names>
</name>
<name>
<surname>Einloft</surname>
<given-names>J</given-names>
</name>
<name>
<surname>Mirus</surname>
<given-names>O</given-names>
</name>
<name>
<surname>Schleiff</surname>
<given-names>E</given-names>
</name>
</person-group>
<article-title>50 years of amino acid hydrophobicity scales: revisiting the capacity for peptide classification</article-title>
<source>Biol Res</source>
<year iso-8601-date="2016">2016</year>
<volume>49</volume>
<elocation-id>31</elocation-id>
<pub-id pub-id-type="doi">10.1186/s40659-016-0092-5</pub-id>
<pub-id pub-id-type="pmid">27378087</pub-id>
<pub-id pub-id-type="pmcid">PMC4932767</pub-id>
</element-citation>
</ref>
<ref id="B8">
<label>8</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Peters</surname>
<given-names>C</given-names>
</name>
<name>
<surname>Elofsson</surname>
<given-names>A</given-names>
</name>
</person-group>
<article-title>Why is the biological hydrophobicity scale more accurate than earlier experimental hydrophobicity scales?</article-title>
<source>Proteins</source>
<year iso-8601-date="2014">2014</year>
<volume>82</volume>
<fpage>2190</fpage>
<lpage>8</lpage>
<pub-id pub-id-type="doi">10.1002/prot.24582</pub-id>
<pub-id pub-id-type="pmid">24753217</pub-id>
</element-citation>
</ref>
<ref id="B9">
<label>9</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>MacCallum</surname>
<given-names>JL</given-names>
</name>
<name>
<surname>Tieleman</surname>
<given-names>DP</given-names>
</name>
</person-group>
<article-title>Hydrophobicity scales: a thermodynamic looking glass into lipid-protein interactions</article-title>
<source>Trends Biochem Sci</source>
<year iso-8601-date="2011">2011</year>
<volume>36</volume>
<fpage>653</fpage>
<lpage>62</lpage>
<pub-id pub-id-type="doi">10.1016/j.tibs.2011.08.003</pub-id>
<pub-id pub-id-type="pmid">21930386</pub-id>
</element-citation>
</ref>
<ref id="B10">
<label>10</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zamora</surname>
<given-names>WJ</given-names>
</name>
<name>
<surname>Campanera</surname>
<given-names>JM</given-names>
</name>
<name>
<surname>Luque</surname>
<given-names>FJ</given-names>
</name>
</person-group>
<article-title>Development of a Structure-Based, pH-Dependent Lipophilicity Scale of Amino Acids from Continuum Solvation Calculations</article-title>
<source>J Phys Chem Lett</source>
<year iso-8601-date="2019">2019</year>
<volume>10</volume>
<fpage>883</fpage>
<lpage>9</lpage>
<pub-id pub-id-type="doi">10.1021/acs.jpclett.9b00028</pub-id>
<pub-id pub-id-type="pmid">30741551</pub-id>
</element-citation>
</ref>
<ref id="B11">
<label>11</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Dunbrack</surname>
<given-names>RL Jr</given-names>
</name>
<name>
<surname>Karplus</surname>
<given-names>M</given-names>
</name>
</person-group>
<article-title>Conformational analysis of the backbone-dependent rotamer preferences of protein sidechains</article-title>
<source>Nat Struct Biol</source>
<year iso-8601-date="1994">1994</year>
<volume>1</volume>
<fpage>334</fpage>
<lpage>40</lpage>
<pub-id pub-id-type="doi">10.1038/nsb0594-334</pub-id>
<pub-id pub-id-type="pmid">7664040</pub-id>
</element-citation>
</ref>
<ref id="B12">
<label>12</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Castro</surname>
<given-names>TG</given-names>
</name>
<name>
<surname>Melle-Franco</surname>
<given-names>M</given-names>
</name>
<name>
<surname>Sousa</surname>
<given-names>CEA</given-names>
</name>
<name>
<surname>Cavaco-Paulo</surname>
<given-names>A</given-names>
</name>
<name>
<surname>Marcos</surname>
<given-names>JC</given-names>
</name>
</person-group>
<article-title>Non-Canonical Amino Acids as Building Blocks for Peptidomimetics: Structure, Function, and Applications</article-title>
<source>Biomolecules</source>
<year iso-8601-date="2023">2023</year>
<volume>13</volume>
<elocation-id>981</elocation-id>
<pub-id pub-id-type="doi">10.3390/biom13060981</pub-id>
<pub-id pub-id-type="pmid">37371561</pub-id>
<pub-id pub-id-type="pmcid">PMC10296201</pub-id>
</element-citation>
</ref>
<ref id="B13">
<label>13</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ochoa</surname>
<given-names>R</given-names>
</name>
<name>
<surname>Fox</surname>
<given-names>T</given-names>
</name>
</person-group>
<article-title>Assessing the fast prediction of peptide conformers and the impact of non-natural modifications</article-title>
<source>J Mol Graph Model</source>
<year iso-8601-date="2023">2023</year>
<volume>125</volume>
<elocation-id>108608</elocation-id>
<pub-id pub-id-type="doi">10.1016/j.jmgm.2023.108608</pub-id>
<pub-id pub-id-type="pmid">37659134</pub-id>
</element-citation>
</ref>
<ref id="B14">
<label>14</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Jin</surname>
<given-names>X</given-names>
</name>
<name>
<surname>Park</surname>
<given-names>OJ</given-names>
</name>
<name>
<surname>Hong</surname>
<given-names>SH</given-names>
</name>
</person-group>
<article-title>Incorporation of non-standard amino acids into proteins: challenges, recent achievements, and emerging applications</article-title>
<source>Appl Microbiol Biotechnol</source>
<year iso-8601-date="2019">2019</year>
<volume>103</volume>
<fpage>2947</fpage>
<lpage>58</lpage>
<pub-id pub-id-type="doi">10.1007/s00253-019-09690-6</pub-id>
<pub-id pub-id-type="pmid">30790000</pub-id>
<pub-id pub-id-type="pmcid">PMC6449208</pub-id>
</element-citation>
</ref>
<ref id="B15">
<label>15</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>López-López</surname>
<given-names>E</given-names>
</name>
<name>
<surname>Robles</surname>
<given-names>O</given-names>
</name>
<name>
<surname>Plisson</surname>
<given-names>F</given-names>
</name>
<name>
<surname>Medina-Franco</surname>
<given-names>JL</given-names>
</name>
</person-group>
<article-title>Mapping the structure–activity landscape of non-canonical peptides with MAP4 fingerprinting</article-title>
<source>Digital Discovery</source>
<year iso-8601-date="2023">2023</year>
<volume>2</volume>
<fpage>1494</fpage>
<lpage>505</lpage>
<pub-id pub-id-type="doi">10.1039/D3DD00098B</pub-id>
</element-citation>
</ref>
<ref id="B16">
<label>16</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kubyshkin</surname>
<given-names>V</given-names>
</name>
</person-group>
<article-title>Experimental lipophilicity scale for coded and noncoded amino acid residues</article-title>
<source>Org Biomol Chem</source>
<year iso-8601-date="2021">2021</year>
<volume>19</volume>
<fpage>7031</fpage>
<lpage>40</lpage>
<pub-id pub-id-type="doi">10.1039/d1ob01213d</pub-id>
<pub-id pub-id-type="pmid">34333582</pub-id>
</element-citation>
</ref>
<ref id="B17">
<label>17</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Oeller</surname>
<given-names>M</given-names>
</name>
<name>
<surname>Kang</surname>
<given-names>RJD</given-names>
</name>
<name>
<surname>Bolt</surname>
<given-names>HL</given-names>
</name>
<name>
<surname>Gomes</surname>
<given-names>Dos Santos AL</given-names>
</name>
<name>
<surname>Weinmann</surname>
<given-names>AL</given-names>
</name>
<name>
<surname>Nikitidis</surname>
<given-names>A</given-names>
</name>
<etal>et al.</etal>
</person-group>
<article-title>Sequence-based prediction of the intrinsic solubility of peptides containing non-natural amino acids</article-title>
<source>Nat Commun</source>
<year iso-8601-date="2023">2023</year>
<volume>14</volume>
<elocation-id>7475</elocation-id>
<pub-id pub-id-type="doi">10.1038/s41467-023-42940-w</pub-id>
<pub-id pub-id-type="pmid">37978172</pub-id>
<pub-id pub-id-type="pmcid">PMC10656490</pub-id>
</element-citation>
</ref>
<ref id="B18">
<label>18</label>
<element-citation publication-type="book">
<person-group person-group-type="author">
<name>
<surname>Hansch</surname>
<given-names>C</given-names>
</name>
<name>
<surname>Leo</surname>
<given-names>A</given-names>
</name>
<name>
<surname>Hoekman</surname>
<given-names>D</given-names>
</name>
</person-group>
<article-title>Exploring QSAR: Hydrophobic, electronic, and steric constants</article-title>
<person-group person-group-type="editor">
<name>
<surname>Hansch</surname>
<given-names>C</given-names>
</name>
<name>
<surname>Leo</surname>
<given-names>A</given-names>
</name>
<name>
<surname>Hoekman</surname>
<given-names>D</given-names>
</name>
</person-group>
<source>Exploring QSAR: Hydrophobic, electronic, and steric constants</source>
<publisher-loc>Washington, DC</publisher-loc>
<publisher-name>American Chemcial Society</publisher-name>
<year iso-8601-date="1995">1995</year>
<comment>p. 6.</comment>
</element-citation>
</ref>
<ref id="B19">
<label>19</label>
<element-citation publication-type="web">
<article-title>DataWarrior V6.0.0 [Internet]</article-title>
<comment>Open Molecules; [cited 2024 Jan 30]. Available from: <uri xlink:href="https://openmolecules.org/datawarrior/">https://openmolecules.org/datawarrior/</uri></comment>
</element-citation>
</ref>
<ref id="B20">
<label>20</label>
<element-citation publication-type="web">
<article-title>Basis Sets [Internet]</article-title>
<comment>Gaussian, Inc.; [cited 2024 Jan 30]. Available from: <uri xlink:href="https://gaussian.com/basissets">https://gaussian.com/basissets</uri></comment>
</element-citation>
</ref>
<ref id="B21">
<label>21</label>
<element-citation publication-type="web">
<article-title>Avogadro: an open-source molecular builder and visualization tool. Version 1.1.1 [Internet]</article-title>
<comment>Avogadro Chemistry; c2022 [cited 2024 Jan 30]. Available from: <uri xlink:href="https://avogadro.cc/releases/avogadro_111/">https://avogadro.cc/releases/avogadro_111/</uri></comment>
</element-citation>
</ref>
<ref id="B22">
<label>22</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>O’Boyle</surname>
<given-names>NM</given-names>
</name>
<name>
<surname>Banck</surname>
<given-names>M</given-names>
</name>
<name>
<surname>James</surname>
<given-names>CA</given-names>
</name>
<name>
<surname>Morley</surname>
<given-names>C</given-names>
</name>
<name>
<surname>Vandermeersch</surname>
<given-names>T</given-names>
</name>
<name>
<surname>Hutchison</surname>
<given-names>GR</given-names>
</name>
</person-group>
<article-title>Open Babel: An open chemical toolbox</article-title>
<source>J Cheminform</source>
<year iso-8601-date="2011">2011</year>
<volume>3</volume>
<elocation-id>33</elocation-id>
<pub-id pub-id-type="doi">10.1186/1758-2946-3-33</pub-id>
<pub-id pub-id-type="pmid">21982300</pub-id>
<pub-id pub-id-type="pmcid">PMC3198950</pub-id>
</element-citation>
</ref>
<ref id="B23">
<label>23</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lee</surname>
<given-names>C</given-names>
</name>
<name>
<surname>Yang</surname>
<given-names>W</given-names>
</name>
<name>
<surname>Parr</surname>
<given-names>R</given-names>
</name>
</person-group>
<article-title>Development of the Colle-Salvetti correlation-energy formula into a functional of the electron density</article-title>
<source>Phys Rev B Condens Matter</source>
<year iso-8601-date="1988">1988</year>
<volume>37</volume>
<fpage>785</fpage>
<lpage>9</lpage>
<pub-id pub-id-type="doi">10.1103/physrevb.37.785</pub-id>
<pub-id pub-id-type="pmid">9944570</pub-id>
</element-citation>
</ref>
<ref id="B24">
<label>24</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Becke</surname>
<given-names>AD</given-names>
</name>
</person-group>
<article-title>Density-functional thermochemistry. III. The role of exact exchange</article-title>
<source>J Chem Phys.</source>
<year iso-8601-date="1993">1993</year>
<volume> 98</volume>
<fpage>5648</fpage>
<lpage>52</lpage>
<pub-id pub-id-type="doi">10.1063/1.464913</pub-id>
</element-citation>
</ref>
<ref id="B25">
<label>25</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Stephens</surname>
<given-names>PJ</given-names>
</name>
<name>
<surname>Devlin</surname>
<given-names>FJ</given-names>
</name>
<name>
<surname>Chabalowski</surname>
<given-names>CF</given-names>
</name>
<name>
<surname>Frisch</surname>
<given-names>MJ</given-names>
</name>
</person-group>
<article-title>Ab-Initio Calculation of Vibrational Absorption and Circular-Dichroism Spectra Using Density-Functional Force-Fields</article-title>
<source>J Phys Chem-Us</source>
<year iso-8601-date="1994">1994</year>
<volume>98</volume>
<fpage>11623</fpage>
<lpage>27</lpage>
<pub-id pub-id-type="doi">10.1021/j100096a001</pub-id>
</element-citation>
</ref>
<ref id="B26">
<label>26</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Curutchet</surname>
<given-names>C</given-names>
</name>
<name>
<surname>Orozco</surname>
<given-names>M</given-names>
</name>
<name>
<surname>Luque</surname>
<given-names>FJ</given-names>
</name>
</person-group>
<article-title>Solvation in octanol: Parametrization of the continuum MST model</article-title>
<source>J Comput Chem</source>
<year iso-8601-date="2001">2001</year>
<volume>22</volume>
<fpage>1180</fpage>
<lpage>93</lpage>
<pub-id pub-id-type="doi">10.1002/jcc.1076.abs</pub-id>
</element-citation>
</ref>
<ref id="B27">
<label>27</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Curutchet</surname>
<given-names>C</given-names>
</name>
<name>
<surname>Bidon-Chanal</surname>
<given-names>A</given-names>
</name>
<name>
<surname>Soteras</surname>
<given-names>I</given-names>
</name>
<name>
<surname>Orozco</surname>
<given-names>M</given-names>
</name>
<name>
<surname>Luque</surname>
<given-names>FJ</given-names>
</name>
</person-group>
<article-title>MST continuum study of the hydration free energies of monovalent ionic species</article-title>
<source>J Phys Chem B</source>
<year iso-8601-date="2005">2005</year>
<volume>109</volume>
<fpage>3565</fpage>
<lpage>74</lpage>
<pub-id pub-id-type="doi">10.1021/jp047197s</pub-id>
<pub-id pub-id-type="pmid">16851394</pub-id>
</element-citation>
</ref>
<ref id="B28">
<label>28</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Soteras</surname>
<given-names>I</given-names>
</name>
<name>
<surname>Curutchet</surname>
<given-names>C</given-names>
</name>
<name>
<surname>Bidon-Chanal</surname>
<given-names>A</given-names>
</name>
<name>
<surname>Orozco</surname>
<given-names>M</given-names>
</name>
<name>
<surname>Luque</surname>
<given-names>FJ</given-names>
</name>
</person-group>
<article-title>Extension of the MST model to the IEF formalism: HF and B3LYP parametrizations</article-title>
<source>J Mol Struc-Theochem</source>
<year iso-8601-date="2005">2005</year>
<volume>727</volume>
<fpage>29</fpage>
<lpage>40</lpage>
<pub-id pub-id-type="doi">10.1016/j.theochem.2005.02.029</pub-id>
</element-citation>
</ref>
<ref id="B29">
<label>29</label>
<element-citation publication-type="web">
<person-group person-group-type="author">
<name>
<surname>Frisch</surname>
<given-names>MJ</given-names>
</name>
<name>
<surname>Trucks</surname>
<given-names>GW</given-names>
</name>
<name>
<surname>Schlegel</surname>
<given-names>HB</given-names>
</name>
<name>
<surname>Scuseria</surname>
<given-names>GE</given-names>
</name>
<name>
<surname>Robb</surname>
<given-names>MA</given-names>
</name>
<name>
<surname>Cheeseman</surname>
<given-names>JR</given-names>
</name>
<etal>et al.</etal>
</person-group>
<article-title>Gaussian 16, Revision C</article-title>
<comment>01 [software]. 2019 Oct 14 [cited 2024 Jan 30]. Available from: <uri xlink:href="https://gaussian.com/gaussian16/">https://gaussian.com/gaussian16/</uri></comment>
</element-citation>
</ref>
<ref id="B30">
<label>30</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Fauchère</surname>
<given-names>JL</given-names>
</name>
<name>
<surname>Pliska</surname>
<given-names>V</given-names>
</name>
</person-group>
<article-title>Hydrophobic Parameters Π of Amino Acid Side Chains from the Partitioning of N-Acetyl-Amino Acid Amides</article-title>
<source>Eur J Med Chem</source>
<year iso-8601-date="1983">1983</year>
<volume>18</volume>
<fpage>369</fpage>
<lpage>75</lpage>
</element-citation>
</ref>
<ref id="B31">
<label>31</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Campanera</surname>
<given-names>JM</given-names>
</name>
<name>
<surname>Barril</surname>
<given-names>X</given-names>
</name>
<name>
<surname>Luque</surname>
<given-names>FJ</given-names>
</name>
</person-group>
<article-title>On the transferability of fractional contributions to the hydration free energy of amino acids</article-title>
<source>Theor Chem Acc</source>
<year iso-8601-date="2013">2013</year>
<volume>132</volume>
<elocation-id>1343</elocation-id>
<pub-id pub-id-type="doi">10.1007/s00214-013-1343-y</pub-id>
</element-citation>
</ref>
<ref id="B32">
<label>32</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lim</surname>
<given-names>JM</given-names>
</name>
<name>
<surname>Kim</surname>
<given-names>G</given-names>
</name>
<name>
<surname>Levine</surname>
<given-names>RL</given-names>
</name>
</person-group>
<article-title>Methionine in Proteins: It’s Not Just for Protein Initiation Anymore</article-title>
<source>Neurochem Res</source>
<year iso-8601-date="2019">2019</year>
<volume>44</volume>
<fpage>247</fpage>
<lpage>57</lpage>
<pub-id pub-id-type="doi">10.1007/s11064-017-2460-0</pub-id>
<pub-id pub-id-type="pmid">29327308</pub-id>
<pub-id pub-id-type="pmcid">PMC6446232</pub-id>
</element-citation>
</ref>
<ref id="B33">
<label>33</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Pinheiro</surname>
<given-names>S</given-names>
</name>
<name>
<surname>Soteras</surname>
<given-names>I</given-names>
</name>
<name>
<surname>Gelpí</surname>
<given-names>JL</given-names>
</name>
<name>
<surname>Dehez</surname>
<given-names>F</given-names>
</name>
<name>
<surname>Chipot</surname>
<given-names>C</given-names>
</name>
<name>
<surname>Luque</surname>
<given-names>FJ</given-names>
</name>
<etal>et al.</etal>
</person-group>
<article-title>Structural and energetic study of cation-π-cation interactions in proteins</article-title>
<source>Phys Chem Chem Phys</source>
<year iso-8601-date="2017">2017</year>
<volume>19</volume>
<fpage>9849</fpage>
<lpage>61</lpage>
<pub-id pub-id-type="doi">10.1039/c6cp08448f</pub-id>
<pub-id pub-id-type="pmid">28352893</pub-id>
</element-citation>
</ref>
<ref id="B34">
<label>34</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname>
<given-names>Z</given-names>
</name>
<name>
<surname>Tan</surname>
<given-names>M</given-names>
</name>
<name>
<surname>Xie</surname>
<given-names>Z</given-names>
</name>
<name>
<surname>Dai</surname>
<given-names>L</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>Y</given-names>
</name>
<name>
<surname>Zhao</surname>
<given-names>Y</given-names>
</name>
</person-group>
<article-title>Identification of lysine succinylation as a new post-translational modification</article-title>
<source>Nat Chem Biol</source>
<year iso-8601-date="2011">2011</year>
<volume>7</volume>
<fpage>58</fpage>
<lpage>63</lpage>
<pub-id pub-id-type="doi">10.1038/nchembio.495</pub-id>
<pub-id pub-id-type="pmid">21151122</pub-id>
<pub-id pub-id-type="pmcid">PMC3065206</pub-id>
</element-citation>
</ref>
<ref id="B35">
<label>35</label>
<element-citation publication-type="confproc">
<person-group person-group-type="author">
<name>
<surname>Matamoros</surname>
<given-names>P</given-names>
</name>
<name>
<surname>Pinheiro</surname>
<given-names>S</given-names>
</name>
<name>
<surname>Viayna</surname>
<given-names>A</given-names>
</name>
<name>
<surname>Zamora</surname>
<given-names>WJ</given-names>
</name>
</person-group>
<comment>Towards an understanding of the lipophilicity of non-coded amino acids: computational simulations of proline analogs. IEEE 4th International Conference on BioInspired Processing (BIP); 2022 Nov 15–17; Cartago, Costa Rica. IEEE; pp. 1–5.</comment>
<pub-id pub-id-type="doi">10.1109/BIP56202.2022.10032480</pub-id>
</element-citation>
</ref>
<ref id="B36">
<label>36</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Marenich</surname>
<given-names>AV</given-names>
</name>
<name>
<surname>Cramer</surname>
<given-names>CJ</given-names>
</name>
<name>
<surname>Truhlar</surname>
<given-names>DG</given-names>
</name>
</person-group>
<article-title>Universal solvation model based on solute electron density and on a continuum model of the solvent defined by the bulk dielectric constant and atomic surface tensions</article-title>
<source>J Phys Chem B</source>
<year iso-8601-date="2009">2009</year>
<volume>113</volume>
<fpage>6378</fpage>
<lpage>96</lpage>
<pub-id pub-id-type="doi">10.1021/jp810292n</pub-id>
<pub-id pub-id-type="pmid">19366259</pub-id>
</element-citation>
</ref>
<ref id="B37">
<label>37</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Soto</surname>
<given-names>P</given-names>
</name>
<name>
<surname>Mark</surname>
<given-names>AE</given-names>
</name>
</person-group>
<article-title>The Effect of the Neglect of Electronic Polarization in Peptide Folding Simulation</article-title>
<source>J Phys Chem B</source>
<year iso-8601-date="2002">2002</year>
<volume>106</volume>
<fpage>12830</fpage>
<lpage>3</lpage>
<pub-id pub-id-type="doi">10.1021/jp026526i</pub-id>
</element-citation>
</ref>
<ref id="B38">
<label>38</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gao</surname>
<given-names>J</given-names>
</name>
<name>
<surname>Truhlar</surname>
<given-names>DG</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>Y</given-names>
</name>
<name>
<surname>Mazack</surname>
<given-names>MJM</given-names>
</name>
<name>
<surname>Löffler</surname>
<given-names>P</given-names>
</name>
<name>
<surname>Provorse</surname>
<given-names>MR</given-names>
</name>
<etal>et al.</etal>
</person-group>
<article-title>Explicit polarization: a quantum mechanical framework for developing next generation force fields</article-title>
<source>Acc Chem Res</source>
<year iso-8601-date="2014">2014</year>
<volume>47</volume>
<fpage>2837</fpage>
<lpage>45</lpage>
<pub-id pub-id-type="doi">10.1021/ar5002186</pub-id>
<pub-id pub-id-type="pmid">25098651</pub-id>
<pub-id pub-id-type="pmcid">PMC4165456</pub-id>
</element-citation>
</ref>
<ref id="B39">
<label>39</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yarne</surname>
<given-names>DA</given-names>
</name>
<name>
<surname>Tuckerman</surname>
<given-names>ME</given-names>
</name>
<name>
<surname>Klein</surname>
<given-names>ML</given-names>
</name>
</person-group>
<article-title>Structural and dynamical behavior of an azide anion in water from ab initio molecular dynamics calculations</article-title>
<source>Chem Phys</source>
<year iso-8601-date="2000">2000</year>
<volume>258</volume>
<fpage>163</fpage>
<lpage>9</lpage>
<pub-id pub-id-type="doi">10.1016/S0301-0104(00)00114-2</pub-id>
</element-citation>
</ref>
<ref id="B40">
<label>40</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>York</surname>
<given-names>DM</given-names>
</name>
<name>
<surname>Lee</surname>
<given-names>TS</given-names>
</name>
<name>
<surname>Yang</surname>
<given-names>W</given-names>
</name>
</person-group>
<article-title>Quantum Mechanical Study of Aqueous Polarization Effects on Biological Macromolecules</article-title>
<source>J Am Chem Soc</source>
<year iso-8601-date="1996">1996</year>
<volume>118</volume>
<fpage>10940</fpage>
<lpage>1</lpage>
<pub-id pub-id-type="doi">10.1021/ja961937w</pub-id>
</element-citation>
</ref>
<ref id="B41">
<label>41</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname>
<given-names>D</given-names>
</name>
<name>
<surname>Lazim</surname>
<given-names>R</given-names>
</name>
<name>
<surname>Yip</surname>
<given-names>YM</given-names>
</name>
</person-group>
<article-title>Incorporating Polarizability of Backbone Hydrogen Bonds Improved Folding of Short α-Helical Peptides</article-title>
<source>Biophys J</source>
<year iso-8601-date="2019">2019</year>
<volume>117</volume>
<fpage>2079</fpage>
<lpage>86</lpage>
<pub-id pub-id-type="doi">10.1016/j.bpj.2019.10.020</pub-id>
<pub-id pub-id-type="pmid">31685242</pub-id>
<pub-id pub-id-type="pmcid">PMC6895711</pub-id>
</element-citation>
</ref>
<ref id="B42">
<label>42</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname>
<given-names>D</given-names>
</name>
<name>
<surname>Yip</surname>
<given-names>TM</given-names>
</name>
</person-group>
<article-title>Application of the polarized structure-specific backbone charge scheme on the folding of Beta3s</article-title>
<source>Chem Phys Lett</source>
<year iso-8601-date="2021">2021</year>
<volume>781</volume>
<elocation-id>138981</elocation-id>
<pub-id pub-id-type="doi">10.1016/j.cplett.2021.138981</pub-id>
</element-citation>
</ref>
<ref id="B43">
<label>43</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname>
<given-names>J</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>H</given-names>
</name>
<name>
<surname>Wu</surname>
<given-names>T</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>Q</given-names>
</name>
<name>
<surname>van der Spoel</surname>
<given-names>D</given-names>
</name>
</person-group>
<article-title>Comparison of Implicit and Explicit Solvent Models for the Calculation of Solvation Free Energy in Organic Solvents</article-title>
<source>J Chem Theory Comput</source>
<year iso-8601-date="2017">2017</year>
<volume>13</volume>
<fpage>1034</fpage>
<lpage>43</lpage>
<pub-id pub-id-type="doi">10.1021/acs.jctc.7b00169</pub-id>
<pub-id pub-id-type="pmid">28245118</pub-id>
</element-citation>
</ref>
<ref id="B44">
<label>44</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chen</surname>
<given-names>J</given-names>
</name>
<name>
<surname>Shao</surname>
<given-names>Y</given-names>
</name>
<name>
<surname>Ho</surname>
<given-names>J</given-names>
</name>
</person-group>
<article-title>Are Explicit Solvent Models More Accurate than Implicit Solvent Models? A Case Study on the Menschutkin Reaction</article-title>
<source>J Phys Chem A</source>
<year iso-8601-date="2019">2019</year>
<volume>123</volume>
<fpage>5580</fpage>
<lpage>9</lpage>
<pub-id pub-id-type="doi">10.1021/acs.jpca.9b03995</pub-id>
<pub-id pub-id-type="pmid">31244115</pub-id>
</element-citation>
</ref>
<ref id="B45">
<label>45</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ree</surname>
<given-names>R</given-names>
</name>
<name>
<surname>Varland</surname>
<given-names>S</given-names>
</name>
<name>
<surname>Arnesen</surname>
<given-names>T</given-names>
</name>
</person-group>
<article-title>Spotlight on protein N-terminal acetylation</article-title>
<source>Exp Mol Med</source>
<year iso-8601-date="2018">2018</year>
<volume>50</volume>
<fpage>1</fpage>
<lpage>13</lpage>
<pub-id pub-id-type="doi">10.1038/s12276-018-0116-z</pub-id>
<pub-id pub-id-type="pmid">30054468</pub-id>
<pub-id pub-id-type="pmcid">PMC6063853</pub-id>
</element-citation>
</ref>
<ref id="B46">
<label>46</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yan</surname>
<given-names>K</given-names>
</name>
<name>
<surname>Mousavi</surname>
<given-names>N</given-names>
</name>
<name>
<surname>Yang</surname>
<given-names>X</given-names>
</name>
</person-group>
<article-title>Analysis of Lysine Acetylation and Acetylation-like Acylation In Vitro and In Vivo</article-title>
<source>Curr Protoc</source>
<year iso-8601-date="2023">2023</year>
<volume>3</volume>
<elocation-id>e738</elocation-id>
<pub-id pub-id-type="doi">10.1002/cpz1.738</pub-id>
<pub-id pub-id-type="pmid">37184117</pub-id>
</element-citation>
</ref>
<ref id="B47">
<label>47</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mizero</surname>
<given-names>B</given-names>
</name>
<name>
<surname>Yeung</surname>
<given-names>D</given-names>
</name>
<name>
<surname>Spicer</surname>
<given-names>V</given-names>
</name>
<name>
<surname>Krokhin</surname>
<given-names>OV</given-names>
</name>
</person-group>
<article-title>Peptide retention time prediction for peptides with post-translational modifications: N-terminal (α-amine) and lysine (ε-amine) acetylation</article-title>
<source>J Chromatogr A</source>
<year iso-8601-date="2021">2021</year>
<volume>1657</volume>
<elocation-id>462584</elocation-id>
<pub-id pub-id-type="doi">10.1016/j.chroma.2021.462584</pub-id>
<pub-id pub-id-type="pmid">34619563</pub-id>
</element-citation>
</ref>
<ref id="B48">
<label>48</label>
<element-citation publication-type="web">
<article-title>Marvin Desktop Suite version 23.16.0 [Internet]</article-title>
<comment>Chemaxon Ltd.; c1998–2024 [cited 2024 Jan 30]. Available from: <uri xlink:href="https://chemaxon.com">https://chemaxon.com</uri></comment>
</element-citation>
</ref>
<ref id="B49">
<label>49</label>
<element-citation publication-type="web">
<article-title>Molinspiration Cheminformatics free web services [Internet]</article-title>
<comment>Slovensky Grob: Molinspiration Cheminformatics; c2024 [cited 2024 Jan 30]. Available from: <uri xlink:href="https://www.molinspiration.com/cgi/properties">https://www.molinspiration.com/cgi/properties</uri></comment>
</element-citation>
</ref>
<ref id="B50">
<label>50</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Işık</surname>
<given-names>M</given-names>
</name>
<name>
<surname>Bergazin</surname>
<given-names>TD</given-names>
</name>
<name>
<surname>Fox</surname>
<given-names>T</given-names>
</name>
<name>
<surname>Rizzi</surname>
<given-names>A</given-names>
</name>
<name>
<surname>Chodera</surname>
<given-names>JD</given-names>
</name>
<name>
<surname>Mobley</surname>
<given-names>DL</given-names>
</name>
</person-group>
<article-title>Assessing the accuracy of octanol-water partition coefficient predictions in the SAMPL6 Part II log P Challenge</article-title>
<source>J Comput Aided Mol Des</source>
<year iso-8601-date="2020">2020</year>
<volume>34</volume>
<fpage>335</fpage>
<lpage>70</lpage>
<pub-id pub-id-type="doi">10.1007/s10822-020-00295-0</pub-id>
<pub-id pub-id-type="pmid">32107702</pub-id>
<pub-id pub-id-type="pmcid">PMC7138020</pub-id>
</element-citation>
</ref>
<ref id="B51">
<label>51</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zamora</surname>
<given-names>WJ</given-names>
</name>
<name>
<surname>Pinheiro</surname>
<given-names>S</given-names>
</name>
<name>
<surname>German</surname>
<given-names>K</given-names>
</name>
<name>
<surname>Ràfols</surname>
<given-names>C</given-names>
</name>
<name>
<surname>Curutchet</surname>
<given-names>C</given-names>
</name>
<name>
<surname>Luque</surname>
<given-names>FJ</given-names>
</name>
</person-group>
<article-title>Prediction of the n-octanol/water partition coefficients in the SAMPL6 blind challenge from MST continuum solvation calculations</article-title>
<source>J Comput Aided Mol Des</source>
<year iso-8601-date="2020">2020</year>
<volume>34</volume>
<fpage>443</fpage>
<lpage>51</lpage>
<pub-id pub-id-type="doi">10.1007/s10822-019-00262-4</pub-id>
<pub-id pub-id-type="pmid">31776809</pub-id>
</element-citation>
</ref>
<ref id="B52">
<label>52</label>
<element-citation publication-type="journal">
<person-group person-group-type="author">
<name>
<surname>Viayna</surname>
<given-names>A</given-names>
</name>
<name>
<surname>Pinheiro</surname>
<given-names>S</given-names>
</name>
<name>
<surname>Curutchet</surname>
<given-names>C</given-names>
</name>
<name>
<surname>Luque</surname>
<given-names>FJ</given-names>
</name>
<name>
<surname>Zamora</surname>
<given-names>WJ</given-names>
</name>
</person-group>
<article-title>Prediction of n-octanol/water partition coefficients and acidity constants (pK<sub>a</sub>) in the SAMPL7 blind challenge with the IEFPCM-MST model</article-title>
<source>J Comput Aided Mol Des</source>
<year iso-8601-date="2021">2021</year>
<volume>35</volume>
<fpage>803</fpage>
<lpage>11</lpage>
<pub-id pub-id-type="doi">10.1007/s10822-021-00394-6</pub-id>
<pub-id pub-id-type="pmid">34244905</pub-id>
<pub-id pub-id-type="pmcid">PMC8295120</pub-id>
</element-citation>
</ref>
</ref-list>
</back>
</article>