From b860be0e5f12873c34d6efb367c2d9d722a666a4 Mon Sep 17 00:00:00 2001 From: Giovanni Stracquadanio Date: Thu, 4 Jul 2024 13:42:16 +0100 Subject: [PATCH] new: official release --- .bumpversion.toml | 24 + .devcontainer.json | 37 + .gitignore | 11 + LICENSE | 617 ++ bin/downstream.py | 766 ++ bin/miscellaneous.py | 836 ++ bin/models.py | 824 ++ bin/train.py | 1003 +++ bin/utilities.py | 2241 +++++ conf/base.config | 214 + containers/Dockerfile | 39 + containers/environment.yml | 27 + main.nf | 1744 ++++ nextflow.config | 8 + readme.md | 161 + testdata/1gs5.pdb | 2701 ++++++ testdata/1gs5_Repair_0_ST.fxout | 1 + testdata/MDH-Eukaryota-test.fasta | 300 + testdata/MDH-Human-seed-test.fasta | 3 + testdata/argB-short.fasta | 2 + testdata/argB.fasta | 6 + ...ataset-with-energies-short-sequences.fasta | 62 + testdata/dataset-with-energies.fasta | 7206 +++++++++++++++++ 23 files changed, 18833 insertions(+) create mode 100644 .bumpversion.toml create mode 100644 .devcontainer.json create mode 100644 .gitignore create mode 100644 LICENSE create mode 100755 bin/downstream.py create mode 100755 bin/miscellaneous.py create mode 100755 bin/models.py create mode 100755 bin/train.py create mode 100755 bin/utilities.py create mode 100644 conf/base.config create mode 100644 containers/Dockerfile create mode 100644 containers/environment.yml create mode 100644 main.nf create mode 100644 nextflow.config create mode 100644 readme.md create mode 100644 testdata/1gs5.pdb create mode 100644 testdata/1gs5_Repair_0_ST.fxout create mode 100644 testdata/MDH-Eukaryota-test.fasta create mode 100644 testdata/MDH-Human-seed-test.fasta create mode 100644 testdata/argB-short.fasta create mode 100644 testdata/argB.fasta create mode 100644 testdata/dataset-with-energies-short-sequences.fasta create mode 100644 testdata/dataset-with-energies.fasta diff --git a/.bumpversion.toml b/.bumpversion.toml new file mode 100644 index 0000000..62ceb9d --- /dev/null +++ b/.bumpversion.toml @@ -0,0 +1,24 @@ +[tool.bumpversion] +current_version = "1.0.0" +parse = "(?P\\d+)\\.(?P\\d+)\\.(?P\\d+)" +serialize = ["{major}.{minor}.{patch}"] +search = "{current_version}" +replace = "{new_version}" +regex = false +ignore_missing_version = false +ignore_missing_files = false +tag = true +sign_tags = false +tag_name = "v{new_version}" +tag_message = "Bump version: {current_version} → {new_version}" +allow_dirty = false +commit = true +message = "Bump version: {current_version} → {new_version}" +commit_args = "" + +[[tool.bumpversion.files]] +filename = "readme.md" + +[[tool.bumpversion.files]] +filename = "containers/Dockerfile" + diff --git a/.devcontainer.json b/.devcontainer.json new file mode 100644 index 0000000..9709b11 --- /dev/null +++ b/.devcontainer.json @@ -0,0 +1,37 @@ +{ + // setup a container to develop a python package using miniconda3 + "name": "prevent-nf", + "dockerFile": "containers/Dockerfile", + "context": ".", + "build": {"args": {"CONDA_FILE": "containers/environment.yml"}}, + + // Set *default* container specific settings.json values. + "settings": { + + "terminal.integrated.profiles.linux": { + "bash": { + "path": "/bin/bash", + } + }, + "terminal.integrated.defaultProfile.windows": "bash", + "python.pythonPath": "/opt/conda/bin/python", + "python.formatting.provider": "black", + "python.formatting.blackPath": "/opt/conda/bin/black", + "[python]": { + "editor.rulers": [ + 90 + ] + }, + }, + + // extensions for vscode + "extensions": [ + "ms-python.python", + "stkb.rewrap", + "donjayamanne.githistory", + "aaron-bond.better-comments", + "gruntfuggly.todo-tree", + "mhutchie.git-graph" + ], + +} \ No newline at end of file diff --git a/.gitignore b/.gitignore new file mode 100644 index 0000000..6a36724 --- /dev/null +++ b/.gitignore @@ -0,0 +1,11 @@ +work/ +results/ +logs/ +preprocessing/ +postprocessing/ +foldx-downloads/ +.DS_Store +*.pyc +.vscode +.nextflow* +optimizing_input.ipynb \ No newline at end of file diff --git a/LICENSE b/LICENSE new file mode 100644 index 0000000..e10ded3 --- /dev/null +++ b/LICENSE @@ -0,0 +1,617 @@ + GNU AFFERO GENERAL PUBLIC LICENSE + Version 3, 19 November 2007 + + Copyright (C) 2007 Free Software Foundation, Inc. + Everyone is permitted to copy and distribute verbatim copies + of this license document, but changing it is not allowed. + + Preamble + + The GNU Affero General Public License is a free, copyleft license for +software and other kinds of works, specifically designed to ensure +cooperation with the community in the case of network server software. + + The licenses for most software and other practical works are designed +to take away your freedom to share and change the works. By contrast, +our General Public Licenses are intended to guarantee your freedom to +share and change all versions of a program--to make sure it remains free +software for all its users. + + When we speak of free software, we are referring to freedom, not +price. Our General Public Licenses are designed to make sure that you +have the freedom to distribute copies of free software (and charge for +them if you wish), that you receive source code or can get it if you +want it, that you can change the software or use pieces of it in new +free programs, and that you know you can do these things. + + Developers that use our General Public Licenses protect your rights +with two steps: (1) assert copyright on the software, and (2) offer +you this License which gives you legal permission to copy, distribute +and/or modify the software. + + A secondary benefit of defending all users' freedom is that +improvements made in alternate versions of the program, if they +receive widespread use, become available for other developers to +incorporate. Many developers of free software are heartened and +encouraged by the resulting cooperation. However, in the case of +software used on network servers, this result may fail to come about. +The GNU General Public License permits making a modified version and +letting the public access it on a server without ever releasing its +source code to the public. + + The GNU Affero General Public License is designed specifically to +ensure that, in such cases, the modified source code becomes available +to the community. It requires the operator of a network server to +provide the source code of the modified version running there to the +users of that server. Therefore, public use of a modified version, on +a publicly accessible server, gives the public access to the source +code of the modified version. + + An older license, called the Affero General Public License and +published by Affero, was designed to accomplish similar goals. This is +a different license, not a version of the Affero GPL, but Affero has +released a new version of the Affero GPL which permits relicensing under +this license. + + The precise terms and conditions for copying, distribution and +modification follow. + + TERMS AND CONDITIONS + + 0. Definitions. + + "This License" refers to version 3 of the GNU Affero General Public License. + + "Copyright" also means copyright-like laws that apply to other kinds of +works, such as semiconductor masks. + + "The Program" refers to any copyrightable work licensed under this +License. Each licensee is addressed as "you". "Licensees" and +"recipients" may be individuals or organizations. + + To "modify" a work means to copy from or adapt all or part of the work +in a fashion requiring copyright permission, other than the making of an +exact copy. The resulting work is called a "modified version" of the +earlier work or a work "based on" the earlier work. + + A "covered work" means either the unmodified Program or a work based +on the Program. + + To "propagate" a work means to do anything with it that, without +permission, would make you directly or secondarily liable for +infringement under applicable copyright law, except executing it on a +computer or modifying a private copy. Propagation includes copying, +distribution (with or without modification), making available to the +public, and in some countries other activities as well. + + To "convey" a work means any kind of propagation that enables other +parties to make or receive copies. Mere interaction with a user through +a computer network, with no transfer of a copy, is not conveying. + + An interactive user interface displays "Appropriate Legal Notices" +to the extent that it includes a convenient and prominently visible +feature that (1) displays an appropriate copyright notice, and (2) +tells the user that there is no warranty for the work (except to the +extent that warranties are provided), that licensees may convey the +work under this License, and how to view a copy of this License. If +the interface presents a list of user commands or options, such as a +menu, a prominent item in the list meets this criterion. + + 1. Source Code. + + The "source code" for a work means the preferred form of the work +for making modifications to it. "Object code" means any non-source +form of a work. + + A "Standard Interface" means an interface that either is an official +standard defined by a recognized standards body, or, in the case of +interfaces specified for a particular programming language, one that +is widely used among developers working in that language. + + The "System Libraries" of an executable work include anything, other +than the work as a whole, that (a) is included in the normal form of +packaging a Major Component, but which is not part of that Major +Component, and (b) serves only to enable use of the work with that +Major Component, or to implement a Standard Interface for which an +implementation is available to the public in source code form. A +"Major Component", in this context, means a major essential component +(kernel, window system, and so on) of the specific operating system +(if any) on which the executable work runs, or a compiler used to +produce the work, or an object code interpreter used to run it. + + The "Corresponding Source" for a work in object code form means all +the source code needed to generate, install, and (for an executable +work) run the object code and to modify the work, including scripts to +control those activities. However, it does not include the work's +System Libraries, or general-purpose tools or generally available free +programs which are used unmodified in performing those activities but +which are not part of the work. For example, Corresponding Source +includes interface definition files associated with source files for +the work, and the source code for shared libraries and dynamically +linked subprograms that the work is specifically designed to require, +such as by intimate data communication or control flow between those +subprograms and other parts of the work. + + The Corresponding Source need not include anything that users +can regenerate automatically from other parts of the Corresponding +Source. + + The Corresponding Source for a work in source code form is that +same work. + + 2. Basic Permissions. + + All rights granted under this License are granted for the term of +copyright on the Program, and are irrevocable provided the stated +conditions are met. This License explicitly affirms your unlimited +permission to run the unmodified Program. The output from running a +covered work is covered by this License only if the output, given its +content, constitutes a covered work. This License acknowledges your +rights of fair use or other equivalent, as provided by copyright law. + + You may make, run and propagate covered works that you do not +convey, without conditions so long as your license otherwise remains +in force. You may convey covered works to others for the sole purpose +of having them make modifications exclusively for you, or provide you +with facilities for running those works, provided that you comply with +the terms of this License in conveying all material for which you do +not control copyright. Those thus making or running the covered works +for you must do so exclusively on your behalf, under your direction +and control, on terms that prohibit them from making any copies of +your copyrighted material outside their relationship with you. + + Conveying under any other circumstances is permitted solely under +the conditions stated below. Sublicensing is not allowed; section 10 +makes it unnecessary. + + 3. Protecting Users' Legal Rights From Anti-Circumvention Law. + + No covered work shall be deemed part of an effective technological +measure under any applicable law fulfilling obligations under article +11 of the WIPO copyright treaty adopted on 20 December 1996, or +similar laws prohibiting or restricting circumvention of such +measures. + + When you convey a covered work, you waive any legal power to forbid +circumvention of technological measures to the extent such circumvention +is effected by exercising rights under this License with respect to +the covered work, and you disclaim any intention to limit operation or +modification of the work as a means of enforcing, against the work's +users, your or third parties' legal rights to forbid circumvention of +technological measures. + + 4. Conveying Verbatim Copies. + + You may convey verbatim copies of the Program's source code as you +receive it, in any medium, provided that you conspicuously and +appropriately publish on each copy an appropriate copyright notice; +keep intact all notices stating that this License and any +non-permissive terms added in accord with section 7 apply to the code; +keep intact all notices of the absence of any warranty; and give all +recipients a copy of this License along with the Program. + + You may charge any price or no price for each copy that you convey, +and you may offer support or warranty protection for a fee. + + 5. Conveying Modified Source Versions. + + You may convey a work based on the Program, or the modifications to +produce it from the Program, in the form of source code under the +terms of section 4, provided that you also meet all of these conditions: + + a) The work must carry prominent notices stating that you modified + it, and giving a relevant date. + + b) The work must carry prominent notices stating that it is + released under this License and any conditions added under section + 7. This requirement modifies the requirement in section 4 to + "keep intact all notices". + + c) You must license the entire work, as a whole, under this + License to anyone who comes into possession of a copy. This + License will therefore apply, along with any applicable section 7 + additional terms, to the whole of the work, and all its parts, + regardless of how they are packaged. This License gives no + permission to license the work in any other way, but it does not + invalidate such permission if you have separately received it. + + d) If the work has interactive user interfaces, each must display + Appropriate Legal Notices; however, if the Program has interactive + interfaces that do not display Appropriate Legal Notices, your + work need not make them do so. + + A compilation of a covered work with other separate and independent +works, which are not by their nature extensions of the covered work, +and which are not combined with it such as to form a larger program, +in or on a volume of a storage or distribution medium, is called an +"aggregate" if the compilation and its resulting copyright are not +used to limit the access or legal rights of the compilation's users +beyond what the individual works permit. Inclusion of a covered work +in an aggregate does not cause this License to apply to the other +parts of the aggregate. + + 6. Conveying Non-Source Forms. + + You may convey a covered work in object code form under the terms +of sections 4 and 5, provided that you also convey the +machine-readable Corresponding Source under the terms of this License, +in one of these ways: + + a) Convey the object code in, or embodied in, a physical product + (including a physical distribution medium), accompanied by the + Corresponding Source fixed on a durable physical medium + customarily used for software interchange. + + b) Convey the object code in, or embodied in, a physical product + (including a physical distribution medium), accompanied by a + written offer, valid for at least three years and valid for as + long as you offer spare parts or customer support for that product + model, to give anyone who possesses the object code either (1) a + copy of the Corresponding Source for all the software in the + product that is covered by this License, on a durable physical + medium customarily used for software interchange, for a price no + more than your reasonable cost of physically performing this + conveying of source, or (2) access to copy the + Corresponding Source from a network server at no charge. + + c) Convey individual copies of the object code with a copy of the + written offer to provide the Corresponding Source. This + alternative is allowed only occasionally and noncommercially, and + only if you received the object code with such an offer, in accord + with subsection 6b. + + d) Convey the object code by offering access from a designated + place (gratis or for a charge), and offer equivalent access to the + Corresponding Source in the same way through the same place at no + further charge. You need not require recipients to copy the + Corresponding Source along with the object code. If the place to + copy the object code is a network server, the Corresponding Source + may be on a different server (operated by you or a third party) + that supports equivalent copying facilities, provided you maintain + clear directions next to the object code saying where to find the + Corresponding Source. Regardless of what server hosts the + Corresponding Source, you remain obligated to ensure that it is + available for as long as needed to satisfy these requirements. + + e) Convey the object code using peer-to-peer transmission, provided + you inform other peers where the object code and Corresponding + Source of the work are being offered to the general public at no + charge under subsection 6d. + + A separable portion of the object code, whose source code is excluded +from the Corresponding Source as a System Library, need not be +included in conveying the object code work. + + A "User Product" is either (1) a "consumer product", which means any +tangible personal property which is normally used for personal, family, +or household purposes, or (2) anything designed or sold for incorporation +into a dwelling. In determining whether a product is a consumer product, +doubtful cases shall be resolved in favor of coverage. For a particular +product received by a particular user, "normally used" refers to a +typical or common use of that class of product, regardless of the status +of the particular user or of the way in which the particular user +actually uses, or expects or is expected to use, the product. A product +is a consumer product regardless of whether the product has substantial +commercial, industrial or non-consumer uses, unless such uses represent +the only significant mode of use of the product. + + "Installation Information" for a User Product means any methods, +procedures, authorization keys, or other information required to install +and execute modified versions of a covered work in that User Product from +a modified version of its Corresponding Source. The information must +suffice to ensure that the continued functioning of the modified object +code is in no case prevented or interfered with solely because +modification has been made. + + If you convey an object code work under this section in, or with, or +specifically for use in, a User Product, and the conveying occurs as +part of a transaction in which the right of possession and use of the +User Product is transferred to the recipient in perpetuity or for a +fixed term (regardless of how the transaction is characterized), the +Corresponding Source conveyed under this section must be accompanied +by the Installation Information. But this requirement does not apply +if neither you nor any third party retains the ability to install +modified object code on the User Product (for example, the work has +been installed in ROM). + + The requirement to provide Installation Information does not include a +requirement to continue to provide support service, warranty, or updates +for a work that has been modified or installed by the recipient, or for +the User Product in which it has been modified or installed. Access to a +network may be denied when the modification itself materially and +adversely affects the operation of the network or violates the rules and +protocols for communication across the network. + + Corresponding Source conveyed, and Installation Information provided, +in accord with this section must be in a format that is publicly +documented (and with an implementation available to the public in +source code form), and must require no special password or key for +unpacking, reading or copying. + + 7. Additional Terms. + + "Additional permissions" are terms that supplement the terms of this +License by making exceptions from one or more of its conditions. +Additional permissions that are applicable to the entire Program shall +be treated as though they were included in this License, to the extent +that they are valid under applicable law. If additional permissions +apply only to part of the Program, that part may be used separately +under those permissions, but the entire Program remains governed by +this License without regard to the additional permissions. + + When you convey a copy of a covered work, you may at your option +remove any additional permissions from that copy, or from any part of +it. (Additional permissions may be written to require their own +removal in certain cases when you modify the work.) You may place +additional permissions on material, added by you to a covered work, +for which you have or can give appropriate copyright permission. + + Notwithstanding any other provision of this License, for material you +add to a covered work, you may (if authorized by the copyright holders of +that material) supplement the terms of this License with terms: + + a) Disclaiming warranty or limiting liability differently from the + terms of sections 15 and 16 of this License; or + + b) Requiring preservation of specified reasonable legal notices or + author attributions in that material or in the Appropriate Legal + Notices displayed by works containing it; or + + c) Prohibiting misrepresentation of the origin of that material, or + requiring that modified versions of such material be marked in + reasonable ways as different from the original version; or + + d) Limiting the use for publicity purposes of names of licensors or + authors of the material; or + + e) Declining to grant rights under trademark law for use of some + trade names, trademarks, or service marks; or + + f) Requiring indemnification of licensors and authors of that + material by anyone who conveys the material (or modified versions of + it) with contractual assumptions of liability to the recipient, for + any liability that these contractual assumptions directly impose on + those licensors and authors. + + All other non-permissive additional terms are considered "further +restrictions" within the meaning of section 10. If the Program as you +received it, or any part of it, contains a notice stating that it is +governed by this License along with a term that is a further +restriction, you may remove that term. If a license document contains +a further restriction but permits relicensing or conveying under this +License, you may add to a covered work material governed by the terms +of that license document, provided that the further restriction does +not survive such relicensing or conveying. + + If you add terms to a covered work in accord with this section, you +must place, in the relevant source files, a statement of the +additional terms that apply to those files, or a notice indicating +where to find the applicable terms. + + Additional terms, permissive or non-permissive, may be stated in the +form of a separately written license, or stated as exceptions; +the above requirements apply either way. + + 8. Termination. + + You may not propagate or modify a covered work except as expressly +provided under this License. Any attempt otherwise to propagate or +modify it is void, and will automatically terminate your rights under +this License (including any patent licenses granted under the third +paragraph of section 11). + + However, if you cease all violation of this License, then your +license from a particular copyright holder is reinstated (a) +provisionally, unless and until the copyright holder explicitly and +finally terminates your license, and (b) permanently, if the copyright +holder fails to notify you of the violation by some reasonable means +prior to 60 days after the cessation. + + Moreover, your license from a particular copyright holder is +reinstated permanently if the copyright holder notifies you of the +violation by some reasonable means, this is the first time you have +received notice of violation of this License (for any work) from that +copyright holder, and you cure the violation prior to 30 days after +your receipt of the notice. + + Termination of your rights under this section does not terminate the +licenses of parties who have received copies or rights from you under +this License. If your rights have been terminated and not permanently +reinstated, you do not qualify to receive new licenses for the same +material under section 10. + + 9. Acceptance Not Required for Having Copies. + + You are not required to accept this License in order to receive or +run a copy of the Program. Ancillary propagation of a covered work +occurring solely as a consequence of using peer-to-peer transmission +to receive a copy likewise does not require acceptance. However, +nothing other than this License grants you permission to propagate or +modify any covered work. These actions infringe copyright if you do +not accept this License. Therefore, by modifying or propagating a +covered work, you indicate your acceptance of this License to do so. + + 10. Automatic Licensing of Downstream Recipients. + + Each time you convey a covered work, the recipient automatically +receives a license from the original licensors, to run, modify and +propagate that work, subject to this License. You are not responsible +for enforcing compliance by third parties with this License. + + An "entity transaction" is a transaction transferring control of an +organization, or substantially all assets of one, or subdividing an +organization, or merging organizations. If propagation of a covered +work results from an entity transaction, each party to that +transaction who receives a copy of the work also receives whatever +licenses to the work the party's predecessor in interest had or could +give under the previous paragraph, plus a right to possession of the +Corresponding Source of the work from the predecessor in interest, if +the predecessor has it or can get it with reasonable efforts. + + You may not impose any further restrictions on the exercise of the +rights granted or affirmed under this License. For example, you may +not impose a license fee, royalty, or other charge for exercise of +rights granted under this License, and you may not initiate litigation +(including a cross-claim or counterclaim in a lawsuit) alleging that +any patent claim is infringed by making, using, selling, offering for +sale, or importing the Program or any portion of it. + + 11. Patents. + + A "contributor" is a copyright holder who authorizes use under this +License of the Program or a work on which the Program is based. The +work thus licensed is called the contributor's "contributor version". + + A contributor's "essential patent claims" are all patent claims +owned or controlled by the contributor, whether already acquired or +hereafter acquired, that would be infringed by some manner, permitted +by this License, of making, using, or selling its contributor version, +but do not include claims that would be infringed only as a +consequence of further modification of the contributor version. For +purposes of this definition, "control" includes the right to grant +patent sublicenses in a manner consistent with the requirements of +this License. + + Each contributor grants you a non-exclusive, worldwide, royalty-free +patent license under the contributor's essential patent claims, to +make, use, sell, offer for sale, import and otherwise run, modify and +propagate the contents of its contributor version. + + In the following three paragraphs, a "patent license" is any express +agreement or commitment, however denominated, not to enforce a patent +(such as an express permission to practice a patent or covenant not to +sue for patent infringement). To "grant" such a patent license to a +party means to make such an agreement or commitment not to enforce a +patent against the party. + + If you convey a covered work, knowingly relying on a patent license, +and the Corresponding Source of the work is not available for anyone +to copy, free of charge and under the terms of this License, through a +publicly available network server or other readily accessible means, +then you must either (1) cause the Corresponding Source to be so +available, or (2) arrange to deprive yourself of the benefit of the +patent license for this particular work, or (3) arrange, in a manner +consistent with the requirements of this License, to extend the patent +license to downstream recipients. "Knowingly relying" means you have +actual knowledge that, but for the patent license, your conveying the +covered work in a country, or your recipient's use of the covered work +in a country, would infringe one or more identifiable patents in that +country that you have reason to believe are valid. + + If, pursuant to or in connection with a single transaction or +arrangement, you convey, or propagate by procuring conveyance of, a +covered work, and grant a patent license to some of the parties +receiving the covered work authorizing them to use, propagate, modify +or convey a specific copy of the covered work, then the patent license +you grant is automatically extended to all recipients of the covered +work and works based on it. + + A patent license is "discriminatory" if it does not include within +the scope of its coverage, prohibits the exercise of, or is +conditioned on the non-exercise of one or more of the rights that are +specifically granted under this License. You may not convey a covered +work if you are a party to an arrangement with a third party that is +in the business of distributing software, under which you make payment +to the third party based on the extent of your activity of conveying +the work, and under which the third party grants, to any of the +parties who would receive the covered work from you, a discriminatory +patent license (a) in connection with copies of the covered work +conveyed by you (or copies made from those copies), or (b) primarily +for and in connection with specific products or compilations that +contain the covered work, unless you entered into that arrangement, +or that patent license was granted, prior to 28 March 2007. + + Nothing in this License shall be construed as excluding or limiting +any implied license or other defenses to infringement that may +otherwise be available to you under applicable patent law. + + 12. No Surrender of Others' Freedom. + + If conditions are imposed on you (whether by court order, agreement or +otherwise) that contradict the conditions of this License, they do not +excuse you from the conditions of this License. If you cannot convey a +covered work so as to satisfy simultaneously your obligations under this +License and any other pertinent obligations, then as a consequence you may +not convey it at all. For example, if you agree to terms that obligate you +to collect a royalty for further conveying from those to whom you convey +the Program, the only way you could satisfy both those terms and this +License would be to refrain entirely from conveying the Program. + + 13. Remote Network Interaction; Use with the GNU General Public License. + + Notwithstanding any other provision of this License, if you modify the +Program, your modified version must prominently offer all users +interacting with it remotely through a computer network (if your version +supports such interaction) an opportunity to receive the Corresponding +Source of your version by providing access to the Corresponding Source +from a network server at no charge, through some standard or customary +means of facilitating copying of software. This Corresponding Source +shall include the Corresponding Source for any work covered by version 3 +of the GNU General Public License that is incorporated pursuant to the +following paragraph. + + Notwithstanding any other provision of this License, you have +permission to link or combine any covered work with a work licensed +under version 3 of the GNU General Public License into a single +combined work, and to convey the resulting work. The terms of this +License will continue to apply to the part which is the covered work, +but the work with which it is combined will remain governed by version +3 of the GNU General Public License. + + 14. Revised Versions of this License. + + The Free Software Foundation may publish revised and/or new versions of +the GNU Affero General Public License from time to time. Such new versions +will be similar in spirit to the present version, but may differ in detail to +address new problems or concerns. + + Each version is given a distinguishing version number. If the +Program specifies that a certain numbered version of the GNU Affero General +Public License "or any later version" applies to it, you have the +option of following the terms and conditions either of that numbered +version or of any later version published by the Free Software +Foundation. If the Program does not specify a version number of the +GNU Affero General Public License, you may choose any version ever published +by the Free Software Foundation. + + If the Program specifies that a proxy can decide which future +versions of the GNU Affero General Public License can be used, that proxy's +public statement of acceptance of a version permanently authorizes you +to choose that version for the Program. + + Later license versions may give you additional or different +permissions. However, no additional obligations are imposed on any +author or copyright holder as a result of your choosing to follow a +later version. + + 15. Disclaimer of Warranty. + + THERE IS NO WARRANTY FOR THE PROGRAM, TO THE EXTENT PERMITTED BY +APPLICABLE LAW. EXCEPT WHEN OTHERWISE STATED IN WRITING THE COPYRIGHT +HOLDERS AND/OR OTHER PARTIES PROVIDE THE PROGRAM "AS IS" WITHOUT WARRANTY +OF ANY KIND, EITHER EXPRESSED OR IMPLIED, INCLUDING, BUT NOT LIMITED TO, +THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR +PURPOSE. THE ENTIRE RISK AS TO THE QUALITY AND PERFORMANCE OF THE PROGRAM +IS WITH YOU. SHOULD THE PROGRAM PROVE DEFECTIVE, YOU ASSUME THE COST OF +ALL NECESSARY SERVICING, REPAIR OR CORRECTION. + + 16. Limitation of Liability. + + IN NO EVENT UNLESS REQUIRED BY APPLICABLE LAW OR AGREED TO IN WRITING +WILL ANY COPYRIGHT HOLDER, OR ANY OTHER PARTY WHO MODIFIES AND/OR CONVEYS +THE PROGRAM AS PERMITTED ABOVE, BE LIABLE TO YOU FOR DAMAGES, INCLUDING ANY +GENERAL, SPECIAL, INCIDENTAL OR CONSEQUENTIAL DAMAGES ARISING OUT OF THE +USE OR INABILITY TO USE THE PROGRAM (INCLUDING BUT NOT LIMITED TO LOSS OF +DATA OR DATA BEING RENDERED INACCURATE OR LOSSES SUSTAINED BY YOU OR THIRD +PARTIES OR A FAILURE OF THE PROGRAM TO OPERATE WITH ANY OTHER PROGRAMS), +EVEN IF SUCH HOLDER OR OTHER PARTY HAS BEEN ADVISED OF THE POSSIBILITY OF +SUCH DAMAGES. + + 17. Interpretation of Sections 15 and 16. + + If the disclaimer of warranty and limitation of liability provided +above cannot be given local legal effect according to their terms, +reviewing courts shall apply local law that most closely approximates +an absolute waiver of all civil liability in connection with the +Program, unless a warranty or assumption of liability accompanies a +copy of the Program in return for a fee. \ No newline at end of file diff --git a/bin/downstream.py b/bin/downstream.py new file mode 100755 index 0000000..fdb86a7 --- /dev/null +++ b/bin/downstream.py @@ -0,0 +1,766 @@ +# PREVENT: PRotein Engineering by Variational frEe eNergy approximaTion +# Copyright (C) 2024 Giovanni Stracquadanio, Evgenii Lobzaev + +# This program is free software: you can redistribute it and/or modify +# it under the terms of the GNU Affero General Public License as published +# by the Free Software Foundation, either version 3 of the License, or +# (at your option) any later version. + +# This program is distributed in the hope that it will be useful, +# but WITHOUT ANY WARRANTY; without even the implied warranty of +# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the +# GNU Affero General Public License for more details. + +# You should have received a copy of the GNU Affero General Public License +# along with this program. If not, see . + +#!/usr/bin/env python3 +# -*- coding: utf-8 -*- + +import torch +import torch.nn +from torch.utils.data import DataLoader +from Bio import SeqIO +import numpy as np +import pandas as pd +import typer +import logging +from typing import List +import pickle +from models import TransformerVAE +from utilities import ( + SequenceData, + default_w2i_i2w, + ProteinSequencesDataset, + decode, + get_means_stds, # get means and stds of q(z|x) for a given dataset + sample_tf_using_prior, + sample_tf_using_posterior, + seq2_energy_tf, + predict_energies_using_tf_encoder, + sgd_optimisation, # completely unconstrained optimisation, performed using SGD pytorch + trust_region_optimisation, # optimisation with trust-region, some constraints are put on x0, performed using autograd-minimize + setup_logger, + obtain_best_results, + stats_compute, + present_results_of_protein_analysis + ) + +# typer setup +app = typer.Typer() +tf_app = typer.Typer() # for Transformer VAE models +predictor_app = typer.Typer() # for predictive models (GRU/TF encoder) +protein_app = typer.Typer() # for protein analysis + +app.add_typer(tf_app, name="transformer") +app.add_typer(predictor_app, name="predictor") +app.add_typer(protein_app,name="protanalysis") + + +#### GLOBAL CONST +# output columns for blastp +CSV_COLUMNS = ['qseqid','sseqid','score','bitscore','evalue','pident','ppos','qcovs'] + + +######################################################### VAE ######################## + +# sample from prior distribution +# sample sequence and energy, combine collapse identical sequences (by averaging energy and logp) +@tf_app.command("sample-prior") +def transformer_sample_prior( + pt_name : str, # pytorch file (trained model params) + pickle_name : str, # pickle file (input model params) + pickle_name_for_seq_tuple : str, # pickle filename to save seq_tuple + output_fasta_filename : str, # fasta filename to save VAE samples + n_samples : int = 10000, + seed : int = 0, + max_number_of_steps : int = 100 + ) -> None: + + seq_tuple = sample_tf_using_prior( + output_fasta_filename, + pt_name, + pickle_name, + n_samples = n_samples, + seed = seed, + max_number_of_steps = max_number_of_steps + ) + + # seq_tuple: (seq,logp(seq),associated z,id,description,seq certainty) as (list[str],float,numpy,str,str,list) + dict_to_pickle = { + "WT" : None, + "VAE": seq_tuple + } + + # save as pickle + pickle.dump( + dict_to_pickle, + open(pickle_name_for_seq_tuple,"wb") + ) + +# seq2energy prediction: take sampled sequences from "transformer_sample_prior" function +# run through encoder, generate {n_samples} latent variables z, decode energy +@tf_app.command("seq2energy") +def transformer_seq2energy_prior( + output_filename_main : str, # filename of main output + output_filename_template_csv : str, # filename template to save individual energies/elbos/etc + pt_name : str, # pytorch file (trained model params) + pickle_name : str, # pickle file (input model params) + clean_samples_fasta : str, # fasta file with clean samples + n_samples : int = 300, # total number of energies computed for a sequence + batch_size : int = 100, # number of energies computed in a single pass of NN (should divide n_samples evenly) + seed : int = 0 # random seed for sampling + ): + + # call seq2_energy_tf; save dictionary "data" as csv [main output] + data = seq2_energy_tf( + output_filename_template_csv, + pt_name, + pickle_name, + clean_samples_fasta, + n_samples = n_samples, + batch_size = batch_size, + seed = seed + ) + + # create dataframe and save + df = pd.DataFrame(data) + df.to_csv(output_filename_main) + +# sample from posterior distribution +@tf_app.command("sample-seeded") +def transformer_sample_posterior( + pt_name : str, # pytorch file with trained model params + pickle_name : str, # pickle file with input params + pickle_name_for_seq_tuple : str, # filename for a pickle file to save VAE (+WT) results + seed_fasta_file : str, # fasta file with single seed sequence + output_fasta_filename : str, # fasta filename to save VAE samples + max_number_of_steps : int = 500, + n_samples : int = 10, + mini_batch_size : int = 10, + seed : int = 0, + T : float = 0.0, + skip_first_element : bool = True + ) -> None: + + seq_tuple = sample_tf_using_posterior( + output_fasta_filename, + pt_name, + pickle_name, + seed_fasta_file, + max_number_of_steps = max_number_of_steps, + n_samples = n_samples, + mini_batch_size = mini_batch_size, + seed = seed, + T = T, + skip_first_element = skip_first_element + ) + + # save tuple + # take WT from seed fasta file + WT = [ + str(record.seq) for record in SeqIO.parse(seed_fasta_file,"fasta") + ][0] + # seq_tuple: (seq,logp(seq),associated z,id,description,seq certainty) as (list[str],float,numpy,str,str,list) + dict_to_pickle = { + "WT" : WT, + "VAE": seq_tuple + } + + # save as pickle + pickle.dump( + dict_to_pickle, + open(pickle_name_for_seq_tuple,"wb") + ) + +# running SGD on energy function +@tf_app.command("sgd-optimization") +def optimize_latent_space( + pt_name : str, # pytorch file with trained model params + pickle_name : str, # pickle file with input params + logger_name : str, # logger name to keep progress (useful for debugging or adapting parameters) + interm_results_template : str, # intermediate results filename template + best_results_filename : str, # best results filename + seed : int = 0, # random seed (important for random starting point) + learning_rate : float = 0.0001, # learning rate for SGD + n_restarts : int = 5, # number of restarts withing a single optimization run + delta_f_tol : float = 0.0001, # tolerance for function change: if function change is smaller, stop the optimisation + max_opt_steps : int = 100, # maximum number of optimisation steps + )->None: + # set random seed + torch.manual_seed(seed) + + # get logger + logger = setup_logger( 'logger', logger_name, level = logging.INFO ) + logger.info(f"Random seed: {seed}") + + # to keep track of best results + best_energy = float('inf') + best_results = { + "opt_energy": None, + "opt_z" : None, + "sequences" : None + } + + # loop over attempts + for restart in range(n_restarts): + logger.info(f"Restart : {restart+1}") + logger.info("-"*30) + + # get optimal results (optimal z; optimal energy; list of sequences obtained throughout optimisation) + opt_z, opt_energy, sequences = sgd_optimisation( + pt_name, + pickle_name, + logger, + learning_rate, + delta_f_tol, + max_opt_steps + ) + filename_ = f"{interm_results_template}-restart-{restart}.fasta" + result_string = f"Restart {restart+1}, optimal energy: {opt_energy}; optimisation progress saved in file:{filename_}" + logger.info(result_string) + + # save results + SeqIO.write( + sequences, + filename_, + "fasta" + ) + logger.info("-"*30) + + # determine best results + if opt_energy < best_energy: + best_results["opt_energy"] = opt_energy + best_results["opt_z"] = opt_z + best_results["sequences"] = sequences + #logger.info(f"Best energy:{best_energy:0.7f}, current energy:{opt_energy:0.7f}") + + # redefine best(smallest) energy + best_energy = opt_energy + + + # now we can write best results + result_string = f"Best energy achieved: {best_energy}; optimisation progress saved in file:{best_results_filename}" + logger.info(result_string) + + # save + SeqIO.write( + best_results["sequences"], + best_results_filename, + "fasta" + ) + +# running trust region optimisation on energy function +# here: within N(0,1) but later need to change for N(mu(seq),std(seq)) +##################### KEEPING THIS FOR NOW, MAY DELETE LATER ##################### +@tf_app.command("trust-region-optimization") +def optimize_latent_space_trust_region( + pt_name : str, # pytorch file with trained model params + pickle_name : str, # pickle file with input params + logger_name : str, # logger name to keep progress (useful for debugging or adapting parameters) + output_filename_fasta : str, # FASTA filename for results + pickle_name_for_seq_tuple : str, # pickle filename for results + seed_fasta_file : str = None, # FASTA file with a seed sequence (if not provided, prior distribution is used) + max_number_of_steps : int = 100, # maximum number of recurrent steps in sampling procedure (i.e. equal to WT seq length) + n_samples : int = 500, # how many samples to generate from a given Z (should be a multiple of 100!) + seed : int = 0, # random seed (important for random starting point) + )->None: + # set random seed + torch.manual_seed(seed) + np.random.seed(seed) + + # get logger + logger = setup_logger( 'logger', logger_name, level = logging.INFO ) + logger.info(f"Random seed: {seed}") + + # get the model + # instantiate model object + vars = pickle.load(open(pickle_name, "rb" )) + + # set device + device = torch.device("cuda" if torch.cuda.is_available() else "cpu") + + # force cpu, if only cpu is available + vars["device"] = device + logger.info(f"Device used: {device}") + + # instantiate model + model = TransformerVAE(**vars) + + # load trained parameters + checkpoint = torch.load(pt_name,map_location = device) + model.load_state_dict(checkpoint['model_state_dict']) + model.eval() + + # extract mlp2energy + f_z = model.get_submodule("mlp2energy") + + # move to GPU + f_z = f_z.to(device) + model = model.to(device) + + f_z.eval() + + # double precision + model = model.double() + f_z = f_z.double() + + + # batch size is always 1 here + batch_size = 1 + latent_size = vars["latent_size"] + + + # get i2w map and eos_idx + w2i,i2w = default_w2i_i2w() + # create a list of improper tokens + improper_token_list = [ + w2i[''], # + w2i[''], # + w2i[''], # + w2i[''] # + ] + + ##### need to obtain mu/sigma if seed_fasta_file is provided + if seed_fasta_file != None: + + ############## USING SEEDED DISTRIBUTION ################# + + # get max_seq_length from vars dictionary (subtract 1 as 1 is added in dataset constructor) + max_sequence_length = vars["max_seq_length"] - 1 + # dataset and dataloader + dataset = ProteinSequencesDataset( + seed_fasta_file, + w2i, + i2w, + device, + max_sequence_length = max_sequence_length + ) + dataloader = DataLoader(dataset, batch_size=1, shuffle=False) + + # check that dataloader contains only 1 element + assert len(dataloader) == 1, "Dataloader should contain a single batch of size 1. Check FASTA file with which you construct dataset." + + # do a forward pass to obtain mu/sigma + with torch.no_grad(): + for batch in dataloader: + # get data (here: batch = 1 sequence) + src = batch['input'] + reference_ = batch["reference"][0] + + # obtain mu and sigma + _,mean,logv,_ = model( + src, # Src in Transformer architecture + src, # Tgt in Transformer architecture + masking_prob = 0.0 # masking probability to mask Tgt + ) + std = torch.exp(0.5 * logv) + + # sample random value (will be a starting point) + z = torch.randn( + [batch_size, latent_size], + dtype = torch.double, + device = device + ) + # [Batch Size, Latent Size] # this is our latent representation + x0 = z * std + mean + + # create bounds: [Batch Size, Latent Size] + left_bound = mean - 3.0 * std + right_bound = mean + 3.0 * std + + logger.info(f"Optimisation run for the seeded distribution for sequence {reference_}") + logger.info(f"mean (as tensor) : {mean}") + logger.info(f"std (as tensor) : {std}") + logger.info(f"x0 (as tensor) : {x0}") + logger.info(f"left_bound (as tensor) : {left_bound}") + logger.info(f"right_bound (as tensor) : {right_bound}") + + # move to CPU and to numpy/list + x0 = np.array( + x0.squeeze(0).tolist() # [batch size = 1, latent size] -> [latent_size] -> move to CPU + ) + left_bound = left_bound.squeeze(0).tolist() + right_bound = right_bound.squeeze(0).tolist() + + bounds = [(left_bound[i],right_bound[i]) for i in range(latent_size)] + + logger.info(f"Initial starting point : {x0}") + logger.info(f"Bounds : {bounds}") + + print("x0 :", x0) + print("bounds:", bounds) + + ############## USING PRIOR DISTRIBUTION ################# + else: + logger.info("Optimisation run for the prior distribution") + reference_ = "None" + + # create starting point + # x0 is a random draw from N(0,I) + x0 = np.random.randn(latent_size) + # create bounds: every coordinate of x should be between -3.0 and 3.0 + bounds = [(-3.0,3.0)]*latent_size + + logger.info(f"Initial starting point: {x0}") + logger.info(f"Bounds : {bounds}") + + print("x0 :", x0) + print("bounds:", bounds) + + # call the function -> will return double + z_opt, energy_opt = trust_region_optimisation( + f_z, + x0, + bounds, + logger, + device + ) + + # now we can do sampling using z_opt (which corresponds to energy_opt value) + # record objects list + records = [] + + # sequences list + sequences = [] + + # we will do argmax and categorical sampling + # check how many times we need to do in batches of 100 + n_times = n_samples//100 + + # need to batchify z; right now it is just a list, we need to create a torch.tensor of this list and copy it 100 times + z_tensor = torch.tensor( + [z_opt], + dtype = torch.double, + device = device + ) # should create a tensor of size [1,latent_size] + z_tensor_batch = z_tensor.repeat([100,1]) # should be of size [100,latent_size] where each row is a copy of 1st row + + + with torch.no_grad(): + ############################################## argmax sampling + # sample and convert to numpy + if torch.cuda.is_available(): + logp,indices,z_out,energies,_ = model.sample_from_latent_space( + 1, + max_length = max_number_of_steps, + z = z_tensor, + argmax = True + ) + logp,indices,z_out,energies = logp.cpu().numpy(),indices.cpu().numpy(),z_out.cpu().numpy(),energies.cpu().numpy() + else: + logp,indices,z_out,energies,_ = model.sample_from_latent_space( + 1, + max_length = max_number_of_steps, + z = z_tensor, + argmax = True + ) + logp,indices,z_out,energies = logp.numpy(),indices.numpy(),z_out.numpy(),energies.numpy() + + # decode sequences and append to sequence list + sequences.extend( + decode( + indices, + logp, + z_out, + energies, + i2w, + improper_token_list + ) + ) + ############################################## categorical sampling (T=1.0) + for _ in range(n_times): + # sample and convert to numpy + if torch.cuda.is_available(): + logp,indices,z_out,energies,_ = model.sample_from_latent_space( + 100, + max_length = max_number_of_steps, + z = z_tensor_batch, + argmax = False + ) + logp,indices,z_out,energies = logp.cpu().numpy(),indices.cpu().numpy(),z_out.cpu().numpy(),energies.cpu().numpy() + else: + logp,indices,z_out,energies,_ = model.sample_from_latent_space( + 100, + max_length = max_number_of_steps, + z = z_tensor_batch, + argmax = False + ) + logp,indices,z_out,energies = logp.numpy(),indices.numpy(),z_out.numpy(),energies.numpy() + + # decode sequences and append to sequence list + sequences.extend( + decode( + indices, + logp, + z_out, + energies, + i2w, + improper_token_list + ) + ) + + # create SeqRecords and save as FASTA + # copied from sample_tf_using_prior + + # sequences we already observed + observed_sequences = [] + + # counter + cnt = 1 + + # seq_tuple: (seq,list(energies),logp(seq),associated z,id,description) as (list[str],list(float),numpy,str,str) + seq_tuple = [] + + # dictionary seq2object + seq2obj = {} + + # combine data to have the following structure: {(seq,all energies, all logps, all zs, id, description)} + for element in sequences: + + # obtain sequence and its logp + seq = "".join(element[0]) # here as string, not as list, list not hashable + associated_energy = element[1] + logp_seq = element[2] + associated_z = element[3] + + # if we haven't seen this sequence yet + if seq not in observed_sequences: + # since we haven't sorted sequences, first element of ${sequences} is the one with argmax // actually it will be first one anyways + if cnt == 1: + id_ = f"seq-{cnt}-argmax" + else: + id_ = f"seq-{cnt}" + # generate new instance of class SequenceData + seq2obj[seq] = SequenceData( + seq, + id_, + associated_energy, + logp_seq, + associated_z + ) + # add to the observed sequences, increase the counter + observed_sequences.append(seq) + cnt += 1 + else: + # update an object of type SequenceData (but we need to update a specific object, need a quick lookup!) + # lookup: seq -> SequenceData instance + seq2obj[seq].update_info( + associated_energy, + logp_seq, + associated_z + ) + # once data is combined we need to generate description, add to seq_tuple, add to records + # loop over pairs (seq, SequenceData) + for k,v in seq2obj.items(): + v.generate_description(seedID = reference_) # to have a human readable description + seq_tuple.append(v.toTuple) # append to list as a tuple + records.append(v.toSeqRecord) # append to list as SeqRecord + + + # save records list as FASTA file + SeqIO.write(records,output_filename_fasta,"fasta") + + # seq_tuple: (seq,logp(seq),associated z,id,description,seq certainty) as (list[str],float,numpy,str,str,list) + dict_to_pickle = { + "WT" : None, + "VAE": seq_tuple + } + + # save as pickle + pickle.dump( + dict_to_pickle, + open(pickle_name_for_seq_tuple,"wb") + ) + + +@tf_app.command("estimate-latent-space") +def latent_space_estimation( + output_filename_means : str, # filename for means of q(z|x) + output_filename_stds : str, # filename for stds of q(z|x) + pt_name : str, # pytorch file with pretraine dlayers + pickle_name : str, # pickle file with model inputs + fasta_file : str, # FASTA file with sequences + batch_size : int = 4, # how many sequences to process in a batch + max_sequence_length : int = 500, # max sequence length for Dataset construction + seed : int = 0 + ): + # call function get_means_stds + get_means_stds( + output_filename_means, + output_filename_stds, + pt_name, + pickle_name, + fasta_file, + batch_size = batch_size, + max_sequence_length = max_sequence_length, + seed = seed + ) + +# obtain mu/sigma from a seed sequence -> construct bounds -> call trust_region_optimisation +# @tf_app.command("trust-region-optimization-seeded") +# def optimize_latent_space_trust_region_seeded( +# pt_name : str, # pytorch file with trained model params +# pickle_name : str, # pickle file with input params +# seed_fasta : str, # FASTA file with a seed sequence +# logger_name : str, # logger name to keep progress (useful for debugging or adapting parameters) +# best_results_filename : str, # best results filename +# seed : int = 0, # random seed (important for random starting point) +# )->None: +# # set random seed +# torch.manual_seed(seed) +# np.random.seed(seed) + +# # get logger +# logger = setup_logger( 'logger', logger_name, level = logging.INFO ) +# logger.info(f"Random seed: {seed}") + +# # get the model +# # instantiate model object +# vars = pickle.load(open(pickle_name, "rb" )) + +# # set device +# device = torch.device("cuda" if torch.cuda.is_available() else "cpu") + +# # force cpu, if only cpu is available +# vars["device"] = device +# logger.info(f"Device used: {device}") + +# # instantiate model +# model = TransformerVAE(**vars) + +# # load trained parameters +# checkpoint = torch.load(pt_name,map_location = device) +# model.load_state_dict(checkpoint['model_state_dict']) +# model.eval() + +# # extract mlp2energy +# f_z = model.get_submodule("mlp2energy") + +# # move to GPU +# f_z = f_z.to(device) +# model = model.to(device) + +# f_z.eval() + +# # forward pass through encoder to get mu/sigma/z + +# # double precision + +# # create starting point +# # we will be working with a single z, so set batch_size to 1 +# batch_size = 1 +# latent_size = vars["latent_size"] +# x0 = np.random.randn(latent_size) # TODO: check if we need to use (batch_size, latent_size) + +# # create bounds: every coordinate of x should be between -3.0 and 3.0 +# bounds = [(-3.0,3.0)]*latent_size + +# # call the function -> will return double +# x_opt, f_opt = trust_region_optimisation( +# f_z.double(), +# x0, +# bounds, +# logger, +# device +# ) + + + + + +########################################################## PREDICTIVE MODELS ##################### +@predictor_app.command("tf-predict-energy") +def predict_energy_tf( + output_filename_fasta : str, # filename to save FASTA + output_filename_csv : str, # filename to save energies CSV + pt_name : str, # pytorch file (trained model params) + pickle_name : str, # pickle file (input model params) + clean_samples_fasta : str, # fasta file with clean samples + seed : int = 0 # random seed for sampling + )->None: + # call seq2_energy_tf; save dictionary "data" as csv + data = predict_energies_using_tf_encoder( + output_filename_fasta, + pt_name, + pickle_name, + clean_samples_fasta, + seed = seed + ) + print("data:") + print(data) + + # create dataframe and save + df = pd.DataFrame(data) + df.to_csv(output_filename_csv,index=False) + +########################################################## OTHER ################################### + +### compute statistics from csv file (which we obtained from blastp and subsequent filtering) +@tf_app.command("csv-stats") +def csv2stats( + csv_file : str, # csv file (output of blastp) + logname : str, # filename for log file + n_samples: int # number of requested samples (a multiple of 100) + ) -> None: + + # logger + logger = setup_logger( 'logger', logname, level = logging.INFO ) + + # obtain identities/similarities/bitscores as lists + identities, similarities, bitscores = obtain_best_results( + csv_file, + CSV_COLUMNS + ) + # if anything is None, we are done + if (identities is None) and (similarities is None) and (bitscores is None): + str_ = "No good samples were generated." + logger.info(str_) + + else: + # assert equal lengths + assert len(identities) == len(similarities) == len(bitscores), "Length mismatch" + n_good = len(identities) + n_good_pct = n_good/n_samples * 100 + str_ = f"Number of requested samples: {n_samples}, number of filtered samples: {n_good} ({n_good_pct:0.2f}%)\n" + str_ += stats_compute(identities,"identity score") + str_ += stats_compute(similarities,"similarity score") + str_ += stats_compute(bitscores,"bitscore") + logger.info(str_) + +# not used +@protein_app.command("prior") +def do_protein_analysis_prior( + pickle_name : str, # pickle filename with with saved sequences + log_name : str, # log name + model_identifier : str # correposnding to best train/validation error, etc + ) -> None: + # some preparations + # copy from enzyme_datasets + amino_acids = ['A','R','N','D','C','Q','E','G','H','I','L','K','M','F','P','S','T','W','Y','V'] + + # create logger + setup_logger( 'logger', log_name, level = logging.INFO ) + logger = logging.getLogger('logger') + + # load pickle with seq_tuple_dict [seq, logp(seq), associated z, id, description] + seq_tuple_dict = pickle.load(open(pickle_name, "rb" )) + seq_tuple = seq_tuple_dict["VAE"] + + + str_ = f"Working with sequences (from the prior) from model: {model_identifier}." + logger.info(str_) + + # start protein analysis + _ = present_results_of_protein_analysis( + seq_tuple, + amino_acids, + logger, + f"prior-samples-{model_identifier}" + ) + logger.info(f"Protein analysis completed.\n") + +# call it +if __name__ == "__main__": + app() + diff --git a/bin/miscellaneous.py b/bin/miscellaneous.py new file mode 100755 index 0000000..6da79e0 --- /dev/null +++ b/bin/miscellaneous.py @@ -0,0 +1,836 @@ +# PREVENT: PRotein Engineering by Variational frEe eNergy approximaTion +# Copyright (C) 2024 Giovanni Stracquadanio, Evgenii Lobzaev + +# This program is free software: you can redistribute it and/or modify +# it under the terms of the GNU Affero General Public License as published +# by the Free Software Foundation, either version 3 of the License, or +# (at your option) any later version. + +# This program is distributed in the hope that it will be useful, +# but WITHOUT ANY WARRANTY; without even the implied warranty of +# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the +# GNU Affero General Public License for more details. + +# You should have received a copy of the GNU Affero General Public License +# along with this program. If not, see . + +#!/usr/bin/env python3 +# -*- coding: utf-8 -*- + +from Bio import SeqIO,AlignIO +from Bio.Seq import Seq +from Bio.SeqRecord import SeqRecord +import typer +from typing import List +import random +import pickle +import copy +import pandas as pd +import numpy as np +from utilities import ( + setup_logger, + compute_stats, + pass_filter, + default_w2i_i2w, + mutate + ) +import logging +from matplotlib import pyplot as plt + +#### GLOBAL CONST +CSV_COLUMNS = ['qseqid','sseqid','score','bitscore','evalue','pident','ppos','qcovs'] + +# main app +app = typer.Typer() +various_app = typer.Typer() +foldx_app = typer.Typer() +app.add_typer(various_app, name = "various") +app.add_typer(foldx_app, name = "foldx") + + +# rebalance training/validation sets to achieve desired proportions +@various_app.command("rebalance-sets") +def rebalance_sets( + combined_fasta_file : str, # contains all clean sequences + pre_validation_fasta_file : str, # fasta file which was obtained by mmseqs2 clustering + train_set_filename : str, # filename for train set FASTA file + validation_set_filename : str, # filename for validatin set FASTA file + log_filename : str, # filename for log file + val_pct : float = 0.2, # pct of total sequences that should be in validation set + seed : int = 0 # random seed + ) -> None: + + # some inline funtion to obtain a subset of records from a big record list + def obtain_records(all_records:list, subset_of_seq_ids:list): + subset_records = [] + for record in all_records: + if record.id in subset_of_seq_ids: + subset_records.append(record) + return subset_records + + # make sure val_pct is in [0.0;0.5] + assert 0.0<=val_pct<=0.5, "Validation percent argument must be between 0.0 and 0.5" + + # set seed + random.seed(seed) + + # we will create a logger for this operation + setup_logger( 'logger', log_filename, level = logging.INFO ) + logger = logging.getLogger('logger') + + ################################## LOAD AS IS: BEFORE REBALANCING ####################### + + # let's load all records and their IDs + all_records = [ record for record in SeqIO.parse(combined_fasta_file, "fasta") ] + all_records_ids = sorted([ record.id for record in all_records ]) + + # load pre-validation-records IDs + pre_val_seq_ids = sorted([ record.id for record in SeqIO.parse(pre_validation_fasta_file, "fasta") ]) + + # get pre-train-ids: all those that are in all_records_ids but not in pre_val_seq_ids + pre_train_seq_ids = sorted( + list( + set(all_records_ids) - set(pre_val_seq_ids) # using set difference + ) + ) + # log results before rebalancing + n_all = len(all_records_ids) + n_pre_validation = len(pre_val_seq_ids) + n_pre_train = len(pre_train_seq_ids) + + val_pct_effective = n_pre_validation/n_all * 100 + train_pct_effective = n_pre_train/n_all * 100 + + # number of samples required to be in train/validation sets + required_n_val = int(val_pct * n_all) + required_n_train = n_all - required_n_val + + # log this information + str_ = "Before rebalancing...\n" + str_ += f"Total number of records : {n_all}\n" + str_ += f"Number of records in validation file before rebalancing : {n_pre_validation} ({val_pct_effective:0.4f})%\n" + str_ += f"Number of records in train file before rebalancing : {n_pre_train} ({train_pct_effective:0.4f})%\n" + str_ += f"Required number of records in validation set : {required_n_val}\n" + str_ += f"Required number of records in train set : {required_n_train}\n" + logger.info(str_) + + assert n_pre_train + n_pre_validation == n_all, "Total number of records must be equal to number of records in train and validation sets before rebalancing." + + # consider three possibilities + if n_pre_validation > required_n_val: + # 1. you have too many sequences in validation set + # move some sequences from validation set to train set + n_seq_to_move = n_pre_validation - required_n_val # you want to move the difference to train set + seq_ids_to_move = random.sample(pre_val_seq_ids,n_seq_to_move) # select this number of objects from pre_validation_records + + # now we will drop these ids from validation and add them to train + train_ids = pre_train_seq_ids + seq_ids_to_move + validation_ids = list( + set(pre_val_seq_ids) - set(seq_ids_to_move) + ) + + # obtain records + train_records = obtain_records(all_records,train_ids) + validation_records = obtain_records(all_records,validation_ids) + + # log information about rebalancing + n_train_after_rabalcning = len(train_records) + n_val_after_rebalancing = len(validation_records) + + val_pct_effective = n_val_after_rebalancing/n_all * 100 + train_pct_effective = n_train_after_rabalcning/n_all * 100 + + str_ = f"Rebalancing from validation set into train set. {n_seq_to_move} will be moved.\n" + str_ += f"Number of records in validation file after rebalancing : {n_val_after_rebalancing} ({val_pct_effective:0.4f})%\n" + str_ += f"Number of records in train file after rebalancing : {n_train_after_rabalcning} ({train_pct_effective:0.4f})%\n" + str_ += f"Moved sequences:\n" + for seq in seq_ids_to_move: + str_ += f"{seq}\n" + logger.info(str_) + + assert n_train_after_rabalcning + n_val_after_rebalancing == n_all, "Total number of records must be equal to number of records in train and validation sets after rebalancing." + + # now we can save + # save train set + SeqIO.write( + train_records, + train_set_filename, + "fasta" + ) + # and its stats + compute_stats( + train_records, + "train-set-stats.txt" + ) + + # save validation set + SeqIO.write( + validation_records, + validation_set_filename, + "fasta" + ) + # and its stats + compute_stats( + validation_records, + "validation-set-stats.txt" + ) + + elif n_pre_validation < required_n_val: + # 2. you have too little sequences in validation set + # move some sequence from train set to validation set + + n_seq_to_move = required_n_val - n_pre_validation # you want to move the difference from train set to validation set + seq_ids_to_move = random.sample(pre_train_seq_ids,n_seq_to_move) # select this number of objects from ${pre_train_records} + + # now we will drop these ids from train set and add them to validation set + validation_ids = pre_val_seq_ids + seq_ids_to_move + train_ids = list( + set(pre_train_seq_ids) - set(seq_ids_to_move) + ) + + # obtain records + train_records = obtain_records(all_records,train_ids) + validation_records = obtain_records(all_records,validation_ids) + + # log information about rebalancing + n_train_after_rabalncing = len(train_records) + n_val_after_rebalancing = len(validation_records) + + val_pct_effective = n_val_after_rebalancing/n_all * 100 + train_pct_effective = n_train_after_rabalncing/n_all * 100 + + str_ = f"Rebalancing from train set into validation set. {n_seq_to_move} will be moved.\n" + str_ += f"Number of records in validation file after rebalancing : {n_val_after_rebalancing} ({val_pct_effective:0.4f})%\n" + str_ += f"Number of records in train file after rebalancing : {n_train_after_rabalncing} ({train_pct_effective:0.4f})%\n" + str_ += f"Moved sequences:\n" + for seq in seq_ids_to_move: + str_ += f"{seq}\n" + logger.info(str_) + + assert n_train_after_rabalncing + n_val_after_rebalancing == n_all, "Total number of records must be equal to number of records in train and validation sets after rebalancing." + + # now we can save + # save train set + SeqIO.write( + train_records, + train_set_filename, + "fasta" + ) + # and its stats + compute_stats( + train_records, + "train-set-stats.txt" + ) + + # save validation set + SeqIO.write( + validation_records, + validation_set_filename, + "fasta" + ) + # and its stats + compute_stats( + validation_records, + "validation-set-stats.txt" + ) + else: + # 3. you satisfy the required pct, so no need for rebalancing + # save as is + + # obtain records + train_records = obtain_records(all_records,pre_train_seq_ids) + validation_records = obtain_records(all_records,pre_val_seq_ids) + + # log information about rebalancing + n_train_after_rabalncing = len(train_records) + n_val_after_rebalancing = len(validation_records) + + val_pct_effective = n_val_after_rebalancing/n_all * 100 + train_pct_effective = n_train_after_rabalncing/n_all * 100 + + str_ = f"No need for rabalancing.\n" + str_ += f"Number of records in validation file : {n_val_after_rebalancing} ({val_pct_effective:0.4f})%\n" + str_ += f"Number of records in train file : {n_train_after_rabalncing} ({train_pct_effective:0.4f})%\n" + + assert n_train_after_rabalncing + n_val_after_rebalancing == n_all, "Total number of records must be equal to number of records in train and validation sets after rebalancing." + + # save train set + SeqIO.write( + train_records, + train_set_filename, + "fasta" + ) + # and its stats + compute_stats( + train_records, + "train-set-stats.txt" + ) + + # save validation set + SeqIO.write( + validation_records, + validation_set_filename, + "fasta" + ) + # and its stats + compute_stats( + validation_records, + "validation-set-stats.txt" + ) + +# preprocess input: remove duplicates/ keep sequences of certain length/ remove sequences with non-canonical AA +@various_app.command("preprocess-input") +def join_sequences( + fasta_files : List[str], # list of FASTA files to preprocess + output_filename : str, # filename for the final output + logger_name : str, # logger filename + Lmin : int = 10, # minimum length threshold for inclusion + Lmax : int = 300 # maximum length threshold for inclusion + ) -> None: + # this function will take a user-provided list of FASTA files and do the following operations upon it: + # concatenate, remove duplicates, remove non-canonical AAs, keep sequences only between certain range of length + + # we will create a logger for this operation + setup_logger( 'logger', logger_name, level = logging.INFO ) + logger = logging.getLogger('logger') + + # will iteratively open each file in fasta_files and append unique record + unique_records = [] + seen_ids = [] + + # first pass is to merge and remove duplicates + for fasta_file in fasta_files: + # open file + local_counter = 0 + for record in SeqIO.parse(fasta_file, "fasta"): + # if we haven't seen record yet AND sequence length lies between Lmin and Lmax + if (record.id not in seen_ids) and (len(record.seq) >= Lmin) and (len(record.seq) <= Lmax): + # append to record list + unique_records.append(record) + # make sure we have seen this id already + seen_ids.append(record.id) + # increase local counter + local_counter += 1 + + # print info for a file + logger.info(f"Number of entries in the input file {fasta_file}: {local_counter}") + + # next: remove non-canonical AAs + # we will also check real Lmin and Lmax + + # create dictionary + w2i,_ = default_w2i_i2w() + + # create a list of clean records + clean_records = [record for record in unique_records if pass_filter(record,w2i) == True] + bad_records = [record for record in unique_records if pass_filter(record,w2i) == False] + + logger.info(f"Number of filtered records : {len(clean_records)}") + logger.info(f"Number of records with non-canonical AAs : {len(bad_records)}") + + # find min and max lengths + lengths = [len(record.seq) for record in clean_records] + Lmin_real = min(lengths) + Lmax_real = max(lengths) + + # log this information + str_ = f"Minimum sequence length in the filtered records FASTA file: {Lmin_real}\n" + str_ += f"Maximum sequence length in filtered records FASTA file : {Lmax_real}" + logger.info(str_) + + # print IDs of sequences with non canonical AAs + if len(bad_records) > 0: + str_ = "(removed) records with non-canonical AAs:\n" + for r in bad_records: + str_ += f"\t{r.id}\n" + # log + logger.info(str_) + + # save as new file + SeqIO.write( + clean_records, + output_filename, + "fasta" + ) + +# remove sequences (by ID), listed in ${id_file} from ${input} file and save result in ${output} +@various_app.command("remove-sequences") +def remove_sequences( + id_file : str, # id txt file + input : str, # input FASTA file + output : str, # output FASTA file + )->None: + with open(id_file, mode='r', encoding='utf-8') as file: + ids = set(file.read().splitlines()) + + records = [SeqRecord(record.seq, id=record.id, description=record.description, name='') for record in SeqIO.parse(input, 'fasta') + if record.id not in ids] + SeqIO.write(records, output, "fasta") + + +# split single fasta file (output of mmseqs) into multiple +# obtain elements of various clusters (as FASTA) from a joint FASTA file +@various_app.command("mmseqs-split") +def mmseq2clusters( + all_seqs_fasta : str, # fasta file with all sequences + template_name : str # template for saving clusters: {template}-xxx.fasta + + ) -> None: + + # open all records + records = [ + record for record in SeqIO.parse( + all_seqs_fasta, + "fasta" + ) + ] + + # create empty subset + subset_records = None + + # cluster counter + cnt = 0 + + # keep while there are records left + while len(records)>0: + # take first element of the array + current_record = records.pop(0) + # if current record is empty string, generate a new empty list + # else: append to list + if current_record.seq == "": + # if there are actually records in list, save ... + if subset_records is not None: + cnt += 1 + SeqIO.write( + subset_records, + f"{template_name}-{cnt}.fasta", + "fasta" + ) + # ..., then reset list + subset_records = [] + else: + # else: append to list + subset_records.append(current_record) + + # at the end all but last cluster will be saved + # save final cluster + cnt += 1 + SeqIO.write( + subset_records, + f"{template_name}-{cnt}.fasta", + "fasta" + ) + +#### compute and plot sequence coverage +@various_app.command("sequence-coverage") +def seqcoverage( + alignment_file : str, # MSA alingment file + csv_filename : str, # filename for csv (contains coverage information) + fig_filename_1 : str, # filename for plot for full coverage + fig_filename_2 : str, # filename for plot with exact matches + ) -> None: + + # inline function: save plots + def plot(array,seqlbl,yaxislbl,filename): + fig,ax = plt.subplots(nrows=1,ncols=1,figsize=(8,10)) + + ax.plot( + range(1,len(array)+1), # x: sequence position + np.array(array), # y: coverage (either exact match or number of non-gapped columns in that position) + linestyle = '-', + color = 'black', + label = seqlbl + ) + ax.set_xlabel("query sequence position") + ax.set_ylabel(yaxislbl) + ax.set_xlim(0,len(array)+1) + ax.set_ylim(0,100) + ax.legend() + + fig.savefig(filename) + + # open MSA file + aln = AlignIO.read( + alignment_file, + "fasta" + ) + aln_ex_VAE = aln[1:,:] # this is MSA excluding VAE sample, which is 1st row of MSA file + vae_sample = aln[0] # this is VAE sample + + seq_coverage = [] # how many sequences are there in MSA for this a given position + seq_coverage_full_match = [] # how many exact matches are there for a given position + + msa_len = len(aln_ex_VAE) + + # loop over gapped sequence and consider only non-gapped elements + for clmn,element in enumerate(str(vae_sample.seq)): + if element != "-": + # extract column from alignment (index is clmn) + aln_column = aln_ex_VAE[:,clmn] # 'str' type + + # need to compute how many non-gapped elements there are + non_gapped_cnt = len(aln_column) - aln_column.count("-") + + # compute how many sequences have the same AA in MSA + element_cnt = aln_column.count(element) + + # append (make numbers relative to length of MSA) + seq_coverage.append( + (non_gapped_cnt/msa_len) * 100 + ) + + seq_coverage_full_match.append( + (element_cnt/msa_len) * 100 + ) + + # save results as csv + data = { + "coverage" : seq_coverage, + "exact-match" : seq_coverage_full_match + } + df = pd.DataFrame(data) + df.to_csv(csv_filename) + + # plot results + seqlbl = vae_sample.id + + # full coverage + plot( + seq_coverage, + seqlbl, + "sequences,%", + fig_filename_1 + ) + + # exact match + plot( + seq_coverage_full_match, + seqlbl, + "sequences with same AA,%", + fig_filename_2 + ) + +#### compute and extract sequence certainty +@various_app.command("sequence-certainty") +def seqcertainty( + fastafile : str, # fasta file with single entry + picklefile : str, # pickle file that containes all information about sequences + temperature : float, # temperature for this sequence + fig_filename : str, # filename to save pdf file + csv_filename : str # filename to save csv file + + ) -> None: + # extract sequence ID + id_ = [record.id for record in SeqIO.parse(fastafile,"fasta")][0] # single entry, so we extract first element of list + + # obtain a list of tuples + # each tuple is (seq,logp(seq),associated z,id,description,seq certainty) as (list[str],float,numpy,str,str,numpy) + data = pickle.load( open( picklefile, "rb" ) ) + list_of_tuples = data["VAE"] + + # here we have 2 alternatives: either loop until ids match or extract a list item by index + # we will try to extract a list item by index + # index = int(seqID number - 1) + # seqID = seq-N-temperature-X -> we need N (to be precise N-1) + index = int( + id_.split('-')[1] + ) - 1 + + tpl = list_of_tuples[index] + + # extract seqID annd certainty measure from tuple + seqID = tpl[3] # string + seqcertainty = tpl[5] # list + + # for T = 0.0 it is p(best) - p(2nd best option): the higher the value in each position the better + # for T > 0.0 it is p(best) - p(chosen) : the lower the value in each position, the better + # we will plot the quantity 1 - prob difference : the higher the value in each position, the better + + if (temperature == 0.0): + seq_certainty_np = np.array(seqcertainty) + else: + seq_certainty_np = 1.0 - np.array(seqcertainty) + + ### printing just to make sure the extracted sequence is what we need + str_ = f"Sequence ID from FASTA file : {id_}.\n" + str_ += f"Sequence ID from pickle file : {seqID}.\n" + print(str_) + + # plot certainty + + + fig,ax = plt.subplots(nrows=1,ncols=1,figsize=(8,10)) + ax.plot( + range(1,len(seqcertainty)+1), # x: sequence position + seq_certainty_np, # y: sequence certainty + linestyle = '-', + color = 'black', + label = seqID + ) + ax.set_xlabel("sequence position") + # y label: sequence certainty + ax.set_ylabel("sequence certainty") + ax.set_xlim(0,len(seqcertainty)+1) + ax.set_ylim(0,1.1) # probability range is [0,1] + ax.legend() + fig.savefig(fig_filename) + + # save csv + data = { + "certainty" : seq_certainty_np + } + df = pd.DataFrame(data) + df.to_csv(csv_filename) + +#### split FASTA file into individual FASTA files +@various_app.command("sequence-split") +def seqsplit( + master_fasta_file : str # filename of aggreagte fastafile + ) -> None: + # open FASTA file + records = [record for record in SeqIO.parse(master_fasta_file,"fasta")] + + # loop over records and save them individually + for i,record in enumerate(records,1): + SeqIO.write( + [record], + f"{record.id}.fasta", + "fasta" + ) + +### compute sequence weights from distance matrix +@various_app.command("distmat-weights") +def seq_weights_from_distmat( + distmat_file : str, # distance matrix from clustalo + pickle_name : str, # filename for pickle file (will pass to Dataset construction later) + csv_name : str # filename for csv (will save for the record) + ) -> None: + # now open and parse distmat_file + df_distances = pd.read_csv( + distmat_file, # file with matrix that is output of clustalo + skiprows = [0], # skip first row, which only contains number of strings + header = None, # no headers + sep = "\s+" # split everything by 1 or more whitespaces + ) + + # weights: dict + weights = {} + + # extract column 0 as list + ids = df_distances.iloc[:,0].to_list() + + # extract everything else as numpy + identity_matrix = df_distances.iloc[0:,1:].to_numpy() + N = identity_matrix.shape[0] # number of elements in matrix + + # populate weights: seqID -> weight + for i,id_ in enumerate(ids): + avg_idenity = (np.sum(identity_matrix[i,:]) - 100.00)/(N-1) # we just subtract identity value of a sequence to itself + weights[id_] = 100.0/avg_idenity + + # need to save weights as csv + df = pd.DataFrame( + list(weights.items()), + columns = ['ID','Weight'] + ) + df.to_csv(csv_name) + + # and as pickle + pickle.dump( + weights, + open(pickle_name,"wb") + ) + +### compute default sequence weights (assume they are 1.0) +### this is just to have pickle/csv file in line with previous function +@various_app.command("default-weights") +def seq_weights_default( + fasta_file : str, # fasta file with sequences + pickle_name : str, # filename for pickle file (will pass to Dataset construction later) + csv_name : str # filename for csv (will save for the record) + ) -> None: + # set default weights to 1.0 + weights = {} + for record in SeqIO.parse(fasta_file,"fasta"): + weights[record.id] = 1.0 + + # need to save weights as csv + df = pd.DataFrame( + list(weights.items()), + columns = ['ID','Weight'] + ) + df.to_csv(csv_name) + + # and as pickle + pickle.dump( + weights, + open(pickle_name,"wb") + ) + +### append energy term to WT fasta +@foldx_app.command("add-energy-wt") +def append_energy_wt( + wt_fasta_file : str, # input FASTA file + wt_fasta_filename : str, # FASTA filename to save + free_energy_wt : float = 0.0 # energy value of WT + ): + + # print("Free energy...") + # print(f"type : {type(free_energy_wt)}") + # print(f"value : {free_energy_wt}") + + new_records = [] + # open file + for old_record in SeqIO.parse(wt_fasta_file,"fasta"): + # append Free Energy to ID: id -> id:(free)energy + id_ = f"{old_record.id}:{free_energy_wt}" + new_record = SeqRecord( + old_record.seq, + id = id_, + description = old_record.description + ) + + new_records.append(new_record) + + # save + SeqIO.write(new_records,wt_fasta_filename,"fasta") + +## function to generate mutants in the appropriate form for FoldX +@foldx_app.command("generate-mutants") +def generate_mutants( + wt_fasta_file : str, # FASTA file with WT (doesn't really matter if Free Energy is appended or not + pdb_reference : str, # PDB reference name + output_filename : str, # FASTA filename for mutants + n_mutation_sites : int = 5, # how many mutations to make + n_mutants : int = 10, # how many different mutants to generate + seed : int = 0, # random seed to control random sampling + ): + + # fix seed + np.random.seed(seed) + + # open WT seq + wt = [record for record in SeqIO.parse(wt_fasta_file,"fasta")][0] + + # WT sequences as list: ["N","A","L",...] + wt_seq = list(str(wt.seq)) + wt_id = wt.id + + print("length of WT:",len(wt_seq)) + + # our positions to mutate (don't mutate first one) + positions_to_mutate = [i for i in range(1,len(wt_seq))] + + # open file + f = open("individual_list.txt", "w") + + # mutant records + mutant_records = [] + + # loop over mutants + for i in range(n_mutants): + # sample which positions in a sequence to mutate + chosen_positions = np.random.choice( + positions_to_mutate, # sample from this list + size = n_mutation_sites, # how many samples + replace = False # no replacement, as we can't have [1,1,1,...] + ) + # sort in ascending order + mutation_sites = sorted(chosen_positions) + + print("Mutation sites:",mutation_sites) + + # get FoldX representation and mutated sequence + foldx_representation,mutant = mutate( + copy.deepcopy(wt_seq), # just a copy of our WT + mutation_sites, # poistions to mutate + chainA_only = True # only single chain + ) + + # add FoldX representation + f.write(foldx_representation) + f.write('\n') + + # add mutant to FASTA + # id will follow FoldX convention for easy matching + + description_ = f"reference-uniprot:{wt_id}||refence-pdb:{pdb_reference}||mutations:{foldx_representation}" + id_ = f"{pdb_reference}_{i+1}" + print("ID:",id_) + mutant_record = SeqRecord( + Seq( + "".join(mutant), + ), + id = id_, + description = description_ + ) + print(mutant_record) + print("-"*10) + + mutant_records.append(mutant_record) + + + f.close() + + # write to FASTA + SeqIO.write(mutant_records,output_filename,"fasta") + +@foldx_app.command("add-energy-mutant") +def append_energy_mutants( + mutant_fasta_file : str, # FASTA file with mutant sequences but no energy + mutant_file_csv : str # CSV file with mutant energy estimates + ): + # energy as lookup + d_energy = {} + + # open and parse mutant_file_csv + df_energy = pd.read_csv( + mutant_file_csv, + header = None, + sep = "," + ) + + # extract ids + ids = df_energy.iloc[:,0].to_list() + + # extract energies + energies = df_energy.iloc[:,1].to_list() + + # populate dictionary + for id_,energy_ in zip(ids,energies): + d_energy[id_] = energy_ + + # now update fasta file + + new_records = [] + # open file + for old_record in SeqIO.parse(mutant_fasta_file,"fasta"): + # append Free Energy to ID: id -> id:(free)energy + old_id = old_record.id + energy_term = d_energy[old_id] + + # somehow the old description contains ID, so we get rid of it by splitting on space + description_ = old_record.description.split(" ")[1] + + id_ = f"{old_id}:{energy_term}" + print("New ID:",id_) + new_record = SeqRecord( + old_record.seq, + id = id_, + description = description_ + ) + print(new_record) + print("-"*10) + + new_records.append(new_record) + + # save under the same name + SeqIO.write(new_records,mutant_fasta_file,"fasta") + +# call it +if __name__ == "__main__": + app() + + + + \ No newline at end of file diff --git a/bin/models.py b/bin/models.py new file mode 100755 index 0000000..ec6695a --- /dev/null +++ b/bin/models.py @@ -0,0 +1,824 @@ +# PREVENT: PRotein Engineering by Variational frEe eNergy approximaTion +# Copyright (C) 2024 Giovanni Stracquadanio, Evgenii Lobzaev + +# This program is free software: you can redistribute it and/or modify +# it under the terms of the GNU Affero General Public License as published +# by the Free Software Foundation, either version 3 of the License, or +# (at your option) any later version. + +# This program is distributed in the hope that it will be useful, +# but WITHOUT ANY WARRANTY; without even the implied warranty of +# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the +# GNU Affero General Public License for more details. + +# You should have received a copy of the GNU Affero General Public License +# along with this program. If not, see . + +#!/usr/bin/env python3 +# -*- coding: utf-8 -*- +""" +Various layers and Neural Networks. +# check: +https://github.com/oriondollar/TransVAE/tree/master/transvae +https://github.com/Fraser-Greenlee/transformer-vae + +TODO: +# VAE THAT DECODES BOTH SEQUENCE AND PROPERTY +- Check if we need to use memory_key_padding_mask in line 189/256 (right now mask is used) + Logic: we don't use encoder output, but rather stochastic representation of the encoder output. + Does it make sense to mask out positions from the encoder output? +""" + +import torch +import torch.nn as nn +import torch.nn.functional as F +import torch.nn.utils.rnn as rnn_utils +import numpy as np +from numpy.typing import ArrayLike +import math +######################################################### VAE THAT DECODES BOTH SEQUENCE AND PROPERTY ###################### +# Positional Encoding, taken from pytorch: https://pytorch.org/tutorials/beginner/transformer_tutorial.html +class PositionalEncodingPytorch(nn.Module): + + def __init__(self, d_model: int, dropout: float = 0.1, max_len: int = 5000): + super().__init__() + self.dropout = nn.Dropout(p=dropout) + + position = torch.arange(max_len).unsqueeze(1) + div_term = torch.exp(torch.arange(0, d_model, 2) * (-math.log(10000.0) / d_model)) + pe = torch.zeros(max_len, 1, d_model) + pe[:, 0, 0::2] = torch.sin(position * div_term) + pe[:, 0, 1::2] = torch.cos(position * div_term) + self.register_buffer('pe', pe) + + def forward(self, x): + """ + Args: + x: Tensor, shape [seq_len, batch_size, embedding_dim] + """ + x = x + self.pe[:x.size(0)] + return self.dropout(x) + +# small MLP (used inside TransformerVAE) +class MLP(nn.Module): + def __init__(self,input_dim): + super(MLP,self).__init__() + + # input dimensionality + self.input_dim = input_dim + + # MLP with 5 layers + # input_dim -> 64 -> 32 -> 16 -> 4 -> 1 + self.layers = nn.Sequential( + nn.Linear(input_dim,64), + nn.ReLU(), + nn.Linear(64,32), + nn.ReLU(), + nn.Linear(32,16), # project to 16-dim vector space + nn.ReLU(), + nn.Linear(16,4), # project to 4-dim vector space + nn.ReLU(), + nn.Linear(4,1) # project to 1-dim vector space (no ReLU is used as target output is mostly negative) + ) + def forward(self,X): + out = self.layers(X) + return out + +# Transfromer-based VAE: both encoder and decoder follow Transformer architecture +# here: using Gaussian latent space +class TransformerVAE(nn.Module): + def __init__( + self, + vocab_size, # number of AAs + 4 tokens + max_seq_length, # max sequence length (from Dataset) + pad_idx, # pad_idx + sos_idx, # sos idx + eos_idx, # eos idx + unk_idx, # unk idx + device, # device (cpu/gpu) + embedding_size = 512, # embedding dimensionality + latent_size = 64, # latent space dimensionality + num_layers_encoder = 6, # how many blocks to use in encoder + num_layers_decoder = 4, # how many blocks to use in decoder + heads = 8, # embedding size should be divisible by heads + dropout_prob = 0.1, # dropout probability + condition_on_energy = False # whether to scale latent variable z by predicted energy: False means z->energy, z->sequence; True means z->energy, z*energy->sequence + + ): + super(TransformerVAE,self).__init__() + + # variables + self.vocab_size = vocab_size + self.max_seq_length = max_seq_length + self.pad_idx = pad_idx + self.sos_idx = sos_idx + self.eos_idx = eos_idx + self.unk_idx = unk_idx + self.embedding_size = embedding_size + self.latent_size = latent_size + self.num_layers_encoder = num_layers_encoder + self.num_layers_decoder = num_layers_decoder + self.heads = heads + self.dropout_prob = dropout_prob + self.device = device + self.condition_on_energy = condition_on_energy + + # embedding layer + self.embedding = nn.Embedding(vocab_size,embedding_size,padding_idx = pad_idx) + + # positional embedding + self.positional_embedding = PositionalEncodingPytorch(embedding_size,dropout=dropout_prob) + + # MLP: logits -> MLP -> energy + # z size: [Batch, Latent size] -> input_dim: Latent size + self.mlp2energy = MLP( + latent_size + ) + + # transformer + #self.transformer = nn.Transformer(d_model = embedding_size,nhead=heads) + self.transformer_encoder = nn.TransformerEncoder( + nn.TransformerEncoderLayer(embedding_size,heads,batch_first = True,dropout=dropout_prob), # transformer encoder layer + num_layers_encoder # how many layers to have + ) + + self.transformer_decoder = nn.TransformerDecoder( + nn.TransformerDecoderLayer(embedding_size,heads,batch_first = True,dropout=dropout_prob), # transformer decoder layer + num_layers_decoder # how many layers to have + ) + + # latent to mean/standard deviation + self.hidden2mean = nn.Linear(embedding_size * max_seq_length, latent_size) + self.hidden2logv = nn.Linear(embedding_size * max_seq_length, latent_size) + + # latent to input to decoder + self.latent2embed = nn.Linear(latent_size, embedding_size * max_seq_length) + + # final step: convert to vocab_size + self.out = nn.Linear(embedding_size, vocab_size) + + def create_pad_mask(self, matrix: torch.tensor, pad_token: int) -> torch.tensor: + # If matrix = [1,2,3,0,0,0] where pad_token=0, the result mask is + # [False, False, False, True, True, True] + return (matrix == pad_token) + + def create_attn_mask(self, size) -> torch.tensor: + # Generates a square matrix where the each row allows one word more to be seen + mask = torch.tril(torch.ones(size, size) == 1) # Lower triangular matrix + mask = mask.float() + mask = mask.masked_fill(mask == 0, float('-inf')) # Convert zeros to -inf + mask = mask.masked_fill(mask == 1, float(0.0)) # Convert ones to 0 + mask = mask.to(self.device) + + # EX for size=5: + # [[0., -inf, -inf, -inf, -inf], + # [0., 0., -inf, -inf, -inf], + # [0., 0., 0., -inf, -inf], + # [0., 0., 0., 0., -inf], + # [0., 0., 0., 0., 0.]] + return mask + + def forward(self,src,tgt,masking_prob = 0.0): + # src : (Batch Size, Src Seq Length) + # tgt : (Batch Size, Tgt Seq Length) + # masking_prob : probability of masking any AA in decoder input (tgt) + + batch_size = src.size(0) + + # get pad masks: [Batch Size, Seq Length] + src_pad_mask = self.create_pad_mask(src,self.pad_idx) + tgt_pad_mask = self.create_pad_mask(tgt,self.pad_idx) + + # replace certain elements in tgt with + if masking_prob > 0.0: + # generate random numbers + prob = torch.rand( + tgt.size(), + dtype = torch.float, + device = self.device + ) + # never replace , + prob[(tgt.data - self.sos_idx) * (tgt.data - self.pad_idx) == 0] = 1 + + # now replace the rest of tokens (AAs) with randomly + tgt[prob < masking_prob] = self.unk_idx + + # get attention mask (used in decoder, so applied to tgt) + tgt_attn_mask = self.create_attn_mask(tgt.size(1)) # size(1) is Tgt Seq Length + + # do embedding (dense + positional) -> [ Batch Size, Seq Length, Embedding size ] + src_emb = self.positional_embedding( + self.embedding(src).transpose(0,1) # embedding: [Batch Size, Seq Lengh] - > [Batch Size, Seq Length, Embedding Size] -> (transpose) -> [Seq Length, Batch Size, Embedding Size] + ).transpose(0,1) # [Seq Length, Batch Size, Embedding Size] + + # same + tgt_emb = self.positional_embedding( + self.embedding(tgt).transpose(0,1) + ).transpose(0,1) + + # pass through encoder + # only padding mask is needed here + encoder_out = self.transformer_encoder(src_emb,src_key_padding_mask = src_pad_mask) # size: [Batch Size, Seq Length, Embedding Size] + + # reshape: [Batch Size, Seq Length, Embedding Size] -> [Batch Size, Seq Length * Embedding Size] + encoder_out = encoder_out.reshape(batch_size,self.max_seq_length*self.embedding_size) + + # to mean and standard deviation + mean = self.hidden2mean(encoder_out) + logv = self.hidden2logv(encoder_out) + std = torch.exp(0.5 * logv) + + # do reparametrisation trick + z = torch.randn( + [batch_size, self.latent_size], + dtype = torch.float, + device = self.device + ) + # [Batch Size, Latent Size] # this is our latent representation + z = z * std + mean + + # predict energy from z : [Batch Size, 1] + energy = self.mlp2energy(z) + + # scale energy (this wont change dimensionality of z, so we can pass it safely to self.latent2embed) + # use scaled latent vector z as stochastic memory representation + if self.condition_on_energy: + z_tilda = z * energy + else: + z_tilda = z + + # stochastic representation of encoder output: + # [Batch Size, Latent Size] -> [Batch Size, Seq Lenth * Embedding Size] -> [Batch Size, Seq Length, Embedding Size] + enc_memory_stochastic = self.latent2embed(z_tilda).reshape(batch_size,self.max_seq_length,self.embedding_size) + + # pass through decoder + out = self.transformer_decoder( + tgt_emb, + enc_memory_stochastic, + tgt_mask = tgt_attn_mask, # prohibit unwanted attention + tgt_key_padding_mask = tgt_pad_mask, # pad indicies for target (will be ignored) + memory_key_padding_mask = src_pad_mask # pad indices for source (will be ignored) : TODO: DEBATABLE IF NEEDED TO BE USED! + ) + + # [Batch Size, Sequence Length, Embedding Size] -> [Batch, Sequence Length, Vocab Size] + out = self.out(out) + + # convert to logp by applying log_softmax along last dimension + logp = nn.functional.log_softmax( + out, + dim = -1 + ) + + + + return logp, mean, logv, energy + + # do forward pass through encoder only + def __precompute_stochastic_memory( + self, + src, # tensor with numerical representation of seed sequence: dataloader -> batch["input"] + ): + + batch_size = src.size(0) + + # get pad masks + src_pad_mask = self.create_pad_mask(src,self.pad_idx) + # do embedding (dense + positional) -> [ Batch Size, Seq Length, Embedding size ] + src_emb = self.positional_embedding( + self.embedding(src).transpose(0,1) + ).transpose(0,1) + # pass through encoder + encoder_out = self.transformer_encoder(src_emb,src_key_padding_mask = src_pad_mask) # size: [Batch Size, Seq Length, Embedding Size] + + # reshape: [Batch Size, Seq length * Embedding Size] + encoder_out = encoder_out.reshape(batch_size,self.max_seq_length*self.embedding_size) + + # to mean and standard deviation + mean = self.hidden2mean(encoder_out) + logv = self.hidden2logv(encoder_out) + std = torch.exp(0.5 * logv) + + return mean,std,src_pad_mask + + # a pass through decoder + def __get_logits_logp(self,encoder_output,tgt,memory_pad_mask = None): + # ENCODER output is a constant thing [Batch Size, Seq Length, Embedding Size] + # either + # prior(z) -> latent2embed -> reshape + # or + # posterior(z) -> latent2embed -> reshape + + # TGT will be changed in a for loop: [,AA1,AA2,..] + + tgt_pad_mask = self.create_pad_mask(tgt,self.pad_idx) + attn_mask = self.create_attn_mask(tgt.size(1)) + + # do embedding for tgt -> [Batch Size, Seq Length, Embedding Size] + tgt_emb = self.positional_embedding( + self.embedding(tgt).transpose(0,1) + ).transpose(0,1) + + # pass through transformer decoder + # memory_key_padding_mask is None for prior samples (because encoder was not used, so we don't know what in the stochastic representation actually corresponds to ) + # memory_key_padding_mask is provided for posterior samples (because encoder was used) + out = self.transformer_decoder( + tgt_emb, + encoder_output, + tgt_mask = attn_mask, + tgt_key_padding_mask = tgt_pad_mask, + memory_key_padding_mask = memory_pad_mask + ) + # size: [Batch, ?, Vocab Size] + # second dimension will be changing because sequence will grow + # we are only interested in last element of that dimension + out = self.out(out) + + # convert to logp by applying log_softmax along last dimension + logp = nn.functional.log_softmax( + out, + dim = -1 + ) + return out,logp + + # sample from the prior + def sample_from_latent_space(self, + batch_size, + max_length = 100, + z = None, + argmax = True + ): + + #NB: z needs to have first dimension equal to batch_size to make this work + + if z is None: + # sample from prior -> [Batch Size, Latent Space Size] + z = torch.randn( + [batch_size, self.latent_size], + dtype = torch.float, + device = self.device + ) + + # get energy: [Batch Size, 1] + energy = self.mlp2energy(z) + + # scale z by energy and pass to decoder: [Batch Size, Latent Size] + if self.condition_on_energy: + z_tilda = z * energy + else: + z_tilda = z + + # convert into input for transformer decoder -> [Batch Size, Seq Length, Embedding Size] + enc_memory_stochastic = self.latent2embed(z_tilda).reshape(batch_size,self.max_seq_length,self.embedding_size) + + # create start tokens -> [Batch Size, 1] + tgt = self.sos_idx * torch.ones( + [batch_size,1], + dtype = torch.long, + device = self.device + ) + + # keep indices and logprobabilities + INDICES = [] + LOGPROBS = [] + + # ENTROPIES: will collect entropy for each distribution (i.e. each AA position will have an entropy term) + ENTROPIES = [] + + # sample tokens (argmax) + for step in range(max_length): + + # call _sample() -> obtain logp for predicted tokens + # size [Batch Size, ? , Vocab Size] (sequence grows so 2nd dimension changes) + _,logp_predicted = self.__get_logits_logp( + enc_memory_stochastic, + tgt + ) + + # select last element + # size [Batch Size, Vocab Size] + logp_predicted_last = logp_predicted[:,-1,:] + + # compute entropy for this AA -> [Batch Size=1] + H = -1.0 * torch.sum( + logp_predicted_last * torch.exp(logp_predicted_last), + dim = 1 + )[0].item() # since batch size is 1, just take the first element + ENTROPIES.append(H) + + # need to select best tokens according to last dimension + # size: [Batch Size, 1] + if argmax: + # argmax selection + logp_all,next_all = torch.max( + logp_predicted_last, + dim = -1, + keepdim = True + ) + else: + # categorical sampling + + # convert logp -> p + probs_temp_annealed_last = logp_predicted_last.exp() + + # sample + next_all = torch.multinomial( + probs_temp_annealed_last, + 1, + replacement = False + ) + # gather sampled indices + logp_all = logp_predicted_last.gather( + 1, + next_all + ) + + # record + INDICES.append(next_all) + LOGPROBS.append(logp_all) + + # need to concatenate tgt with next_token + # [Batch Size, ?] as sequence grows + tgt = torch.cat( + [tgt, next_all], + dim = 1 + ) + + # once loop is over concatenate lists + # [Batch Size, Seq Length] + logp_opt = torch.cat( + LOGPROBS, + dim = 1 + ) + + indices = torch.cat( + INDICES, + dim = 1 + ) + + # extract mean,max,std of entropies + entropies = np.array(ENTROPIES) + + # get a list of entropies stats + entropies_out = [ + np.mean(entropies), # mean + np.max(entropies), # max + np.std(entropies) # std + ] + + return logp_opt, indices, z, energy, entropies_out + + + + # sample around seed molecule + def sample_around_molecule( + self, + src, # tensor with numerical representation of seed sequence: dataloader -> batch["input"] + batch_size, # how many samples for a seed molecule to do + T = 0.0, # if T = 0.0 do argmax sampling + max_length = 100, # maximum number of sampling steps + skip_first_element = True # first element (should be M) will be taken as argmax, the rest will be sampled if T > 0.0 + ): + + # obtain mu/sigma (just part of forward()) + # also returns a memory pad mask of size [1,Seq Length] + mean,std,memory_pad_mask = self.__precompute_stochastic_memory(src) + + # keep indices and logprobabilities + INDICES = [] + LOGPROBS = [] + Z = [] + + # expand mu and sigma, pad_mask -> [Batch Size, Seq Length] + mean_exp = mean.repeat([batch_size,1]) + std_exp = std.repeat([batch_size,1]) + memory_pad_mask_exp = memory_pad_mask.repeat([batch_size,1]) + + # sample from prior + z = torch.randn( + [batch_size, self.latent_size], + dtype = torch.float, + device = self.device + ) + + # convert to posterior: [Batch Size, Latent Size] + z = mean_exp + z * std_exp + + # predict energy: as long as sampling := argmax operation, it is fine + # if there is real sampling involved, unclear + energy = self.mlp2energy(z) # [Batch Size, 1] + + # whether to condition on energy or not + if self.condition_on_energy: + z_tilda = z * energy + else: + z_tilda = z + + # convert into input for transformer decoder -> [Mini Batch Size, Seq Length, Embedding Size] + enc_memory_stochastic = self.latent2embed(z_tilda).reshape(batch_size,self.max_seq_length,self.embedding_size) + + # create start tokens -> [Batch Size, 1] + tgt = self.sos_idx * torch.ones( + [batch_size,1], + dtype = torch.long, + device = self.device + ) + + # for loop: max_length + for step in range(max_length): + + # call _sample() -> obtain logp for predicted tokens + # size [Batch Size, Num of Elements in a Sequence , Vocab Size] (sequence grows) + logits_predicted,logp_predicted = self.__get_logits_logp( + enc_memory_stochastic, + tgt, + memory_pad_mask = memory_pad_mask_exp + ) + + # select last element + # size [Batch Size, Vocab Size] + logp_predicted_last = logp_predicted[:,-1,:] + + # need to select next token (and it's logprobability) + # if T == 0.0 or T>0.0 but first element is forced to be selected according to argmax + if (T == 0.0) or (step == 0 and T > 0.0 and skip_first_element == True): + # size [Batch Size, 1] + logp_all,next_all = torch.max( + logp_predicted_last, + dim = -1, + keepdim = True + ) + else: + # do proper categorical sampling + # convert logits to logp + logp_temp_annealed = nn.functional.log_softmax( + logits_predicted/T, + dim = -1 + ) + # select last element + # size [Batch Size,Vocab Size] + logp_temp_annealed_last = logp_temp_annealed[:,-1,:] + + # logp -> p + probs_temp_annealed_last = logp_temp_annealed_last.exp() + + # sample + next_all = torch.multinomial( + probs_temp_annealed_last, + 1, + replacement = False + ) + # gather sampled indices + logp_all = logp_temp_annealed_last.gather( + 1, + next_all + ) + + # record + INDICES.append(next_all) + LOGPROBS.append(logp_all) + Z.append(z) + + # need to concatenate tgt with next_token + tgt = torch.cat( + [tgt, next_all], + dim = 1 + ) + + # at this point need to concatenate INDICES and LOGPROBS and Z + # size: [Batch Size, Max Length] + logp_opt = torch.cat( + LOGPROBS, + dim = 1 + ) + + indices = torch.cat( + INDICES, + dim = 1 + ) + z = torch.cat( + Z, + dim = 1 + ) + + return logp_opt,indices,z,energy + +######################################################### SEQUENCE-TO-PROPERTY MODELS ###################################### +# simple average: compute avg of the train set, compute MSE of the train set\validation set +def simple_average_model( + energies_train : ArrayLike, # numpy array of energies in the train set + energies_validation : ArrayLike, # numpy array of energies in the validation set + ): + + # avg of train set + avg_train = np.mean(energies_train) + + # mse of the train set + mse_train = np.mean( + np.square( + energies_train - avg_train + ) + ) + + # mse of the validation set + mse_validation = np.mean( + np.square( + energies_validation - avg_train + ) + ) + return avg_train, mse_train, mse_validation + +# GRU-to-property (we will assume here that sequences can be of variable length) +class PredictorGRU(nn.Module): + ''' + INPUT: + vocab_size : number of tokens, int + embedding_size : number of features in the input, int + hidden_size : number of features in hidden dimension in RNN, int + num_layers : number of stacked RNNs, int, default: 1 + bidirectional : whether to use bidirectional RNNs, boolean, default: False + ''' + def __init__( self, + vocab_size, + embedding_size, + hidden_size, + device, + pad_idx, + p_dropout = 0.2, + num_layers = 1, + bidirectional = False + ): + super().__init__() + + self.vocab_size = vocab_size + self.embedding_size = embedding_size + self.hidden_size = hidden_size + self.device = device + self.pad_idx = pad_idx + self.p_droput = p_dropout + self.num_layers = num_layers + self.bidirectional = bidirectional + + # account for bidirectionality and number of layers + self.hidden_factor = (2 if bidirectional else 1) * num_layers + + # embedding layer + dropout + self.embedding = nn.Embedding(vocab_size,embedding_size,padding_idx=pad_idx) + self.dropout_embedding = nn.Dropout(p = p_dropout) + + # GRU + self.gru = nn.GRU( + embedding_size, + hidden_size, + num_layers = num_layers, + bidirectional = bidirectional, + batch_first = True + ) + + # small MLP to move from h_last to scalar + #self.h2energy = MLP(hidden_size * self.hidden_factor) + + # 3 layers here + self.h2energy = nn.Sequential( + nn.Linear(hidden_size * self.hidden_factor,16), + nn.ReLU(), + nn.Linear(16,4), # project to 4-dim vector space + nn.ReLU(), + nn.Linear(4,1) # project to 1-dim vector space (no ReLU is used as target output is mostly negative) + ) + + def forward(self,batch_of_input_sequences,input_sequences_lengths, h0 = None): + + # batch size + batch_size = batch_of_input_sequences.size(0) + + # sorting by sequence length + batch_size = batch_of_input_sequences.size(0) + sorted_lengths, sorted_idx = torch.sort(input_sequences_lengths, descending=True) + X = batch_of_input_sequences[sorted_idx] + + # embed sequences + X_embedded = self.dropout_embedding( + self.embedding(X) + ) + # now we need to pack them for efficient passing through RNN + X_packed = rnn_utils.pack_padded_sequence(X_embedded, sorted_lengths.data.tolist(), batch_first=True) + + # run through GRU -> we are only concerned about final h + if h0 is None: + _, hidden = self.gru(X_packed) + else: + _, hidden = self.gru(X_packed,h0) + + # need to take into account different sizes of h depending on bidirectionality and number of layers + if self.bidirectional or self.num_layers > 1: + # flatten hidden state + encoder_hidden_at_T = hidden.view(batch_size, self.hidden_size*self.hidden_factor) + else: + encoder_hidden_at_T = hidden.squeeze() + + print("Size of encoder_hidden_at_T:",encoder_hidden_at_T.size()) + + # now pass through MLP + output = self.h2energy(encoder_hidden_at_T) + + return output + +# TransformerEncoder-to-property (we will assume here that sequences can be of variable length) +class PredictorTFEncoder(nn.Module): + def __init__( + self, + vocab_size, # number of AAs + 4 tokens + max_seq_length, # max sequence length (from Dataset) + pad_idx, # pad_idx + embedding_size = 512, # embedding dimensionality + latent_size = 64, # latent space dimensionality + num_layers_encoder = 6, # how many blocks to use in encoder + heads = 8, # embedding size should be divisible by heads + dropout_prob = 0.1 # dropout probability + ): + super(PredictorTFEncoder,self).__init__() + + # variables + self.vocab_size = vocab_size + self.max_seq_length = max_seq_length + self.pad_idx = pad_idx + self.embedding_size = embedding_size + self.latent_size = latent_size + self.num_layers_encoder = num_layers_encoder + self.heads = heads + self.dropout_prob = dropout_prob + + # embedding layer + self.embedding = nn.Embedding(vocab_size,embedding_size,padding_idx = pad_idx) + + # positional embedding + self.positional_embedding = PositionalEncodingPytorch(embedding_size,dropout=dropout_prob) + + # MLP: logits -> MLP -> energy + # z size: [Batch, Latent size] -> input_dim: Latent size + self.mlp2energy = MLP( + latent_size + ) + + # TF encoder + self.transformer_encoder = nn.TransformerEncoder( + nn.TransformerEncoderLayer( + embedding_size, + heads, + batch_first = True, + dropout=dropout_prob + ), # transformer encoder layer + num_layers_encoder # how many layers to have + ) + + # sequence (embedding) to hidden + self.seq2latent = nn.Linear(embedding_size * max_seq_length, latent_size) + + def create_pad_mask(self, matrix: torch.tensor, pad_token: int) -> torch.tensor: + # If matrix = [1,2,3,0,0,0] where pad_token=0, the result mask is + # [False, False, False, True, True, True] + return (matrix == pad_token) + + def forward(self,src): + + batch_size = src.size(0) + + # size : [N,S] + src_pad_mask = self.create_pad_mask(src,self.pad_idx) + + # do embedding (dense + positional) -> [ Batch Size, Seq Length, Embedding size ] + src_emb = self.positional_embedding( + self.embedding(src).transpose(0,1) # embedding: [Batch Size, Seq Lengh] - > [Batch Size, Seq Length, Embedding Size] -> (transpose) -> [Seq Length, Batch Size, Embedding Size] + ).transpose(0,1) # [Seq Length, Batch Size, Embedding Size] + + # pass through TF encoder + encoder_out = self.transformer_encoder(src_emb,src_key_padding_mask = src_pad_mask) # size: [Batch Size, Seq Length, Embedding Size] + # reshape to be 2D + encoder_out = encoder_out.reshape(batch_size,self.max_seq_length*self.embedding_size) + + # to latent (aka z) + latent = self.seq2latent(encoder_out) + + # finally latent to energy + energy = self.mlp2energy(latent) + + return energy + + + + + + + + + + + + + + + + + + + diff --git a/bin/train.py b/bin/train.py new file mode 100755 index 0000000..6c7418b --- /dev/null +++ b/bin/train.py @@ -0,0 +1,1003 @@ +# PREVENT: PRotein Engineering by Variational frEe eNergy approximaTion +# Copyright (C) 2024 Giovanni Stracquadanio, Evgenii Lobzaev + +# This program is free software: you can redistribute it and/or modify +# it under the terms of the GNU Affero General Public License as published +# by the Free Software Foundation, either version 3 of the License, or +# (at your option) any later version. + +# This program is distributed in the hope that it will be useful, +# but WITHOUT ANY WARRANTY; without even the implied warranty of +# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the +# GNU Affero General Public License for more details. + +# You should have received a copy of the GNU Affero General Public License +# along with this program. If not, see . + +#!/usr/bin/env python3 +# -*- coding: utf-8 -*- +""" +Main training functions. + +TODO: +1. Check if we need , , for regression task. +""" +import torch +import torch.nn as nn +import logging +import copy +import pickle +import typer +from torch.utils.data import DataLoader,WeightedRandomSampler +from models import ( + TransformerVAE, + PredictorGRU, + PredictorTFEncoder, + simple_average_model + ) +from utilities import ( + default_w2i_i2w, + setup_logger, + ProteinSequencesDataset, + load_checkpoint, + save_data_to_csv, + train_step, # TransformerVAE (sequence + property) + validation_step, # TransformerVAE (sequence + property) + train_step_gru_tf, # GRU prediction (sequence -> property) + validation_step_gru_tf # GRU prediction (sequence -> property) + ) + +# main app +app = typer.Typer() + +# for TransformerVAE +tf_app = typer.Typer() +app.add_typer(tf_app, name="transformer") + +# for predicting +predictor_app = typer.Typer() +app.add_typer(predictor_app, name="predictor") + +######################################### VAE ############ +@tf_app.command("gaussian") +def train_gaussian( + training_fasta_file : str, # FASTA file with training sequences + validation_fasta_file : str, # FASTA file with validation sequences + log_name_batch : str, # logger for batch updates during training + log_name_epoch : str, # logger for epoch updates during training + log_name_val_epoch : str, # logger for epoch updates during validation + log_name_seqs_batch : str, # logger for keeping track what sequences were in a batch update + checkpoint_pattern : str, # checkpoint generic name + csv_epoch_name : str, # filename for CSV with training losses results by epoch + csv_validation_epoch_name : str, # filename for CSV with validation losses results by epoch + pickle_name : str, # filename for model input params (to instantiate correct object later) + pt_name_train : str, # filename for model trained layers (corresponding to smallest training error) + pt_name_val : str, # filename for model trained layers (corresponding to smallest validation error) + epochs : int = 10, # number of epochs to train NN + learning_rate : float = 0.0001, # learning rate for gradient descent + lambda_constant : float = 0.001, # L2 constant + validation_freq_epoch : int = 2, # how frequently compute validation loss + checkpoint_freq_epoch : int = 2, # how frequently save model snapshots + max_sequence_length : int = 100, # maximum sequence length + batch_size : int = 16, # how many sequences in mini-batch + embedding_size : int = 512, # embedding size (must be divisible by number of heads) + latent_size : int = 64, # dimensionality of the latent space + condition_on_energy : bool = False, # whether to scale z by energy when passed to sequence decoder + weighted_sampling : bool = False, # whether to use weighted sampling (right now using WeightedRandomSampler) + dropout_prob : float = 0.1, # dropout probability (same for all the dropouts) + masking_prob : float = 0.1, # probability of replacing AA with token for the input + heads : int = 8, # number of heads in (self)attention + num_layers_encoder : int = 6, # number of transformer blocks in encoder + num_layers_decoder : int = 4, # number of transformer blocks in decoder + seed : int = 0, # random seed + pt_checkpoint : str = None # checkpoint file (default is None) + ) -> None: + # set up loggers + logger_batch = setup_logger( 'logger_batch', log_name_batch, level = logging.INFO ) + logger_epoch = setup_logger( 'logger_epoch', log_name_epoch, level = logging.INFO ) + logger_val_epoch = setup_logger( 'logger_val_epoch', log_name_val_epoch, level = logging.INFO ) + logger_sequences = setup_logger( 'logger_sequences', log_name_seqs_batch, level = logging.INFO ) + + # set device + device = torch.device("cuda" if torch.cuda.is_available() else "cpu") + + # model info + str_info = "Training details:\n" + str_info += f"\tNeural Network core architecture : Transformer\n" + str_info += f"\tPrior and variational distribution : standard multivariate Gaussian\n" + str_info += f"\tTraining set file : {training_fasta_file}\n" + str_info += f"\tValidation set file : {validation_fasta_file}\n" + str_info += f"\tNumber of epochs : {epochs}\n" + str_info += f"\tValidation frequency (in epochs) : {validation_freq_epoch}\n" + str_info += f"\tCheckpoint frequency (in epochs) : {checkpoint_freq_epoch}\n" + str_info += f"\tEmbedding size : {embedding_size}\n" + str_info += f"\tDropout probability : {dropout_prob}\n" + str_info += f"\tMasking probability (for replacing with ) : {masking_prob}\n" + str_info += f"\tLatent size : {latent_size}\n" + str_info += f"\tCondition latent z on predicted energy for sequence decoding : {condition_on_energy}\n" + str_info += f"\tUse weighted sampling for mini-batches( using WeightedRandomSampler): {weighted_sampling}\n" + str_info += f"\tLearning rate : {learning_rate}\n" + str_info += f"\tL2 penalty constant : {lambda_constant}\n" + str_info += f"\tBatch size : {batch_size}\n" + str_info += f"\tMax sequence length : {max_sequence_length}\n" + str_info += f"\tNumber of heads in (self)attention : {heads}\n" + str_info += f"\tNumber of transformer blocks in encoder : {num_layers_encoder}\n" + str_info += f"\tNumber of transformer blocks in decoder : {num_layers_decoder}\n" + str_info += f"\tRandom seed : {seed}\n" + str_info += f"\tCheckpoint to start a model : {pt_checkpoint}\n" + str_info += f"\tDevice : {device}\n" + + # log + logger_epoch.info(str_info) + + # set seed + torch.manual_seed(seed) + + # create default w2i and i2w maps + w2i,i2w = default_w2i_i2w() + + # create Datasets + # TODO: provide sequence weights + dataset = ProteinSequencesDataset( + training_fasta_file, + w2i, + i2w, + device, + max_sequence_length = max_sequence_length, + extract_energy = True + ) + if weighted_sampling: + train_sequence_weights = dataset.sequence_weights # obtain sequence weights + train_weighted_sampler = WeightedRandomSampler( + weights = train_sequence_weights, + num_samples = len(train_sequence_weights), + replacement = True + ) # create a weighted Random Sampler + dataloader = DataLoader(dataset, batch_size = batch_size, shuffle = False, sampler = train_weighted_sampler) + sampler_string = "Using WeightedRandomSampler." + + else: + dataloader = DataLoader(dataset, batch_size = batch_size, shuffle = True) + sampler_string = "Using default sampling scheme." + + ## log info + str_ = f"Train dataset contains {len(dataset)} elements. " + str_ += f"Batch size is {batch_size}. " + str_ += f"Train dataloader length is {len(dataloader)}.\n" + str_ += f"{sampler_string}" + + logger_epoch.info(str_) + + ### create validation dataset and dataloader + dataset_val = ProteinSequencesDataset( + validation_fasta_file, + w2i, + i2w, + device, + max_sequence_length = max_sequence_length, + extract_energy = True + + ) + dataloader_val = DataLoader(dataset_val, batch_size = batch_size, shuffle = True) + + ### log info + str_ = f"Validation dataset contains {len(dataset_val)} elements. " + str_ += f"Batch size is {batch_size}. " + str_ += f"Validation dataloader length is {len(dataloader_val)}.\n" + logger_val_epoch.info(str_) + + #### compute basic model -> average as predictor + mean_train, mse_train, mse_validation = simple_average_model( + dataset.energies, + dataset_val.energies + ) + # write to both train and validation logger + str_ = f"Average energy prediction: {mean_train:0.4f}. Training MSE using this estimator: {mse_train:0.4f}\n" + logger_epoch.info(str_) + + str_ = f"Average energy prediction: {mean_train:0.4f}. Validation MSE using this estimator: {mse_validation:0.4f}\n" + logger_val_epoch.info(str_) + + # instantiate model + vars = { + "vocab_size" : dataset.vocab_size, + "max_seq_length" : dataset.max_seq_len, + "pad_idx" : dataset.pad_idx, + "sos_idx" : dataset.sos_idx, + "eos_idx" : dataset.eos_idx, + "unk_idx" : dataset.unk_idx, + "embedding_size" : embedding_size, + "latent_size" : latent_size, + "condition_on_energy" : condition_on_energy, + "num_layers_encoder" : num_layers_encoder, + "num_layers_decoder" : num_layers_decoder, + "heads" : heads, + "dropout_prob" : dropout_prob, + "device" : device + } + # model input params + pickle.dump(vars,open(pickle_name,"wb")) + + # print GPU usage after datasets instatiation + if torch.cuda.is_available(): + print("GPU resources after datasets creation...") + print(torch.cuda.memory_summary()) + + + model = TransformerVAE(**vars) + logger_epoch.info("Model specification:") + logger_epoch.info(model) + + # move the model (and its sub-modules(model.children()) to GPU) + model = model.to(device) + + # instantiate optimizer + optimizer = torch.optim.Adam(model.parameters(), lr = learning_rate, weight_decay = lambda_constant) + + # print GPU usage after model instatiation + if torch.cuda.is_available(): + print("GPU resources after model creation...") + print(torch.cuda.memory_summary()) + + # try loading checkpoint + # it may fail if there is no checkpoint or some mismatch in model params + try: + load_checkpoint(model,optimizer,pt_checkpoint) + except Exception as e: + print("Exception occured:",e) + else: + print("Checkpoint loaded successfully") + finally: + # for debugging + max_len = 0 + for name, param in model.named_parameters(recurse=True): + if len(name) > max_len: + max_len = len(name) + print(f"Param: {name}, device: {param.device}") + + # loss objects for reconstruction error + NLL = nn.NLLLoss(ignore_index=dataset.pad_idx) + NLL_val = nn.NLLLoss(ignore_index=dataset_val.pad_idx) + + # loss objects for mse error + MSE = nn.MSELoss() + MSE_val = nn.MSELoss() + + # losses by epoch + nll_losses_by_epoch = [] + kl_losses_by_epoch = [] + mse_losses_by_epoch = [] + total_losses_by_epoch = [] + + # validation losses (by epoch only) + epoch_val = [] + nll_val_by_epoch = [] + kl_val_by_epoch = [] + mse_val_by_epoch = [] + total_loss_val_by_epoch = [] + + # to keep track of epoch with smallest loss: overall + best_loss_train = float('inf') # for train loss + best_loss_val = float('inf') # for validation loss + + # actual training part + for epoch in range(epochs): + # add a note to logger_batch + logger_batch.info(f"Epoch: {epoch}") + + + # do a full pass over training set + train_elbo,train_reconstruction,train_kl,train_mse = train_step( + model, + dataloader, + NLL, + MSE, + optimizer, + logger_batch, + logger_sequences, + masking_prob = masking_prob + ) + + # append to epoch lists + nll_losses_by_epoch.append(train_reconstruction) + kl_losses_by_epoch.append(train_kl) + mse_losses_by_epoch.append(train_mse) + total_losses_by_epoch.append(train_elbo) + + # write to epoch logger + str_epoch = f"Epoch: {epoch}\n\t\t" + str_epoch += f"Reconstruction loss: {train_reconstruction:0.4f} \t" + str_epoch += f"KL loss: {train_kl:0.4f} \t" + str_epoch += f"MSE loss: {train_mse:0.4f}\t" + str_epoch += f"ELBO: {train_elbo:0.4f} \t" + logger_epoch.info(str_epoch) + + + # do a snapshot + if (epoch % checkpoint_freq_epoch == 0) and (epoch != 0): + + checkpoint_name = checkpoint_pattern + f"-after-epoch-{epoch}.pytorch" + + torch.save({ + 'epoch' : epoch, + 'reconstruction' : train_reconstruction, + 'kl loss' : train_kl, + 'mse' : train_mse, + 'elbo' : train_elbo, + 'model_state_dict' : copy.deepcopy(model.state_dict()), + 'optimizer_state_dict' : copy.deepcopy(optimizer.state_dict()) + }, checkpoint_name) + + + # check validation error + if (epoch % validation_freq_epoch == 0) and (epoch != 0): + + # run validation + val_elbo,val_reconstruction,val_kl,val_mse = validation_step( + model, + dataloader_val, + NLL_val, + MSE_val + ) + + # append to validation lists + epoch_val.append(epoch) + nll_val_by_epoch.append(val_reconstruction) + kl_val_by_epoch.append(val_kl) + mse_val_by_epoch.append(val_mse) + total_loss_val_by_epoch.append(val_elbo) + + # write to val_epoch logger + val_string_ = f"Validation after epoch: {epoch}\n\t\t" + val_string_ += f"Reconstruction loss : {val_reconstruction:0.4f}\t" + val_string_ += f"KL loss : {val_kl:0.4f}\t" + val_string_ += f"MSE loss : {val_mse:0.4f}\t" + val_string_ += f"ELBO : {val_elbo:0.4f}" + logger_val_epoch.info(val_string_) + + # update best model params based on validation error + if val_elbo < best_loss_val: + # create/update dictionary + best_results_val = { + 'epoch' : epoch, + 'reconstruction' : val_reconstruction, + 'kl loss' : val_kl, + 'mse' : val_mse, + 'elbo' : val_elbo, + 'model_state_dict' : copy.deepcopy(model.state_dict()), + 'optimizer_state_dict' : copy.deepcopy(optimizer.state_dict()) + } + best_loss_val = val_elbo + + + # need to update best model params based on training error + if train_elbo < best_loss_train: + # create/update dictionary + best_results_train = { + 'epoch' : epoch, + 'reconstruction' : train_reconstruction, + 'kl loss' : train_kl, + 'mse' : train_mse, + 'elbo' : train_elbo, + 'model_state_dict' : copy.deepcopy(model.state_dict()), + 'optimizer_state_dict' : copy.deepcopy(optimizer.state_dict()) + } + best_loss_train = train_elbo + + + # once training is over, save all results + # training results + save_data_to_csv( + csv_epoch_name, + [list(range(len(nll_losses_by_epoch))),nll_losses_by_epoch,kl_losses_by_epoch,mse_losses_by_epoch,total_losses_by_epoch], + ["Epoch","NLL","KL","MSE","ELBO"] + ) + + # validation results + save_data_to_csv( + csv_validation_epoch_name, + [epoch_val,nll_val_by_epoch,kl_val_by_epoch,mse_val_by_epoch,total_loss_val_by_epoch], + ["Epoch","NLL","KL","MSE","ELBO"] + ) + + # save best results (TRAIN) + str_ = "Best model parameters (based on train error)\n" + str_ += f"\tAchieved at epoch : {best_results_train['epoch']}\n" + str_ += f"\tReconstruction error : {best_results_train['reconstruction']:0.4f}\n" + str_ += f"\tKL loss : {best_results_train['kl loss']:0.4f}\n" + str_ += f"\tMSE loss : {best_results_train['mse']:0.4f}\n" + str_ += f"\tELBO : {best_results_train['elbo']:0.4f}\n" + logger_epoch.info(str_) + # save model + torch.save(best_results_train, pt_name_train) + + # save best results (VALIDATION) + str_ = "Best model parameters (based on validation error)\n" + str_ += f"\tAchieved at epoch : {best_results_val['epoch']}\n" + str_ += f"\tReconstruction error : {best_results_val['reconstruction']:0.4f}\n" + str_ += f"\tKL loss : {best_results_val['kl loss']:0.4f}\n" + str_ += f"\tMSE loss : {best_results_val['mse']:0.4f}\n" + str_ += f"\tELBO : {best_results_val['elbo']:0.4f}\n" + logger_val_epoch.info(str_) + # save model + torch.save(best_results_val, pt_name_val) + +######################################### GRU predictive ############ +@predictor_app.command("gru") +def train_gru( + training_fasta_file : str, # FASTA file with training sequences + validation_fasta_file : str, # FASTA file with validation sequences + log_name_batch : str, # logger for batch updates during training + log_name_epoch : str, # logger for epoch updates during training + log_name_val_epoch : str, # logger for epoch updates during validation + checkpoint_pattern : str, # checkpoint generic name + csv_epoch_name : str, # filename for CSV with training losses results by epoch + csv_validation_epoch_name : str, # filename for CSV with validation losses results by epoch + pickle_name : str, # filename for model input params (to instantiate correct object later) + pt_name_train : str, # filename for model trained layers (corresponding to smallest training error) + pt_name_val : str, # filename for model trained layers (corresponding to smallest validation error) + epochs : int = 10, # number of epochs to train NN + learning_rate : float = 0.0001, # learning rate for gradient descent + lambda_constant : float = 0.001, # L2 constant + validation_freq_epoch : int = 2, # how frequently compute validation loss + checkpoint_freq_epoch : int = 2, # how frequently save model snapshots + max_sequence_length : int = 100, # maximum sequence length + batch_size : int = 16, # how many sequences in mini-batch + embedding_size : int = 32, # embedding size (must be divisible by number of heads) + hidden_size : int = 32, # hidden size for h in GRU + num_layers : int = 1, # number of stacked GRUs + bidirectional : bool = False, # whether to use bidirectional GRU (default: no) + dropout_prob : float = 0.1, # dropout probability (same for all the dropouts) + seed : int = 0, # random seed + pt_checkpoint : str = None # checkpoint file (default is None) + ) -> None: + # set up loggers + logger_batch = setup_logger( 'logger_batch', log_name_batch, level = logging.INFO ) + logger_epoch = setup_logger( 'logger_epoch', log_name_epoch, level = logging.INFO ) + logger_val_epoch = setup_logger( 'logger_val_epoch', log_name_val_epoch, level = logging.INFO ) + + # set device + device = torch.device("cuda" if torch.cuda.is_available() else "cpu") + + # model info + str_info = "Training details:\n" + str_info += f"\tPredictive NN core architecture : GRU\n" + str_info += f"\tTraining set file : {training_fasta_file}\n" + str_info += f"\tValidation set file : {validation_fasta_file}\n" + str_info += f"\tNumber of epochs : {epochs}\n" + str_info += f"\tValidation frequency (in epochs) : {validation_freq_epoch}\n" + str_info += f"\tCheckpoint frequency (in epochs) : {checkpoint_freq_epoch}\n" + str_info += f"\tEmbedding size : {embedding_size}\n" + str_info += f"\tDropout probability : {dropout_prob}\n" + str_info += f"\tLearning rate : {learning_rate}\n" + str_info += f"\tL2 penalty constant : {lambda_constant}\n" + str_info += f"\tBatch size : {batch_size}\n" + str_info += f"\tMax sequence length : {max_sequence_length}\n" + str_info += f"\tRandom seed : {seed}\n" + str_info += f"\tCheckpoint to start a model : {pt_checkpoint}\n" + str_info += f"\tDevice : {device}\n" + + # log + logger_epoch.info(str_info) + + # set seed + torch.manual_seed(seed) + + # create default w2i and i2w maps + w2i,i2w = default_w2i_i2w() + + # create train set -> need ["input"] and ["energy"] + dataset = ProteinSequencesDataset( + training_fasta_file, + w2i, + i2w, + device, + max_sequence_length = max_sequence_length, + extract_energy = True + ) + dataloader = DataLoader(dataset, batch_size = batch_size, shuffle = True) + + ## log info + str_ = f"Train dataset contains {len(dataset)} elements. " + str_ += f"Batch size is {batch_size}. " + str_ += f"Train dataloader length is {len(dataloader)}.\n" + logger_epoch.info(str_) + + ### create validation set + dataset_val = ProteinSequencesDataset( + validation_fasta_file, + w2i, + i2w, + device, + max_sequence_length = max_sequence_length, + extract_energy = True + + ) + dataloader_val = DataLoader(dataset_val, batch_size = batch_size, shuffle = True) + + ### log info + str_ = f"Validation dataset contains {len(dataset_val)} elements. " + str_ += f"Batch size is {batch_size}. " + str_ += f"Validation dataloader length is {len(dataloader_val)}.\n" + logger_val_epoch.info(str_) + + #### compute basic model -> average as predictor + mean_train, mse_train, mse_validation = simple_average_model( + dataset.energies, + dataset_val.energies + ) + # write to both train and validation logger + str_ = f"Average energy prediction: {mean_train:0.4f}. Training MSE using this estimator: {mse_train:0.4f}\n" + logger_epoch.info(str_) + + str_ = f"Average energy prediction: {mean_train:0.4f}. Validation MSE using this estimator: {mse_validation:0.4f}\n" + logger_val_epoch.info(str_) + + # instantiate GRU model + vars = { + "vocab_size" : dataset.vocab_size, + "embedding_size" : embedding_size, + "hidden_size" : hidden_size, + "device" : device, + "pad_idx" : dataset.pad_idx, + "p_dropout" : dropout_prob, + "num_layers" : num_layers, + "bidirectional" : bidirectional + } + model = PredictorGRU(**vars) + + logger_epoch.info("Model specification:") + logger_epoch.info(model) + + # move the model (and its sub-modules(model.children()) to GPU) + model = model.to(device) + + # instantiate optimizer + optimizer = torch.optim.Adam(model.parameters(), lr = learning_rate, weight_decay = lambda_constant) + + # try loading checkpoint + # it may fail if there is no checkpoint or some mismatch in model params + try: + load_checkpoint(model,optimizer,pt_checkpoint) + except Exception as e: + print("Exception occured:",e) + else: + print("Checkpoint loaded successfully") + finally: + # for debugging + max_len = 0 + for name, param in model.named_parameters(recurse=True): + if len(name) > max_len: + max_len = len(name) + print(f"Param: {name}, device: {param.device}") + + # loss objects for mse error + MSE = nn.MSELoss() + MSE_val = nn.MSELoss() + + # loss by epoch + mse_losses_by_epoch = [] # train + mse_val_by_epoch = [] # validation + epoch_val = [] # epochs when validation loss is computed + + + # to keep track of epoch with smallest loss: overall + best_loss_train = float('inf') # for train loss + best_loss_val = float('inf') # for validation loss + + # actual training part + for epoch in range(epochs): + + # add a note to logger_batch + logger_batch.info(f"Epoch: {epoch}") + + # do a full pass over training set + train_mse = train_step_gru_tf( + model, + dataloader, + MSE, + optimizer, + logger_batch + ) + # append to epoch lists + mse_losses_by_epoch.append(train_mse) + + # write to epoch logger + str_epoch = f"Epoch: {epoch}\n\t\t" + str_epoch += f"MSE loss: {train_mse:0.4f}\t" + logger_epoch.info(str_epoch) + + # do a snapshot + if (epoch % checkpoint_freq_epoch == 0) and (epoch != 0): + + checkpoint_name = checkpoint_pattern + f"-after-epoch-{epoch}.pytorch" + + torch.save({ + 'epoch' : epoch, + 'mse' : train_mse, + 'model_state_dict' : copy.deepcopy(model.state_dict()), + 'optimizer_state_dict' : copy.deepcopy(optimizer.state_dict()) + }, checkpoint_name) + + # check validation error + if (epoch % validation_freq_epoch == 0) and (epoch != 0): + + # run validation + val_mse = validation_step_gru_tf( + model, + dataloader_val, + MSE_val + ) + + # append to validation lists + epoch_val.append(epoch) + mse_val_by_epoch.append(val_mse) + + # write to val_epoch logger + val_string_ = f"Validation after epoch: {epoch}\n\t\t" + val_string_ += f"MSE loss : {val_mse:0.4f}\t" + logger_val_epoch.info(val_string_) + + # update best model params based on validation error + if val_mse < best_loss_val: + # create/update dictionary + best_results_val = { + 'epoch' : epoch, + 'mse' : val_mse, + 'model_state_dict' : copy.deepcopy(model.state_dict()), + 'optimizer_state_dict' : copy.deepcopy(optimizer.state_dict()) + } + best_loss_val = val_mse + + # need to update best model params based on training error + if train_mse < best_loss_train: + # create/update dictionary + best_results_train = { + 'epoch' : epoch, + 'mse' : train_mse, + 'model_state_dict' : copy.deepcopy(model.state_dict()), + 'optimizer_state_dict' : copy.deepcopy(optimizer.state_dict()) + } + best_loss_train = train_mse + + # once training is over save all the results + # training results + save_data_to_csv( + csv_epoch_name, + [list(range(len(mse_losses_by_epoch))),mse_losses_by_epoch], + ["Epoch","MSE"] + ) + + # validation results + save_data_to_csv( + csv_validation_epoch_name, + [epoch_val,mse_val_by_epoch], + ["Epoch","MSE"] + ) + + # model input params + pickle.dump(vars,open(pickle_name,"wb")) + + # save best results (TRAIN) + str_ = "Best model parameters (based on train error)\n" + str_ += f"\tAchieved at epoch : {best_results_train['epoch']}\n" + str_ += f"\tMSE loss : {best_results_train['mse']:0.4f}\n" + logger_epoch.info(str_) + # save model + torch.save(best_results_train, pt_name_train) + + # save best results (VALIDATION) + str_ = "Best model parameters (based on validation error)\n" + str_ += f"\tAchieved at epoch : {best_results_val['epoch']}\n" + str_ += f"\tMSE loss : {best_results_val['mse']:0.4f}\n" + logger_val_epoch.info(str_) + # save model + torch.save(best_results_val, pt_name_val) + + +######################################### TF encoder predictive ############ +@predictor_app.command("tf") +def train_tf( + training_fasta_file : str, # FASTA file with training sequences + validation_fasta_file : str, # FASTA file with validation sequences + log_name_batch : str, # logger for batch updates during training + log_name_epoch : str, # logger for epoch updates during training + log_name_val_epoch : str, # logger for epoch updates during validation + checkpoint_pattern : str, # checkpoint generic name + csv_epoch_name : str, # filename for CSV with training losses results by epoch + csv_validation_epoch_name : str, # filename for CSV with validation losses results by epoch + pickle_name : str, # filename for model input params (to instantiate correct object later) + pt_name_train : str, # filename for model trained layers (corresponding to smallest training error) + pt_name_val : str, # filename for model trained layers (corresponding to smallest validation error) + epochs : int = 10, # number of epochs to train NN + learning_rate : float = 0.0001, # learning rate for gradient descent + lambda_constant : float = 0.001, # L2 constant + validation_freq_epoch : int = 2, # how frequently compute validation loss + checkpoint_freq_epoch : int = 2, # how frequently save model snapshots + max_sequence_length : int = 100, # maximum sequence length + batch_size : int = 16, # how many sequences in mini-batch + embedding_size : int = 512, # embedding size (must be divisible by number of heads) + latent_size : int = 64, # dimensionality of the latent space + weighted_sampling : bool = False, # whether to use weighted sampling (right now using WeightedRandomSampler) + dropout_prob : float = 0.1, # dropout probability (same for all the dropouts) + heads : int = 8, # number of heads in (self)attention + num_layers_encoder : int = 6, # number of transformer blocks in encoder + seed : int = 0, # random seed + pt_checkpoint : str = None # checkpoint file (default is None) + ) -> None: + + # set up loggers + logger_batch = setup_logger( 'logger_batch', log_name_batch, level = logging.INFO ) + logger_epoch = setup_logger( 'logger_epoch', log_name_epoch, level = logging.INFO ) + logger_val_epoch = setup_logger( 'logger_val_epoch', log_name_val_epoch, level = logging.INFO ) + + # set device + device = torch.device("cuda" if torch.cuda.is_available() else "cpu") + + # model info + str_info = "Training details:\n" + str_info += f"\tPredictive NN core architecture : Transformer Encoder\n" + str_info += f"\tTraining set file : {training_fasta_file}\n" + str_info += f"\tValidation set file : {validation_fasta_file}\n" + str_info += f"\tNumber of epochs : {epochs}\n" + str_info += f"\tValidation frequency (in epochs) : {validation_freq_epoch}\n" + str_info += f"\tCheckpoint frequency (in epochs) : {checkpoint_freq_epoch}\n" + str_info += f"\tEmbedding size : {embedding_size}\n" + str_info += f"\tLatent size : {latent_size}\n" + str_info += f"\tUse weighted sampling for mini-batches( using WeightedRandomSampler): {weighted_sampling}\n" + str_info += f"\tNumber of heads in self-attention : {heads}\n" + str_info += f"\tNumber of layers in TF encoder block : {num_layers_encoder}\n" + str_info += f"\tDropout probability : {dropout_prob}\n" + str_info += f"\tLearning rate : {learning_rate}\n" + str_info += f"\tL2 penalty constant : {lambda_constant}\n" + str_info += f"\tBatch size : {batch_size}\n" + str_info += f"\tMax sequence length : {max_sequence_length}\n" + str_info += f"\tRandom seed : {seed}\n" + str_info += f"\tCheckpoint to start a model : {pt_checkpoint}\n" + str_info += f"\tDevice : {device}\n" + + # log + logger_epoch.info(str_info) + + # set seed + torch.manual_seed(seed) + + # create default w2i and i2w maps + w2i,i2w = default_w2i_i2w() + + # create train set -> need ["input"] and ["energy"] + dataset = ProteinSequencesDataset( + training_fasta_file, + w2i, + i2w, + device, + max_sequence_length = max_sequence_length, + extract_energy = True + ) + if weighted_sampling: + train_sequence_weights = dataset.sequence_weights # obtain sequence weights + train_weighted_sampler = WeightedRandomSampler( + weights = train_sequence_weights, + num_samples = len(train_sequence_weights), + replacement = True + ) # create a weighted Random Sampler + dataloader = DataLoader(dataset, batch_size = batch_size, shuffle = False, sampler = train_weighted_sampler) + sampler_string = "Using WeightedRandomSampler." + + else: + dataloader = DataLoader(dataset, batch_size = batch_size, shuffle = True) + sampler_string = "Using default sampling scheme." + + ## log info + str_ = f"Train dataset contains {len(dataset)} elements. " + str_ += f"Batch size is {batch_size}. " + str_ += f"Train dataloader length is {len(dataloader)}.\n" + str_ += f"{sampler_string}" + logger_epoch.info(str_) + + + ### create validation set + dataset_val = ProteinSequencesDataset( + validation_fasta_file, + w2i, + i2w, + device, + max_sequence_length = max_sequence_length, + extract_energy = True + + ) + dataloader_val = DataLoader(dataset_val, batch_size = batch_size, shuffle = True) + + ### log info + str_ = f"Validation dataset contains {len(dataset_val)} elements. " + str_ += f"Batch size is {batch_size}. " + str_ += f"Validation dataloader length is {len(dataloader_val)}.\n" + logger_val_epoch.info(str_) + + #### compute basic model -> average as predictor + mean_train, mse_train, mse_validation = simple_average_model( + dataset.energies, + dataset_val.energies + ) + # write to both train and validation logger + str_ = f"Average energy prediction: {mean_train:0.4f}. Training MSE using this estimator: {mse_train:0.4f}\n" + logger_epoch.info(str_) + + str_ = f"Average energy prediction: {mean_train:0.4f}. Validation MSE using this estimator: {mse_validation:0.4f}\n" + logger_val_epoch.info(str_) + + # instantiate GRU model + vars = { + "vocab_size" : dataset.vocab_size, + "max_seq_length" : dataset.max_seq_len, + "pad_idx" : dataset.pad_idx, + "embedding_size" : embedding_size, + "latent_size" : latent_size, + "num_layers_encoder" : num_layers_encoder, + "heads" : heads, + "dropout_prob" : dropout_prob + } + model = PredictorTFEncoder(**vars) + + logger_epoch.info("Model specification:") + logger_epoch.info(model) + + # move the model (and its sub-modules(model.children()) to GPU) + model = model.to(device) + + # instantiate optimizer + optimizer = torch.optim.Adam(model.parameters(), lr = learning_rate, weight_decay = lambda_constant) + + # try loading checkpoint + # it may fail if there is no checkpoint or some mismatch in model params + try: + load_checkpoint(model,optimizer,pt_checkpoint) + except Exception as e: + print("Exception occured:",e) + else: + print("Checkpoint loaded successfully") + finally: + # for debugging + max_len = 0 + for name, param in model.named_parameters(recurse=True): + if len(name) > max_len: + max_len = len(name) + print(f"Param: {name}, device: {param.device}") + + # loss objects for mse error + MSE = nn.MSELoss() + MSE_val = nn.MSELoss() + + # loss by epoch + mse_losses_by_epoch = [] # train + mse_val_by_epoch = [] # validation + epoch_val = [] # epochs when validation loss is computed + + + # to keep track of epoch with smallest loss: overall + best_loss_train = float('inf') # for train loss + best_loss_val = float('inf') # for validation loss + + # actual training part + for epoch in range(epochs): + + # add a note to logger_batch + logger_batch.info(f"Epoch: {epoch}") + + # do a full pass over training set + train_mse = train_step_gru_tf( + model, + dataloader, + MSE, + optimizer, + logger_batch, + model_type = 2 + ) + # append to epoch lists + mse_losses_by_epoch.append(train_mse) + + # write to epoch logger + str_epoch = f"Epoch: {epoch}\n\t\t" + str_epoch += f"MSE loss: {train_mse:0.4f}\t" + logger_epoch.info(str_epoch) + + # do a snapshot + if (epoch % checkpoint_freq_epoch == 0) and (epoch != 0): + + checkpoint_name = checkpoint_pattern + f"-after-epoch-{epoch}.pytorch" + + torch.save({ + 'epoch' : epoch, + 'mse' : train_mse, + 'model_state_dict' : copy.deepcopy(model.state_dict()), + 'optimizer_state_dict' : copy.deepcopy(optimizer.state_dict()) + }, checkpoint_name) + + # check validation error + if (epoch % validation_freq_epoch == 0) and (epoch != 0): + + # run validation + val_mse = validation_step_gru_tf( + model, + dataloader_val, + MSE_val, + model_type = 2 + ) + + # append to validation lists + epoch_val.append(epoch) + mse_val_by_epoch.append(val_mse) + + # write to val_epoch logger + val_string_ = f"Validation after epoch: {epoch}\n\t\t" + val_string_ += f"MSE loss : {val_mse:0.4f}\t" + logger_val_epoch.info(val_string_) + + # update best model params based on validation error + if val_mse < best_loss_val: + # create/update dictionary + best_results_val = { + 'epoch' : epoch, + 'mse' : val_mse, + 'model_state_dict' : copy.deepcopy(model.state_dict()), + 'optimizer_state_dict' : copy.deepcopy(optimizer.state_dict()) + } + best_loss_val = val_mse + + # need to update best model params based on training error + if train_mse < best_loss_train: + # create/update dictionary + best_results_train = { + 'epoch' : epoch, + 'mse' : train_mse, + 'model_state_dict' : copy.deepcopy(model.state_dict()), + 'optimizer_state_dict' : copy.deepcopy(optimizer.state_dict()) + } + best_loss_train = train_mse + + # once training is over save all the results + # training results + save_data_to_csv( + csv_epoch_name, + [list(range(len(mse_losses_by_epoch))),mse_losses_by_epoch], + ["Epoch","MSE"] + ) + + # validation results + save_data_to_csv( + csv_validation_epoch_name, + [epoch_val,mse_val_by_epoch], + ["Epoch","MSE"] + ) + + # model input params + pickle.dump(vars,open(pickle_name,"wb")) + + # save best results (TRAIN) + str_ = "Best model parameters (based on train error)\n" + str_ += f"\tAchieved at epoch : {best_results_train['epoch']}\n" + str_ += f"\tMSE loss : {best_results_train['mse']:0.4f}\n" + logger_epoch.info(str_) + # save model + torch.save(best_results_train, pt_name_train) + + # save best results (VALIDATION) + str_ = "Best model parameters (based on validation error)\n" + str_ += f"\tAchieved at epoch : {best_results_val['epoch']}\n" + str_ += f"\tMSE loss : {best_results_val['mse']:0.4f}\n" + logger_val_epoch.info(str_) + # save model + torch.save(best_results_val, pt_name_val) + + + + +if __name__ == "__main__": + app() + + + + + + + diff --git a/bin/utilities.py b/bin/utilities.py new file mode 100755 index 0000000..978ec9c --- /dev/null +++ b/bin/utilities.py @@ -0,0 +1,2241 @@ +# PREVENT: PRotein Engineering by Variational frEe eNergy approximaTion +# Copyright (C) 2024 Giovanni Stracquadanio, Evgenii Lobzaev + +# This program is free software: you can redistribute it and/or modify +# it under the terms of the GNU Affero General Public License as published +# by the Free Software Foundation, either version 3 of the License, or +# (at your option) any later version. + +# This program is distributed in the hope that it will be useful, +# but WITHOUT ANY WARRANTY; without even the implied warranty of +# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the +# GNU Affero General Public License for more details. + +# You should have received a copy of the GNU Affero General Public License +# along with this program. If not, see . + +#!/usr/bin/env python3 +# -*- coding: utf-8 -*- +""" +Utility functions and classes. +""" + +import torch +import torch.nn as nn +from autograd_minimize import minimize +from models import ( + TransformerVAE, + PredictorTFEncoder + ) +from torch.utils.data import Dataset,DataLoader +from Bio import SeqIO +from Bio.Seq import Seq +from Bio.SeqRecord import SeqRecord +from Bio.SeqUtils.ProtParam import ProteinAnalysis +from collections import defaultdict +from typing import List,Tuple +from numpy.typing import ArrayLike +import logging +import pandas as pd +import numpy as np +import seaborn as sns +import tqdm +import re +from matplotlib import pyplot as plt +import pickle + +# class to store sequence data +class SequenceData(object): + """ + Stores information about sequence: + sequence as string, + list of energies, + list of logprobabilities, + list of z (as numpy arrays) + id (as string) + description (as string) + """ + def __init__(self,seq,id,first_energy,first_logp,first_z): + # instantiate object -> save id, create and add first element to energy/logp/z lists + self.id = id + self.energies = [first_energy] + self.logps = [first_logp] + self.zs = [first_z] + self.sequence = seq + self.description = "" + def update_info(self,next_energy,next_logp,next_z): + # update respective lists + self.energies.append(next_energy) + self.logps.append(next_logp) + self.zs.append(next_z) + def generate_description(self,seedID=None): + # generate description of the SequenceData + # print("List of all energies/zs:") + # for z,energy in zip(self.zs,self.energies): + # print("energy:",energy) + # print("z :",z) + # print("-"*10) + + # stats for energies + energies_stats = self.__compute_stats(self.energies) + # stats for logp + logps_stats = self.__compute_stats(self.logps) + # write energies + self.description = ( + f"Seed molecule: {seedID}||" + f"Number of datapoints: {energies_stats[0]}||" + f"Length: {len(self.sequence)}||" + f"Energy [avg,std,5%,95%]: [{energies_stats[1]:0.4f},{energies_stats[2]:0.4f},{energies_stats[3]:0.4f},{energies_stats[4]:0.4f}]||" + f"logp(x|z) [avg,std,5%,95%]: [{logps_stats[1]:0.4f},{logps_stats[2]:0.4f},{logps_stats[3]:0.4f},{logps_stats[4]:0.4f}]" + ) + + @property + def toTuple(self): + # return as tuple + tpl = ( + self.sequence, + self.energies, + self.logps, + self.zs, + self.id, + self.description + ) + return tpl + @property + def toSeqRecord(self): + # return as SeqRecord + record = SeqRecord( + Seq(self.sequence), + id = self.id, + description = self.description + ) + return record + def __compute_stats(self,somelist): + # compute stats for a list of numerical values: energies and logps + n_elements = len(somelist) # number of elements + as_np = np.array(somelist) # cast to np.array + avg = np.mean(as_np) # mean + std = np.std(as_np) + pct5 = np.percentile(as_np,5) + pct95 = np.percentile(as_np,95) + return n_elements,avg,std,pct5,pct95 + +#################################################### DATA PREPROCESSING ###################################### +# mappings: amino acids (+ tokens) <-> integers +def default_w2i_i2w() -> Tuple[dict,dict] : + ''' + Constructs default maps that can be passed to ProteinSequencesDataset. + If you want custom maps, you need to code them separately. You can reuse the code from here. + ''' + w2i = dict() # maps word(amino-acids) into index + i2w = dict() # maps index into word(amino-acid) + + # may need to rearrange the order later + amino_acids = ['A','R','N','D','C','Q','E','G','H','I','L','K','M','F','P','S','T','W','Y','V'] + special_tokens = ['', '', '', ''] + + # first get the amino acids + for w in amino_acids: + i2w[len(w2i)] = w + w2i[w] = len(w2i) + + # then add special tokens + for st in special_tokens: + i2w[len(w2i)] = st + w2i[st] = len(w2i) + + return w2i,i2w + +# find a historgram frequency for an input value +def find_bin_value( + element: float, # element to find correpsonding bin frequency for. higher the frequency, lower should be the probability of sampling this value + n: List, # List of bin frequencies + bins: List # List of bin edges + )->float: + + import bisect + + # find min/max : leftmost/rightmost bin edges + min_, max_ = bins[0], bins[-1] + + # if element is outside min_, max_, throw an error + if (element < min_) or (element > max_): + raise Exception(f"Sorry, cannot find frequency for element outside of [{min_};{max_}] range") + + # if element is equal to max_, assign to last bin (other edge cases should be handled correclt in the main body of the function) + if element == max_: + ind = len(n)-1 + else: + ind = bisect.bisect(bins, element) - 1 + + return n[ind] + +# dataset class for processing sequence data +class ProteinSequencesDataset(Dataset): + ''' + Custom dataset class that works with protein sequences. + fasta_file : FASTA file from Uniprot with protein sequences (needs to be prepared separately), string + w2i : map word-to-index, dictionary + i2w : map index-to-word, dictionary + max_sequence_length: maximum length of protein sequence to be considered for VAE, whatever is beyond is ignored, int + sequence_weights : dictionary with sequence weights + + ''' + def __init__( + self, + fasta_file : str, + w2i : dict, + i2w : dict, + device : torch.device, + max_sequence_length : int = 500, + sequence_weights : dict = None, + extract_energy : bool = False + ): + super().__init__() + + # save few variables + self.max_seq_length = max_sequence_length + 1 # to account for / + + # need to create w2i and i2w dictionaries + self.w2i, self.i2w = w2i, i2w + + # keep device + self.device = device + + # need to construct data object -> modified to exclude sequences with weird amino acids + self.data, self.list_of_energies = self.__construct_data( + fasta_file, + sequence_weights = sequence_weights, + extract_energy = extract_energy + ) + + def __len__(self) -> int: + return len(self.data) + + def __getitem__(self, idx) -> dict: + return self.data[idx] + + def __sym2num_conversion( + self, + input_ : List, + target_ : List + ) -> Tuple[torch.tensor,torch.tensor]: + ''' + Conversion of string array into numeric array. Needed if we use embedding layers. + Conversion is the SAME for input_ and target_ + EX.: ['','M','Q','H'] -> [2,4,7,10] + + INPUT: + input_ : Input array of strings, list of strings + target_: Next element predictions for the input_, list of strings + OUTPUT: + input_num, target_num : numpy numeric arrays. See EX. above. + + ''' + #input_num = np.asarray([self.w2i.get(element,self.w2i['']) for element in input_]) + #target_num = np.asarray([self.w2i.get(element,self.w2i['']) for element in target_]) + input_num = torch.tensor( + [self.w2i.get(element,self.w2i['']) for element in input_], + dtype = torch.long, + device = self.device + ) + target_num = torch.tensor( + [self.w2i.get(element,self.w2i['']) for element in target_], + dtype = torch.long, + device = self.device + ) + + return input_num,target_num + + def __construct_data( + self, + fasta_file : str, + sequence_weights : dict = None, # sequence weights (as dictionary) + extract_energy : bool = False + ) -> defaultdict: + ''' + Explicit construction of data object that is used in __getitem__ method. + INPUT: + fasta_file : FASTA file from Uniprot with protein sequences (needs to be prepared separately), string + OUTPUT: + data : defaultdict that has a following format: + data[i] = {"input" : Input array for element i (EX: ABCD) + "target" : Target array for element i (it is input shifted by 1 position to the right) (EX: ABCD) + "energy" : Free Energy value + "length" : length of input or output (they'are the same length) that does not take padding into account) + "weight" : some weight assigned to a sequence, default 1.0 + "reference" : id of a sequence + } + ''' + # create a nested dictionary with default dictionary + data = defaultdict(dict) + + # create empty list + list_of_energies = [] + + # get list of sequences: now only sequences with ALL known amino acids are added + orginal_records = SeqIO.parse(fasta_file,"fasta") + records = [record for record in orginal_records] + + # add weights (if sequence_weights object is not None) + addweights = True if sequence_weights != None else False + + # populate data + # loop over seqeunces + for i,record in enumerate(records): + + # get reference id + reference_ = record.id + + if extract_energy: + # parse ID to obtain free energy + energy = float( + reference_.split(":")[1] + ) + + # append to energies list + list_of_energies.append(energy) + + # cast to tensor + energy_ = torch.tensor( + [energy], + dtype = torch.float, + device = self.device + ) + + # convert to a list + sequence = list(record.seq) + sequence_plus_sos = [''] + sequence + + # obtain input and target as character arrays + input_ = sequence_plus_sos[:self.max_seq_length] + target_ = sequence[:self.max_seq_length-1] + [''] + assert len(input_) == len(target_), "Length mismatch" + len_ = len(input_) + + # cast to tensor + len_ = torch.tensor( + len_, + dtype=torch.long, + device=self.device + ) + + # need to append tokens if necessary + input_.extend([''] * (self.max_seq_length-len_)) + target_.extend([''] * (self.max_seq_length-len_)) + + # need to convert into numerical format + input_,target_ = self.__sym2num_conversion(input_,target_) + + # save to data: everything but reference_ is torch tensor (pushed to cpu or gpu, if available) + data[i]["input"] = input_ + data[i]["target"] = target_ + data[i]["length"] = len_ + data[i]["reference"] = reference_ + + # add weights + if addweights: + data[i]["weight"] = torch.tensor( + sequence_weights[reference_], + dtype = torch.float, + device = self.device + ) # add weights wrapped into tensor + print(data[i]["weight"]) + # add energy + if extract_energy: + data[i]["energy"] = energy_ + + return data,list_of_energies + + @property + def vocab_size(self) -> int: + return len(self.w2i) + + @property + def max_seq_len(self) -> int: + return self.max_seq_length + + @property + def pad_idx(self) -> int: + return self.w2i[''] + + @property + def sos_idx(self) -> int: + return self.w2i[''] + + @property + def eos_idx(self) -> int: + return self.w2i[''] + + @property + def unk_idx(self) -> int: + return self.w2i[''] + + @property + def energies(self) -> ArrayLike: + return np.array(self.list_of_energies) + + # new: return weights for each sequence/energy pair + @property + def sequence_weights(self) -> ArrayLike: + # run histrogram on self.list_of_energies + n, bins = np.histogram( + self.list_of_energies, + "auto" + ) + + # compute weights as inverse of frequencies + # higher the frequency, lower the probability of sampling + weights = [ 1.0/find_bin_value(energy,n,bins) for energy in self.list_of_energies ] + + return weights + + + +##################################################### RELATED TO TRAINING ######################################## +# computing loss for Gaussian-based VAE +# loss is composed of 3 terms: +# 1) Reconstruction loss +# 2) KL loss (in closed form) +# 3) MSE loss +# weights are not used here, if sequences have different weights, this function needs to be modified! +def compute_loss_gaussian( + reconstruction_loss_criterion, # function/class to compute Reconstruction loss -> here NLLLoss + true, # true sequnce tokens + predicted, # predicted tokens probability/logprobability/logits (depends on a function used) + mean, # mean of q(z|x) + logv, # log-variance of q(z|x) + mse_loss_criterion, # MSE loss class/function + energy_true, # true energy values + energy_predicted # predicted energy values + ): + # true: [Batch Sise, Seq Length] + # predicted: [Batch Size, Seq Length, Vocab Size] + B,S,E = predicted.size() + true = true.reshape(-1) + predicted = predicted.reshape(B*S,E) + + # reconstruction loss + reconstruction_loss = reconstruction_loss_criterion(predicted,true) + + # KL loss + kl_loss = -0.5 * torch.sum( + 1 + logv - mean.pow(2) - logv.exp() + ) + + # MSE loss + mse_energy = mse_loss_criterion(energy_predicted,energy_true) + + return reconstruction_loss,kl_loss,mse_energy + +# whole pass over dataloader +# optimization is performed +def train_step( + model, # VAE + dataloader, # dataloader + criterion, # NLL for reconstruction error + criterion_mse, # MSE for MSE loss + optimizer, + logger, + logger_sequences, # logger to check which sequences are in batch + masking_prob=0.0 + ): + # training mode + model.train() + + batch_loss = [] # all + batch_reconstruction = [] # reconstruction + batch_kl = [] # kl + batch_mse = [] # mse + + for idx,batch in enumerate(dataloader): + + src = batch["input"] # size [N,S] + tgt = batch["target"] # size [N,T] + energy_true = batch["energy"] # size [N,1] or maybe [N] as energy is a scalar + reference_ids = batch["reference"] + + # forward pass + output,mean,logv,predicted_energy = model( + src, # Src in Transformer architecture + src, # Tgt in Transformer architecture + masking_prob = masking_prob # masking probability to mask Tgt + ) + + # loss calculation (returns reconstruction, kl and mse losses individually) + reconstruction_loss, kl_loss, mse_loss = compute_loss_gaussian( + criterion, + tgt, + output, + mean, + logv, + criterion_mse, + energy_true, + predicted_energy + ) + + # overall loss + loss = reconstruction_loss + kl_loss + mse_loss + + if idx == 0: + # print resources + if torch.cuda.is_available(): + print(f"GPU resources just before gradient update:") + print(torch.cuda.memory_summary()) + + optimizer.zero_grad() + loss.backward() + optimizer.step() + + # Overall loss + batch_loss.append(loss.item()) + + # reconstruction + batch_reconstruction.append(reconstruction_loss.item()) + + # kl + batch_kl.append(kl_loss.item()) + + # mse + batch_mse.append(mse_loss.item()) + + # add to the logger + str_ = f"\t Batch {idx}\t" + str_ += f"Reconstruction error: {batch_reconstruction[-1]:0.4f}\t" + str_ += f"KL: {batch_kl[-1]:0.4f}\t" + str_ += f"MSE: {batch_mse[-1]:0.4f}\t" + str_ += f"ELBO: {batch_loss[-1]:0.4f}" + logger.info(str_) + + # add to logger_sequences + logger_sequences.info(reference_ids) + + + # compute average (for epoch) + avg_loss = sum(batch_loss)/len(batch_loss) + avg_reconstruction = sum(batch_reconstruction)/len(batch_reconstruction) + avg_kl = sum(batch_kl)/len(batch_kl) + avg_mse = sum(batch_mse)/len(batch_mse) + + return avg_loss,avg_reconstruction,avg_kl,avg_mse + +# whole pass over dataloader +# no optimization is performed +def validation_step(model,dataloader,criterion,criterion_mse): + # evaluation mode + model.eval() + + batch_loss = [] # all + batch_reconstruction = [] # reconstruction + batch_kl = [] # kl + batch_mse = [] # mse + + # don't keep gradients + with torch.no_grad(): + for batch in dataloader: + src = batch["input"] # size [N,S] + tgt = batch["target"] # size [N,T] + energy_true = batch["energy"] # size [N,1] or just [N] + + # forward pass + output,mean,logv,predicted_energy = model(src,src) + + # loss calculation + reconstruction_loss, kl_loss, mse_loss = compute_loss_gaussian( + criterion, + tgt, + output, + mean, + logv, + criterion_mse, + energy_true, + predicted_energy + ) + + # overall loss + loss = reconstruction_loss + kl_loss + mse_loss + + # all loss + batch_loss.append(loss.item()) + # reconstruction + batch_reconstruction.append(reconstruction_loss.item()) + # kl + batch_kl.append(kl_loss.item()) + # mse + batch_mse.append(mse_loss.item()) + + + # compute average + avg_loss = sum(batch_loss)/len(batch_loss) + avg_reconstruction = sum(batch_reconstruction)/len(batch_reconstruction) + avg_kl = sum(batch_kl)/len(batch_kl) + avg_mse = sum(batch_mse)/len(batch_mse) + + return avg_loss,avg_reconstruction,avg_kl,avg_mse + +# GRU predict energy from sequence +# whole pass over dataloader +# optimization is performed +def train_step_gru_tf( + model, + dataloader, + criterion_mse, + optimizer, + logger, + model_type: int = 1 # 1: GRU, 2: TF + ): + # training mode + model.train() + + # batch mse + batch_mse = [] + + for idx,batch in enumerate(dataloader): + + input = batch["input"] # size [N,S] + input_length = batch["length"] + energy_true = batch["energy"] # size [N,1] + + if model_type == 1: + # GRU needs sequences and lengths + predicted_energy = model( + input, + input_length + ) + else: + # else if Transformer here + predicted_energy = model( + input + ) + + # loss calculation + # overall loss + mse_loss = criterion_mse(predicted_energy,energy_true) + + # if idx == 0: + # # print resources + # if torch.cuda.is_available(): + # print(f"GPU resources just before gradient update:") + # print(torch.cuda.memory_summary()) + + optimizer.zero_grad() + mse_loss.backward() + optimizer.step() + + # mse + batch_mse.append(mse_loss.item()) + + # add to the logger + str_ = f"\t Batch {idx}\t" + str_ += f"MSE: {batch_mse[-1]:0.4f}\t" + logger.info(str_) + + + # compute average (for epoch) + avg_mse = sum(batch_mse)/len(batch_mse) + + return avg_mse + +# GRU validation step +def validation_step_gru_tf( + model, + dataloader, + criterion_mse, + model_type: int = 1 # 1: GRU, 2: TF + ): + # training mode + model.eval() + + # batch mse + batch_mse = [] + + with torch.no_grad(): + for idx,batch in enumerate(dataloader): + + input = batch["input"] # size [N,S] + input_length = batch["length"] + energy_true = batch["energy"] # size [N,1] + + if model_type == 1: + # GRU needs sequences and lengths + predicted_energy = model( + input, + input_length + ) + else: + # else if Transformer here + predicted_energy = model( + input + ) + + # loss calculation + # overall loss + mse_loss = criterion_mse(predicted_energy,energy_true) + + # mse + batch_mse.append(mse_loss.item()) + + # compute average (for epoch) + avg_mse = sum(batch_mse)/len(batch_mse) + + return avg_mse + +# procedure to get means/stds of the latent space +def get_means_stds( + output_filename_means : str, # filename for means of q(z|x) + output_filename_stds : str, # filename for stds of q(z|x) + pt_name : str, # pytorch file with pretraine dlayers + pickle_name : str, # pickle file with model inputs + fasta_file : str, # FASTA file with sequences + batch_size : int = 4, # how many sequences to process in a batch + max_sequence_length : int = 500, # max sequence length for Dataset construction + seed : int = 0 + ): + # instantiate model object + vars = pickle.load(open(pickle_name, "rb" )) + + # set device + device = torch.device("cuda" if torch.cuda.is_available() else "cpu") + + # force cpu, if only cpu is available + vars["device"] = device + + # instantiate model + model = TransformerVAE(**vars) + + # load trained parameters + checkpoint = torch.load(pt_name,map_location = device) + model.load_state_dict(checkpoint['model_state_dict']) + model.eval() + + # move to GPU + model = model.to(device) + print(f"Device: {device}") + + # get i2w map and eos_idx + w2i,i2w = default_w2i_i2w() + + # create a list of improper tokens + improper_token_list = [ + w2i[''], # + w2i[''], # + w2i[''], # + w2i[''] # + ] + + # set random seed + torch.manual_seed(seed) + + # dataset and dataloader + dataset = ProteinSequencesDataset( + fasta_file, + w2i, + i2w, + device, + max_sequence_length = max_sequence_length + ) + dataloader = DataLoader(dataset, batch_size=batch_size, shuffle=False) + + # list to store all means/stds + means, stds, sequenceIDs = [], [], [] + + # iterate over dataloader + with torch.no_grad(): + for batch in dataloader: + src = batch['input'] + batch_seq_ids = batch["reference"] + sequenceIDs.extend(batch_seq_ids) + + # forward pass + # no masking probability here + # saving mean/std + _,mean,logv,_ = model( + src, # Src in Transformer architecture + src, # Tgt in Transformer architecture + ) + std = torch.exp(0.5 * logv) + + means.append(mean) + stds.append(std) + + # concatenate all means/stds + means = torch.cat(means,dim=0) + stds = torch.cat(stds,dim=0) + + # convert to numpy : size [# seq in training set, latent size] + if torch.cuda.is_available(): + # convert to numpy (if cuda is enabled, move to cpu first) + means = means.cpu().numpy() + stds = stds.cpu().numpy() + else: + # convert to numpy (already on cpu) + means = means.numpy() + stds = stds.numpy() + + + # create column names + latent_size = vars["latent_size"] + column_names = [f"dim-{i+1}" for i in range(latent_size)] + + # create dataframe + df_means = pd.DataFrame( + means, + columns = column_names, + index = sequenceIDs + ) + df_means.to_csv(output_filename_means) + + df_stds = pd.DataFrame( + stds, + columns = column_names, + index = sequenceIDs + ) + df_stds.to_csv(output_filename_stds) + + +####################################################### RELATED TO SAMPLING ###################################### +# convert indices to tokens +def decode( + array_indices : ArrayLike, # numpy array with indices + array_logp : ArrayLike, # numpy array with log-probabilities (must be same shape as indices) + array_Z : ArrayLike, # latent space value used in decoder to generate log-probabilities and indices + array_energies : ArrayLike, # energies obtained from z + i2w : dict, # dictionary that maps index to a letter + improper_token_list : List # list of tokens that are not 20 valid AAs + ) -> List: + # check that arrays are of the same length + assert array_indices.shape == array_logp.shape, "Shape mismatch between indices and log-probabilities numpy arrays" + # assert array_indices.shape == array_logp.shape == array_certainty.shape, "Shape mismatch between indices and log-probabilities and certainty numpy arrays" + + # check that number of elements is the same in array_indices and array_Z + assert array_indices.shape[0] == array_Z.shape[0], "Number of samples must be the same in indices and Z numpy arrays" + + # check that number of elements is the same between indices and energies + assert array_indices.shape[0] == array_energies.shape[0], "Number of samples must be the same in indices and energies numpy arrays" + + # empty list; list element is a (sequence,energy,logp,z) tuple: z is a latent space vector used to create a sequence + sequences = [] + + # get number of sequences and number of elements per sequence + n_samples = array_indices.shape[0] + n_elements_per_sequence = array_indices.shape[1] + + print(f"Number of sequences to decode : {n_samples}") + print(f"Number of elements in a sequence: {n_elements_per_sequence}") + + + # loop over sequences + for n in range(n_samples): + + temp_decoded = [] # for decoding of a sequence + + cumulative_logp = 0.0 + + + + # extract associated latent vector + associated_z = array_Z[n,:][np.newaxis,:] # to make size (1, latent_size) + + # extract energy + associated_energy = array_energies[n][0] + + # loop over elements within a sequence + for k in range(n_elements_per_sequence): + # get element + element = array_indices[n,k] + + # if an element is not in improper token list, append it + # improper token list: ,,, + if element not in improper_token_list: + # append character + temp_decoded.append(i2w[element]) + # increase logp + cumulative_logp += array_logp[n,k] + # # add ceratinty element + # temp_certainty.append(array_certainty[n,k]) + else: + break + + # append to a list + # IF len(temp) > 0. Otherwise, first sampled token is improper token already + if len(temp_decoded) > 0: + sequences.append( + ( + temp_decoded, + associated_energy, + cumulative_logp, + associated_z + ) + ) + + return sequences + +# sample from gaussian prior +def sample_tf_using_prior( + output_filename : str, + pt_name : str, + pickle_name : str, + n_samples : int = 10000, + seed : int = 0, + max_number_of_steps : int = 100 + ) -> List: + # instantiate model object + vars = pickle.load(open(pickle_name, "rb" )) + + # set device + device = torch.device("cuda" if torch.cuda.is_available() else "cpu") + + # force cpu, if only cpu is available + vars["device"] = device + + # instantiate model + model = TransformerVAE(**vars) + + # load trained parameters + checkpoint = torch.load(pt_name,map_location = device) + model.load_state_dict(checkpoint['model_state_dict']) + model.eval() + + # move to GPU + model = model.to(device) + + print(f"Device: {device}") + + # get i2w map and eos_idx + w2i,i2w = default_w2i_i2w() + # create a list of improper tokens + improper_token_list = [ + w2i[''], # + w2i[''], # + w2i[''], # + w2i[''] # + ] + + # set seed + torch.manual_seed(seed) + + # check how many times we need to do in batches of 100 + n_times = n_samples//100 + + # record objects list + records = [] + + # sequences list + sequences = [] + + with torch.no_grad(): + for _ in range(n_times): + + # sample 100 samples + if torch.cuda.is_available(): + logp,indices,z,energies,_ = model.sample_from_latent_space(100,max_length = max_number_of_steps) + logp,indices,z,energies = logp.cpu().numpy(), indices.cpu().numpy(), z.cpu().numpy(), energies.cpu().numpy() + else: + logp,indices,z,energies,_ = model.sample_from_latent_space(100,max_length = max_number_of_steps) + logp,indices,z,energies = logp.numpy(), indices.numpy(),z.numpy(),energies.numpy() + + # extend list with a batch of decoded sequences + # each element of a list is a tuple: + # ( + # decoded sequence, as list: ["A","B","C"] + # energy, as float number + # logp, as float number + # z as numpy array + # ) + sequences.extend( + decode( + indices, + logp, + z, + energies, + i2w, + improper_token_list + ) + ) + + # sort by energies (1st element of the tuple), although doesn't really matter + sorted_sequences = sorted(sequences, key=lambda tup: tup[1],reverse = False) + + # for current seed maintain a list of observed sequences + # samples may be identical but have different log-probabilties + # since sequences are sorted by log-probability + # we will keep every unique sequence with the highest log-probability + observed_sequences = [] + + # counter + cnt = 1 + + # seq_tuple: (seq,list(energies),logp(seq),associated z,id,description) as (list[str],list(float),numpy,str,str) + seq_tuple = [] + + # dictionary seq2object + seq2obj = {} + + # combine data to have the following structure: {(seq,all energies, all logps, all zs, id, description)} + for element in sorted_sequences: + + # obtain sequence and its logp + seq = "".join(element[0]) # here as string, not as list, list not hashable + associated_energy = element[1] + logp_seq = element[2] + associated_z = element[3] + + # if we haven't seen this sequence yet + if seq not in observed_sequences: + id_ = f"seq-{cnt}-prior" + # generate new instance of class SequenceData + seq2obj[seq] = SequenceData( + seq, + id_, + associated_energy, + logp_seq, + associated_z + ) + # add to the observed sequences, increase the counter + observed_sequences.append(seq) + cnt += 1 + else: + # update an object of type SequenceData (but we need to update a specific object, need a quick lookup!) + # lookup: seq -> SequenceData instance + seq2obj[seq].update_info( + associated_energy, + logp_seq, + associated_z + ) + # once data is combined we need to generate description, add to seq_tuple, add to records + # loop over pairs (seq, SequenceData) + for k,v in seq2obj.items(): + v.generate_description() # to have a human readable description + seq_tuple.append(v.toTuple) # append to list as a tuple + records.append(v.toSeqRecord) # append to list as SeqRecord + + + # save records list as FASTA file + SeqIO.write(records,output_filename,"fasta") + + # return seq_tuple + return seq_tuple + +# sample from gaussian variational posterior +def sample_tf_using_posterior( + output_filename : str, + pt_name : str, + pickle_name : str, + fasta_file : str, + max_number_of_steps : int = 500, # for how many steps to perform autoregressive sampling + n_samples : int = 10, + mini_batch_size : int = 10, + seed : int = 0, + T : float = 0.0, + skip_first_element : bool = True + ) -> List: + # instantiate model object + vars = pickle.load(open(pickle_name, "rb" )) + + # get max_seq_length from vars dictionary (subtract 1 as 1 is added in dataset constructor) + max_sequence_length = vars["max_seq_length"] - 1 + + # set device + device = torch.device("cuda" if torch.cuda.is_available() else "cpu") + + # force cpu, if only cpu is available + vars["device"] = device + + # instantiate model + model = TransformerVAE(**vars) + + # load trained parameters + checkpoint = torch.load(pt_name,map_location = device) + model.load_state_dict(checkpoint['model_state_dict']) + model.eval() + + # move to GPU + model = model.to(device) + + print(f"Device: {device}") + + # get i2w map and eos_idx + w2i,i2w = default_w2i_i2w() + # create a list of improper tokens + improper_token_list = [ + w2i[''], # + w2i[''], # + w2i[''], # + w2i[''] # + ] + + # set seed + torch.manual_seed(seed) + + # record list and counter + records = [] + cnt = 1 + + + # dataset and dataloader + dataset = ProteinSequencesDataset( + fasta_file, + w2i, + i2w, + device, + max_sequence_length = max_sequence_length + ) + dataloader = DataLoader(dataset, batch_size=1, shuffle=False) + + # check that dataloader contains only 1 element + assert len(dataloader) == 1, "Dataloader should contain a single batch of size 1. Check FASTA file with which you construct dataset." + + # seq_tuple: (seq,logp(seq),associated z,id,description) as (list[str],float,numpy,str,str) + seq_tuple = [] + + # dictionary seq2object + seq2obj = {} + + n_times = n_samples // mini_batch_size + + # loop over elements of dataset: outer loop + for batch in dataloader: + + # get data (here: batch = 1 sequence) + src = batch['input'] + reference_ = batch["reference"][0] + + print("Src size:",src.size()) + + # empty sequence list + sequences = [] + + # sample indices + with torch.no_grad(): + + # sample + for _ in range(n_times): + logp,indices,z,energies = model.sample_around_molecule( + src, + mini_batch_size, + T = T, + max_length = max_number_of_steps, + skip_first_element = skip_first_element + ) + if torch.cuda.is_available(): + # convert to numpy (if cuda is enabled, move to cpu first) + logp,indices,z,energies = logp.cpu().numpy(), indices.cpu().numpy(), z.cpu().numpy(), energies.cpu().numpy() + else: + # convert to numpy (already on cpu) + logp,indices,z,energies = logp.numpy(), indices.numpy(), z.numpy(), energies.numpy() + + + # decode + sequences.extend( + decode( + indices, + logp, + z, + energies, + i2w, + improper_token_list + ) + ) + + # sort by energies + sorted_sequences = sorted(sequences, key=lambda tup: tup[1],reverse = True) + + # for current seed maintain a list of observed sequences + # samples may be identical but have different log-probabilties + # since sequences are sorted by log-probability + # we will keep every unique sequence with the highest log-probability + observed_sequences = [] + + # populate list of records + for element in sorted_sequences: + + # obtain sequence and its logp + seq = "".join(element[0]) # as string + associated_energy = element[1] + logp_seq = element[2] + associated_z = element[3] + + # if we haven't seen this sequence yet + if seq not in observed_sequences: + # create a description and id + id_ = f"seq-{cnt}-temperature-{T}" + + # generate new instance of class SequenceData + seq2obj[seq] = SequenceData( + seq, + id_, + associated_energy, + logp_seq, + associated_z + ) + # increase counter + cnt += 1 + + # append to a list of observed sequences + observed_sequences.append(seq) + else: + # update an object of type SequenceData (but we need to update a specific object, need a quick lookup!) + # lookup: seq -> SequenceData instance + seq2obj[seq].update_info( + associated_energy, + logp_seq, + associated_z + ) + + # once data is combined we need to generate description, add to seq_tuple, add to records + # loop over pairs (seq, SequenceData) + for k,v in seq2obj.items(): + v.generate_description(seedID=reference_) # to have a human readable description + seq_tuple.append(v.toTuple) # append to list as a tuple + records.append(v.toSeqRecord) # append to list as SeqRecord + + + # write a file + SeqIO.write(records,output_filename,"fasta") + + ### output: + ### seq_tuple: (seq,logp(seq),associated z,id,description) as (list[str],float,numpy,str,str) + return seq_tuple + +# sample seq2energy (same function will be used for prior and posterior samples) +# will estimate elbo (reconstruction+kl) and energy for sampled variants (prior and posterior) +def seq2_energy_tf( + output_filename_intermediate : str, # csv output template (reconstruction/kl/elbo/energy) + pt_name : str, # pytorch file with pretrained layers + pickle_name : str, # pickle file with model input parameters + fasta_file : str, # fasta with sequences + n_samples : int = 100, # how many times sample from latent + batch_size : int = 10, # how many samples to process at once + seed : int = 0 # random seed for sampling + ): + + #### small fucntion that computes reconstruction loss and KL individually for each batch element + def compute_loss_gaussian( + NLL : torch.tensor, + logp : torch.tensor, # [N,S,Vocab Size] + target : torch.tensor, # [N,S] + mean : torch.tensor, # [N,latent size] + logv : torch.tensor # [N,latent size] + ): + # get number of batches [N] and sequence length [S] + N,S,_ = logp.size() + + # merge dimensions + target = target.view(-1) + logp = logp.view(-1, logp.size(2)) + + + # Negative Log Likelihood + NLL_loss = NLL(logp, target) # size of [N*S] + NLL_loss = NLL_loss.reshape(N,S) # size of [N,S] + + + # KL Divergence -> by batch + KL_loss = -0.5 * torch.sum( + 1 + logv - mean.pow(2) - logv.exp(), + dim = -1 # if this is not used, overall summation will happen + ) + # both will be tensors of size [N] + return NLL_loss.sum(dim=-1), KL_loss + + #### small function to save intermedaite results into dataframe + def save( + np_array: ArrayLike, + indices : List, + columns : List, + filename: str + )->None: + df = pd.DataFrame( + np_array, + columns = columns, + index = indices + ) + df.to_csv(filename) + + ################################################################# MAIN BODY ################################# + # create a map id (which is "reference" field in dataset) to (sequence,description) + id2seq = {} + for record in SeqIO.parse(fasta_file,"fasta"): + id_ = record.id + seq_ = record.seq + desc_ = record.description + id2seq[id_] = (seq_,desc_) + + # instantiate model object + vars = pickle.load(open(pickle_name, "rb" )) + + # get the max_seq_length (for dataset construction, adjust by subtracting 1) + max_sequence_length = vars["max_seq_length"] - 1 + + # set device + device = torch.device("cuda" if torch.cuda.is_available() else "cpu") + + # force cpu, if only cpu is available + vars["device"] = device + + # instantiate model + model = TransformerVAE(**vars) + + # load trained parameters + checkpoint = torch.load(pt_name,map_location = device) + model.load_state_dict(checkpoint['model_state_dict']) + model.eval() + + # move to GPU + model = model.to(device) + + print(f"Device: {device}") + + # get i2w map and eos_idx + w2i,i2w = default_w2i_i2w() + + # set seed + torch.manual_seed(seed) + + # dataset and dataloader + dataset = ProteinSequencesDataset( + fasta_file, + w2i, + i2w, + device, + max_sequence_length = max_sequence_length + ) + + dataloader = DataLoader(dataset, batch_size=batch_size, shuffle=False) + + # empty matrices: each for reconstruction/KL/ELBO/energies [ # sequences, # samples ] + prediction_matrix_reconstruction = torch.zeros((len(dataset),n_samples)) + prediction_matrix_kl = torch.zeros((len(dataset),n_samples)) + prediction_matrix_elbo = torch.zeros((len(dataset),n_samples)) + prediction_matrix_energy = torch.zeros((len(dataset),n_samples)) + + # list for sequenceIDs + sequenceIDs = [] + + # NLL object + NLL = nn.NLLLoss(ignore_index=dataset.pad_idx,reduction='none') + + with torch.no_grad(): + # run over batches + for i, batch in enumerate(tqdm.tqdm(dataloader, 'Looping through mutation batches')): + # extract necessary input + src = batch["input"] # size [N,S] + tgt = batch["target"] # size [N,T] + reference_ids = batch["reference"] + sequenceIDs.extend(reference_ids) + + # run over number of samples + for j in tqdm.tqdm(range(n_samples), 'Looping through number of samples for batch #: '+str(i+1)): + + # do forward pass + # predicted energy: [Batch Size, 1] -> need to get rid of last dimension + logp,mean,logv,predicted_energy = model( + src, # Src in Transformer architecture + src, # Tgt in Transformer architecture + ) + + # compute reconstruction/KL + # dimensionality [Batch Size] + NLL_loss, KL_loss = compute_loss_gaussian( + NLL, + logp, + tgt, + mean, + logv + ) + elbo = NLL_loss + KL_loss + + # write to matrices: [# sequences; # samples] + prediction_matrix_reconstruction[i*batch_size:i*batch_size+len(src),j] = NLL_loss + prediction_matrix_kl[i*batch_size:i*batch_size+len(src),j] = KL_loss + prediction_matrix_elbo[i*batch_size:i*batch_size+len(src),j] = elbo + prediction_matrix_energy[i*batch_size:i*batch_size+len(src),j] = predicted_energy.squeeze() + + + # compute averages across dim=1 : [# of sequences] + avg_pm_reconstruction = prediction_matrix_reconstruction.mean(dim=1,keepdim=False) + avg_pm_kl = prediction_matrix_kl.mean(dim=1,keepdim=False) + avg_pm_elbo = prediction_matrix_elbo.mean(dim=1,keepdim=False) + avg_pm_energy = prediction_matrix_energy.mean(dim=1,keepdim=False) + + + ################################################################# intermediate results ######################## + # convert to numpy : size [# seq in training set, # samples] + if torch.cuda.is_available(): + # convert to numpy (if cuda is enabled, move to cpu first) + prediction_matrix_reconstruction,prediction_matrix_kl,prediction_matrix_elbo,prediction_matrix_energy = prediction_matrix_reconstruction.cpu().numpy(), prediction_matrix_kl.cpu().numpy(), prediction_matrix_elbo.cpu().numpy(), prediction_matrix_energy.cpu().numpy() + else: + # convert to numpy (already on cpu) + prediction_matrix_reconstruction,prediction_matrix_kl,prediction_matrix_elbo,prediction_matrix_energy = prediction_matrix_reconstruction.numpy(), prediction_matrix_kl.numpy(), prediction_matrix_elbo.numpy(), prediction_matrix_energy.numpy() + + # column names: integers representing sample + columns = [f"{i+1}" for i in range(n_samples)] + + # reconstruction errors + save( + prediction_matrix_reconstruction, + sequenceIDs, + columns, + output_filename_intermediate + "-reconstruction.csv" + ) + + # KLs: will be identical + save( + prediction_matrix_kl, + sequenceIDs, + columns, + output_filename_intermediate + "-kl.csv" + ) + + # ELBO + save( + prediction_matrix_elbo, + sequenceIDs, + columns, + output_filename_intermediate + "-elbo.csv" + ) + + # energies + save( + prediction_matrix_energy, + sequenceIDs, + columns, + output_filename_intermediate + "-energy.csv" + ) + + ################################################################# final results ######################## + final_data = { + "seq-id" : sequenceIDs, + "reconstruction" : avg_pm_reconstruction.tolist(), + "kl" : avg_pm_kl.tolist(), + "elbo" : avg_pm_elbo.tolist(), + "energy" : avg_pm_energy.tolist() + } + + return final_data + +# single optimisation run -> running SGD on prior sample +def sgd_optimisation( + pt_name : str, + pickle_name : str, + logger : logging.Logger, + learning_rate : float, + delta_f_tol : float, + max_opt_steps : int + ): + # instantiate model object + vars = pickle.load(open(pickle_name, "rb" )) + + # set device + device = torch.device("cuda" if torch.cuda.is_available() else "cpu") + + # force cpu, if only cpu is available + vars["device"] = device + logger.info(f"Device used: {device}") + + # instantiate model + model = TransformerVAE(**vars) + + # load trained parameters + checkpoint = torch.load(pt_name,map_location = device) + model.load_state_dict(checkpoint['model_state_dict']) + model.eval() + + # extract mlp2energy + f_z = model.get_submodule("mlp2energy") + + # move to GPU + f_z = f_z.to(device) + model = model.to(device) + + f_z.eval() + + # turn off the gradients everywhere in model f_z + for param in f_z.parameters(): + param.requires_grad_(False) + + # we will be working with a single z, so set batch_size to 1 + batch_size = 1 + latent_size = vars["latent_size"] + + # this is dataset length (inclusing ), so we will sample this number of times + max_sequence_length = vars["max_seq_length"] + + # get i2w map and eos_idx + w2i,i2w = default_w2i_i2w() + + # create a list of improper tokens + improper_token_list = [ + w2i[''], # + w2i[''], # + w2i[''], # + w2i[''] # + ] + + # create an input and require gradients + z = torch.nn.Parameter( + # our initial guess of vector z + torch.randn( + [batch_size, latent_size], # (1,latent size) + dtype = torch.float, + device = device + ), + requires_grad = True + ) + str_ = "Initial value:\n" + str_ += f"{z}" + logger.info(str_) + + # optimizer for z + optim = torch.optim.SGD([z], lr = learning_rate) + + # assume starting loss is inifinity + prev_loss = float('inf') + + ### loop over steps and keep track of progress + records_progressive = [] + + for step in range(max_opt_steps): + + # clone z to z_prev and detach from computational graph + z_prev = z.clone().detach() + + # predict energy + energy = f_z(z) + + # energy is [1,1] tensor, so we need a sum for backprop + loss = energy.sum() + + # gradient step + optim.zero_grad() + loss.backward() + optim.step() + + # print results: change in energy and L2 and L0 norms of vector z change + + # change in z; L2 and L0 norms of a change + dz = z - z_prev + l2_dz = torch.linalg.vector_norm(dz,ord=2) + #l0_dz = torch.linalg.vector_norm(dz,ord=0) # not sure it is good + + # change in function + df = abs(loss.item() - prev_loss) + + # log results + step_results_str = f"Iteration:{step+1}:\n" + step_results_str += f"Previous loss:{prev_loss:0.7f}, current loss:{loss.item():0.7f}, delta:{df:0.7f}\n" + step_results_str += f"L2-norm of change in z: {l2_dz.item()}\n" + step_results_str += f"Current z: \n {z.tolist()}\n" + #step_results_str += f"L2-norm of change in z: {l2_dz.item():0.7f}, L0-norm of change in z: {l0_dz.item():0.7f}" + logger.info(step_results_str) + + # reassign prev_loss variable + prev_loss = loss.item() + + # obtain sequence from current z + with torch.no_grad(): + # all of them should be batch size = 1 + + # logp and indices correspond to collection scheme + # right now: argmax + # TODO: introduce random sampling + logp ,indices, current_z, current_energy, entropies = model.sample_from_latent_space( + batch_size, + max_length = max_sequence_length, + z = z, + argmax = False # will do sampling + ) + if torch.cuda.is_available(): + logp, indices, current_z, current_energy = logp.cpu().numpy(), indices.cpu().numpy(), current_z.cpu().numpy(), current_energy.cpu().numpy() + else: + logp, indices, current_z, current_energy = logp.numpy(), indices.numpy(), current_z.numpy(), current_energy.numpy() + + # decode + # [ temp_decoded, associated_energy, cumulative_logp, associated_z] + out = decode( + indices, + logp, + current_z, + current_energy, + i2w, + improper_token_list + ) + assert len(out) == 1, "Something is wrong with decoding step." + seq = "".join(out[0][0]) + associated_energy = out[0][1] + logp_seq = out[0][2] + + # append to records + records_progressive.append( + SeqRecord( + Seq(seq), + id = f"optimization-step-{step+1}", + description = f"Step:{step+1}/{max_opt_steps}||Logp:{logp_seq:0.7f}||Energy:{associated_energy:0.7f}|| Entropy (mean,max,std):[{entropies[0]:0.7f},{entropies[1]:0.7f},{entropies[2]:0.7f}]" + ) + ) + # break out of for loop + if df < delta_f_tol: + final_str = f"Stopped after iteration {step+1} due to {df:0.10f} difference between energy values at two consecutive steps. Optimal function value: {loss.item():0.7f}" + final_str += f"\tOptimal argument value (z): {z}" + logger.info(final_str) + + break + + # here, we reached end of for loop without breaking it + final_str = f"Stopped because maximum number of optimisation steps ({max_opt_steps}) have been reached. Optimal function value: {loss.item():0.7f}" + final_str += f"\tOptimal argument value (z): {z}" + logger.info(final_str) + + + # detach and convert to numpy + if torch.cuda.is_available(): + # convert to numpy (if cuda is enabled, move to cpu first) + opt_z,opt_loss = z.detach().cpu().numpy(), loss.detach().cpu().numpy() + else: + # convert to numpy (already on cpu) + opt_z,opt_loss = z.detach().numpy(), loss.detach().numpy() + + # return tuple(opt_z,opt_energy,progressive list of decoded sequences throughout optimisation//last element if the optimal sequence) + return opt_z,opt_loss,records_progressive + +# constraint optimisation of energy NN (z -> E(z)) +# optimal z will lie in mean(seq)+-3*sigma(seq) +def trust_region_optimisation( + f_energy: nn.Module, # NN to predict energy + x0 : np.ndarray, # starting point (x0,x1,x2...) + bounds : List, # List of tuples [(x0_min,x0_max),(x1_min,x1_max) ...] or Bounds class from scipy. Not sure which will work + logger : logging.Logger, # logger + device : torch.device # cpu/cuda + ): + # run optimisation problem + res = minimize( + f_energy, + x0, + bounds = bounds, + method = 'trust-constr', + backend = 'torch', + precision = 'float64', + tol = 1e-8, + torch_device = device, + options = {'disp': True} + ) + # check the output : + # res.x <- solution (x_opt) + # res.fun <- F(x_opt) + # res.success <- whether optimisation is successful + # res.message <- optimisation msg + + # construct log string + log_string = f"Optimisation successful: {res.success}.\n" + log_string += f"Optimisation message : {res.message}.\n" + log_string += f"F(x_opt) : {res.fun}.\n" + log_string += f"x_opt : {res.x}.\n" + logger.info(log_string) + + # return x_opt, f(x_opt) + return res.x, res.fun + +####################################################### RELATED TO PREDICTIVE MODELS:GRU/TF encoder ###################################### +def predict_energies_using_tf_encoder( + output_filename : str, # output (FASTA) filename + pt_name : str, # pytorch file with pretrained layers + pickle_name : str, # pickle file with model input parameters + fasta_file : str, # fasta with sequences + seed : int = 0 # random seed for sampling + ): + + # create a map id (which is "reference" field in dataset) to (sequence,description) + id2seq = {} + for record in SeqIO.parse(fasta_file,"fasta"): + id_ = record.id + seq_ = record.seq + desc_ = record.description + id2seq[id_] = (seq_,desc_) + + # instantiate model input params + vars = pickle.load(open(pickle_name, "rb" )) + + # get the max_seq_length (for dataset construction, adjust by subtracting 1) + max_sequence_length = vars["max_seq_length"] - 1 + + # set device + device = torch.device("cuda" if torch.cuda.is_available() else "cpu") + + # force cpu, if only cpu is available + #vars["device"] = device + + # instantiate model -> TF predictive + model = PredictorTFEncoder(**vars) + + # load trained parameters + checkpoint = torch.load(pt_name,map_location = device) + model.load_state_dict(checkpoint['model_state_dict']) + model.eval() + + # move to GPU + model = model.to(device) + + print(f"Device: {device}") + + # get i2w map and eos_idx + w2i,i2w = default_w2i_i2w() + + # set seed + torch.manual_seed(seed) + + # record list + records = [] + + # dataset and dataloader + dataset = ProteinSequencesDataset( + fasta_file, + w2i, + i2w, + device, + max_sequence_length = max_sequence_length + ) + + dataloader = DataLoader(dataset, batch_size=1, shuffle=False) + + # to sort based on energy + to_sort = [] + + # energies data, to save as csv + energies_data = {} + predicted_energies, references = [],[] + + i = 0 # currently processed + # loop over elements of dataset: outer loop + for batch in dataloader: + + # get data (here: batch = 1 sequence) + src = batch['input'] + reference_ = batch["reference"][0] + + print("Src size:",src.size()) + + # sample indices + with torch.no_grad(): + # forward pass to obtain a predicted energy + predicted_energy = model(src) + + if torch.cuda.is_available(): + # convert to numpy (if cuda is enabled, move to cpu first) + predicted_energy = predicted_energy.cpu().numpy()[0][0] + else: + # convert to numpy (already on cpu) + predicted_energy = predicted_energy.numpy()[0][0] + + print("predicted energy: ", predicted_energy ) + + # add to lists + references.append(reference_) + predicted_energies.append(predicted_energy) + + + # write additional description + additional_description = ( + f"||Model predicted energy:{predicted_energy}" + ) + + # add to_sort list -> we need reference, to retrieve sequence post sorting + to_sort.append( + (reference_,predicted_energy,additional_description) + ) + + # do sorting now (on avg energy), construct records objects and save + sorted_to_sort = sorted(to_sort,key=lambda tup: tup[1],reverse = False) + + # create records + records = [] + #(id,avg_energy,additional description) + for tpl in sorted_to_sort: + id_ = tpl[0] + reference_seq_, original_description_ = id2seq[id_][0], id2seq[id_][1] + additional_description_ = tpl[2] + + # need to create SeqRecord object + record_ = SeqRecord( + reference_seq_, + id = id_, + description = original_description_ + additional_description_ + ) + + records.append(record_) + + # save + SeqIO.write(records,output_filename,"fasta") + + # construct energies_data + energies_data['reference-id'] = references + energies_data['estimated-energy'] = predicted_energies + + return energies_data + + + + + + + + + + +######################################################## RELATED TO PROTEIN ANALYSIS ################################ + +# creates default dictionary to be populated in protein_analysis function +# keys should be changed accordingly (!) +def get_accumulator( + amino_acid_list:list + ) -> defaultdict: + # create default dictionary specifying keys explicitly + standard_keys = [ + "MW", + "aromaticity", + "instability", + "flexibility", + "gravy", + "isoelectric", + "helix", + "turn", + "sheet", + "reduced", + "oxidized" + ] + # extend with AAs + standard_keys.extend(amino_acid_list) + + accumulator = defaultdict( + list, + { k:[] for k in standard_keys } + ) + return accumulator + +# compute sequence params using ProteinAnalysis +def protein_analysis( + sequence : str, # input is a sequence but as a string + sequence_id : str, # sequence id + amino_acid_list : list, # list of strings (change to list if it complains!) + results_accumulator : defaultdict, # we will keep accumulating results + logger : logging.Logger # logger to keep log info + ) -> None: + + # instantiate ProteinAnalysis object for a given sequence + sequence_analysis = ProteinAnalysis(sequence) + + # analysis of AA % + aa_pct_d = sequence_analysis.get_amino_acids_percent() + + # loop over AA % (if not found,set to 0.0) + for key_aa in amino_acid_list: + aa_value = aa_pct_d.get(key_aa,0.0) + # add to accumulator + results_accumulator[key_aa].append(aa_value) + + # molecular weight + results_accumulator["MW"].append( + sequence_analysis.molecular_weight() + ) + + # aromaticity + results_accumulator["aromaticity"].append( + sequence_analysis.aromaticity() + ) + + # instability index + results_accumulator["instability"].append( + sequence_analysis.instability_index() + ) + + # flexibility -> is a list + # we take average (not sure it is correct) + flexibility_list = sequence_analysis.flexibility() + if len(flexibility_list) > 0: + avg_flexibility = sum(flexibility_list)/len(flexibility_list) + else: + # log if flexibility is not computed as expected + avg_flexibility = 0.0 + str_ = f"Issue with sequence ID : {sequence_id}\n" + str_ += f"Sequence : {sequence}\n" + str_ += f"Flexibility list : {flexibility_list}\n" + str_ += f"Avg flexibility set to : {avg_flexibility}\n" + logger.info(str_) + + results_accumulator["flexibility"].append( + avg_flexibility + ) + + # gravy + results_accumulator["gravy"].append( + sequence_analysis.gravy() + ) + + # isoelectric point + results_accumulator["isoelectric"].append( + sequence_analysis.isoelectric_point() + ) + + # secondary structure fraction + secondary_structure_fraction = sequence_analysis.secondary_structure_fraction() + results_accumulator["helix"].append(secondary_structure_fraction[0]) + results_accumulator["turn"].append(secondary_structure_fraction[1]) + results_accumulator["sheet"].append(secondary_structure_fraction[2]) + + # molar extinction coefficient + epsilon_prot = sequence_analysis.molar_extinction_coefficient() + results_accumulator["reduced"].append(epsilon_prot[0]) + results_accumulator["oxidized"].append(epsilon_prot[1]) + +# call protein_analysis for all sequences +def complete_protein_analysis( + sequences : List, + sequence_ids : List, + amino_acid_list : List, + logger : logging.Logger + ) -> pd.DataFrame: + # get accumulator + data_accumulator = get_accumulator(amino_acid_list) + + # call protein analysis on each sequence in a list + for id_,sequence_ in zip(sequence_ids,sequences): + protein_analysis( + sequence_, + id_, + amino_acid_list, + data_accumulator, + logger + ) + + # generate dataframe out of data_accumulator + data = pd.DataFrame.from_dict(data_accumulator) + + return data + +# compute correlations of two dataframes with identical number of rows +def correlate( + df1 : pd.DataFrame, + df2 : pd.DataFrame + ) -> pd.DataFrame: + assert df1.shape[0] == df2.shape[0], "Dataframes must have identical number of rows" + return pd.concat([df1, df2], axis=1, keys=['df1', 'df2']).corr(method="spearman").loc['df2', 'df1'] + +# computes all correlations and saves all intermediate results +def present_results_of_protein_analysis( + seq_tuple : Tuple, + amino_acids : List, + logger : logging.Logger, + filename_template : str + ) -> pd.DataFrame: + # need to extract first and third element from a tuple + string_seqs = [] + Z = [] + seq_ids = [] + for element in seq_tuple: + # create a string + string_seqs.append( + "".join(element[0]) + ) + # append to Z + Z.append( + element[2] + ) + + # append to seq ids + seq_ids.append(element[3]) + + # redefine Z to be numpy array + Z = np.concatenate( + Z, + axis = 0 + ) + + # check that number of elements in string_seqs matches number of elements in Z + assert len(string_seqs) == Z.shape[0], "Number of generated strings must match number of vectors from latent space" + + # need to create a dataframe from Z + # create a list of column names: [dim-1,dim-2,...,dim-N] + z_columns = [f"dim-{dim+1}" for dim in range(Z.shape[1])] + + ########## create dataframes + + # for Z + df_z = pd.DataFrame( + data = Z, + columns = z_columns, + index = seq_ids + ) + # for amino-acid properties + df_seq_properties = complete_protein_analysis( + string_seqs, + seq_ids, + amino_acids, + logger + ) + # reset index + df_seq_properties.index = seq_ids + #df_seq_properties.set_axis(seq_ids,axis="index") + + # check they have the same number of rows + assert df_z.shape[0] == df_seq_properties.shape[0], "Number of rows in dataframes must be identical" + + # compute correlation df + df_corr_latent = correlate( + df_z, + df_seq_properties + ) + + # visualize as heatmap + fig,ax = plt.subplots(nrows=1, ncols=1, figsize=df_corr_latent.shape) + sns.heatmap( + df_corr_latent, + ax = ax, + linewidths = 0.5 # add small separating line between squares in heatmap + ) + + ################## save everything + # 1. dataframe for z + df_z.to_csv(f"{filename_template}-dataframe-z.csv") + + # 2. dataframe sequence properties + df_seq_properties.to_csv(f"{filename_template}-dataframe-sequence-properties.csv") + + # 3. correlation dataframe + df_corr_latent.to_csv(f"{filename_template}-dataframe-correlations.csv") + + # 4. heatmap + fig.savefig(f"{filename_template}-correlations-as-heatmap.pdf") + + return df_seq_properties + + +#################################################### MISCELLANEOUS #################################### +# get a logger +def setup_logger( + logger_name : str, + log_file : str, + level : int =logging.INFO + ) -> logging.Logger: + l = logging.getLogger(logger_name) + formatter = logging.Formatter('%(name)s - %(levelname)s - %(message)s') + fileHandler = logging.FileHandler(log_file, mode='w') + fileHandler.setFormatter(formatter) + streamHandler = logging.StreamHandler() + streamHandler.setFormatter(formatter) + + l.setLevel(level) + l.addHandler(fileHandler) + l.addHandler(streamHandler) + + return l + +# load checkpoint +def load_checkpoint(model,optimizer,pt_checkpoint): + checkpoint = torch.load(pt_checkpoint) + model.load_state_dict(checkpoint['model_state_dict']) + optimizer.load_state_dict(checkpoint['optimizer_state_dict']) + +# create and save dataframe as csv file +def save_data_to_csv( + filename : str, + list_vals : List, + list_ids : List + ) -> None: + ''' + INPUT: + filename : filename of csv file, string + list_vals : list of lists. Each element(list) should contain numeric information, list + list_ids : list of strings. Each element(string) contains a name for a list in the same position from list_vals variable, list + OUTPUT: + None. Saves a csv file + ''' + assert len(list_vals) == len(list_ids), "Length mismatch between list_vals and list_ids" + # construct dictionary + data = {} + for key,val in zip(list_ids,list_vals): + data[key] = val + + # create a dataframe from it + df = pd.DataFrame.from_dict(data) + + # save df + df.to_csv(filename,index=False) + +# compute statistics for a set of FASTA records +def compute_stats( + records: list, + filename: str + ) -> None: + + # create a list of sequences + seq_list = [ record.seq for record in records ] + + # total number of sequences + n_total = len(seq_list) + + # length: numpy array + lengths = np.array( [ len(seq) for seq in seq_list ] ) + + # different stats -> can be expanded later if needed + ave_length = np.mean(lengths) + std_length = np.std(lengths) + max_length = np.max(lengths) + min_length = np.min(lengths) + pct10 = np.percentile(lengths,10) + pct25 = np.percentile(lengths,25) + pct50 = np.percentile(lengths,50) + pct75 = np.percentile(lengths,75) + pct90 = np.percentile(lengths,90) + + # create string + str_ = "FASTA file statistics\n" + str_ += f"\t Number of sequences : {n_total}\n" + str_ += f"\t Average length : {ave_length: 0.4f}\n" + str_ += f"\t Std of length : {std_length: 0.4f}\n" + str_ += f"\t Max length : {max_length: 0.4f}\n" + str_ += f"\t Min length : {min_length: 0.4f}\n" + str_ += f"\t 10th percentile : {pct10: 0.4f}\n" + str_ += f"\t 25th percentile : {pct25: 0.4f}\n" + str_ += f"\t 50th percentile : {pct50: 0.4f}\n" + str_ += f"\t 75th percentile : {pct75: 0.4f}\n" + str_ += f"\t 90th percentile : {pct90: 0.4f}\n" + + # save in file + f = open(filename,"w") + f.write(str_) + f.close() + +# pass basic filtering criteria: presence of non-canonical AAs +def pass_filter( + record: SeqRecord, + w2i : dict + ) -> bool: + """ + INPUT: + record: record object of BioPython module + OUTPUT: + True if no weird amino acids are found. else, False. + """ + # obtain amino acids as a set + set_amino_acids = set(w2i.keys()) + + # obtain set of amino acids in a given record + unique_set_of_amino_acids_in_ID = set(list(str(record.seq))) + + # do set difference + set_diff = unique_set_of_amino_acids_in_ID - set_amino_acids + + # if set is empty, filtering criteri passed, else not + if len(set_diff)==0: + return True + else: + return False + +# obtain best results from dataframe +def obtain_best_results( + file_ : str, + columns_ : list + ) -> Tuple[List,List,List]: + + # read csv, explicitly saying no header + try: + df = pd.read_csv(file_,header=None) + except Exception as e: + print("Exception occured:",e) + # create empty dataframe + df = pd.DataFrame() + + # if dataframe is empty + if df.empty: + return None,None,None + + # add columns + df.columns = columns_ + + # indices of max values (seperate for identity and similarity and bitscore) + indices_identity = df.groupby('qseqid').idxmax()['pident'].values + indices_similarity = df.groupby('qseqid').idxmax()['ppos'].values + indices_bitscore = df.groupby('qseqid').idxmax()['bitscore'].values + + # obtain max values + best_identities = df['pident'].values[indices_identity] + best_similarities = df['ppos'].values[indices_similarity] + best_bitscores = df['bitscore'].values[indices_bitscore] + + # resave csv file with columns + df.to_csv( + file_, + index = False # do not write row names + ) + + # we will return lists because they are easy to extend + return list(best_identities), list(best_similarities), list(best_bitscores) + +# compute (percentile) stats of an array +def stats_compute( + items : list, + identifier : str + ) -> str: + # number of elements + n_total = len(items) + + # convert to numpy + items = np.array(items) + + # different stats -> can be expanded later if needed + ave_ = np.mean(items) + std_ = np.std(items) + max_ = np.max(items) + min_ = np.min(items) + pct10 = np.percentile(items,5) + pct25 = np.percentile(items,25) + pct50 = np.percentile(items,50) + pct75 = np.percentile(items,75) + pct90 = np.percentile(items,95) + + # create string + str_ = f"{identifier} statistics \n" + str_ += f"\t Number of elements : {n_total}\n" + str_ += f"\t Average : {ave_: 0.4f}\n" + str_ += f"\t Std : {std_: 0.4f}\n" + str_ += f"\t Max : {max_: 0.4f}\n" + str_ += f"\t Min : {min_: 0.4f}\n" + str_ += f"\t 5th percentile : {pct10: 0.4f}\n" + str_ += f"\t 25th percentile : {pct25: 0.4f}\n" + str_ += f"\t 50th percentile : {pct50: 0.4f}\n" + str_ += f"\t 75th percentile : {pct75: 0.4f}\n" + str_ += f"\t 95th percentile : {pct90: 0.4f}\n" + + return str_ + +# do mutations for FoldX +def mutate( + wt : list, # WT sequence as list + pos_mutate : list, # list of positions to mutate + chainA_only : bool = True # whether to add to chain B + ) -> Tuple[str,List]: + + # empty FoldX representation + representation = "" + + # loop over sampled positions + for pos in pos_mutate: + original_aa = wt[pos] # original AA in WT + new_aa = np.random.choice( + [aa for aa in 'ARNDCEQGHILKMFPSTWYV' if aa != original_aa] + ) # new AA + # mutate sequence + wt[pos] = new_aa + + # add to representation (keep in mind +1 here!) + representation += f"{original_aa}A{pos+1}{new_aa}," + + # add chain B if asked + if chainA_only == False: + representation += f"{original_aa}B{pos+1}{new_aa}," + + + # at the end we have all necessary representations + # just need to replace final , with ; + representation = re.sub(r".$", ";", representation) + + return representation,wt \ No newline at end of file diff --git a/conf/base.config b/conf/base.config new file mode 100644 index 0000000..8fe5643 --- /dev/null +++ b/conf/base.config @@ -0,0 +1,214 @@ +// basic information about the workflow +manifest { + name = 'prevent-nf' + description = 'PREVENT: PRotein Engineering by Variational frEe eNergy approximaTion' + version = '0.0.0' + homePage = 'https://github.com/stracquadaniolab/prevent-nf.git' + author = 'Evgenii Lobzaev' + nextflowVersion = '>=20.07.1' +} + +// default configuration +executor { + name = 'local' + cpus = 4 + memory = 8.GB + queueSize = 5 +} + +process { + executor = 'local' + cpus = 2 + memory = 4.GB + shell = ['/bin/bash', '-euo', 'pipefail'] +} + +// Export this variable to prevent local Python libraries +// from conflicting with those in the container +env { + PYTHONNOUSERSITE = 1 +} + +// profiles to setup runtimes, executors, and process resources +profiles { + + docker { + docker.enabled = true + docker.userEmulation = true + singularity.enabled = false + podman.enabled = false + shifter.enabled = false + charliecloud.enabled = false + + process.container = "ghcr.io/stracquadaniolab/prevent-nf:0.0.0" + } + + singularity { + singularity.enabled = true + singularity.autoMounts = true + docker.enabled = false + podman.enabled = false + shifter.enabled = false + charliecloud.enabled = false + + process.container = "docker://ghcr.io/stracquadaniolab/prevent-nf:0.0.0" + } + + slurm { + process.executor='slurm' + process.queue='compute' + } + + apple { + docker.runOptions = '--platform linux/amd64' + } + + ci { + executor.name = 'local' + executor.cpus = 2 + executor.memory = 6.GB + executor.queueSize = 5 + + process.executor = 'local' + process.cpus = 1 + process.memory = 2.GB + process.shell = ['/bin/bash', '-euo', 'pipefail'] + } + + // profile containing dummy data to test the workflow + test { + params{ + // global, used in more than one subworkflow (Preprocessing,Training,Prior,Posterior) + resultsDir = "./results/test-run/" // master directory where all output is stored + seed = 0 // seed value used in: + + // free energy calculation + energy.fasta_file = "./testdata/argB.fasta" + energy.pdb_file = "./testdata/1gs5.pdb" + + // mutagenesis + mutagenesis.os = "macOS" //else: "linux" + mutagenesis.n_mutation_sites = [1] // how many mutations in a sequence + mutagenesis.n_mutants = 5 // how many mutants to produce + mutagenesis.seeds = [11] // seeds for random sampling + mutagenesis.foldx_runs = 2 // don't do more than 5 + + + // preprocessing: + preprocessing.lmin = 0 // minimum sequence length to filter sequences from file lists + preprocessing.lmax = 60 // maximum sequence length to filter sequences from file lists; was 260 + preprocessing.val_pct = 0.1 // relative size of validation set (here 20%) + preprocessing.mmseq_clustering = "--min-seq-id 0.8" // mmseqs2 clustering options + preprocessing.training_list = [ + "./testdata/dataset-with-energies-short-sequences.fasta" + ] // list of FASTA files to be cleaned and used for NN training + preprocessing.seed_list = [ + "./testdata/argB-short.fasta" + ] // list of FASTA files to be cleaned and used as seed molecules (to obtain novel variants) + preprocessing.weight_sequences = false // add weights to sequences + + // training VAE: + training.epochs = 100 // number of training epochs + training.val_freq = 3 // frequency of validation error calculation + training.checkpoint_freq = 50 // frequency of model checkpoints + training.batch_size = 10 // batch size + training.learning_rate = 0.0001 // learning rate + training.L2 = 0.0 // L2 constant for normalisation + training.latent_size = 32 // dimensionality of latent distribution (Gaussian or Dirichlet) + training.condition_on_energy = false // whether we will condition on energy when decoding sequence from z + training.weighted_sampling = false // whether we will use WeightedRandomSampling for batch sampling + training.entry_checkpoint = "None" // model checkpoint to start training from + training.embedding_size = 32 // embedding size of AAs (and special tokens) + training.dropout_prob = 0.2 // AAs embedding dropout probability + training.masking_prob = 0.0 // input masking probability + training.heads = 8 + training.num_layers_encoder = 6 + training.num_layers_decoder = 4 + + // sampling: + sampling.seed = 0 // random seed for sampling (prior and posterior) + sampling.n_samples = 200 // how many samples to request (should be a multiple of 100!) + sampling.mini_batch_size = 100 // divide n_samples into X number of mini batches + sampling.max_length = 150 // max number of steps in sampling + sampling.e_value = 1000.0 // e-value cutoff + sampling.query_coverage = 2.0 // query coverage cutoff + sampling.temperature = [1.0] // list of temperatures for seeded sampling + sampling.argmax_first_element = true // argmax selection of the first element of seeded samples (should force "M" for high temperatures) + sampling.mmseq_clustering = "--cluster-reassign --min-seq-id 0.7" // clustering to get representative samples + sampling.pytorch_file = "None" // pytorch file : relevant for VAE_SAMPLE + sampling.pickle_file = "None" // pickle file : relevant for VAE_SAMPLE + sampling.seeds_file = "None" // seeds file : relevant for VAE_SAMPLE + sampling.databases = ["None"] // train/val sets : relevant for VAE_SAMPLE + + // training GRU (supervised learning) + training_gru.epochs = 10 // number of training epochs + training_gru.val_freq = 3 // frequency of validation error calculation + training_gru.checkpoint_freq = 5 // frequency of model checkpoints + training_gru.batch_size = 10 // batch size + training_gru.learning_rate = 0.0001 // learning rate + training_gru.L2 = 0.0 // L2 constant for normalisation + training_gru.hidden_size = 32 // dimensionality of h for GRU + training_gru.num_layers = 1 // number of stacked GRUs + training_gru.bidirectional = false // uni- or bi-directional GRU + training_gru.entry_checkpoint = "None" // model checkpoint to start training_gru from + training_gru.embedding_size = 32 // embedding size of AAs (and special tokens) + training_gru.dropout_prob = 0.2 // AAs embedding dropout probability + + // training TF encoder (supervised learning) + training_tf.epochs = 10 // number of training epochs + training_tf.val_freq = 3 // frequency of validation error calculation + training_tf.checkpoint_freq = 5 // frequency of model checkpoints + training_tf.batch_size = 10 // batch size + training_tf.learning_rate = 0.0001 // learning rate + training_tf.L2 = 0.0 // L2 constant for normalisation + training_tf.latent_size = 64 // dimensionality of latent space + training_tf.weighted_sampling = false // whether we will use WeightedRandomSampling for batch sampling + training_tf.embedding_size = 512 // embedding size of AAs (and special tokens), will be split across heads + training_tf.heads = 8 // number of heads + training_tf.num_layers_encoder = 6 // number of stacked TF encoders + training_tf.entry_checkpoint = "None" // model checkpoint to start training_tf from + training_tf.dropout_prob = 0.2 // AAs embedding dropout probability + + // using TF encoder to predict energies for sequences in a FASTA file + predicting_tf.pickle_file = "None" + predicting_tf.pytorch_file = "None" + predicting_tf.fasta_file = "None" + + // optimisation: + optimisation.pickle_file = "./results/test-run/training/best-models/model-input.pickle" + optimisation.pytorch_file = "./results/test-run/training/best-models/best-train-error.pytorch" + optimisation.learning_rate = 0.1 // learning rate for SGD + optimisation.n_restarts = 3 // number of restart in a single process + optimisation.delta_f_tol = 0.0 // absolute tolerance for function (energy change) + optimisation.max_opt_steps = 10 // maximum allowed number of optimisation steps + optimisation.seeds = [0] // different initial random seeds (each seed corresponds to an individual process) + optimisation.seeds_file = "None" + optimisation.databases = ["None"] + + // energy estimate + energy_estimate.pickle_file = "None" + energy_estimate.pytorch_file = "None" + energy_estimate.fasta_file = "None" + + // estimating latent space (get mu/sigma for datasets of interest) + latent.pickle_file = "./results/test-run/training/best-models/model-input.pickle" + latent.pytorch_file = "./results/test-run/training/best-models/best-train-error.pytorch" + latent.fasta_files = [ + "./results/test-run/preprocessing/train-set.fasta", + "./results/test-run/preprocessing/validation-set.fasta", + ] + } + } +} + +// configuring log information +report { + enabled = true + file = "logs/execution_report.html" +} + +// monitor progress on Tower +tower { + accessToken = 'eyJ0aWQiOiAzMzMzfS5iYjkxYjI5ZTg3ZGY3ZGE2NzhlNjUyNTU1OTI1NzNhMDYxYzdiODRi' + enabled = true +} \ No newline at end of file diff --git a/containers/Dockerfile b/containers/Dockerfile new file mode 100644 index 0000000..d328265 --- /dev/null +++ b/containers/Dockerfile @@ -0,0 +1,39 @@ +## base container +FROM pytorch/pytorch:1.9.0-cuda11.1-cudnn8-devel + +# adding opencontainer labels to link registry to github repository +LABEL org.opencontainers.image.title="prevent-nf" +LABEL org.opencontainers.image.description="PREVENT: PRotein Engineering by Variational frEe eNergy approximaTion" +LABEL org.opencontainers.image.url="https://github.com/stracquadaniolab/prevent-nf" +LABEL org.opencontainers.image.documentation="https://github.com/stracquadaniolab/prevent-nf" +LABEL org.opencontainers.image.source="https://github.com/stracquadaniolab/prevent-nf" +LABEL org.opencontainers.image.vendor="stracquadaniolab" +LABEL org.opencontainers.image.authors="Evgenii Lobzaev" +LABEL org.opencontainers.image.revision="v1.0.0" + +# new line (from https://forums.developer.nvidia.com/t/invalid-public-key-for-cuda-apt-repository/212901/13) +# new pubkey +RUN apt-key adv --fetch-keys https://developer.download.nvidia.com/compute/cuda/repos/ubuntu1804/x86_64/3bf863cc.pub + +# added wget, git, gcc, cmake +RUN apt-get update \ + && apt-get install --yes rename procps curl wget git \ + && apt-get install gcc \ + && apt-get -y install cmake protobuf-compiler \ + && apt-get autoremove \ + && apt-get clean \ + && rm -rf /var/lib/apt/lists/* + +# copy environment.yml file +WORKDIR / +COPY containers/environment.yml / +RUN conda env update -n base --file environment.yml && conda clean --all --yes + +# install tini (and add to the PATH) +ENV TINI_VERSION v0.19.0 +ADD https://github.com/krallin/tini/releases/download/${TINI_VERSION}/tini /tini +RUN chmod +x /tini +ENV PATH="/tini:${PATH}" + +ENTRYPOINT ["/tini","-s","--"] +CMD ["/bin/bash"] diff --git a/containers/environment.yml b/containers/environment.yml new file mode 100644 index 0000000..bcb7dff --- /dev/null +++ b/containers/environment.yml @@ -0,0 +1,27 @@ +name: prevent-nf +channels: + - defaults + - bioconda + - conda-forge +dependencies: + - python=3.7.7 + - typer=0.4.0 + - black=19.10b0 + - pylint=2.7.4 + - pandas=1.3.5 + - seaborn=0.11.2 + - matplotlib=3.2.0 + - numpy=1.20.2 + - scipy=1.6.2 + - biopython=1.79 + - mmseqs2=13.45111 + - blast=2.10.1 + - clustalo=1.2.4 + - seqtk=1.3 + - seqkit=2.1.0 + - scikit-learn=0.24.1 + - hhsuite=3.3.0 + - pip=22.2.2 + - pip: + - fair-esm==1.0.2 + - autograd_minimize==0.2.2 \ No newline at end of file diff --git a/main.nf b/main.nf new file mode 100644 index 0000000..453921c --- /dev/null +++ b/main.nf @@ -0,0 +1,1744 @@ +// # PREVENT: PRotein Engineering by Variational frEe eNergy approximaTion +// # Copyright (C) 2024 Giovanni Stracquadanio, Evgenii Lobzaev + +// # This program is free software: you can redistribute it and/or modify +// # it under the terms of the GNU Affero General Public License as published +// # by the Free Software Foundation, either version 3 of the License, or +// # (at your option) any later version. + +// # This program is distributed in the hope that it will be useful, +// # but WITHOUT ANY WARRANTY; without even the implied warranty of +// # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the +// # GNU Affero General Public License for more details. + +// # You should have received a copy of the GNU Affero General Public License +// # along with this program. If not, see . +// enabling nextflow DSL v2 +nextflow.enable.dsl=2 + +// (re)define variables: use user-inputs, otherwise use default values +// global : used in various subworkflows +resultsDir = params.resultsDir ? params.resultsDir : "${workflow.launchDir}/results" // default: "results" +seed = params.seed ? params.seed : 0 // default: 0 + +// preprocessing +preprocessing_lmin = params.preprocessing.lmin ? params.preprocessing.lmin : 0 // default: 0 +preprocessing_lmax = params.preprocessing.lmax ? params.preprocessing.lmax : 1000 // default: 1000 +max_sequence_length = preprocessing_lmax // set to lmax +preprocessing_val_pct = params.preprocessing.val_pct ? params.preprocessing.val_pct : 0.2 // default: 0.2 (20%) +preprocessing_mmseq_mmseq_clustering = params.preprocessing.mmseq_clustering ? params.preprocessing.mmseq_clustering : "--min-seq-id 0.8" // default: --min-seq-id 0.8 +preprocessing_weight_sequences = params.preprocessing.weight_sequences ? params.preprocessing.weight_sequences : true // default: true + + +// training VAE +training_epochs = params.training.epochs ? params.training.epochs : 100 // default : 100 +training_val_freq = params.training.val_freq ? params.training.val_freq : 1 // default : 1 +training_checkpoint_freq = params.training.checkpoint_freq ? params.training.checkpoint_freq : 50 // default : 50 (just to have 1 checkpoint) +training_batch_size = params.training.batch_size ? params.training.batch_size : 32 // default : 32 +training_learning_rate = params.training.learning_rate ? params.training.learning_rate : 0.0001 // default : 0.0001 +training_L2 = params.training.L2 ? params.training.L2 : 0.0 // default : 0.0 (no L2 regularisation) +training_latent_size = params.training.latent_size ? params.training.latent_size : 32 // default : 32 +training_entry_checkpoint = params.training.entry_checkpoint ? params.training.entry_checkpoint : "None" // default : "None" +training_embedding_size = params.training.embedding_size ? params.training.embedding_size : 512 // default : 32 +training_dropout_prob = params.training.dropout_prob ? params.training.dropout_prob : 0.2 // default : 0.2 +training_masking_prob = params.training.masking_prob ? params.training.masking_prob : 0.0 // default : 0.0 +training_heads = params.training.heads ? params.training.heads : 8 +training_num_layers_encoder = params.training.num_layers_encoder ? params.training.num_layers_encoder : 6 +training_num_layers_decoder = params.training.num_layers_decoder ? params.training.num_layers_decoder : 4 + +// taining GRU (supervised learning) +gru_training_epochs = params.training_gru.epochs ? params.training_gru.epochs : 100 +gru_training_val_freq = params.training_gru.val_freq ? params.training_gru.val_freq : 1 +gru_training_checkpoint_freq = params.training_gru.checkpoint_freq ? params.training_gru.checkpoint_freq : 50 +gru_training_batch_size = params.training_gru.batch_size ? params.training_gru.batch_size : 32 +gru_training_learning_rate = params.training_gru.learning_rate ? params.training_gru.learning_rate : 0.0001 +gru_training_L2 = params.training_gru.L2 ? params.training_gru.L2 : 0.0 +gru_training_hidden_size = params.training_gru.hidden_size ? params.training_gru.hidden_size : 32 +gru_training_num_layers = params.training_gru.num_layers ? params.training_gru.num_layers : 1 +gru_training_embedding_size = params.training_gru.embedding_size ? params.training_gru.embedding_size : 32 +gru_training_dropout_prob = params.training_gru.dropout_prob ? params.training_gru.dropout_prob : 0.2 + +// you sure this is correct ? +if (params.training_gru.bidirectional == true) + gru_training_directionality = "--no-bidirectional" +else + gru_training_directionality = "--bidirectional" + +if (params.training.condition_on_energy == true) + training_condition_on_energy = "--condition-on-energy" +else + training_condition_on_energy = "--no-condition-on-energy" + +if (params.training.weighted_sampling == true) + training_weighted_sampling = "--weighted-sampling" +else + training_weighted_sampling = "--no-weighted-sampling" + +//sampling +sampling_seed = params.sampling.seed ? params.sampling.seed : 0 // default : 0 +sampling_n_samples = params.sampling.n_samples ? params.sampling.n_samples : 100 // default : 100 +samling_mini_batch_size = params.sampling.mini_batch_size ? params.sampling.mini_batch_size : 100 // default : 100 +sampling_max_length = params.sampling.max_length ? params.sampling.max_length : 200 // default : 200 +sampling_e_value = params.sampling.e_value ? params.sampling.e_value : 0.0001 // default : 0.0001 +samplng_query_coverage = params.sampling.query_coverage ? params.sampling.query_coverage : 70.0 // default : 70.0 +sampling_argmax_first_element = params.sampling.argmax_first_element ? params.sampling.argmax_first_element : true // default : true +sampling_temperature = params.sampling.temperature ? params.sampling.temperature : [1.0] // default : [1.0] +sampling_mmseq_clustering = params.sampling.mmseq_clustering ? params.sampling.mmseq_clustering : "--min-seq-id 0.8" // default: "--min-seq-id 0.8" + + +// printing message of the day +motd = """ +-------------------------------------------------------------------------- +prevent-nf (${workflow.manifest.version}) +-------------------------------------------------------------------------- +Name : ${params.name} +Session ID : ${workflow.sessionId} +-------------------------------------------------------------------------- +Environment information +-------------------------------------------------------------------------- +Container : ${workflow.container} +Config files : ${workflow.configFiles} +Project directory : ${workflow.projectDir} +Work directory : ${workflow.workDir} +Launch directory : ${workflow.launchDir} +Results directory : ${resultsDir} +Command line : ${workflow.commandLine} +Repository : ${workflow.repository} +CommitID : ${workflow.commitId} +Revision : ${workflow.revision} +-------------------------------------------------------------------------- +Preprocessing +-------------------------------------------------------------------------- +Minimum allowed sequence length : ${preprocessing_lmin} +Maximum allowed sequence length : ${preprocessing_lmax} +MMSEQS clustering options : ${preprocessing_mmseq_mmseq_clustering} +Validation set proportion : ${preprocessing_val_pct} +Add MSA-related weights to sequences : ${preprocessing_weight_sequences} +Random seed : ${seed} +-------------------------------------------------------------------------- +Training (Transformver VAE) +-------------------------------------------------------------------------- +Number of training epochs : ${training_epochs} +Validation error frequency estimation : ${training_val_freq} +Model checkpoint frequency : ${training_checkpoint_freq} +Batch size : ${training_batch_size} +Learning rate : ${training_learning_rate} +L2 normalisation constant : ${training_L2} +Latent distribution dimensionality : ${training_latent_size} +Conditioning on energy for decoding sequence : ${training_condition_on_energy} +Weighted sampling : ${training_weighted_sampling} +Embeddings dimensionality : ${training_embedding_size} +Dropout probability : ${training_dropout_prob} +Input masking probability : ${training_masking_prob} +Number of heads in (self)-attention : ${training_heads} +Number of layers in encoder : ${training_num_layers_encoder} +Number of layers in decoder : ${training_num_layers_decoder} +-------------------------------------------------------------------------- +Sampling (Prior & Posterior Transformver VAE) +-------------------------------------------------------------------------- +Random seed : ${sampling_seed} +Number of samples : ${sampling_n_samples} +Number of samples in mini batch : ${samling_mini_batch_size} +E-Value : ${sampling_e_value} +Query coverage : ${samplng_query_coverage} +Argmax selection of first AA (posterior only) : ${sampling_argmax_first_element} +Sampling temperatures (posterior only) : ${sampling_temperature} +Number of autoregressive steps in sampling : ${sampling_max_length} +MMSEQS clustering options : ${sampling_mmseq_clustering} +-------------------------------------------------------------------------- +Training (GRU supervised) +-------------------------------------------------------------------------- +Number of training epochs : ${gru_training_epochs} +Validation error frequency estimation : ${gru_training_val_freq} +Model checkpoint frequency : ${gru_training_checkpoint_freq} +Batch size : ${gru_training_batch_size} +Learning rate : ${gru_training_learning_rate} +L2 normalisation constant : ${gru_training_L2} +Hidden size : ${gru_training_hidden_size} +Embeddings dimensionality : ${gru_training_embedding_size} +Dropout probability : ${gru_training_dropout_prob} +Number of layers : ${gru_training_num_layers} +GRU directionalify flag : ${gru_training_directionality} +-------------------------------------------------------------------------- +""" + +log.info motd +//////////////////////////////////////////////// FOLDX /////////////////////////////////////////// + +// repair WT PDB file +process RepairWT{ + tag "WT-repair" + + publishDir "${resultsDir}/preprocessing/energy-estimates", pattern: "${pdb_file.baseName}_Repair.pdb", mode: 'copy' + publishDir "${resultsDir}/preprocessing/energy-estimates", pattern: "${pdb_file.baseName}_Repair_0_ST.fxout", mode: 'copy' + + input: + path pdb_file // WT PDB file + + output: + path("${pdb_file.baseName}_Repair.pdb"), emit: repaired_pdb + path("${pdb_file.baseName}_Repair_0_ST.fxout"), emit: energy_estimate_file + /* + Set of commands: + 1. FoldX: RepairPDB -> adjust some stuff in PDB, necessary for downstream analysis. + Need repaired PDB file for downstream analysis. + 2. FoldX: Stability -> compute free energy estimate for WT structure + */ + script: + + if (params.mutagenesis.os == "macOS") + """ + FoldX_macOS --command=RepairPDB --pdb=${pdb_file} + + FoldX_macOS --command=Stability --pdb=${pdb_file.baseName}_Repair.pdb + """ + else + """ + FoldX_linux --command=RepairPDB --pdb=${pdb_file} + + FoldX_linux --command=Stability --pdb=${pdb_file.baseName}_Repair.pdb + """ +} +// extract Free Energy from Repaired WT PDB file +process ExtractEnergyWT{ + tag "extract-WT-Free-Energy" + + input: + path wt_energy_file // fxout file that is output of FoldX Stability subcommand + + output: + stdout emit: energy_wt + + script: + """ + energy=`cat ${wt_energy_file} | awk -F"\t" '{print \$2}'` + echo \$energy + """ +} +// append Free Energy to WT Fasta file +process AddFreeEnergyWT{ + + tag "add-free-energy-to-WT" + + publishDir "${resultsDir}/preprocessing/energy-estimates", pattern: "${fasta_wt.baseName}-with-energy.fasta", mode:'copy' + + input: + path fasta_wt // WT fasta file + val energy // Free energy estimated for WT structure + + output: + path("${fasta_wt.baseName}-with-energy.fasta"), emit: wt_with_energy + + script: + """ + miscellaneous.py foldx add-energy-wt ${fasta_wt} ${fasta_wt.baseName}-with-energy.fasta --free-energy-wt ${energy} + """ +} + +// main process to generate mutants +process Mutagenesis{ + tag "mutagenesis:seed-${seed};num-of-mutations-${n_mutation_sites}" + + // raw output + publishDir "${resultsDir}/preprocessing/energy-estimates/seed-${seed}/num-of-mutations-${n_mutation_sites}", pattern: "Raw_${pdb_repaired.baseName}.fxout", saveAs: { filename -> "Raw-Energy-Estimates-${pdb_repaired.baseName}.txt" }, mode:'copy' + // avg output + publishDir "${resultsDir}/preprocessing/energy-estimates/seed-${seed}/num-of-mutations-${n_mutation_sites}", pattern: "mutants-energy*.csv", saveAs: { filename -> "mutants-energy.csv" }, mode:'copy' + // mutants fasta file + publishDir "${resultsDir}/preprocessing/energy-estimates/seed-${seed}/num-of-mutations-${n_mutation_sites}", pattern: "mutants*.fasta",saveAs: { filename -> "mutants.fasta" }, mode:'copy' + + input: + path fasta_wt // WT FASTA file + path pdb_repaired // PDB file (repaired) + each seed // list of user provided seeds: for each seed there will be a run + each n_mutation_sites // list of user provided number of mutation sites: for each number there will be a run + + output: + path("Raw_${pdb_repaired.baseName}.fxout"), emit: raw_energy_estimates + path("mutants-energy*.csv"), emit: avg_energy_estimate + path("mutants*.fasta"), emit: mutants_fasta + + /* + Procedure: + 1. Generate mutants (mutants.fasta and individual_list.txt) + 2. Run FoldX to generate mutants + 3. Compute averge FreeEnergy for mutants (line by line): + - keep only mutant names: 1gs5_Repair_1_0.pdb -> 1gs5_Repair_1 by removing trailing 6 characters + - count unique values in first column and sum up values in the second column: (1gs5_Repair_1,avg energy) + - sort by 1st column and save into csv file + 4. Update mutants.fasta with free energy estimates + + */ + script: + if (params.mutagenesis.os == "macOS") + """ + miscellaneous.py foldx generate-mutants ${fasta_wt}\ + ${pdb_repaired.baseName}\ + mutants-${seed}-${n_mutation_sites}.fasta\ + --n-mutation-sites ${n_mutation_sites}\ + --n-mutants ${params.mutagenesis.n_mutants}\ + --seed ${seed} + + FoldX_macOS --command=BuildModel --pdb=${pdb_repaired} --mutant-file=individual_list.txt --numberOfRuns=${params.mutagenesis.foldx_runs} + + cat Raw_${pdb_repaired.baseName}.fxout |\ + awk -F "\t" '/^${pdb_repaired.baseName}/ {print substr(\$1,1,length(\$1)-6) "\t" \$2}' |\ + awk '{v[\$1]+=\$2;n[\$1]++} END{for (i in n) print i","v[i]/n[i]}' |\ + sort -V -k1,1 > mutants-energy-${seed}-${n_mutation_sites}.csv + + miscellaneous.py foldx add-energy-mutant mutants-${seed}-${n_mutation_sites}.fasta\ + mutants-energy-${seed}-${n_mutation_sites}.csv + """ + else + """ + miscellaneous.py foldx generate-mutants ${fasta_wt}\ + ${pdb_repaired.baseName}\ + mutants-${seed}-${n_mutation_sites}.fasta\ + --n-mutation-sites ${n_mutation_sites}\ + --n-mutants ${params.mutagenesis.n_mutants}\ + --seed ${seed} + + FoldX_linux --command=BuildModel --pdb=${pdb_repaired} --mutant-file=individual_list.txt --numberOfRuns=${params.mutagenesis.foldx_runs} + + cat Raw_${pdb_repaired.baseName}.fxout |\ + awk -F "\t" '/^${pdb_repaired.baseName}/ {print substr(\$1,1,length(\$1)-6) "\t" \$2}' |\ + awk '{v[\$1]+=\$2;n[\$1]++} END{for (i in n) print i","v[i]/n[i]}' |\ + sort -V -k1,1 > mutants-energy-${seed}-${n_mutation_sites}.csv + + miscellaneous.py foldx add-energy-mutant mutants-${seed}-${n_mutation_sites}.fasta\ + mutants-energy-${seed}-${n_mutation_sites}.csv + """ +} + +// process to combine all mutants and WT FASTA files with energies +process CombineFASTA{ + tag "combine-FASTA-files" + + publishDir "${resultsDir}/preprocessing/energy-estimates", pattern: "dataset-with-energies.fasta", mode:'copy' + + input: + path wt_fasta // WT FASTA file with energy + path mutants_fasta // Mutants FASTA files with energies + + output: + path("dataset-with-energies.fasta"), emit: final_fasta + + script: + """ + cat ${wt_fasta} ${mutants_fasta} > dataset-with-energies.fasta + """ +} + +// run: nextflow main.nf -profile test -entry FreeEnergy +workflow FreeEnergy{ + // construct channels for FASTA file and PDB file + ch_fasta = Channel.fromPath( params.energy.fasta_file ) + ch_pdb = Channel.fromPath( params.energy.pdb_file ) + + // call RepairWT + // output: .repaired_pdb -> to be used for mutagenesis + // . energy_estimate_file -> to be used to extract Free Energy from file + out_repair = RepairWT( + ch_pdb + ) + + // extract energy through ExtractEnergyWT + // output: .energy_wt -> WT energy value + out_energy = ExtractEnergyWT( + + out_repair.energy_estimate_file + ) + + // add energy to FASTA file + // output: .wt_with_energy -> FASTA file with WT sequence and its Free Energy + out_add_free_energy = AddFreeEnergyWT( + ch_fasta, + out_energy.energy_wt + ) + + ch_seeds = Channel.fromList( params.mutagenesis.seeds ) + ch_n_mutation_sites = Channel.fromList( params.mutagenesis.n_mutation_sites ) + + // mutagenesis + out_mutagenesis = Mutagenesis( + ch_fasta, + out_repair.repaired_pdb, + ch_seeds, + ch_n_mutation_sites + ) + + // combine output + out_combine_fasta = CombineFASTA( + out_add_free_energy.wt_with_energy, + out_mutagenesis.mutants_fasta.collect() + ) + +} + +///////////////////////////////////////////////// PREPROCESSING ////////////////////////////////// +// info about pipeline +process Info { + tag "experiment-info" + + publishDir "${params.resultsDir}", mode: 'copy', overwrite: 'yes' + + output: + tuple path('model.info.txt'), path('model.environment.txt') + + """ + echo '${motd}' > model.info.txt + conda list --export > model.environment.txt + """ +} +// merge and clean user-provided FASTA files +process DataFiltering { + tag "data-filtering" + + // publish log file + publishDir "${resultsDir}/preprocessing/data-filtering", pattern: "logger-filtering.log", mode: 'copy' + // filtered FASTA files (for training/validation) + publishDir "${resultsDir}/preprocessing/data-filtering", pattern: "filtered-sequences.fasta", mode: 'copy' + // seed FASTA file + publishDir "${resultsDir}/preprocessing", pattern: "seeds.fasta", mode: 'copy' + + + input: + path fasta_files // 1.list of FASTA files to concatenate (the result will be used for generating train and validation sets) + path seed_fasta_files // 3.list of FASTA files that will be used as seed molecules + + output: + path("filtered-sequences.fasta"), emit: clean_file // file that will be split into train and validation set (full file) + path("seeds.fasta"), emit: seed_file // filtered seed sequences + path("logger-filtering.log"), emit: log_file // log + + script: + // 1st command: obtain unique (and clean) fasta file from ${fasta_files} + // 2nd command: take first ${number_of_test_samples} lines and save it as SMALL file (useful for small testing) + // 3rd command: same as 1st but for seed sequences + // 4th command: join logs + """ + miscellaneous.py various preprocess-input ${fasta_files}\ + filtered-sequences.fasta\ + logger-inputs.log\ + --lmin ${preprocessing_lmin}\ + --lmax ${preprocessing_lmax} + + miscellaneous.py various preprocess-input ${seed_fasta_files}\ + seeds.fasta\ + logger-seeds.log\ + --lmin ${preprocessing_lmin}\ + --lmax ${preprocessing_lmax} + + cat logger-inputs.log logger-seeds.log > logger-filtering.log + """ +} +// generate train and validation sets +process GenerateTrainValidationSet { + + tag "train-and-validation-sets-generation" + + // log file + publishDir "${resultsDir}/preprocessing/data-split", pattern: "logger-data-split.log", mode: 'copy' + // fasta files + publishDir "${resultsDir}/preprocessing", pattern: "train-set.fasta", mode: 'copy' + publishDir "${resultsDir}/preprocessing", pattern: "validation-set.fasta", mode: 'copy' + // sets stats + publishDir "${resultsDir}/preprocessing", pattern: "train-set-stats.txt", mode: 'copy' + publishDir "${resultsDir}/preprocessing", pattern: "validation-set-stats.txt", mode: 'copy' + // representative sequences (for DEBUGGING) + publishDir "${resultsDir}/preprocessing/data-split", pattern: "pre-validation-set.fasta", mode: 'copy' + + + input: + path(clean_fasta_file) // FASTA file + + output: + path("train-set.fasta"), emit: train_set_fasta_file + path("validation-set.fasta"), emit: validation_set_fasta_file + path("train-set-stats.txt"), emit: train_set_stats + path("validation-set-stats.txt"), emit: validation_set_stats + path("logger-data-split.log"), emit: log_file + path("pre-validation-set.fasta"), emit: representative_sequences_fasta_file + + // train and validation sets are created by applying mmseqs2 clustering to clean fasta file + // representative sequences are considered to be (pre)validation set + // mmseqs2 output may be tweaked (rebalanced) in order to maintain 80-20 (as an example; defined by user) ratio for train-validation set sizes + script: + """ + mmseqs easy-cluster ${preprocessing_mmseq_mmseq_clustering} ${clean_fasta_file} clustered-train tmp + + mv clustered-train_rep_seq.fasta pre-validation-set.fasta + + miscellaneous.py various rebalance-sets ${clean_fasta_file}\ + pre-validation-set.fasta\ + train-set.fasta\ + validation-set.fasta\ + logger-data-split.log\ + --val-pct ${preprocessing_val_pct}\ + --seed ${seed} + + """ +} +// generate weights for training and validation +process CalculateSequenceWeights{ + tag "sequence-weights-calculation" + + // publish csv,pickle + publishDir "${resultsDir}/preprocessing/sequence-weights", pattern: "*.{pickle,csv}", mode: 'copy' + + input: + path(train_set) // FASTA file with train set + path(validation_set) // FASTA file with validation set + + output: + path("${train_set.baseName}-weights.pickle"), emit: train_weights_pickle + path("${train_set.baseName}-weights.csv"), emit: train_weights_csv + path("${validation_set.baseName}-weights.pickle"), emit: validation_weights_pickle + path("${validation_set.baseName}-weights.csv"), emit: validation_weights_csv + + + // we will compute sequence weights for train set optionally, but leave weights for validation set as 1.0 + script: + if (preprocessing_weight_sequences) + """ + clustalo -i ${train_set}\ + -o ${train_set.baseName}-msa.aln\ + --distmat-out ${train_set.baseName}-distmat.csv\ + --full\ + --percent-id + miscellaneous.py various distmat-weights ${train_set.baseName}-distmat.csv\ + ${train_set.baseName}-weights.pickle\ + ${train_set.baseName}-weights.csv + + miscellaneous.py various default-weights ${validation_set}\ + ${validation_set.baseName}-weights.pickle\ + ${validation_set.baseName}-weights.csv + """ + else + """ + miscellaneous.py various default-weights ${train_set}\ + ${train_set.baseName}-weights.pickle\ + ${train_set.baseName}-weights.csv + + miscellaneous.py various default-weights ${validation_set}\ + ${validation_set.baseName}-weights.pickle\ + ${validation_set.baseName}-weights.csv + """ + +} +// combine sequences into single FASTA file +process MergeFasta{ + tag "merging-FASTA-files" + + input: + path(fasta_files_to_merge) // [list of FASTA files] + + output: + path("merged-files.fasta"), emit: merged_file + + script: + """ + cat ${fasta_files_to_merge} > merged-files.fasta + """ +} + +// MAIN PREPROCESSING WORKFLOW +workflow Preprocessing{ + take: + fasta_files_to_join // raw FASTA files + seed_fasta_files_to_join // raw FASTA files with seeds + main: + // clean data -> remove duplicates/non-canonical AAs + out_data_filtering = DataFiltering( + fasta_files_to_join.collect(), + seed_fasta_files_to_join.collect() + ) + + // generate train and validation sets + out_generate_train_validation_set = GenerateTrainValidationSet( + out_data_filtering.clean_file + ) + + + // compute weights for sequences: weights are computed for training set, for validation set they are set to 1.0 + // out_sequence_weights = CalculateSequenceWeights( + // out_generate_train_validation_set.train_set_fasta_file, + // out_generate_train_validation_set.validation_set_fasta_file + // ) + emit: + train_file = out_generate_train_validation_set.train_set_fasta_file // clean train set file + val_file = out_generate_train_validation_set.validation_set_fasta_file // clean validation set file + seed_file = out_data_filtering.seed_file // clean seed file + //train_weights = out_sequence_weights.train_weights_pickle // training weights + //val_weights = out_sequence_weights.validation_weights_pickle // validation weights +} + +//////////////////////////////////////////////// TRAINING //////////////////////////////////////// +// TransformerVAE model training process +process TrainModel{ + tag "model-training" + + // no checkpoint or sequence weights + input: + path(trainFile) // train set + path(validationFile) // validation set + path(checkpoint) // model checkpoint + + // csv files with losses: train by batch and by epoch; validation by epoch + publishDir "${resultsDir}/training/losses/csv", pattern: "loss-*.csv", mode: 'copy' + // log files with losses and gradients + publishDir "${resultsDir}/training/losses/log", pattern: "*.log", mode: 'copy' + + // publish pytorch files (best model): will have 2 pytorch files and 1 pickle file + publishDir "${resultsDir}/training/best-models", pattern: "best-*.pytorch", mode: 'copy' + publishDir "${resultsDir}/training/best-models", pattern: "model-input.pickle", mode: 'copy' + + // publish intermediate model results + pickle file + publishDir "${resultsDir}/training/model-checkpoints", pattern: "model-checkpoint-*.pytorch", mode: 'copy' + publishDir "${resultsDir}/training/model-checkpoints", pattern: "model-input.pickle", mode: 'copy' + + // embedding weights + //publishDir "${resultsDir}/training/embeddings", pattern: "embedding-weights-best-*.csv", mode: 'copy' + + output: + path trainFile, emit: train_set_fasta_file + path validationFile, emit: validation_set_fasta_file + // pickle (input parameters to the model) + path("model-input.pickle"), emit: pickle_file + // best models + path("best-train-error.pytorch"), emit:best_train_pytorch + path("best-validation-error.pytorch"), emit: best_validation_pytorch + // logs + path("loss-batch-train.log"), emit: train_batch_log + path("loss-epoch-train.log"), emit: train_loss_log + path("loss-epoch-validation.log"), emit: validation_loss_log + path("sequence-batch-update.log"), emit: sequence_batch_log + // checkpoints + path("model-checkpoint-*.pytorch"), emit: model_chekpoints + // embedding weights (for best models) + //path("embedding-weights-best-*.csv"), emit: embedding_weights + // csv files with losses -> needs to be separate + //path("loss-batch-train.csv"), emit: csv_file_batch + path("loss-epoch-train.csv"), emit: csv_file_epoch + path("loss-epoch-validation.csv"), emit: csv_file_val_epoch + + // no checkpoint + script: + """ + train.py transformer gaussian ${trainFile}\ + ${validationFile}\ + loss-batch-train.log\ + loss-epoch-train.log\ + loss-epoch-validation.log\ + sequence-batch-update.log\ + model-checkpoint\ + loss-epoch-train.csv\ + loss-epoch-validation.csv\ + model-input.pickle\ + best-train-error.pytorch\ + best-validation-error.pytorch\ + --epochs ${training_epochs}\ + --learning-rate ${training_learning_rate}\ + --lambda-constant ${training_L2}\ + --validation-freq-epoch ${training_val_freq}\ + --checkpoint-freq-epoch ${training_checkpoint_freq}\ + --max-sequence-length ${max_sequence_length}\ + --batch-size ${training_batch_size}\ + --embedding-size ${training_embedding_size}\ + --latent-size ${training_latent_size}\ + ${training_condition_on_energy}\ + ${training_weighted_sampling}\ + --dropout-prob ${training_dropout_prob}\ + --masking-prob ${training_masking_prob}\ + --heads ${training_heads}\ + --num-layers-encoder ${training_num_layers_encoder}\ + --num-layers-decoder ${training_num_layers_decoder}\ + --seed ${seed}\ + --pt-checkpoint ${checkpoint} + """ +} + +// TransformerVAE model: get params of latent space +process EstimateLatentSpace{ + tag "latent-space-estimation:${model_identifier};${fasta_file.baseName}" + + + // store csv file in the training folder + publishDir "${resultsDir}/training/latent-space-estimation/${model_identifier}/${fasta_file.baseName}", pattern: "*.csv", mode: 'copy' + + input: + tuple path(pickle_file), path(pytorch_file), val(model_identifier), path(fasta_file) // [pickle, pytorch, model identifier, FASTA file with sequences] + + output: + path("${fasta_file.baseName}-means.csv"), emit: means + path("${fasta_file.baseName}-stds.csv"), emit: stds + + script: + """ + downstream.py transformer estimate-latent-space ${fasta_file.baseName}-means.csv\ + ${fasta_file.baseName}-stds.csv\ + ${pytorch_file}\ + ${pickle_file}\ + ${fasta_file}\ + --batch-size ${training_batch_size}\ + --max-sequence-length ${max_sequence_length}\ + --seed 12345 + """ +} + +// supervised GRU model training process: sequence -> energy +process TrainModelPredictiveGRU{ + tag "model-training-supervised-GRU" + + input: + path(trainFile) // train set + path(validationFile) // validation set + path(checkpoint) // model checkpoint + + // csv files with losses: train by batch and by epoch; validation by epoch + publishDir "${resultsDir}/supervised-model-gru/training/losses/csv", pattern: "loss-*.csv", mode: 'copy' + // log files with losses and gradients + publishDir "${resultsDir}/supervised-model-gru/training/losses/log", pattern: "*.log", mode: 'copy' + + // publish pytorch files (best model): will have 2 pytorch files and 1 pickle file + publishDir "${resultsDir}/supervised-model-gru/training/best-models", pattern: "best-*.pytorch", mode: 'copy' + publishDir "${resultsDir}/supervised-model-gru/training/best-models", pattern: "model-input.pickle", mode: 'copy' + + // publish intermediate model results + pickle file + publishDir "${resultsDir}/supervised-model-gru/training/model-checkpoints", pattern: "model-checkpoint-*.pytorch", mode: 'copy' + publishDir "${resultsDir}/supervised-model-gru/training/model-checkpoints", pattern: "model-input.pickle", mode: 'copy' + + output: + path trainFile, emit: train_set_fasta_file + path validationFile, emit: validation_set_fasta_file + // pickle (input parameters to the model) + path("model-input.pickle"), emit: pickle_file + // best models + path("best-train-error.pytorch"), emit:best_train_pytorch + path("best-validation-error.pytorch"), emit: best_validation_pytorch + // logs + path("loss-batch-train.log"), emit: train_batch_log + path("loss-epoch-train.log"), emit: train_loss_log + path("loss-epoch-validation.log"), emit: validation_loss_log + // checkpoints + path("model-checkpoint-*.pytorch"), emit: model_chekpoints + path("loss-epoch-train.csv"), emit: csv_file_epoch + path("loss-epoch-validation.csv"), emit: csv_file_val_epoch + + // max_sequence_length is the same as for VAE + // seed is the same as for VAE + script: + """ + train.py predictor gru ${trainFile}\ + ${validationFile}\ + loss-batch-train.log\ + loss-epoch-train.log\ + loss-epoch-validation.log\ + model-checkpoint\ + loss-epoch-train.csv\ + loss-epoch-validation.csv\ + model-input.pickle\ + best-train-error.pytorch\ + best-validation-error.pytorch\ + --epochs ${gru_training_epochs}\ + --learning-rate ${gru_training_learning_rate}\ + --lambda-constant ${gru_training_L2}\ + --validation-freq-epoch ${gru_training_val_freq}\ + --checkpoint-freq-epoch ${gru_training_checkpoint_freq}\ + --max-sequence-length ${max_sequence_length}\ + --batch-size ${gru_training_batch_size}\ + --embedding-size ${gru_training_embedding_size}\ + --hidden-size ${gru_training_hidden_size}\ + --num-layers ${gru_training_num_layers}\ + ${gru_training_directionality}\ + --dropout-prob ${gru_training_dropout_prob}\ + --seed ${seed}\ + --pt-checkpoint ${checkpoint} + """ + + + +} + +// supervised TF encoder model training process : sequence -> energy +process TrainModelPredictiveTFEncoder{ + tag "model-training-supervised-TF" + + input: + path(trainFile) // train set + path(validationFile) // validation set + path(checkpoint) // model checkpoint + val(useWeightedSampling) // whether to use WeitedRandomSampling or not + + // csv files with losses: train by batch and by epoch; validation by epoch + publishDir "${resultsDir}/supervised-model-tf/training/losses/csv", pattern: "loss-*.csv", mode: 'copy' + // log files with losses and gradients + publishDir "${resultsDir}/supervised-model-tf/training/losses/log", pattern: "*.log", mode: 'copy' + + // publish pytorch files (best model): will have 2 pytorch files and 1 pickle file + publishDir "${resultsDir}/supervised-model-tf/training/best-models", pattern: "best-*.pytorch", mode: 'copy' + publishDir "${resultsDir}/supervised-model-tf/training/best-models", pattern: "model-input.pickle", mode: 'copy' + + // publish intermediate model results + pickle file + publishDir "${resultsDir}/supervised-model-tf/training/model-checkpoints", pattern: "model-checkpoint-*.pytorch", mode: 'copy' + publishDir "${resultsDir}/supervised-model-tf/training/model-checkpoints", pattern: "model-input.pickle", mode: 'copy' + + output: + path trainFile, emit: train_set_fasta_file + path validationFile, emit: validation_set_fasta_file + // pickle (input parameters to the model) + path("model-input.pickle"), emit: pickle_file + // best models + path("best-train-error.pytorch"), emit:best_train_pytorch + path("best-validation-error.pytorch"), emit: best_validation_pytorch + // logs + path("loss-batch-train.log"), emit: train_batch_log + path("loss-epoch-train.log"), emit: train_loss_log + path("loss-epoch-validation.log"), emit: validation_loss_log + // checkpoints + path("model-checkpoint-*.pytorch"), emit: model_chekpoints + path("loss-epoch-train.csv"), emit: csv_file_epoch + path("loss-epoch-validation.csv"), emit: csv_file_val_epoch + + // max_sequence_length is the same as for VAE + // seed is the same as for VAE + script: + """ + train.py predictor tf ${trainFile}\ + ${validationFile}\ + loss-batch-train.log\ + loss-epoch-train.log\ + loss-epoch-validation.log\ + model-checkpoint\ + loss-epoch-train.csv\ + loss-epoch-validation.csv\ + model-input.pickle\ + best-train-error.pytorch\ + best-validation-error.pytorch\ + --epochs ${params.training_tf.epochs}\ + --learning-rate ${params.training_tf.learning_rate}\ + --lambda-constant ${params.training_tf.L2}\ + --validation-freq-epoch ${params.training_tf.val_freq}\ + --checkpoint-freq-epoch ${params.training_tf.checkpoint_freq}\ + --max-sequence-length ${max_sequence_length}\ + --batch-size ${params.training_tf.batch_size}\ + --embedding-size ${params.training_tf.embedding_size}\ + --latent-size ${params.training_tf.latent_size}\ + ${useWeightedSampling}\ + --dropout-prob ${params.training_tf.dropout_prob}\ + --heads ${params.training_tf.heads }\ + --num-layers-encoder ${params.training_tf.num_layers_encoder}\ + --seed ${seed}\ + --pt-checkpoint ${checkpoint} + """ +} + + +//////////////////////////////////////////////// PRIOR SAMPLING ///////////////////////////////////////// +// sample from prior: at each sampling step we obtain (seq, energy), which is later merged into (seq, {energies}) +process PriorSampling{ + + tag "prior-sampling,model-params:${model_identifier}" + + // publish duplicated/unduplicated VAE samples FASTA file + publishDir "${resultsDir}/prior/sampling-results/${model_identifier}", pattern: "all-prior-samples-all-${model_identifier}.fasta", mode: 'copy' + publishDir "${resultsDir}/prior/sampling-results/${model_identifier}", pattern: "prior-samples-all-${model_identifier}.fasta", mode: 'copy' + // publish pickle file + publishDir "${resultsDir}/prior/sampling-results/${model_identifier}", pattern: "all-prior-results-${model_identifier}.pickle", mode: 'copy' + // publish txt file with duplicates + publishDir "${resultsDir}/prior/sampling-results/${model_identifier}", pattern: "duplicated.detail.txt", mode: 'copy' + + + input: + tuple path(pickle_file), path(pytorch_file), val(model_identifier), path(fasta_files_clean_against) //[pickle, pytorch, modelID, list of FASTA files that contain sequences that should be removed from samples file] + + output: + tuple path("all-prior-results-${model_identifier}.pickle"), val(model_identifier), emit: output_for_protein_analysis_prior // tuple [pickle, modelID] + tuple path(pickle_file), path(pytorch_file), path("prior-samples-all-${model_identifier}.fasta"), val(model_identifier), emit: output_for_filtering // tuple [raw FASTA file, modelID] + path("duplicated.detail.txt"), emit: duplicates_details + path("all-prior-samples-all-${model_identifier}.fasta"), emit: initial_samples + + // command description: + // 1st : sample from the prior distribution. if identical sequences are sampled, they will be collapsed and the statistics will be aggregated + // 2nd - 6th: from the output of 1st command remove sequences that can be found in ${fasta_files_clean_against} + // 2nd : join all FASTA file together + // 3rd : remove duplicated sequences from this joint file (called joint.fasta) + // 4th : if there are no duplicates, need to create duplicated.detail.txt, otherwise the code will break + // 5th : take duplicated.detail.txt file, remove first column then flatten it -> output.duplicated.detail.txt + // 6th : take output.duplicated.detail.txt and remove all sequences listed there from all-prior-samples* file + script: + """ + downstream.py transformer sample-prior ${pytorch_file}\ + ${pickle_file}\ + all-prior-results-${model_identifier}.pickle\ + all-prior-samples-all-${model_identifier}.fasta\ + --n-samples ${sampling_n_samples}\ + --seed ${sampling_seed}\ + --max-number-of-steps ${sampling_max_length} + + cat ${fasta_files_clean_against} all-prior-samples-all-${model_identifier}.fasta > joint.fasta + + cat joint.fasta | seqkit rmdup -s -o unduplicated-joint.fasta -d duplicated.fasta -D duplicated.detail.txt + + [ -f duplicated.detail.txt ] && echo "duplicated.detail.txt file exist." || touch duplicated.detail.txt + + cut -f2- duplicated.detail.txt | tr ',' '\n' | tr -d "[:blank:]" > output.duplicated.detail.txt + + miscellaneous.py various remove-sequences output.duplicated.detail.txt all-prior-samples-all-${model_identifier}.fasta prior-samples-all-${model_identifier}.fasta + """ +} +// filter prior samples obtained from PriorSampling process +process PriorFiltering{ + tag "prior-filtering,model-params:${modelID},database:${database.baseName}" + + // publish filtered VAE samples FASTA file + publishDir "${resultsDir}/prior/sampling-results/${modelID}/${database.baseName}", pattern: "filtered-${vae_samples_fasta_file.baseName}.fasta", mode: 'copy' + + // publish csv file with filtered results (we will need it for statisitcs calculation) + publishDir "${resultsDir}/prior/sampling-results/${modelID}/${database.baseName}", pattern: "${vae_samples_fasta_file.baseName}.csv", mode: 'copy' + + //publish log file + publishDir "${resultsDir}/prior/sampling-results/${modelID}/${database.baseName}", pattern: "${vae_samples_fasta_file.baseName}-logger.log", mode: 'copy' + + input: + tuple path(pickle_file),path(pytorch_file), path(vae_samples_fasta_file), val(modelID) // tuple: [pickle file, pytorch file, raw FASTA file, modelID] : pickle and pytorch are not used here but will be carried over to the next process + each path(database) // train or validation set + output: + path("${vae_samples_fasta_file.baseName}.csv"), emit: csv_file + path("filtered-${vae_samples_fasta_file.baseName}.fasta"), emit: filtered_fasta_file + path("${vae_samples_fasta_file.baseName}-logger.log"), emit: log_file + tuple path(pickle_file), path(pytorch_file), val(modelID), path(database), path("filtered-${vae_samples_fasta_file.baseName}.fasta"), emit: output_for_energy_reestimation // [pickle, pytorch, modelID, database, clean FASTA] + + /* + 1st command: create protein DB out of FASTA file with single seed + 2nd command: run blastp of ${vae_samples_fasta_file} against newly created DB -> receive csv file where filtering is done only by e-value: temp.csv! + 3rd command: filter by qcovs (last column) + 4th command: obtain list of seqIDs + 5th command: obtain filtered FASTA file + 6th command: compute statistics and save them to log file (csv headers added) + */ + script: + """ + makeblastdb -dbtype prot -in ${database} + + blastp -out temp.csv -outfmt '10 qseqid sseqid score bitscore evalue pident ppos qcovs' -query ${vae_samples_fasta_file} -db ${database} -evalue ${sampling_e_value} + + cat temp.csv | awk -F "," '/^seq/ { if (\$NF > ${samplng_query_coverage}) print \$0 }' > ${vae_samples_fasta_file.baseName}.csv + + cat ${vae_samples_fasta_file.baseName}.csv | cut -d ',' -f1 | uniq > seq-list.txt + + seqtk subseq ${vae_samples_fasta_file} seq-list.txt > filtered-${vae_samples_fasta_file.baseName}.fasta + + downstream.py transformer csv-stats ${vae_samples_fasta_file.baseName}.csv\ + ${vae_samples_fasta_file.baseName}-logger.log\ + ${sampling_n_samples} + """ + +} +// re-estimate (by running encoder) energies for (clean) sequences from PriorFiltering process +process ReestimateEnergiesPrior{ + errorStrategy 'ignore' // in case no sequences + + tag "energy-reestimation-prior,model-params:${model_identifier},database:${database.baseName}" + + // publish reestimated energies + publishDir "${resultsDir}/prior/sampling-results/${model_identifier}/${database.baseName}/reestimated-energies", pattern: "*.csv", mode: 'copy' + + input: + tuple path(pickle_file), path(pytorch_file), val(model_identifier), path(database), path(fasta_file) // [pickle file, pt file, model ID, database_name, FASTA with clean sequences]: database is relevant b/c FASTA was cleaned against that DB, so we want to output files in the correct folder + + output: + path("*.csv"), emit: all_csv // all csv files + + script: + """ + downstream.py transformer seq2energy ${fasta_file.baseName}-estimated-average-values.csv\ + ${fasta_file.baseName}-individual\ + ${pytorch_file}\ + ${pickle_file}\ + ${fasta_file}\ + --n-samples 300\ + --batch-size ${training_batch_size}\ + --seed ${sampling_seed} + """ +} + +// protein analysis of prior samples +process ProteinAnalysisPrior { + tag "prior-protein-analysis-${model_identifier}" + errorStrategy 'ignore' + + // for now save all files + publishDir "${resultsDir}/prior/protein-analysis-results/${model_identifier}", pattern: "*.{pdf,csv,log}", mode: "copy" + + input: + tuple path(pickle_file), val(model_identifier) // pickle file with sequence information and model identifier + + output: + path("*.csv"), emit: csv_files + path("*.pdf"), emit: pdf_files + path("*.log"), emit: log_files + + script: + """ + downstream.py protanalysis prior ${pickle_file}\ + protein-analysis-prior.log\ + ${model_identifier} + + """ + + +} +// subworkflow to do prior sampling + analysis +workflow Prior{ + take: + input_prior_sampling // input for prior sampling: tuple[pickle_file,pytorch_file,modelID] + databases // list of FASTA files to query against (either train or validation set) + fasta_seq_to_exclude // FASTA file with sequences that should be excluded + main: + + // modify ${input_prior_sampling}, extend each element with ${databases} + input_prior_sampling_extended = input_prior_sampling.combine(fasta_seq_to_exclude) // [pickle, pytorch, modelID, FASTA file with sequences to exclude] + + // run prior sampling + out_downstream_prior_sampling = PriorSampling(input_prior_sampling_extended) + + // filter prior samples (against DB) + out_prior_filtering = PriorFiltering( + out_downstream_prior_sampling.output_for_filtering, // [[pickle file, pytorch file, raw FASTA file, modelID] + databases + ) + // reestimate energies by running filtered sequences through encoder + ReestimateEnergiesPrior( + out_prior_filtering.output_for_energy_reestimation + ) + + // run protein analysis on prior results NOT NEEDED NOW + // ProteinAnalysisPrior( + // out_downstream_prior_sampling.output_for_protein_analysis_prior + // ) +} + +////////////////////////////////////////////////// POSTERIOR SAMPLING //////////////////////////////////////// +// sample from variational (seeded) posterior: at each sampling step we obtain (seq, energy), which is later merged into (seq, {energies}) +process SeededSampling{ + tag "seeded-sampling:${seed_fasta_file.baseName},model-params:${model_identifier},temperature:${temperature}" + + // publish seed FASTA file + publishDir "${resultsDir}/seeded/sampling-results/${model_identifier}/temperature-${temperature}/${seed_fasta_file.baseName}", pattern: "${seed_fasta_file}", mode: 'copy' + + // publish duplicated/unduplicated VAE samples FASTA file + publishDir "${resultsDir}/seeded/sampling-results/${model_identifier}/temperature-${temperature}/${seed_fasta_file.baseName}", pattern: "all-seeded-samples-all-${seed_fasta_file.baseName}-${model_identifier}-temperature-${temperature}.fasta", mode: 'copy' + publishDir "${resultsDir}/seeded/sampling-results/${model_identifier}/temperature-${temperature}/${seed_fasta_file.baseName}", pattern: "seeded-samples-all-${seed_fasta_file.baseName}-${model_identifier}-temperature-${temperature}.fasta", mode: 'copy' + // publish txt file with duplicates + publishDir "${resultsDir}/prior/sampling-results/${model_identifier}", pattern: "duplicated.detail.txt", mode: 'copy' + + // publish pickle file + publishDir "${resultsDir}/seeded/sampling-results/${model_identifier}/temperature-${temperature}/${seed_fasta_file.baseName}", pattern: "all-seeded-results-${seed_fasta_file.baseName}-${model_identifier}-temperature-${temperature}.pickle", mode: 'copy' + + input: + // ${model_identifier} is "train" or "validation" + // ${first_element} tells whether to avoid sampling first element or not + tuple path(pickle_file), path(pytorch_file), val(model_identifier), path(seed_fasta_file), val(first_element), path(fasta_files_clean_against) //[pickle, pytorch, modelID, seed FASTA, whether to do argmax for the first sample, list of FASTA files that contain sequences that should be removed from samples file] + each temperature + + output: + tuple val("${seed_fasta_file.baseName}"), val(model_identifier), val(temperature), path("seeded-samples-all-${seed_fasta_file.baseName}-${model_identifier}-temperature-${temperature}.fasta"), path(seed_fasta_file), path(pickle_file), path(pytorch_file), emit: raw_to_filter // tuple [seedID,modelID,temperature,raw FASTA file with VAE samples, seed FASTA file, pickle, pytorch] + tuple path("all-seeded-results-${seed_fasta_file.baseName}-${model_identifier}-temperature-${temperature}.pickle"), val("${seed_fasta_file.baseName}"), val(model_identifier), val(temperature), emit: output_for_protein_analysis_posterior //tuple [pickle file, seedID, modelID, temperature] + path("duplicated.detail.txt"), emit: duplicates_details + path("all-seeded-samples-all-${seed_fasta_file.baseName}-${model_identifier}-temperature-${temperature}.fasta"), emit: initial_samples + + // command description: + // 1st : sample from the prior distribution. if identical sequences are sampled, they will be collapsed and the statistics will be aggregated + // 2nd - 6th: from the output of 1st command remove sequences that can be found in ${fasta_files_clean_against} + // 2nd : join all FASTA file together + // 3rd : remove duplicated sequences from this joint file (called joint.fasta) + // 4th : if there are no duplicates, need to create duplicated.detail.txt, otherwise the code will break + // 5th : take duplicated.detail.txt file, remove first column then flatten it -> output.duplicated.detail.txt + // 6th : take output.duplicated.detail.txt and remove all sequences listed there from all-seeded-samples* file + script: + """ + downstream.py transformer sample-seeded ${pytorch_file}\ + ${pickle_file}\ + all-seeded-results-${seed_fasta_file.baseName}-${model_identifier}-temperature-${temperature}.pickle\ + ${seed_fasta_file}\ + all-seeded-samples-all-${seed_fasta_file.baseName}-${model_identifier}-temperature-${temperature}.fasta\ + --max-number-of-steps ${sampling_max_length}\ + --n-samples ${sampling_n_samples}\ + --mini-batch-size ${samling_mini_batch_size}\ + --seed ${sampling_seed}\ + --t ${temperature}\ + ${first_element} + + cat ${fasta_files_clean_against} all-seeded-samples-all-${seed_fasta_file.baseName}-${model_identifier}-temperature-${temperature}.fasta > joint.fasta + + cat joint.fasta | seqkit rmdup -s -o unduplicated-joint.fasta -d duplicated.fasta -D duplicated.detail.txt + + [ -f duplicated.detail.txt ] && echo "duplicated.detail.txt file exist." || touch duplicated.detail.txt + + cut -f2- duplicated.detail.txt | tr ',' '\n' | tr -d "[:blank:]" > output.duplicated.detail.txt + + miscellaneous.py various remove-sequences output.duplicated.detail.txt all-seeded-samples-all-${seed_fasta_file.baseName}-${model_identifier}-temperature-${temperature}.fasta seeded-samples-all-${seed_fasta_file.baseName}-${model_identifier}-temperature-${temperature}.fasta + """ +} +// filter posterior samples +process SeededFiltering{ + tag "seeded-filtering:${seedID},model-params:${modelID},temperature:${temperature}" + + // publish filtered VAE samples FASTA file + publishDir "${resultsDir}/seeded/sampling-results/${modelID}/temperature-${temperature}/${seedID}", pattern: "filtered-${vae_samples_fasta_file.baseName}.fasta", mode: 'copy' + + // publish csv file with filtered results (we will need it for statisitcs calculation) + publishDir "${resultsDir}/seeded/sampling-results/${modelID}/temperature-${temperature}/${seedID}", pattern: "${vae_samples_fasta_file.baseName}.csv", mode: 'copy' + + //publish log file + publishDir "${resultsDir}/seeded/sampling-results/${modelID}/temperature-${temperature}/${seedID}", pattern: "${vae_samples_fasta_file.baseName}-logger.log", mode: 'copy' + + + input: + tuple val(seedID), val(modelID), val(temperature), path(vae_samples_fasta_file), path(seed_fasta_file), path(pickle_file), path(pytorch_file) // tuple [seedID,modelID,temperature,raw FASTA file with VAE samples, seed FASTA file, pickle, pytorch ]: pickle and pytorch are not needed, just carry over! + output: + tuple val(seedID), val(modelID), path("filtered-${vae_samples_fasta_file.baseName}.fasta"), emit: seed_id_clean_fasta_tuple // tuple [seed ID, model identifier, clean fasta file] + path("${vae_samples_fasta_file.baseName}.csv"), emit: csv_file + path("filtered-${vae_samples_fasta_file.baseName}.fasta"), emit: filtered_fasta + path("${vae_samples_fasta_file.baseName}-logger.log"), emit: log_file + tuple val(seedID), val(modelID), val(temperature), path(pickle_file), path(pytorch_file), path("filtered-${vae_samples_fasta_file.baseName}.fasta"), emit: output_for_energy_reestimation // [seedID, modelID, temperature, pickle, pytorch, clean FASTA] + + /* + 1st command: create protein DB out of FASTA file with single seed + 2nd command: run blastp of ${vae_samples_fasta_file} against newly created DB -> receive csv file where filtering is done only by e-value: temp.csv! + 3rd command: filter by qcovs (last column) + 4th command: obtain list of seqIDs + 5th command: obtain filtered FASTA file + 6th command: compute statistics and save them to log file (csv headers added) + */ + script: + """ + makeblastdb -dbtype prot -in ${seed_fasta_file} + + blastp -out temp.csv -outfmt '10 qseqid sseqid score bitscore evalue pident ppos qcovs' -query ${vae_samples_fasta_file} -db ${seed_fasta_file} -evalue ${sampling_e_value} + + cat temp.csv | awk -F "," '/^seq/ { if (\$NF > ${samplng_query_coverage}) print \$0 }' > ${vae_samples_fasta_file.baseName}.csv + + cat ${vae_samples_fasta_file.baseName}.csv | cut -d ',' -f1 | uniq > seq-list.txt + + seqtk subseq ${vae_samples_fasta_file} seq-list.txt > filtered-${vae_samples_fasta_file.baseName}.fasta + + downstream.py transformer csv-stats ${vae_samples_fasta_file.baseName}.csv\ + ${vae_samples_fasta_file.baseName}-logger.log\ + ${sampling_n_samples} + """ +} +// re-estimate (by running encoder) energies for (clean) sequences from SeededFiltering process +process ReestimateEnergiesPosterior{ + errorStrategy 'ignore' // in case no sequences + + tag "energy-reestimation,seed:${seedID},model-params:${modelID},temperature:${temperature}" + + // publish reestimated energies + publishDir "${resultsDir}/seeded/sampling-results/${modelID}/temperature-${temperature}/${seedID}/reestimated-energies", pattern: "*.csv", mode: 'copy' + + input: + tuple val(seedID), val(modelID), val(temperature), path(pickle_file), path(pytorch_file), path(fasta_file) // [seedID, modelID, temperature, pickle file, pytorch file, FASTA with clean sequences] + + output: + path("*.csv"), emit: all_csv // all csv files + + script: + """ + downstream.py transformer seq2energy ${fasta_file.baseName}-estimated-average-values.csv\ + ${fasta_file.baseName}-individual\ + ${pytorch_file}\ + ${pickle_file}\ + ${fasta_file}\ + --n-samples 300\ + --batch-size ${training_batch_size}\ + --seed ${sampling_seed} + """ +} + +// nextflow run ... -profile ... -entry ENERGY_ESTIMATE +workflow ENERGY_ESTIMATE{ + // calling process ReestimateEnergiesPosterior + + // some placeholders, they dont really mean anything + seedID = Channel.of("my-seed-id") + modelID = Channel.of("my-model") + temperature = Channel.of("my-temperature") + + pickle_file = Channel.fromPath( params.energy_estimate.pickle_file ) + pytorch_file = Channel.fromPath( params.energy_estimate.pytorch_file ) + fasta_file = Channel.fromPath( params.energy_estimate.fasta_file ) + + input = seedID.combine( + modelID.combine( + temperature.combine( + pickle_file.combine( + pytorch_file.combine( + fasta_file + ) + ) + ) + ) + ) + + ReestimateEnergiesPosterior(input) + + + +} + +// subworkflow to do posterior sampling + analysiss +workflow Posterior{ + take: + input_posterior_sampling // input for posterior sampling: tuple [pickle_file, pytorch_file, model_identifier, seed_fasta_file, first_element] + temperatures // temperatures for sampling + fasta_seq_to_exclude // FASTA file with sequences that should be excluded + + main: + + // modify input_posterior_sampling + input_posterior_sampling_extended = input_posterior_sampling.combine(fasta_seq_to_exclude) + + // run posterior sampling + out_seeded_sampling = SeededSampling( + input_posterior_sampling_extended, + temperatures + ) + // filter sequences + out_filtering = SeededFiltering( + out_seeded_sampling.raw_to_filter + ) + // reestimate energy by running through encoder + ReestimateEnergiesPosterior( + out_filtering.output_for_energy_reestimation + ) +} + +//////////////////////////////////////////////////// PROCESSES RELATED TO PREDICTIVE MODELS ////////////////// +process PredictEnergies{ + errorStrategy 'ignore' // in case no sequences + + tag "energy-prediction-using-predictive-model" + + // publish reestimated energies + publishDir "${resultsDir}/supervised-model-tf/predicted-energies/${modelID}", pattern: "*.{csv,fasta}", mode: 'copy' + + input: + tuple val(modelID), path(pickle_file), path(pytorch_file), path(fasta_file) // [modelID, pickle file, pytorch file, FASTA with clean sequences] + + output: + path("${fasta_file.baseName}-predicted-energies.fasta"), emit: fasta_with_predicted_energies // FASTA file with reestimated energies, sequences are the same here + path("${fasta_file.baseName}-predicted-energies.csv"), emit: csv_predicted_energies // CSV with reestimated energies + + script: + """ + downstream.py predictor tf-predict-energy ${fasta_file.baseName}-predicted-energies.fasta\ + ${fasta_file.baseName}-predicted-energies.csv\ + ${pytorch_file}\ + ${pickle_file}\ + ${fasta_file}\ + --seed ${sampling_seed} + """ +} + + +////////////////////////////////////////////////////// LATENT SPACE OPTIMIZATION //////////////////// +// SGD optimisation, no constraints +process SGDOptimisation { + tag "SGD-optimisation-in-latent-space;seed-${opt_seed}" + + // publish results + publishDir "${resultsDir}/latent-space-sgd-optimisation/seed-${opt_seed}", pattern: "*.{log}", mode: 'copy' + publishDir "${resultsDir}/latent-space-sgd-optimisation/seed-${opt_seed}", pattern: "best-results.fasta", mode: 'copy' + publishDir "${resultsDir}/latent-space-sgd-optimisation/seed-${opt_seed}/restarts", pattern: "optimisation-results-*.fasta", mode: 'copy' + + input: + path(pickle_file) + path(pytorch_file) + each opt_seed + + + output: + path("logger-${opt_seed}.log"), emit: optimisation_logger + path("optimisation-results-*.fasta"), emit: intermediate_results + path("best-results.fasta"), emit: best_results + + script: + """ + downstream.py transformer sgd-optimization ${pytorch_file}\ + ${pickle_file}\ + logger-${opt_seed}.log\ + optimisation-results\ + best-results.fasta\ + --seed ${opt_seed}\ + --learning-rate ${params.optimisation.learning_rate}\ + --n-restarts ${params.optimisation.n_restarts}\ + --delta-f-tol ${params.optimisation.delta_f_tol}\ + --max-opt-steps ${params.optimisation.max_opt_steps} + """ +} + +// Trust Region optimisation, constraints to lie within Gaussian ball N(0,I) +process TrustRegionOptimisationPrior{ + errorStrategy 'ignore' + + tag "trust-region-optimisation-in-latent-space;seed-${opt_seed}" + + // publish results + publishDir "${resultsDir}/latent-space-trust-region-optimisation/prior/seed-${opt_seed}", pattern: "*.{log,fasta,csv,pickle}", mode: 'copy' + publishDir "${resultsDir}/latent-space-trust-region-optimisation/prior/seed-${opt_seed}", pattern: "duplicated.detail.txt", mode: 'copy' + + input: + path(pickle_file) + path(pytorch_file) + path(fasta_files_clean_against) + each opt_seed + + output: + path("logger-${opt_seed}.log"), emit: optimisation_logger // logger file + path("all-samples.fasta"), emit: fasta_output_raw // generated output from trust-region-optimization + path("samples.fasta"), emit: fasta_output_clean // unduplicated output from trust-region-optimization + path("all-samples.pickle"), emit: pickle_output_raw // generated output from trust-region-optimization + path("duplicated.detail.txt"), emit: duplicates_info // txt file with information on duplicated sequences + path("*.csv"), emit: all_csv // output with reestimated energies [MAIN OUTPUT] + + + // 1: downstream.py transformer trust-region-optimization: runs trust region optimisation and then samples 2000 (categorical) + 1 (argmax) samples using optimal z, that corresponds to lowest energy + + // 2: remove sequences found in ${fasta_files_clean_against} + + // WE SKIP FILTERING STEP HERE AND RUN ENERGY REESTIMATION DIRECTLY + // 3: downstream.py transformer seq2energy: runs energy reestimation (again, using 500 samples) + + script: + """ + downstream.py transformer trust-region-optimization ${pytorch_file}\ + ${pickle_file}\ + logger-${opt_seed}.log\ + all-samples.fasta\ + all-samples.pickle\ + --max-number-of-steps ${sampling_max_length}\ + --n-samples 2000\ + --seed ${opt_seed} + + cat ${fasta_files_clean_against} all-samples.fasta > joint.fasta + + cat joint.fasta | seqkit rmdup -s -o unduplicated-joint.fasta -d duplicated.fasta -D duplicated.detail.txt + + [ -f duplicated.detail.txt ] && echo "duplicated.detail.txt file exist." || touch duplicated.detail.txt + + cut -f2- duplicated.detail.txt | tr ',' '\n' | tr -d "[:blank:]" > output.duplicated.detail.txt + + miscellaneous.py various remove-sequences output.duplicated.detail.txt all-samples.fasta samples.fasta + + downstream.py transformer seq2energy samples-estimated-average-values.csv\ + samples-individual\ + ${pytorch_file}\ + ${pickle_file}\ + samples.fasta\ + --n-samples 300\ + --batch-size ${training_batch_size}\ + --seed ${opt_seed} + """ + +} + +// Trust Region optimisation, constraints to lie within Gaussian ball N(mu(seed),diag(seed)) +process TrustRegionOptimisationSeeded{ + + errorStrategy 'ignore' + + tag "trust-region-optimisation-in-latent-space;seed-sequence:${seed_fasta_file.baseName};seed-${opt_seed}" + + // publish results + publishDir "${resultsDir}/latent-space-trust-region-optimisation/seeded/${seed_fasta_file.baseName}/seed-${opt_seed}", pattern: "*.{log,fasta,csv,pickle}", mode: 'copy' + publishDir "${resultsDir}/latent-space-trust-region-optimisation/seeded/seed-${opt_seed}", pattern: "duplicated.detail.txt", mode: 'copy' + + input: + path(pickle_file) + path(pytorch_file) + path(fasta_files_clean_against) + each seed_fasta_file // FASTA file with a seed sequence + each opt_seed + + output: + path("logger-${opt_seed}.log"), emit: optimisation_logger // logger file + path("all-samples.fasta"), emit: fasta_output_raw // generated output from trust-region-optimization + path("samples.fasta"), emit: fasta_output_clean // unduplicated output from trust-region-optimization + path("all-samples.pickle"), emit: pickle_output_raw // generated output from trust-region-optimization + path("duplicated.detail.txt"), emit: duplicates_info // txt file with information on duplicated sequences + path("*.csv"), emit: all_csv // output with reestimated energies [MAIN OUTPUT] + + + // 1: downstream.py transformer trust-region-optimization: runs trust region optimisation and then samples 500 (categorical) + 1 (argmax) samples using optimal z, that corresponds to lowest energy + + // 2: remove sequences found in ${fasta_files_clean_against} + + + // WE SKIP FILTERING STEP HERE AND RUN ENERGY REESTIMATION DIRECTLY + // 3: downstream.py transformer seq2energy: runs energy reestimation (again, using 500 samples) + + script: + """ + downstream.py transformer trust-region-optimization ${pytorch_file}\ + ${pickle_file}\ + logger-${opt_seed}.log\ + all-samples.fasta\ + all-samples.pickle\ + --seed-fasta-file ${seed_fasta_file}\ + --max-number-of-steps ${sampling_max_length}\ + --n-samples 2000\ + --seed ${opt_seed} + + cat ${fasta_files_clean_against} all-samples.fasta > joint.fasta + + cat joint.fasta | seqkit rmdup -s -o unduplicated-joint.fasta -d duplicated.fasta -D duplicated.detail.txt + + [ -f duplicated.detail.txt ] && echo "duplicated.detail.txt file exist." || touch duplicated.detail.txt + + cut -f2- duplicated.detail.txt | tr ',' '\n' | tr -d "[:blank:]" > output.duplicated.detail.txt + + miscellaneous.py various remove-sequences output.duplicated.detail.txt all-samples.fasta samples.fasta + + downstream.py transformer seq2energy samples-estimated-average-values.csv\ + samples-individual\ + ${pytorch_file}\ + ${pickle_file}\ + samples.fasta\ + --n-samples 300\ + --batch-size ${training_batch_size}\ + --seed ${opt_seed} + """ + +} + + +// workflow that serves as entrypoint +// nextflow run main.nf -profile test -entry OPTIMISATION +workflow OPTIMISATION{ + // input channels + pickle_file = Channel.fromPath( params.optimisation.pickle_file ) + pytorch_file = Channel.fromPath( params.optimisation.pytorch_file ) + optimisation_seeds = Channel.fromList( params.optimisation.seeds ) + + ch_seeds_fasta_file = Channel.fromPath( params.optimisation.seeds_file ) + ch_individual_fasta_files = ch_seeds_fasta_file + .splitFasta( record: [id: true, text: true ]) // obtain a map with keys: id and text, basically each map is a single entry of original FASTA file + .collectFile() { item -> [ "${item.id.replaceAll("[._|]","-")}.fasta", item.text ] } // save single entry in respective FASTA files (using ID as filename) + + // load databases, aka FASTA files with sequences that you want to exclude (if they are found!) from the samples set + ch_databases = Channel.fromPath( params.optimisation.databases ) + + // merge databases + out_merge_fasta = MergeFasta(ch_databases.collect()) + ch_fasta_seq_to_exclude = out_merge_fasta.merged_file + + // Trust Region Optimisation for prior + TrustRegionOptimisationPrior( + pickle_file, + pytorch_file, + ch_fasta_seq_to_exclude, + optimisation_seeds + ) + + // Trust Region Optimisation for posterior + TrustRegionOptimisationSeeded( + pickle_file, + pytorch_file, + ch_fasta_seq_to_exclude, + ch_individual_fasta_files, + optimisation_seeds + ) + + +} + +// workflow for TransformerVAE model: training + sampling +workflow MAIN{ + + /////////////////////////////////////////////// INFORMATION ABOUT PROCESS //////////////// + Info() + ////////////////////////////////////////////// PREPROCESSING //////////////////////////////////////// + // fasta files: both are lists + ch_fasta_files_to_join = Channel.fromPath( params.preprocessing.training_list ) + ch_seed_fasta_files_to_join = Channel.fromPath( params.preprocessing.seed_list ) + + // run preprocessing step (STEP I) + out_preprocessing = Preprocessing( + ch_fasta_files_to_join, + ch_seed_fasta_files_to_join + ) + + ////////////////////////////////////////////////////// MODEL TRAINING ////////////////////////////// + // TODO: add checkpoints and sequence weights (need to change python code) + ch_checkpointfile = Channel.fromPath( training_entry_checkpoint ) + + // STEP II: model training + out_train_model_process = TrainModel( + out_preprocessing.train_file, + out_preprocessing.val_file, + ch_checkpointfile + ) + + ////////////////////////////////////////////////////// PRIOR ANALYSIS (SAMPLING + PROTEIN ANALYSIS) ////////// + // get necessary outputs from training + ch_pickle_file = out_train_model_process.pickle_file + ch_best_train_pytorch = out_train_model_process.best_train_pytorch + ch_best_validation_pytorch = out_train_model_process.best_validation_pytorch + ch_seeds_fasta_file = out_preprocessing.seed_file + + // generate identifiers manually + ch_train_identifier = Channel.of( "best-train-error" ) + ch_validation_identifier = Channel.of( "best-validation-error" ) + + + // create input for prior sampling (part of Prior workflow) + ch_input_train_prior_sampling = ch_pickle_file.combine( + ch_best_train_pytorch.combine( + ch_train_identifier + ) + ) + + + + ch_input_validation_prior_sampling = ch_pickle_file.combine( + ch_best_validation_pytorch.combine( + ch_validation_identifier + ) + ) + ch_input_prior_sampling = ch_input_train_prior_sampling + .mix( + ch_input_validation_prior_sampling + ) + // databases: [train-set, validation-set] + // also will serve as list of FASTA files, which sequences should be removed from any samples! + ch_databases = out_preprocessing.train_file + .mix(out_preprocessing.val_file) + .collect() + + // pass through MergeFasta to get merged file + out_merge_fasta = MergeFasta(ch_databases) + ch_fasta_seq_to_exclude = out_merge_fasta.merged_file + + // STEP III: prior sampling and analysis + Prior( + ch_input_prior_sampling, + ch_databases, + ch_fasta_seq_to_exclude + ) + + ///////////////////////////////////////////////////////////// SEEDED ANALYSIS //////////////////////////////////// + // skip or not argmax sampling of first element + if (sampling_argmax_first_element == true) + ch_first_element = Channel.of( "--skip-first-element" ) + else + ch_first_element = Channel.of( "--no-skip-first-element" ) + + // get multiple fasta files from one + // fasta file with sequence ID + ch_individual_fasta_files = ch_seeds_fasta_file + .splitFasta( record: [id: true, text: true ]) // obtain a map with keys: id and text, basically each map is a single entry of original FASTA file + .collectFile() { item -> [ "${item.id.replaceAll("[._|]","-")}.fasta", item.text ] } // save single entry in respective FASTA files (using ID as filename) + + // create input for seeded sampling + ch_input_train_seeded_sampling = ch_pickle_file.combine( + ch_best_train_pytorch.combine( + ch_train_identifier.combine( + ch_individual_fasta_files.combine( + ch_first_element + ) + ) + ) + ) + ch_input_validation_seeded_sampling = ch_pickle_file.combine( + ch_best_validation_pytorch.combine( + ch_validation_identifier.combine( + ch_individual_fasta_files.combine( + ch_first_element + ) + ) + ) + ) + ch_input_seeded_sampling = ch_input_train_seeded_sampling + .mix( + ch_input_validation_seeded_sampling + ) + + // temperature input + ch_temperatures = Channel.fromList( sampling_temperature ) + + //call Posterior workflow + Posterior( + ch_input_seeded_sampling, + ch_temperatures, + ch_fasta_seq_to_exclude + ) +} + +// workflow for TransformerVAE model: sampling +// nextflow run main.nf -profile test -entry VAE_SAMPLE +workflow VAE_SAMPLE{ + // create inputs + ch_pickle_file = Channel.fromPath( params.sampling.pickle_file ) + ch_best_model_pytorch = Channel.fromPath( params.sampling.pytorch_file ) + ch_seeds_fasta_file = Channel.fromPath( params.sampling.seeds_file ) + ch_model_identifier = Channel.of( "user-provided-model" ) + ch_databases = Channel.fromPath( params.sampling.databases ) + ch_temperatures = Channel.fromList( sampling_temperature ) + + if (sampling_argmax_first_element == true) + ch_first_element = Channel.of( "--skip-first-element" ) + else + ch_first_element = Channel.of( "--no-skip-first-element" ) + + + // Prior workflow + ch_input_prior_sampling = ch_pickle_file.combine( + ch_best_model_pytorch.combine( + ch_model_identifier + ) + ) + + // pass through MergeFasta to get merged file + out_merge_fasta = MergeFasta(ch_databases.collect()) + ch_fasta_seq_to_exclude = out_merge_fasta.merged_file + + Prior( + ch_input_prior_sampling, + ch_databases.collect(), + ch_fasta_seq_to_exclude + ) + + + // Posterior workflow + + // get multiple fasta files from one + // fasta file with sequence ID + ch_individual_fasta_files = ch_seeds_fasta_file + .splitFasta( record: [id: true, text: true ]) // obtain a map with keys: id and text, basically each map is a single entry of original FASTA file + .collectFile() { item -> [ "${item.id.replaceAll("[._|]","-")}.fasta", item.text ] } // save single entry in respective FASTA files (using ID as filename) + + // single input here + ch_input_seeded_sampling = ch_pickle_file.combine( + ch_best_model_pytorch.combine( + ch_model_identifier.combine( + ch_individual_fasta_files.combine( + ch_first_element + ) + ) + ) + ) + + //call Posterior workflow + Posterior( + ch_input_seeded_sampling, + ch_temperatures, + ch_fasta_seq_to_exclude + ) + + +} + + +// workflow for supervised learning: sequence -> energy (using GRU) +// nextflow run main.nf -profile test -entry GRU_SUPERVISED_TRAIN +workflow GRU_SUPERVISED_TRAIN{ + /////////////////////////////////////// PREPROCESSING (same as for TransformerVAE) /////////////////////////////////// + // fasta files: both are lists + ch_fasta_files_to_join = Channel.fromPath( params.preprocessing.training_list ) + ch_seed_fasta_files_to_join = Channel.fromPath( params.preprocessing.seed_list ) + + // run preprocessing step (STEP I) + out_preprocessing = Preprocessing( + ch_fasta_files_to_join, + ch_seed_fasta_files_to_join + ) + /////////////////////////////////////// SUPERVISED MODEL TRAINING ///////////////////////////////////////////////////// + ch_checkpointfile = Channel.fromPath( params.training_gru.entry_checkpoint ) + out_model_training = TrainModelPredictiveGRU( + out_preprocessing.train_file, + out_preprocessing.val_file, + ch_checkpointfile + ) +} + +// workflow for supervised learning: sequence -> energy (using TF encoder) +// nextflow run main.nf -profile test -entry TF_SUPERVISED_TRAIN +workflow TF_SUPERVISED_TRAIN{ + /////////////////////////////////////// PREPROCESSING (same as for TransformerVAE) /////////////////////////////////// + // fasta files: both are lists + ch_fasta_files_to_join = Channel.fromPath( params.preprocessing.training_list ) + ch_seed_fasta_files_to_join = Channel.fromPath( params.preprocessing.seed_list ) + + // run preprocessing step (STEP I) + out_preprocessing = Preprocessing( + ch_fasta_files_to_join, + ch_seed_fasta_files_to_join + ) + /////////////////////////////////////// SUPERVISED MODEL TRAINING ///////////////////////////////////////////////////// + ch_checkpointfile = Channel.fromPath( params.training_tf.entry_checkpoint ) + + if (params.training_tf.weighted_sampling == true) + ch_training_weighted_sampling = Channel.value("--weighted-sampling") + else + ch_training_weighted_sampling = Channel.value("--no-weighted-sampling") + + + out_model_training = TrainModelPredictiveTFEncoder( + out_preprocessing.train_file, + out_preprocessing.val_file, + ch_checkpointfile, + ch_training_weighted_sampling + ) +} + + +// workflow for predicting energy from sequence (using TF encoder) +// nextflow run main.nf -profile test -entry TF_SUPERVISED_PREDICT +workflow TF_SUPERVISED_PREDICT{ + // calling process PredictEnergies, inputs: [modelID, pickle file, pytorch file, FASTA with clean sequences] + + // some placeholders, they dont really mean anything + modelID = Channel.of("my-model") + pickle_file = Channel.fromPath( params.predicting_tf.pickle_file ) + pytorch_file = Channel.fromPath( params.predicting_tf.pytorch_file ) + fasta_file = Channel.fromPath( params.predicting_tf.fasta_file ) + + input = modelID.combine( + pickle_file.combine( + pytorch_file.combine( + fasta_file + ) + ) + ) + + PredictEnergies(input) +} + +// workflow for TransformerVAE model: latent space parameters +// nextflow run main.nf -profile test -entry LATENTVARIABILITY +workflow LATENTVARIABILITY{ + // create channels + ch_pickle_file = Channel.fromPath( params.latent.pickle_file ) + ch_pytorch_file = Channel.fromPath( params.latent.pytorch_file ) + ch_model_identifier = Channel.of( "user-provided-model" ) + ch_fasta_files = Channel.fromPath( params.latent.fasta_files ) + + // cross-product them + ch_input = ch_pickle_file.combine( + ch_pytorch_file.combine( + ch_model_identifier.combine( + ch_fasta_files + ) + ) + ) + + // call EstimateLatentSpaceVariability + EstimateLatentSpace(ch_input) +} + +// main entry point +// call as follows: nextflow run main.nf -profile test +workflow{ + MAIN() +} \ No newline at end of file diff --git a/nextflow.config b/nextflow.config new file mode 100644 index 0000000..981b686 --- /dev/null +++ b/nextflow.config @@ -0,0 +1,8 @@ +// your workflow parameters +params { + inputFile = "./testdata/mydata.txt" + resultsDir = "./results/" +} + +// include basic process configuration options +includeConfig 'conf/base.config' diff --git a/readme.md b/readme.md new file mode 100644 index 0000000..4b8d194 --- /dev/null +++ b/readme.md @@ -0,0 +1,161 @@ +# prevent-nf + +![](https://img.shields.io/badge/current_version-1.0.0-blue) + +## Overview + +PREVENT: PRotein Engineering by Variational frEe eNergy approximaTion + +## Configuration + +A user needs to specify a number of parameters in the configuration file under **params** scope to run `prevent` pipeline. +In addition to that, profile(s) describing the system where `prevent` is run need(s) to be provided in the same configuration file. + +- **resultsDir**: directory name where all the results of the current run will be saved +- **seed**: random seed used in set rebalancing and model training (default: 0) + +- **preprocessing.lmin**: minimum sequence length to consider sequence suitable for training (default: 0) +- **preprocessing.lmax**: maximum sequence length to consider sequence suitable for training (default: 1,000) +- **preprocessing.val_pct**: relative size of validation set, should be between 0.0 and 0.5 (default: 0.2) +- **preprocessing.mmseq_clustering**: `MMseqs2` clustering options to obtain cluster representative sequences (default: ''--min-seq-id 0.8'') +- **preprocessing.weight_sequences**: weight sequences by inverse of the average sequence identity within the train set (default: true) [NOT USED] +- **preprocessing.training_list**: list of FASTA files that will be used to generate train and validation sets (compulsory parameter) +- **preprocessing.seed_list**: list of FASTA files with seed sequences to generate novel variants (compulsory parameter) +- **training.epochs**: number of training epochs (default: 100) +- **training.val_freq**: epoch frequency of validation error calculation (default: 1) +- **training.checkpoint_freq**: frequency of model checkpoints, there must be at least one checkpoint, set the value accordingly (default: 50) +- **training.batch_size**: batch size for the gradient update step (default: 32) +- **training.learning_rate**: learning rate for the gradient update step (default: 0.0001) +- **training.L2**: **L2** normalisation constant (default: 0.0) +- **training.clipping_type**: gradient clipping technique, either ''norm'' or ''value'', see pytorch documentation for more details (default: ''value'') +- **training.hidden_size**: hidden units dimensionality for intermeidate layers for temporal convolution layers (default: 128) +- **training.latent_size**: dimensionality of latent distribution (default: 32) +- **training.condition_on_energy**: whether scale latent variable z by predicted energy value, when otaining p(sequence|z) (compulsory parameter). Start with setting it to "false". +- **training.entry_checkpoint**: pytorch model checkpoint to start training from (default: ''None'') +- **training.embedding_size**: embedding dimensionality for amino acids and special tokens (default: 32). Must be divisible by **training.heads** +- **training.dropout_prob**: embedding dropout probability (default: 0.2) +- **training.masking_prob**: input masking probability for transformer decoder (default: 0.0). Non-zero values are recommended to force latent space to learn more +- **training.heads**: number of heads in (self)attention layers of transformer. Default pytorch transformer class is used, see pytorch docs for more information +- **training.num_layers_encoder**: number of TransformerEncoderLayer in Transformer (default: 6) +- **training.num_layers_decoder**: number of TransformerDecoderLayer in Transformer (default: 4) + +- **sampling.seed**: random seed used for sampling (default: 0) +- **sampling.n_samples**: number of requested samples, must be a multiple of 100 (default: 100) +- **sampling.mini_batch_size**: number of samples per mini-batch in seeded sampling procedure only. Must be a divisor of **sampling.n_samples**, not sure why this was implemented. +- **sampling.max_length**: maximum number of sampling steps (default: 200) +- **sampling.e_value**: e-value threshold for `BLASTP` (default: 0.0001) +- **sampling.query_coverage**: minimum allowed query coverage (default: 70.0) +- **sampling.temperature**: list of temperatures for temperature annealing, temperature 0.0 corresponds to argmax operation; the higher the temperature the more uniform amino acid sampling becomes (default: [1.0]) +- **sampling.argmax_first_element**: force argmax selection of the first amino acid; relevant for posterior sampling for temperatures greater than 0.0 (default: true). This is done to avoid having other than methionine AA. +- **sampling.mmseq_clustering**: `MMseqs2` clustering options to obtain cluster representative sequences (best candidates) for subsequent downstream analysis; relevant for seeded sampling only (default: ''--min-seq-id 0.8'') [NOT USED] + +There are other functionalities included in the `prevent` workflow. The most important is generating a set of mutants for further NN training. There are certain parameters that need to be specified in order to run this particular branch (entrypoint) of the workflow: + +- **energy.fasta_file**: FASTA file with a single (wild-type;WT) sequence, for which mutants will be generated and free energy estimated. For the WT free energy is also estimated. +- **energy.pdb_file**: PDB file for WT sequence provided in **energy.fasta_file**. Needed for energy estimation using FoldX. + +- **mutagenesis.os**: OS where code is run. Supported options are "macOS" and "linux" as they will determine which FoldX binary to use. +- **mutagenesis.n_mutation_sites**: list with number of mutation sites in a sequence, for example [1,2,3] means 1,2,3 positions in WT sequence will be mutated independetly. First position in WT is not mutated (compulsory parameter) +- **mutagenesis.n_mutants**: how many mutants to produce (compulsory parameter) +- **mutagenesis.seeds**: list of seeds for random mutagenesis. +- **mutagenesis.foldx_runs**: number of random restarts for FoldX (code won't work with 1 restart yet). Recommend to have between 2 and 5. + +In the end you will have |**mutagenesis.n_mutation_sites**| _ **mutagenesis.n_mutants** _ |**mutagenesis.seeds**| mutants. Each mutant will be run **mutagenesis.foldx_runs** and average value for free energy will be taken. + +There are few more entrypoints in `prevent` that can be useful. Each of them has a specific set of parameters that need to be specified in **params** scope. +First entrypoint is called **GRU_SUPERVISED** and it allows to train a supervised model to predict free energy from a sequence. The special parameters are: + +- **training_gru.epochs**: number of training epochs for GRU supervised model +- **training_gru.val_freq**: frequency of valiation error calculation +- **training_gru.checkpoint_freq**: frequency of model checkpoints +- **training_gru.batch_size**: batch size +- **training_gru.learning_rate**: learning rate for the gradient update step +- **training_gru.L2**: L2 regularisation constant +- **training_gru.hidden_size**: hidden units dimensionality in GRU +- **training_gru.num_layers**: number of stacked GRUs +- **training_gru.bidirectional**: whether to use bidirectional GRU (true/false) +- **training_gru.entry_checkpoint**: model checkpoint to start training from (if no checkpoint, provide "None") +- **training_gru.embedding_size**: embedding size for AAs and special tokens +- **training_gru.dropout_prob**: dropout probability for embeddings + +Another entrypoint is called **TF_SUPERVISED** and it allows to train a different supervised model to predict free energy from a sequence. The related parameters are: + +- **training_tf.epochs**: number of training epochs for Transformer (encoder) supervised model +- **training_tf.val_freq**: frequency of valiation error calculation +- **training_tf.checkpoint_freq**: frequency of model checkpoints +- **training_tf.batch_size**: batch size +- **training_tf.learning_rate**: learning rate for the gradient update step +- **training_tf.L2**: L2 regularisation constant +- **training_tf.latent_size**: dimensionality of a latent space (a size of a space we project to following transformer encoder forward pass). From this latent space an MLP predicts energy. Unlike VAE, here latent space is a deterministic object +- **training_tf.embedding_size**: embedding size for AAs and special tokens; will be split across attention heads, so this number must be divisible by the number of heads +- **training_tf.heads**: number of attention heads +- **training_tf.num_layers_encoder**: number of of Transformer encoderl layers to be used +- **training_tf.entry_checkpoint**: model checkpoint to start training from (if no checkpoint, provide "None") +- **training_tf.dropout_prob**: embedding dropout probability + +Next entrypoint is called **ENERGY_ESTIMATE** and it allows to run energy estimation (using 500 random samples) for a list of sequences from a FASTA file. May be useful for evaluating model performance on test set. The related parameters are: + +- **energy_estimate.pickle_file**: pickle file with model params (often an output of a main entrypoint) +- **energy_estimate.pytorch_file**: pytorch file with pretrained model layers (often an output of a main entrypoint) +- **energy_estimate.fasta_file**: FASTA file with sequence for which energy needs to be estimated (for example, test set) + +Finally, entrypoint called **OPTIMISATION**, it allows to run optimisation procedure in latent space to find proteins with smallest free energy (not complete!). The related parameters are: + +- **optimisation.pickle_file**: pickle file with model params (often an output of a main entrypoint) +- **optimisation.pytorch_file**: pytorch file with pretrained model layers (often an output of a main entrypoint) +- **optimisation.learning_rate**: learning rate for SGD +- **optimisation.n_restarts**: number of restarts for a run (to achieve a better result) +- **optimisation.delta_f_tol**: absolute tolerance for change in predicted energy (if absolute change is smaller than this number, procedure stops) +- **optimisation.max_opt_steps**: maximum allowed number of optimisation steps for a single restart +- **optimisation.seeds**: list of random seeds (for example, [1,2,3]); each seed correponds to an individual process with **optimisation.n_restarts** restarts + +## Running the workflow (example) + +There are multiple entry points to the pipeline, depending on the desired outcome: `ENERGY_ESTIMATE`, `OPTIMISATION`, `LATENTVARIABILITY` and others. This README will focus on the main entry point that is called by default and trains a model and does sampling. + +### Install the workflow + +1. Install [Nextflow](https://www.nextflow.io/docs/latest/getstarted.html). + +2. Download `prevent` as follows: + + ```bash + git clone https://github.com/stracquadaniolab/prevent-nf.git + ``` + +3. Install [Docker](https://docs.docker.com/get-docker/) or + [Singularity](https://sylabs.io/guides/3.7/user-guide/installation.html), + depending on what container engine you want to use. You can find the software + used in either `containers/environment.yml` file or `model.environment.txt` + file, which is the output of the pipeline. + +4. Since we cannot redistribute FoldX, you have to build your docker/singularity image using the file in `containers/Dockerfile` with : + + ```bash + docker buildx build . -f containers/Dockerfile -t ghcr.io/stracquadaniolab/prevent-nf:1.0.0 + ``` +and put the `FoldX` executables and its required files in the `${HOME}/.nextflow/assets/stracquadaniolab/prevent-nf/bin` folder. + +5. A example of configuration files is attached to the release: + + - `reviewer-1-q3-latent-size-16-smaller-NN.conf` - a configuration file with + all the necessary parameters to run the pipeline with a small transformer + and latent size of 16. The results of this model were used to address the + reviewer's question about hyperparameter tuning. + +6. Inspect and modify the configuration file to be able to run the pipeline on + your machine. Sensitive information, such as personal tokens or account names + are deliberately masked. + +```bash +nextflow run main.nf -profile singularity,singularitynv,cell -c conf/reviewer-1-q3-latent-size-16-smaller-NN.conf +``` + +```bash +nextflow run main.nf -profile singularity,singularitynv,cell -entry ENERGY_ESTIMATE -c conf/reviewer-1-q3-latent-size-16-smaller-NN.conf +``` + +## Authors + +- Evgenii Lobzaev (maintainer and main developer) +- Giovanni Stracquadanio (Principal Investigator) diff --git a/testdata/1gs5.pdb b/testdata/1gs5.pdb new file mode 100644 index 0000000..4752512 --- /dev/null +++ b/testdata/1gs5.pdb @@ -0,0 +1,2701 @@ +HEADER TRANSFERASE 28-DEC-01 1GS5 +TITLE N-ACETYL-L-GLUTAMATE KINASE FROM ESCHERICHIA COLI COMPLEXED +TITLE 2 WITH ITS SUBSTRATE N-ACETYLGLUTAMATE AND ITS SUBSTRATE +TITLE 3 ANALOG AMPPNP +COMPND MOL_ID: 1; +COMPND 2 MOLECULE: ACETYLGLUTAMATE KINASE; +COMPND 3 CHAIN: A; +COMPND 4 SYNONYM: NAG KINASE, AGK, N-ACETYL-L-GLUTAMATE +COMPND 5 5-PHOSPHOTRANSFERASE; +COMPND 6 EC: 2.7.2.8; +COMPND 7 ENGINEERED: YES +SOURCE MOL_ID: 1; +SOURCE 2 ORGANISM_SCIENTIFIC: ESCHERICHIA COLI; +SOURCE 3 ORGANISM_TAXID: 469008; +SOURCE 4 STRAIN: BL21(DE3); +SOURCE 5 EXPRESSION_SYSTEM: ESCHERICHIA COLI; +SOURCE 6 EXPRESSION_SYSTEM_TAXID: 469008; +SOURCE 7 EXPRESSION_SYSTEM_STRAIN: BL21(DE3); +SOURCE 8 EXPRESSION_SYSTEM_PLASMID: PET-15B; +SOURCE 9 OTHER_DETAILS: NOVAGEN +KEYWDS CARBAMATE KINASE, AMINO ACID KINASE, ARGININE BIOSYNTHESIS, +KEYWDS 2 PHOSPHORYL GROUP TRANSFER, TRANSFERASE +EXPDTA X-RAY DIFFRACTION +AUTHOR S.RAMON-MAIQUES,A.MARINA,F.GIL-ORTIZ,I.FITA,V.RUBIO +REVDAT 3 05-FEB-14 1GS5 1 HEADER SOURCE KEYWDS REMARK +REVDAT 3 2 VERSN FORMUL SITE +REVDAT 2 24-FEB-09 1GS5 1 VERSN +REVDAT 1 16-MAY-02 1GS5 0 +JRNL AUTH S.RAMON-MAIQUES,A.MARINA,F.GIL-ORTIZ,I.FITA,V.RUBIO +JRNL TITL STRUCTURE OF ACETYLGLUTAMATE KINASE, A KEY ENZYME +JRNL TITL 2 FOR ARGININE BIOSYNTHESIS AND A PROTOTYPE FOR THE +JRNL TITL 3 AMINO ACID KINASE ENZYME FAMILY, DURING CATALYSIS +JRNL REF STRUCTURE V. 10 329 2002 +JRNL REFN ISSN 0969-2126 +JRNL PMID 12005432 +JRNL DOI 10.1016/S0969-2126(02)00721-9 +REMARK 2 +REMARK 2 RESOLUTION. 1.5 ANGSTROMS. +REMARK 3 +REMARK 3 REFINEMENT. +REMARK 3 PROGRAM : REFMAC +REMARK 3 AUTHORS : MURSHUDOV,VAGIN,DODSON +REMARK 3 +REMARK 3 DATA USED IN REFINEMENT. +REMARK 3 RESOLUTION RANGE HIGH (ANGSTROMS) : 1.5 +REMARK 3 RESOLUTION RANGE LOW (ANGSTROMS) : 50 +REMARK 3 DATA CUTOFF (SIGMA(F)) : 0.0 +REMARK 3 COMPLETENESS FOR RANGE (%) : 99.9 +REMARK 3 NUMBER OF REFLECTIONS : 35599 +REMARK 3 +REMARK 3 FIT TO DATA USED IN REFINEMENT. +REMARK 3 CROSS-VALIDATION METHOD : THROUGHOUT +REMARK 3 FREE R VALUE TEST SET SELECTION : RANDOM +REMARK 3 R VALUE (WORKING + TEST SET) : NULL +REMARK 3 R VALUE (WORKING SET) : 0.2088 +REMARK 3 FREE R VALUE : 0.2128 +REMARK 3 FREE R VALUE TEST SET SIZE (%) : 5.0 +REMARK 3 FREE R VALUE TEST SET COUNT : 1883 +REMARK 3 +REMARK 3 NUMBER OF NON-HYDROGEN ATOMS USED IN REFINEMENT. +REMARK 3 PROTEIN ATOMS : 1904 +REMARK 3 NUCLEIC ACID ATOMS : 0 +REMARK 3 HETEROGEN ATOMS : 45 +REMARK 3 SOLVENT ATOMS : 198 +REMARK 3 +REMARK 3 B VALUES. +REMARK 3 FROM WILSON PLOT (A**2) : NULL +REMARK 3 MEAN B VALUE (OVERALL, A**2) : NULL +REMARK 3 OVERALL ANISOTROPIC B VALUE. +REMARK 3 B11 (A**2) : NULL +REMARK 3 B22 (A**2) : NULL +REMARK 3 B33 (A**2) : NULL +REMARK 3 B12 (A**2) : NULL +REMARK 3 B13 (A**2) : NULL +REMARK 3 B23 (A**2) : NULL +REMARK 3 +REMARK 3 ESTIMATED OVERALL COORDINATE ERROR. +REMARK 3 ESU BASED ON R VALUE (A): NULL +REMARK 3 ESU BASED ON FREE R VALUE (A): 0.09127 +REMARK 3 ESU BASED ON MAXIMUM LIKELIHOOD (A): 0.06101 +REMARK 3 ESU FOR B VALUES BASED ON MAXIMUM LIKELIHOOD (A**2): 1.60017 +REMARK 3 +REMARK 3 RMS DEVIATIONS FROM IDEAL VALUES. +REMARK 3 DISTANCE RESTRAINTS. RMS SIGMA +REMARK 3 BOND LENGTH (A) : NULL ; NULL +REMARK 3 ANGLE DISTANCE (A) : NULL ; NULL +REMARK 3 INTRAPLANAR 1-4 DISTANCE (A) : NULL ; NULL +REMARK 3 H-BOND OR METAL COORDINATION (A) : NULL ; NULL +REMARK 3 +REMARK 3 PLANE RESTRAINT (A) : NULL ; NULL +REMARK 3 CHIRAL-CENTER RESTRAINT (A**3) : NULL ; NULL +REMARK 3 +REMARK 3 NON-BONDED CONTACT RESTRAINTS. +REMARK 3 SINGLE TORSION (A) : NULL ; NULL +REMARK 3 MULTIPLE TORSION (A) : NULL ; NULL +REMARK 3 H-BOND (X...Y) (A) : NULL ; NULL +REMARK 3 H-BOND (X-H...Y) (A) : NULL ; NULL +REMARK 3 +REMARK 3 CONFORMATIONAL TORSION ANGLE RESTRAINTS. +REMARK 3 SPECIFIED (DEGREES) : NULL ; NULL +REMARK 3 PLANAR (DEGREES) : NULL ; NULL +REMARK 3 STAGGERED (DEGREES) : NULL ; NULL +REMARK 3 TRANSVERSE (DEGREES) : NULL ; NULL +REMARK 3 +REMARK 3 ISOTROPIC THERMAL FACTOR RESTRAINTS. RMS SIGMA +REMARK 3 MAIN-CHAIN BOND (A**2) : NULL ; NULL +REMARK 3 MAIN-CHAIN ANGLE (A**2) : NULL ; NULL +REMARK 3 SIDE-CHAIN BOND (A**2) : NULL ; NULL +REMARK 3 SIDE-CHAIN ANGLE (A**2) : NULL ; NULL +REMARK 3 +REMARK 3 OTHER REFINEMENT REMARKS: NONE +REMARK 4 +REMARK 4 1GS5 COMPLIES WITH FORMAT V. 3.30, 13-JUL-11 +REMARK 100 +REMARK 100 THIS ENTRY HAS BEEN PROCESSED BY PDBE ON 15-JAN-02. +REMARK 100 THE PDBE ID CODE IS EBI-9174. +REMARK 200 +REMARK 200 EXPERIMENTAL DETAILS +REMARK 200 EXPERIMENT TYPE : X-RAY DIFFRACTION +REMARK 200 DATE OF DATA COLLECTION : 15-MAY-00 +REMARK 200 TEMPERATURE (KELVIN) : 100.0 +REMARK 200 PH : 4.60 +REMARK 200 NUMBER OF CRYSTALS USED : 1 +REMARK 200 +REMARK 200 SYNCHROTRON (Y/N) : Y +REMARK 200 RADIATION SOURCE : ESRF +REMARK 200 BEAMLINE : ID14-1 +REMARK 200 X-RAY GENERATOR MODEL : NULL +REMARK 200 MONOCHROMATIC OR LAUE (M/L) : M +REMARK 200 WAVELENGTH OR RANGE (A) : 1 +REMARK 200 MONOCHROMATOR : NULL +REMARK 200 OPTICS : NULL +REMARK 200 +REMARK 200 DETECTOR TYPE : CCD +REMARK 200 DETECTOR MANUFACTURER : MARRESEARCH +REMARK 200 INTENSITY-INTEGRATION SOFTWARE : MOSFLM +REMARK 200 DATA SCALING SOFTWARE : CCP4 (SCALA) +REMARK 200 +REMARK 200 NUMBER OF UNIQUE REFLECTIONS : 37460 +REMARK 200 RESOLUTION RANGE HIGH (A) : 1.500 +REMARK 200 RESOLUTION RANGE LOW (A) : 53.710 +REMARK 200 REJECTION CRITERIA (SIGMA(I)) : 0.000 +REMARK 200 +REMARK 200 OVERALL. +REMARK 200 COMPLETENESS FOR RANGE (%) : 99.9 +REMARK 200 DATA REDUNDANCY : 5.200 +REMARK 200 R MERGE (I) : NULL +REMARK 200 R SYM (I) : 0.04200 +REMARK 200 FOR THE DATA SET : 9.2000 +REMARK 200 +REMARK 200 IN THE HIGHEST RESOLUTION SHELL. +REMARK 200 HIGHEST RESOLUTION SHELL, RANGE HIGH (A) : 1.50 +REMARK 200 HIGHEST RESOLUTION SHELL, RANGE LOW (A) : 1.58 +REMARK 200 COMPLETENESS FOR SHELL (%) : 99.8 +REMARK 200 DATA REDUNDANCY IN SHELL : 4.70 +REMARK 200 R MERGE FOR SHELL (I) : NULL +REMARK 200 R SYM FOR SHELL (I) : 0.34900 +REMARK 200 FOR SHELL : 2.100 +REMARK 200 +REMARK 200 DIFFRACTION PROTOCOL: SINGLE WAVELENGTH +REMARK 200 METHOD USED TO DETERMINE THE STRUCTURE: MOLECULAR REPLACEMENT +REMARK 200 SOFTWARE USED: AMORE +REMARK 200 STARTING MODEL: PDB ENTRY 1GSJ +REMARK 200 +REMARK 200 REMARK: NULL +REMARK 280 +REMARK 280 CRYSTAL +REMARK 280 SOLVENT CONTENT, VS (%): 42 +REMARK 280 MATTHEWS COEFFICIENT, VM (ANGSTROMS**3/DA): 2.1 +REMARK 280 +REMARK 280 CRYSTALLIZATION CONDITIONS: 27-32% PEG MONOMETHYLETHER 2000, +REMARK 280 0.1-0.3M AMMONIUM SULFATE, 5% ETHYLENE GLYCOL, +REMARK 280 0.1M SODIUM ACETATE PH 4.6 +REMARK 290 +REMARK 290 CRYSTALLOGRAPHIC SYMMETRY +REMARK 290 SYMMETRY OPERATORS FOR SPACE GROUP: C 2 2 21 +REMARK 290 +REMARK 290 SYMOP SYMMETRY +REMARK 290 NNNMMM OPERATOR +REMARK 290 1555 X,Y,Z +REMARK 290 2555 -X,-Y,Z+1/2 +REMARK 290 3555 -X,Y,-Z+1/2 +REMARK 290 4555 X,-Y,-Z +REMARK 290 5555 X+1/2,Y+1/2,Z +REMARK 290 6555 -X+1/2,-Y+1/2,Z+1/2 +REMARK 290 7555 -X+1/2,Y+1/2,-Z+1/2 +REMARK 290 8555 X+1/2,-Y+1/2,-Z +REMARK 290 +REMARK 290 WHERE NNN -> OPERATOR NUMBER +REMARK 290 MMM -> TRANSLATION VECTOR +REMARK 290 +REMARK 290 CRYSTALLOGRAPHIC SYMMETRY TRANSFORMATIONS +REMARK 290 THE FOLLOWING TRANSFORMATIONS OPERATE ON THE ATOM/HETATM +REMARK 290 RECORDS IN THIS ENTRY TO PRODUCE CRYSTALLOGRAPHICALLY +REMARK 290 RELATED MOLECULES. +REMARK 290 SMTRY1 1 1.000000 0.000000 0.000000 0.00000 +REMARK 290 SMTRY2 1 0.000000 1.000000 0.000000 0.00000 +REMARK 290 SMTRY3 1 0.000000 0.000000 1.000000 0.00000 +REMARK 290 SMTRY1 2 -1.000000 0.000000 0.000000 0.00000 +REMARK 290 SMTRY2 2 0.000000 -1.000000 0.000000 0.00000 +REMARK 290 SMTRY3 2 0.000000 0.000000 1.000000 53.70900 +REMARK 290 SMTRY1 3 -1.000000 0.000000 0.000000 0.00000 +REMARK 290 SMTRY2 3 0.000000 1.000000 0.000000 0.00000 +REMARK 290 SMTRY3 3 0.000000 0.000000 -1.000000 53.70900 +REMARK 290 SMTRY1 4 1.000000 0.000000 0.000000 0.00000 +REMARK 290 SMTRY2 4 0.000000 -1.000000 0.000000 0.00000 +REMARK 290 SMTRY3 4 0.000000 0.000000 -1.000000 0.00000 +REMARK 290 SMTRY1 5 1.000000 0.000000 0.000000 29.78200 +REMARK 290 SMTRY2 5 0.000000 1.000000 0.000000 36.16600 +REMARK 290 SMTRY3 5 0.000000 0.000000 1.000000 0.00000 +REMARK 290 SMTRY1 6 -1.000000 0.000000 0.000000 29.78200 +REMARK 290 SMTRY2 6 0.000000 -1.000000 0.000000 36.16600 +REMARK 290 SMTRY3 6 0.000000 0.000000 1.000000 53.70900 +REMARK 290 SMTRY1 7 -1.000000 0.000000 0.000000 29.78200 +REMARK 290 SMTRY2 7 0.000000 1.000000 0.000000 36.16600 +REMARK 290 SMTRY3 7 0.000000 0.000000 -1.000000 53.70900 +REMARK 290 SMTRY1 8 1.000000 0.000000 0.000000 29.78200 +REMARK 290 SMTRY2 8 0.000000 -1.000000 0.000000 36.16600 +REMARK 290 SMTRY3 8 0.000000 0.000000 -1.000000 0.00000 +REMARK 290 +REMARK 290 REMARK: NULL +REMARK 300 +REMARK 300 BIOMOLECULE: 1 +REMARK 300 SEE REMARK 350 FOR THE AUTHOR PROVIDED AND/OR PROGRAM +REMARK 300 GENERATED ASSEMBLY INFORMATION FOR THE STRUCTURE IN +REMARK 300 THIS ENTRY. THE REMARK MAY ALSO PROVIDE INFORMATION ON +REMARK 300 BURIED SURFACE AREA. +REMARK 350 +REMARK 350 COORDINATES FOR A COMPLETE MULTIMER REPRESENTING THE KNOWN +REMARK 350 BIOLOGICALLY SIGNIFICANT OLIGOMERIZATION STATE OF THE +REMARK 350 MOLECULE CAN BE GENERATED BY APPLYING BIOMT TRANSFORMATIONS +REMARK 350 GIVEN BELOW. BOTH NON-CRYSTALLOGRAPHIC AND +REMARK 350 CRYSTALLOGRAPHIC OPERATIONS ARE GIVEN. +REMARK 350 +REMARK 350 BIOMOLECULE: 1 +REMARK 350 AUTHOR DETERMINED BIOLOGICAL UNIT: DIMERIC +REMARK 350 SOFTWARE DETERMINED QUATERNARY STRUCTURE: DIMERIC +REMARK 350 SOFTWARE USED: PQS +REMARK 350 APPLY THE FOLLOWING TO CHAINS: A +REMARK 350 BIOMT1 1 1.000000 0.000000 0.000000 0.00000 +REMARK 350 BIOMT2 1 0.000000 1.000000 0.000000 0.00000 +REMARK 350 BIOMT3 1 0.000000 0.000000 1.000000 0.00000 +REMARK 350 BIOMT1 2 -1.000000 0.000000 0.000000 59.56400 +REMARK 350 BIOMT2 2 0.000000 1.000000 0.000000 0.00000 +REMARK 350 BIOMT3 2 0.000000 0.000000 -1.000000 53.70900 +REMARK 500 +REMARK 500 GEOMETRY AND STEREOCHEMISTRY +REMARK 500 SUBTOPIC: CLOSE CONTACTS IN SAME ASYMMETRIC UNIT +REMARK 500 +REMARK 500 THE FOLLOWING ATOMS ARE IN CLOSE CONTACT. +REMARK 500 +REMARK 500 ATM1 RES C SSEQI ATM2 RES C SSEQI DISTANCE +REMARK 500 O ILE A 75 O HOH A 2064 1.96 +REMARK 500 OE1B GLU A 138 O HOH A 2117 2.08 +REMARK 500 OE1B GLU A 138 O HOH A 2118 1.81 +REMARK 500 O HOH A 2018 O HOH A 2062 2.17 +REMARK 500 O HOH A 2061 O HOH A 2062 2.16 +REMARK 500 O HOH A 2162 O HOH A 2163 2.00 +REMARK 500 O HOH A 2179 O HOH A 2180 1.92 +REMARK 500 O HOH A 2189 O HOH A 2191 1.51 +REMARK 500 +REMARK 500 REMARK: NULL +REMARK 500 +REMARK 500 GEOMETRY AND STEREOCHEMISTRY +REMARK 500 SUBTOPIC: CLOSE CONTACTS +REMARK 500 +REMARK 500 THE FOLLOWING ATOMS THAT ARE RELATED BY CRYSTALLOGRAPHIC +REMARK 500 SYMMETRY ARE IN CLOSE CONTACT. AN ATOM LOCATED WITHIN 0.15 +REMARK 500 ANGSTROMS OF A SYMMETRY RELATED ATOM IS ASSUMED TO BE ON A +REMARK 500 SPECIAL POSITION AND IS, THEREFORE, LISTED IN REMARK 375 +REMARK 500 INSTEAD OF REMARK 500. ATOMS WITH NON-BLANK ALTERNATE +REMARK 500 LOCATION INDICATORS ARE NOT INCLUDED IN THE CALCULATIONS. +REMARK 500 +REMARK 500 DISTANCE CUTOFF: +REMARK 500 2.2 ANGSTROMS FOR CONTACTS NOT INVOLVING HYDROGEN ATOMS +REMARK 500 1.6 ANGSTROMS FOR CONTACTS INVOLVING HYDROGEN ATOMS +REMARK 500 +REMARK 500 ATM1 RES C SSEQI ATM2 RES C SSEQI SSYMOP DISTANCE +REMARK 500 CA MET A 1 OE2B GLU A 117 5455 2.18 +REMARK 500 O A HOH A 2066 O A HOH A 2066 3655 0.44 +REMARK 500 +REMARK 500 REMARK: NULL +REMARK 500 +REMARK 500 GEOMETRY AND STEREOCHEMISTRY +REMARK 500 SUBTOPIC: COVALENT BOND LENGTHS +REMARK 500 +REMARK 500 THE STEREOCHEMICAL PARAMETERS OF THE FOLLOWING RESIDUES +REMARK 500 HAVE VALUES WHICH DEVIATE FROM EXPECTED VALUES BY MORE +REMARK 500 THAN 6*RMSD (M=MODEL NUMBER; RES=RESIDUE NAME; C=CHAIN +REMARK 500 IDENTIFIER; SSEQ=SEQUENCE NUMBER; I=INSERTION CODE). +REMARK 500 +REMARK 500 STANDARD TABLE: +REMARK 500 FORMAT: (10X,I3,1X,2(A3,1X,A1,I4,A1,1X,A4,3X),1X,F6.3) +REMARK 500 +REMARK 500 EXPECTED VALUES PROTEIN: ENGH AND HUBER, 1999 +REMARK 500 EXPECTED VALUES NUCLEIC ACID: CLOWNEY ET AL 1996 +REMARK 500 +REMARK 500 M RES CSSEQI ATM1 RES CSSEQI ATM2 DEVIATION +REMARK 500 MET A 1 CG A MET A 1 SD A 0.160 +REMARK 500 +REMARK 500 REMARK: NULL +REMARK 500 +REMARK 500 GEOMETRY AND STEREOCHEMISTRY +REMARK 500 SUBTOPIC: COVALENT BOND ANGLES +REMARK 500 +REMARK 500 THE STEREOCHEMICAL PARAMETERS OF THE FOLLOWING RESIDUES +REMARK 500 HAVE VALUES WHICH DEVIATE FROM EXPECTED VALUES BY MORE +REMARK 500 THAN 6*RMSD (M=MODEL NUMBER; RES=RESIDUE NAME; C=CHAIN +REMARK 500 IDENTIFIER; SSEQ=SEQUENCE NUMBER; I=INSERTION CODE). +REMARK 500 +REMARK 500 STANDARD TABLE: +REMARK 500 FORMAT: (10X,I3,1X,A3,1X,A1,I4,A1,3(1X,A4,2X),12X,F5.1) +REMARK 500 +REMARK 500 EXPECTED VALUES PROTEIN: ENGH AND HUBER, 1999 +REMARK 500 EXPECTED VALUES NUCLEIC ACID: CLOWNEY ET AL 1996 +REMARK 500 +REMARK 500 M RES CSSEQI ATM1 ATM2 ATM3 +REMARK 500 ARG A 22 CD - NE - CZ ANGL. DEV. = 11.5 DEGREES +REMARK 500 ARG A 36 NE - CZ - NH1 ANGL. DEV. = 6.1 DEGREES +REMARK 500 ARG A 66 NE - CZ - NH1 ANGL. DEV. = 3.0 DEGREES +REMARK 500 ASP A 74 CB - CG - OD2 ANGL. DEV. = 7.0 DEGREES +REMARK 500 HIS A 95 CE1 - NE2 - CD2 ANGL. DEV. = 6.6 DEGREES +REMARK 500 PHE A 103 CB - CG - CD1 ANGL. DEV. = -5.1 DEGREES +REMARK 500 ASP A 152 CB - CG - OD1 ANGL. DEV. = 5.5 DEGREES +REMARK 500 ARG A 192 CD - NE - CZ ANGL. DEV. = 9.3 DEGREES +REMARK 500 ARG A 192 NE - CZ - NH1 ANGL. DEV. = -6.7 DEGREES +REMARK 500 ARG A 192 NE - CZ - NH2 ANGL. DEV. = 3.7 DEGREES +REMARK 500 GLU A 202 CG - CD - OE1 ANGL. DEV. = 12.0 DEGREES +REMARK 500 VAL A 218 O - C - N ANGL. DEV. = -9.8 DEGREES +REMARK 500 ASP A 233 O - C - N ANGL. DEV. = 11.0 DEGREES +REMARK 500 ILE A 234 O - C - N ANGL. DEV. = -10.0 DEGREES +REMARK 500 GLU A 241 OE1 - CD - OE2 ANGL. DEV. = -9.7 DEGREES +REMARK 500 MET A 250 CG - SD - CE ANGL. DEV. = 10.5 DEGREES +REMARK 500 +REMARK 500 REMARK: NULL +REMARK 500 +REMARK 500 GEOMETRY AND STEREOCHEMISTRY +REMARK 500 SUBTOPIC: TORSION ANGLES +REMARK 500 +REMARK 500 TORSION ANGLES OUTSIDE THE EXPECTED RAMACHANDRAN REGIONS: +REMARK 500 (M=MODEL NUMBER; RES=RESIDUE NAME; C=CHAIN IDENTIFIER; +REMARK 500 SSEQ=SEQUENCE NUMBER; I=INSERTION CODE). +REMARK 500 +REMARK 500 STANDARD TABLE: +REMARK 500 FORMAT:(10X,I3,1X,A3,1X,A1,I4,A1,4X,F7.2,3X,F7.2) +REMARK 500 +REMARK 500 EXPECTED VALUES: GJ KLEYWEGT AND TA JONES (1996). PHI/PSI- +REMARK 500 CHOLOGY: RAMACHANDRAN REVISITED. STRUCTURE 4, 1395 - 1400 +REMARK 500 +REMARK 500 M RES CSSEQI PSI PHI +REMARK 500 ASN A 56 38.28 70.36 +REMARK 500 ASP A 212 -129.56 53.62 +REMARK 500 +REMARK 500 REMARK: NULL +REMARK 620 +REMARK 620 METAL COORDINATION +REMARK 620 (M=MODEL NUMBER; RES=RESIDUE NAME; C=CHAIN IDENTIFIER; +REMARK 620 SSEQ=SEQUENCE NUMBER; I=INSERTION CODE): +REMARK 620 +REMARK 620 COORDINATION ANGLES FOR: M RES CSSEQI METAL +REMARK 620 MG A1261 MG +REMARK 620 N RES CSSEQI ATOM +REMARK 620 1 ANP A1260 O2G +REMARK 620 2 ANP A1260 O2A 94.0 +REMARK 620 3 ANP A1260 O1B 80.5 89.0 +REMARK 620 4 HOH A2195 O 82.5 175.0 86.9 +REMARK 620 5 HOH A2135 O 166.7 97.3 106.4 86.6 +REMARK 620 N 1 2 3 4 +REMARK 800 +REMARK 800 SITE +REMARK 800 SITE_IDENTIFIER: AC1 +REMARK 800 EVIDENCE_CODE: SOFTWARE +REMARK 800 SITE_DESCRIPTION: BINDING SITE FOR RESIDUE MG A1261 +REMARK 800 +REMARK 800 SITE_IDENTIFIER: AC2 +REMARK 800 EVIDENCE_CODE: SOFTWARE +REMARK 800 SITE_DESCRIPTION: BINDING SITE FOR RESIDUE NLG A1259 +REMARK 800 +REMARK 800 SITE_IDENTIFIER: AC3 +REMARK 800 EVIDENCE_CODE: SOFTWARE +REMARK 800 SITE_DESCRIPTION: BINDING SITE FOR RESIDUE ANP A1260 +DBREF 1GS5 A 1 258 UNP P11445 ARGB_ECOLI 1 258 +SEQRES 1 A 258 MET MET ASN PRO LEU ILE ILE LYS LEU GLY GLY VAL LEU +SEQRES 2 A 258 LEU ASP SER GLU GLU ALA LEU GLU ARG LEU PHE SER ALA +SEQRES 3 A 258 LEU VAL ASN TYR ARG GLU SER HIS GLN ARG PRO LEU VAL +SEQRES 4 A 258 ILE VAL HIS GLY GLY GLY CYS VAL VAL ASP GLU LEU MET +SEQRES 5 A 258 LYS GLY LEU ASN LEU PRO VAL LYS LYS LYS ASN GLY LEU +SEQRES 6 A 258 ARG VAL THR PRO ALA ASP GLN ILE ASP ILE ILE THR GLY +SEQRES 7 A 258 ALA LEU ALA GLY THR ALA ASN LYS THR LEU LEU ALA TRP +SEQRES 8 A 258 ALA LYS LYS HIS GLN ILE ALA ALA VAL GLY LEU PHE LEU +SEQRES 9 A 258 GLY ASP GLY ASP SER VAL LYS VAL THR GLN LEU ASP GLU +SEQRES 10 A 258 GLU LEU GLY HIS VAL GLY LEU ALA GLN PRO GLY SER PRO +SEQRES 11 A 258 LYS LEU ILE ASN SER LEU LEU GLU ASN GLY TYR LEU PRO +SEQRES 12 A 258 VAL VAL SER SER ILE GLY VAL THR ASP GLU GLY GLN LEU +SEQRES 13 A 258 MET ASN VAL ASN ALA ASP GLN ALA ALA THR ALA LEU ALA +SEQRES 14 A 258 ALA THR LEU GLY ALA ASP LEU ILE LEU LEU SER ASP VAL +SEQRES 15 A 258 SER GLY ILE LEU ASP GLY LYS GLY GLN ARG ILE ALA GLU +SEQRES 16 A 258 MET THR ALA ALA LYS ALA GLU GLN LEU ILE GLU GLN GLY +SEQRES 17 A 258 ILE ILE THR ASP GLY MET ILE VAL LYS VAL ASN ALA ALA +SEQRES 18 A 258 LEU ASP ALA ALA ARG THR LEU GLY ARG PRO VAL ASP ILE +SEQRES 19 A 258 ALA SER TRP ARG HIS ALA GLU GLN LEU PRO ALA LEU PHE +SEQRES 20 A 258 ASN GLY MET PRO MET GLY THR ARG ILE LEU ALA +HET MG A1261 1 +HET NLG A1259 13 +HET ANP A1260 31 +HETNAM MG MAGNESIUM ION +HETNAM NLG N-ACETYL-L-GLUTAMATE +HETNAM ANP PHOSPHOAMINOPHOSPHONIC ACID-ADENYLATE ESTER +FORMUL 2 MG MG 2+ +FORMUL 3 NLG C7 H11 N O5 +FORMUL 4 ANP C10 H17 N6 O12 P3 +FORMUL 5 HOH *198(H2 O) +HELIX 1 1 GLY A 11 ASP A 15 5 5 +HELIX 2 2 SER A 16 GLU A 32 1 17 +HELIX 3 3 GLY A 44 ASN A 56 1 13 +HELIX 4 4 PRO A 69 GLY A 82 1 14 +HELIX 5 5 GLY A 82 HIS A 95 1 14 +HELIX 6 6 GLY A 105 ASP A 108 5 4 +HELIX 7 7 ASP A 116 LEU A 119 5 4 +HELIX 8 8 PRO A 130 ASN A 139 1 10 +HELIX 9 9 ASN A 160 GLY A 173 1 14 +HELIX 10 10 THR A 197 GLN A 207 1 11 +HELIX 11 11 ASP A 212 GLY A 229 1 18 +HELIX 12 12 HIS A 239 GLU A 241 5 3 +HELIX 13 13 GLN A 242 ASN A 248 1 7 +SHEET 1 AA 8 ALA A 99 LEU A 102 0 +SHEET 2 AA 8 LEU A 142 VAL A 145 1 O LEU A 142 N VAL A 100 +SHEET 3 AA 8 LEU A 38 HIS A 42 1 O ILE A 40 N VAL A 145 +SHEET 4 AA 8 LEU A 5 LEU A 9 1 O LEU A 5 N VAL A 39 +SHEET 5 AA 8 ASP A 175 SER A 180 1 O ASP A 175 N ILE A 6 +SHEET 6 AA 8 VAL A 232 SER A 236 1 O ASP A 233 N LEU A 178 +SHEET 7 AA 8 THR A 254 ILE A 256 -1 O THR A 254 N ILE A 234 +SHEET 8 AA 8 GLU A 195 MET A 196 1 N MET A 196 O ARG A 255 +SHEET 1 AB 2 LYS A 61 LYS A 62 0 +SHEET 2 AB 2 LEU A 65 ARG A 66 -1 O LEU A 65 N LYS A 62 +SHEET 1 AC 2 VAL A 110 GLN A 114 0 +SHEET 2 AC 2 GLY A 123 PRO A 127 -1 O LEU A 124 N THR A 113 +SHEET 1 AD 2 ILE A 148 VAL A 150 0 +SHEET 2 AD 2 LEU A 156 ASN A 158 -1 O MET A 157 N GLY A 149 +LINK MG MG A1261 O2G ANP A1260 1555 1555 2.77 +LINK MG MG A1261 O2A ANP A1260 1555 1555 2.13 +LINK MG MG A1261 O1B ANP A1260 1555 1555 2.18 +LINK MG MG A1261 O HOH A2195 1555 1555 2.51 +LINK MG MG A1261 O HOH A2135 1555 1555 2.65 +SITE 1 AC1 3 ANP A1260 HOH A2135 HOH A2195 +SITE 1 AC2 14 GLY A 43 GLY A 44 GLY A 45 LEU A 65 +SITE 2 AC2 14 ARG A 66 LEU A 80 ASN A 158 VAL A 159 +SITE 3 AC2 14 ASN A 160 ALA A 161 ANP A1260 HOH A2194 +SITE 4 AC2 14 HOH A2195 HOH A2196 +SITE 1 AC3 18 LYS A 8 GLY A 10 GLY A 11 GLY A 43 +SITE 2 AC3 18 GLY A 44 GLY A 45 SER A 180 VAL A 182 +SITE 3 AC3 18 LEU A 186 ILE A 209 ILE A 210 THR A 211 +SITE 4 AC3 18 MET A 214 LYS A 217 NLG A1259 MG A1261 +SITE 5 AC3 18 HOH A2197 HOH A2198 +CRYST1 59.564 72.332 107.418 90.00 90.00 90.00 C 2 2 21 8 +ORIGX1 1.000000 0.000000 0.000000 0.00000 +ORIGX2 0.000000 1.000000 0.000000 0.00000 +ORIGX3 0.000000 0.000000 1.000000 0.00000 +SCALE1 0.016789 0.000000 0.000000 0.00000 +SCALE2 0.000000 0.013825 0.000000 0.00000 +SCALE3 0.000000 0.000000 0.009309 0.00000 +ATOM 1 N MET A 1 24.253 42.093 39.424 0.80 37.50 N +ATOM 2 CA MET A 1 23.934 40.679 39.655 0.80 43.15 C +ATOM 3 C MET A 1 24.107 40.294 41.120 0.80 24.96 C +ATOM 4 O MET A 1 25.075 40.676 41.786 0.80 28.17 O +ATOM 5 CB MET A 1 24.818 39.772 38.781 0.80 31.53 C +ATOM 6 CG AMET A 1 24.292 38.366 38.581 0.40 29.84 C +ATOM 7 SD AMET A 1 24.778 37.899 36.733 0.40 27.07 S +ATOM 8 CE AMET A 1 23.236 37.515 35.913 0.40 16.85 C +ATOM 9 CG BMET A 1 24.165 38.481 38.333 0.40 29.84 C +ATOM 10 SD BMET A 1 25.130 37.601 37.081 0.40 27.07 S +ATOM 11 CE BMET A 1 26.787 37.868 37.699 0.40 16.85 C +ATOM 12 N MET A 2 22.989 39.586 41.607 1.00 30.55 N +ATOM 13 CA MET A 2 23.062 38.897 42.951 1.00 28.36 C +ATOM 14 C MET A 2 24.073 37.739 42.978 1.00 31.79 C +ATOM 15 O MET A 2 24.506 37.338 41.905 1.00 32.49 O +ATOM 16 CB MET A 2 21.681 38.351 43.319 1.00 29.60 C +ATOM 17 CG MET A 2 20.594 39.436 43.403 1.00 38.10 C +ATOM 18 SD MET A 2 18.988 38.752 43.793 1.00 31.47 S +ATOM 19 CE MET A 2 19.305 37.947 45.377 1.00 35.42 C +ATOM 20 N ASN A 3 24.447 37.287 44.182 1.00 29.54 N +ATOM 21 CA ASN A 3 25.336 36.087 44.249 1.00 24.06 C +ATOM 22 C ASN A 3 24.464 35.025 43.632 1.00 25.04 C +ATOM 23 O ASN A 3 23.330 34.850 43.983 1.00 26.15 O +ATOM 24 CB ASN A 3 25.612 35.734 45.711 1.00 27.62 C +ATOM 25 CG ASN A 3 26.550 36.708 46.402 1.00 25.05 C +ATOM 26 OD1 ASN A 3 26.421 36.918 47.625 1.00 38.75 O +ATOM 27 ND2 ASN A 3 27.446 37.342 45.705 1.00 26.17 N +ATOM 28 N PRO A 4 25.095 34.110 42.829 1.00 19.86 N +ATOM 29 CA PRO A 4 24.259 33.092 42.262 1.00 19.79 C +ATOM 30 C PRO A 4 23.906 32.006 43.282 1.00 17.56 C +ATOM 31 O PRO A 4 24.511 31.965 44.390 1.00 20.62 O +ATOM 32 CB PRO A 4 25.207 32.403 41.231 1.00 19.65 C +ATOM 33 CG PRO A 4 26.327 33.332 41.045 1.00 21.41 C +ATOM 34 CD PRO A 4 26.446 34.227 42.242 1.00 22.15 C +ATOM 35 N LEU A 5 22.980 31.173 42.921 1.00 17.70 N +ATOM 36 CA LEU A 5 22.707 29.926 43.672 1.00 18.00 C +ATOM 37 C LEU A 5 23.099 28.712 42.823 1.00 19.49 C +ATOM 38 O LEU A 5 22.599 28.595 41.699 1.00 20.68 O +ATOM 39 CB LEU A 5 21.200 29.774 43.958 1.00 22.46 C +ATOM 40 CG LEU A 5 20.718 28.483 44.572 1.00 20.27 C +ATOM 41 CD1 LEU A 5 21.321 28.204 45.956 1.00 21.37 C +ATOM 42 CD2 LEU A 5 19.176 28.495 44.714 1.00 24.43 C +ATOM 43 N ILE A 6 24.007 27.871 43.350 1.00 17.73 N +ATOM 44 CA ILE A 6 24.301 26.613 42.663 1.00 19.08 C +ATOM 45 C ILE A 6 23.374 25.530 43.208 1.00 15.73 C +ATOM 46 O ILE A 6 23.317 25.351 44.467 1.00 18.35 O +ATOM 47 CB ILE A 6 25.781 26.203 42.875 1.00 16.06 C +ATOM 48 CG1 ILE A 6 26.692 27.226 42.153 1.00 17.17 C +ATOM 49 CG2 ILE A 6 25.926 24.769 42.432 1.00 16.70 C +ATOM 50 CD1 ILE A 6 28.166 27.062 42.568 1.00 19.33 C +ATOM 51 N ILE A 7 22.689 24.801 42.421 1.00 16.57 N +ATOM 52 CA ILE A 7 21.918 23.641 42.756 1.00 16.51 C +ATOM 53 C ILE A 7 22.724 22.457 42.262 1.00 20.31 C +ATOM 54 O ILE A 7 22.893 22.379 41.020 1.00 19.00 O +ATOM 55 CB ILE A 7 20.491 23.680 42.219 1.00 18.84 C +ATOM 56 CG1 ILE A 7 19.772 24.945 42.727 1.00 23.22 C +ATOM 57 CG2 ILE A 7 19.753 22.447 42.673 1.00 21.76 C +ATOM 58 CD1 ILE A 7 18.333 25.195 42.336 1.00 30.01 C +ATOM 59 N LYS A 8 23.215 21.573 43.104 1.00 18.43 N +ATOM 60 CA LYS A 8 23.906 20.378 42.658 1.00 16.51 C +ATOM 61 C LYS A 8 23.002 19.188 42.550 1.00 16.18 C +ATOM 62 O LYS A 8 22.235 18.963 43.557 1.00 19.00 O +ATOM 63 CB LYS A 8 25.077 20.137 43.607 1.00 16.92 C +ATOM 64 CG LYS A 8 25.933 18.936 43.229 1.00 19.51 C +ATOM 65 CD LYS A 8 25.470 17.640 43.859 1.00 21.01 C +ATOM 66 CE LYS A 8 26.293 16.485 43.267 1.00 19.12 C +ATOM 67 NZ LYS A 8 26.049 15.239 44.090 1.00 20.93 N +ATOM 68 N LEU A 9 22.942 18.504 41.463 1.00 18.78 N +ATOM 69 CA LEU A 9 22.079 17.380 41.237 1.00 18.42 C +ATOM 70 C LEU A 9 22.775 16.065 41.091 1.00 21.03 C +ATOM 71 O LEU A 9 23.868 16.010 40.535 1.00 22.99 O +ATOM 72 CB LEU A 9 21.322 17.606 39.875 1.00 20.19 C +ATOM 73 CG LEU A 9 20.510 18.877 39.848 1.00 22.66 C +ATOM 74 CD1 LEU A 9 19.843 18.962 38.458 1.00 22.37 C +ATOM 75 CD2 LEU A 9 19.404 18.874 40.888 1.00 23.49 C +ATOM 76 N GLY A 10 22.368 15.041 41.828 1.00 29.61 N +ATOM 77 CA GLY A 10 23.021 13.733 41.577 1.00 26.76 C +ATOM 78 C GLY A 10 22.067 12.643 42.097 1.00 36.89 C +ATOM 79 O GLY A 10 20.878 12.907 42.292 1.00 39.46 O +ATOM 80 N GLY A 11 22.630 11.462 42.280 1.00 46.11 N +ATOM 81 CA GLY A 11 21.827 10.332 42.793 1.00 40.51 C +ATOM 82 C GLY A 11 21.087 9.712 41.611 1.00 36.38 C +ATOM 83 O GLY A 11 21.511 9.865 40.468 1.00 40.83 O +ATOM 84 N VAL A 12 20.047 8.944 41.909 1.00 32.05 N +ATOM 85 CA VAL A 12 19.290 8.300 40.864 1.00 32.20 C +ATOM 86 C VAL A 12 18.294 9.233 40.176 1.00 32.88 C +ATOM 87 O VAL A 12 17.548 8.753 39.337 1.00 33.75 O +ATOM 88 CB VAL A 12 18.516 7.101 41.477 1.00 39.90 C +ATOM 89 CG1 VAL A 12 17.687 6.361 40.445 1.00 53.00 C +ATOM 90 CG2 VAL A 12 19.522 6.157 42.115 1.00 41.73 C +ATOM 91 N LEU A 13 18.419 10.555 40.354 1.00 32.14 N +ATOM 92 CA LEU A 13 17.473 11.490 39.754 1.00 31.41 C +ATOM 93 C LEU A 13 17.361 11.345 38.256 1.00 35.13 C +ATOM 94 O LEU A 13 16.254 11.459 37.756 1.00 33.66 O +ATOM 95 CB LEU A 13 17.875 12.945 40.029 1.00 29.40 C +ATOM 96 CG LEU A 13 17.276 14.058 39.168 1.00 35.80 C +ATOM 97 CD1 LEU A 13 15.840 14.364 39.558 1.00 29.16 C +ATOM 98 CD2 LEU A 13 18.125 15.331 39.286 1.00 36.69 C +ATOM 99 N LEU A 14 18.473 11.195 37.543 1.00 33.13 N +ATOM 100 CA LEU A 14 18.498 11.070 36.086 1.00 31.27 C +ATOM 101 C LEU A 14 17.787 9.850 35.573 1.00 38.82 C +ATOM 102 O LEU A 14 17.333 9.803 34.420 1.00 56.83 O +ATOM 103 CB LEU A 14 19.970 11.091 35.601 1.00 49.13 C +ATOM 104 CG LEU A 14 20.774 12.283 36.218 1.00 55.18 C +ATOM 105 CD1 LEU A 14 22.264 12.216 35.800 1.00 61.69 C +ATOM 106 CD2 LEU A 14 20.183 13.574 35.569 1.00 50.05 C +ATOM 107 N ASP A 15 17.595 8.867 36.450 1.00 43.35 N +ATOM 108 CA ASP A 15 16.872 7.672 35.990 1.00 50.65 C +ATOM 109 C ASP A 15 15.374 7.875 36.166 1.00 51.88 C +ATOM 110 O ASP A 15 14.598 6.978 35.829 1.00 41.77 O +ATOM 111 CB ASP A 15 17.390 6.424 36.699 1.00 58.73 C +ATOM 112 CG ASP A 15 18.815 6.118 36.247 1.00 62.03 C +ATOM 113 OD1 ASP A 15 19.069 6.218 35.029 1.00 66.55 O +ATOM 114 OD2 ASP A 15 19.656 5.804 37.107 1.00 67.92 O +ATOM 115 N SER A 16 14.971 9.083 36.602 1.00 37.80 N +ATOM 116 CA SER A 16 13.537 9.266 36.835 1.00 32.01 C +ATOM 117 C SER A 16 12.928 10.407 36.047 1.00 33.54 C +ATOM 118 O SER A 16 13.113 11.568 36.411 1.00 30.12 O +ATOM 119 CB SER A 16 13.252 9.476 38.314 1.00 37.85 C +ATOM 120 OG SER A 16 11.863 9.711 38.469 1.00 37.52 O +ATOM 121 N GLU A 17 12.265 10.089 34.937 1.00 32.24 N +ATOM 122 CA GLU A 17 11.565 11.098 34.149 1.00 30.10 C +ATOM 123 C GLU A 17 10.605 11.930 34.983 1.00 28.78 C +ATOM 124 O GLU A 17 10.501 13.131 34.839 1.00 29.81 O +ATOM 125 CB AGLU A 17 10.650 10.395 33.115 0.50 28.68 C +ATOM 126 CG AGLU A 17 11.475 9.439 32.268 0.50 30.16 C +ATOM 127 CD AGLU A 17 12.517 10.180 31.451 0.50 38.24 C +ATOM 128 OE1AGLU A 17 13.629 10.390 31.974 0.50 40.25 O +ATOM 129 OE2AGLU A 17 12.253 10.556 30.290 0.50 48.25 O +ATOM 130 CB BGLU A 17 10.775 10.414 33.006 0.50 28.68 C +ATOM 131 CG BGLU A 17 10.043 11.404 32.096 0.50 30.16 C +ATOM 132 CD BGLU A 17 9.247 10.718 30.984 0.50 38.24 C +ATOM 133 OE1BGLU A 17 9.251 9.432 30.887 0.50 40.25 O +ATOM 134 OE2BGLU A 17 8.571 11.426 30.144 0.50 48.25 O +ATOM 135 N GLU A 18 9.789 11.246 35.801 1.00 28.02 N +ATOM 136 CA GLU A 18 8.854 11.962 36.647 1.00 28.30 C +ATOM 137 C GLU A 18 9.587 12.936 37.562 1.00 27.48 C +ATOM 138 O GLU A 18 9.174 14.088 37.661 1.00 28.75 O +ATOM 139 CB GLU A 18 7.997 10.989 37.465 1.00 37.22 C +ATOM 140 CG GLU A 18 6.787 11.630 38.122 1.00 48.35 C +ATOM 141 CD GLU A 18 5.894 10.566 38.755 1.00 64.19 C +ATOM 142 OE1 GLU A 18 5.702 9.469 38.182 1.00 63.38 O +ATOM 143 OE2 GLU A 18 5.377 10.840 39.865 1.00 69.84 O +ATOM 144 N ALA A 19 10.682 12.512 38.223 1.00 25.43 N +ATOM 145 CA ALA A 19 11.411 13.402 39.127 1.00 25.70 C +ATOM 146 C ALA A 19 12.057 14.575 38.375 1.00 21.88 C +ATOM 147 O ALA A 19 12.029 15.683 38.850 1.00 21.67 O +ATOM 148 CB ALA A 19 12.473 12.555 39.832 1.00 25.77 C +ATOM 149 N LEU A 20 12.529 14.335 37.173 1.00 21.78 N +ATOM 150 CA LEU A 20 13.124 15.396 36.348 1.00 23.84 C +ATOM 151 C LEU A 20 12.076 16.419 35.981 1.00 23.00 C +ATOM 152 O LEU A 20 12.300 17.615 36.007 1.00 24.46 O +ATOM 153 CB LEU A 20 13.726 14.795 35.059 1.00 26.78 C +ATOM 154 CG LEU A 20 15.072 14.111 35.296 1.00 27.34 C +ATOM 155 CD1 LEU A 20 15.439 13.148 34.169 1.00 30.62 C +ATOM 156 CD2 LEU A 20 16.212 15.089 35.532 1.00 26.74 C +ATOM 157 N GLU A 21 10.872 15.923 35.570 1.00 22.91 N +ATOM 158 CA GLU A 21 9.805 16.875 35.239 1.00 25.09 C +ATOM 159 C GLU A 21 9.443 17.712 36.426 1.00 22.15 C +ATOM 160 O GLU A 21 9.260 18.948 36.338 1.00 24.22 O +ATOM 161 CB GLU A 21 8.589 16.116 34.655 1.00 27.09 C +ATOM 162 CG GLU A 21 7.445 17.031 34.361 1.00 26.82 C +ATOM 163 CD GLU A 21 7.773 18.090 33.316 1.00 31.77 C +ATOM 164 OE1 GLU A 21 7.301 19.230 33.487 1.00 37.48 O +ATOM 165 OE2 GLU A 21 8.554 17.840 32.367 1.00 34.69 O +ATOM 166 N ARG A 22 9.241 17.067 37.610 1.00 23.76 N +ATOM 167 CA ARG A 22 8.900 17.866 38.775 1.00 22.93 C +ATOM 168 C ARG A 22 9.987 18.847 39.181 1.00 26.25 C +ATOM 169 O ARG A 22 9.767 19.951 39.622 1.00 22.08 O +ATOM 170 CB ARG A 22 8.510 17.045 40.004 1.00 25.42 C +ATOM 171 CG ARG A 22 7.291 16.159 39.863 1.00 33.19 C +ATOM 172 CD ARG A 22 5.976 16.914 39.773 1.00 40.18 C +ATOM 173 NE ARG A 22 5.824 17.742 38.612 1.00 43.69 N +ATOM 174 CZ ARG A 22 5.031 18.740 38.273 1.00 43.06 C +ATOM 175 NH1 ARG A 22 4.074 19.198 39.090 1.00 47.69 N +ATOM 176 NH2 ARG A 22 5.202 19.298 37.083 1.00 47.92 N +ATOM 177 N LEU A 23 11.271 18.467 39.003 1.00 20.08 N +ATOM 178 CA LEU A 23 12.349 19.382 39.311 1.00 20.33 C +ATOM 179 C LEU A 23 12.393 20.558 38.344 1.00 18.38 C +ATOM 180 O LEU A 23 12.515 21.678 38.783 1.00 19.95 O +ATOM 181 CB LEU A 23 13.651 18.546 39.212 1.00 20.30 C +ATOM 182 CG LEU A 23 14.891 19.429 39.327 1.00 21.55 C +ATOM 183 CD1 LEU A 23 15.100 19.970 40.729 1.00 25.63 C +ATOM 184 CD2 LEU A 23 16.114 18.623 38.856 1.00 31.43 C +ATOM 185 N PHE A 24 12.344 20.255 37.040 1.00 20.79 N +ATOM 186 CA PHE A 24 12.400 21.353 36.048 1.00 20.85 C +ATOM 187 C PHE A 24 11.193 22.283 36.218 1.00 20.69 C +ATOM 188 O PHE A 24 11.333 23.477 36.007 1.00 21.73 O +ATOM 189 CB PHE A 24 12.645 20.834 34.613 1.00 20.82 C +ATOM 190 CG PHE A 24 14.145 20.622 34.404 1.00 21.05 C +ATOM 191 CD1 PHE A 24 14.779 19.446 34.819 1.00 19.80 C +ATOM 192 CD2 PHE A 24 14.902 21.643 33.812 1.00 24.61 C +ATOM 193 CE1 PHE A 24 16.141 19.331 34.671 1.00 21.64 C +ATOM 194 CE2 PHE A 24 16.271 21.507 33.635 1.00 20.95 C +ATOM 195 CZ PHE A 24 16.886 20.347 34.066 1.00 20.90 C +ATOM 196 N SER A 25 10.023 21.707 36.575 1.00 22.37 N +ATOM 197 CA SER A 25 8.907 22.629 36.868 1.00 27.50 C +ATOM 198 C SER A 25 9.284 23.632 37.920 1.00 21.07 C +ATOM 199 O SER A 25 9.008 24.860 37.879 1.00 23.47 O +ATOM 200 CB SER A 25 7.723 21.773 37.369 1.00 27.15 C +ATOM 201 OG SER A 25 6.688 22.638 37.875 1.00 32.64 O +ATOM 202 N ALA A 26 9.885 23.154 39.011 1.00 21.22 N +ATOM 203 CA ALA A 26 10.242 23.990 40.119 1.00 19.80 C +ATOM 204 C ALA A 26 11.382 24.992 39.830 1.00 21.37 C +ATOM 205 O ALA A 26 11.460 26.101 40.322 1.00 24.49 O +ATOM 206 CB ALA A 26 10.719 23.061 41.260 1.00 24.08 C +ATOM 207 N LEU A 27 12.274 24.590 38.898 1.00 22.41 N +ATOM 208 CA LEU A 27 13.387 25.473 38.528 1.00 21.99 C +ATOM 209 C LEU A 27 12.827 26.613 37.683 1.00 22.00 C +ATOM 210 O LEU A 27 13.260 27.736 37.801 1.00 22.06 O +ATOM 211 CB LEU A 27 14.391 24.708 37.638 1.00 23.96 C +ATOM 212 CG LEU A 27 15.200 23.658 38.376 1.00 25.48 C +ATOM 213 CD1 LEU A 27 16.172 22.930 37.435 1.00 25.52 C +ATOM 214 CD2 LEU A 27 16.002 24.390 39.451 1.00 31.77 C +ATOM 215 N VAL A 28 11.927 26.314 36.754 1.00 19.60 N +ATOM 216 CA VAL A 28 11.351 27.368 35.928 1.00 23.25 C +ATOM 217 C VAL A 28 10.586 28.333 36.829 1.00 23.51 C +ATOM 218 O VAL A 28 10.685 29.539 36.673 1.00 24.98 O +ATOM 219 CB VAL A 28 10.407 26.811 34.878 1.00 24.41 C +ATOM 220 CG1 VAL A 28 9.532 27.918 34.261 1.00 28.86 C +ATOM 221 CG2 VAL A 28 11.119 26.170 33.695 1.00 24.12 C +ATOM 222 N ASN A 29 9.816 27.771 37.807 1.00 22.46 N +ATOM 223 CA ASN A 29 9.088 28.696 38.698 1.00 22.44 C +ATOM 224 C ASN A 29 10.062 29.501 39.523 1.00 24.94 C +ATOM 225 O ASN A 29 9.817 30.709 39.746 1.00 26.08 O +ATOM 226 CB ASN A 29 8.207 27.794 39.598 1.00 26.32 C +ATOM 227 CG ASN A 29 7.569 28.637 40.685 1.00 28.46 C +ATOM 228 OD1 ASN A 29 6.575 29.321 40.411 1.00 30.04 O +ATOM 229 ND2 ASN A 29 8.117 28.630 41.874 1.00 30.43 N +ATOM 230 N TYR A 30 11.158 28.931 39.996 1.00 23.79 N +ATOM 231 CA TYR A 30 12.110 29.721 40.775 1.00 22.93 C +ATOM 232 C TYR A 30 12.726 30.819 39.868 1.00 28.14 C +ATOM 233 O TYR A 30 12.721 31.989 40.243 1.00 26.84 O +ATOM 234 CB TYR A 30 13.295 28.869 41.198 1.00 24.79 C +ATOM 235 CG TYR A 30 14.360 29.645 41.935 1.00 26.66 C +ATOM 236 CD1 TYR A 30 14.342 29.697 43.326 1.00 33.16 C +ATOM 237 CD2 TYR A 30 15.406 30.267 41.287 1.00 27.95 C +ATOM 238 CE1 TYR A 30 15.313 30.385 44.033 1.00 29.76 C +ATOM 239 CE2 TYR A 30 16.386 30.990 41.993 1.00 31.17 C +ATOM 240 CZ TYR A 30 16.321 31.030 43.364 1.00 35.43 C +ATOM 241 OH TYR A 30 17.319 31.722 44.032 1.00 34.51 O +ATOM 242 N ARG A 31 13.184 30.451 38.677 1.00 25.93 N +ATOM 243 CA ARG A 31 13.791 31.421 37.777 1.00 29.94 C +ATOM 244 C ARG A 31 12.907 32.572 37.387 1.00 30.76 C +ATOM 245 O ARG A 31 13.361 33.688 37.274 1.00 32.12 O +ATOM 246 CB ARG A 31 14.193 30.740 36.464 1.00 26.96 C +ATOM 247 CG ARG A 31 15.517 30.058 36.499 1.00 31.11 C +ATOM 248 CD ARG A 31 15.705 29.170 35.284 1.00 41.58 C +ATOM 249 NE ARG A 31 15.328 29.770 34.014 1.00 34.62 N +ATOM 250 CZ ARG A 31 16.206 30.409 33.213 1.00 27.74 C +ATOM 251 NH1 ARG A 31 15.766 30.902 32.068 1.00 37.77 N +ATOM 252 NH2 ARG A 31 17.438 30.590 33.646 1.00 28.80 N +ATOM 253 N GLU A 32 11.620 32.325 37.181 1.00 28.78 N +ATOM 254 CA GLU A 32 10.699 33.380 36.781 1.00 29.44 C +ATOM 255 C GLU A 32 10.202 34.205 37.939 1.00 27.51 C +ATOM 256 O GLU A 32 9.447 35.188 37.810 1.00 35.11 O +ATOM 257 CB GLU A 32 9.538 32.718 36.034 1.00 36.98 C +ATOM 258 CG GLU A 32 10.117 32.006 34.808 1.00 31.54 C +ATOM 259 CD GLU A 32 10.844 32.917 33.862 1.00 39.68 C +ATOM 260 OE1 GLU A 32 10.490 34.121 33.795 1.00 43.38 O +ATOM 261 OE2 GLU A 32 11.783 32.481 33.160 1.00 45.30 O +ATOM 262 N SER A 33 10.659 33.819 39.153 1.00 30.19 N +ATOM 263 CA SER A 33 10.227 34.575 40.337 1.00 32.12 C +ATOM 264 C SER A 33 11.322 35.066 41.233 1.00 28.63 C +ATOM 265 O SER A 33 11.094 35.541 42.382 1.00 30.90 O +ATOM 266 CB SER A 33 9.256 33.684 41.163 1.00 33.13 C +ATOM 267 OG SER A 33 9.923 32.580 41.707 1.00 30.16 O +ATOM 268 N HIS A 34 12.558 35.009 40.785 1.00 27.30 N +ATOM 269 CA HIS A 34 13.741 35.339 41.555 1.00 30.98 C +ATOM 270 C HIS A 34 14.817 35.941 40.627 1.00 25.65 C +ATOM 271 O HIS A 34 15.082 35.539 39.475 1.00 26.39 O +ATOM 272 CB HIS A 34 14.388 34.097 42.146 1.00 32.37 C +ATOM 273 CG HIS A 34 13.667 33.467 43.292 1.00 26.83 C +ATOM 274 ND1 HIS A 34 12.547 32.715 43.203 1.00 38.29 N +ATOM 275 CD2 HIS A 34 14.079 33.498 44.620 1.00 23.42 C +ATOM 276 CE1 HIS A 34 12.218 32.302 44.423 1.00 34.10 C +ATOM 277 NE2 HIS A 34 13.100 32.758 45.279 1.00 31.74 N +ATOM 278 N GLN A 35 15.403 37.002 41.122 1.00 21.37 N +ATOM 279 CA GLN A 35 16.465 37.691 40.388 1.00 22.70 C +ATOM 280 C GLN A 35 17.789 36.942 40.541 1.00 20.95 C +ATOM 281 O GLN A 35 18.677 37.204 39.740 1.00 25.48 O +ATOM 282 CB GLN A 35 16.522 39.159 40.864 1.00 18.90 C +ATOM 283 CG GLN A 35 15.263 39.924 40.334 1.00 22.57 C +ATOM 284 CD GLN A 35 15.135 39.713 38.839 1.00 29.42 C +ATOM 285 OE1 GLN A 35 15.844 40.403 38.100 1.00 28.51 O +ATOM 286 NE2 GLN A 35 14.260 38.789 38.429 1.00 23.18 N +ATOM 287 N ARG A 36 17.874 36.168 41.612 1.00 25.64 N +ATOM 288 CA ARG A 36 19.145 35.426 41.825 1.00 25.34 C +ATOM 289 C ARG A 36 19.370 34.414 40.633 1.00 18.95 C +ATOM 290 O ARG A 36 18.549 33.543 40.519 1.00 24.10 O +ATOM 291 CB ARG A 36 18.997 34.663 43.172 1.00 27.23 C +ATOM 292 CG ARG A 36 20.337 34.033 43.552 1.00 32.62 C +ATOM 293 CD ARG A 36 20.132 33.250 44.844 1.00 38.28 C +ATOM 294 NE ARG A 36 19.851 34.090 45.984 1.00 46.08 N +ATOM 295 CZ ARG A 36 20.612 34.928 46.658 1.00 42.34 C +ATOM 296 NH1 ARG A 36 21.888 35.214 46.405 1.00 43.67 N +ATOM 297 NH2 ARG A 36 20.127 35.575 47.737 1.00 45.81 N +ATOM 298 N PRO A 37 20.556 34.535 40.109 1.00 24.13 N +ATOM 299 CA PRO A 37 20.844 33.656 38.944 1.00 25.95 C +ATOM 300 C PRO A 37 21.239 32.249 39.366 1.00 20.94 C +ATOM 301 O PRO A 37 21.867 32.118 40.410 1.00 23.18 O +ATOM 302 CB PRO A 37 21.990 34.323 38.186 1.00 31.00 C +ATOM 303 CG PRO A 37 22.727 35.028 39.246 1.00 29.01 C +ATOM 304 CD PRO A 37 21.602 35.515 40.228 1.00 21.82 C +ATOM 305 N LEU A 38 20.674 31.287 38.678 1.00 19.69 N +ATOM 306 CA LEU A 38 20.859 29.870 38.914 1.00 18.40 C +ATOM 307 C LEU A 38 22.016 29.261 38.075 1.00 19.09 C +ATOM 308 O LEU A 38 22.334 29.706 36.977 1.00 20.25 O +ATOM 309 CB LEU A 38 19.678 28.961 38.637 1.00 20.66 C +ATOM 310 CG LEU A 38 18.465 29.120 39.538 1.00 30.65 C +ATOM 311 CD1 LEU A 38 17.426 28.123 39.092 1.00 28.00 C +ATOM 312 CD2 LEU A 38 18.987 28.880 40.966 1.00 32.63 C +ATOM 313 N VAL A 39 22.753 28.392 38.780 1.00 18.13 N +ATOM 314 CA VAL A 39 23.756 27.540 38.120 1.00 20.54 C +ATOM 315 C VAL A 39 23.510 26.100 38.511 1.00 15.61 C +ATOM 316 O VAL A 39 23.189 25.890 39.741 1.00 17.98 O +ATOM 317 CB VAL A 39 25.180 27.944 38.551 1.00 18.22 C +ATOM 318 CG1 VAL A 39 26.254 26.970 38.079 1.00 18.09 C +ATOM 319 CG2 VAL A 39 25.523 29.369 38.102 1.00 19.45 C +ATOM 320 N ILE A 40 23.555 25.125 37.643 1.00 16.32 N +ATOM 321 CA ILE A 40 23.419 23.756 38.022 1.00 14.57 C +ATOM 322 C ILE A 40 24.781 23.056 37.921 1.00 16.63 C +ATOM 323 O ILE A 40 25.517 23.334 36.944 1.00 16.62 O +ATOM 324 CB AILE A 40 22.452 22.962 37.112 0.50 9.82 C +ATOM 325 CG1AILE A 40 21.049 23.503 37.276 0.50 12.13 C +ATOM 326 CG2AILE A 40 22.523 21.488 37.301 0.50 12.02 C +ATOM 327 CD1AILE A 40 19.999 22.895 36.367 0.50 15.73 C +ATOM 328 CB BILE A 40 22.429 23.022 37.100 0.50 9.82 C +ATOM 329 CG1BILE A 40 21.031 23.644 37.130 0.50 12.13 C +ATOM 330 CG2BILE A 40 22.234 21.546 37.453 0.50 12.02 C +ATOM 331 CD1BILE A 40 20.395 23.623 38.522 0.50 15.73 C +ATOM 332 N VAL A 41 25.173 22.334 38.901 1.00 16.09 N +ATOM 333 CA VAL A 41 26.326 21.398 38.830 1.00 15.65 C +ATOM 334 C VAL A 41 25.736 20.036 38.983 1.00 17.55 C +ATOM 335 O VAL A 41 24.805 19.814 39.785 1.00 18.89 O +ATOM 336 CB VAL A 41 27.345 21.662 39.910 1.00 14.54 C +ATOM 337 CG1 VAL A 41 28.440 20.570 39.965 1.00 16.97 C +ATOM 338 CG2 VAL A 41 27.944 23.034 39.770 1.00 17.08 C +ATOM 339 N HIS A 42 26.231 18.987 38.308 1.00 16.24 N +ATOM 340 CA HIS A 42 25.679 17.657 38.383 1.00 15.57 C +ATOM 341 C HIS A 42 26.754 16.560 38.447 1.00 17.33 C +ATOM 342 O HIS A 42 27.843 16.716 37.944 1.00 17.68 O +ATOM 343 CB HIS A 42 24.737 17.348 37.219 1.00 17.05 C +ATOM 344 CG HIS A 42 25.432 17.292 35.898 1.00 16.35 C +ATOM 345 ND1 HIS A 42 25.986 16.115 35.499 1.00 16.43 N +ATOM 346 CD2 HIS A 42 25.639 18.285 34.968 1.00 16.06 C +ATOM 347 CE1 HIS A 42 26.563 16.369 34.286 1.00 19.33 C +ATOM 348 NE2 HIS A 42 26.391 17.640 33.959 1.00 16.89 N +ATOM 349 N GLY A 43 26.256 15.485 39.119 1.00 20.25 N +ATOM 350 CA GLY A 43 27.108 14.257 39.075 1.00 23.29 C +ATOM 351 C GLY A 43 26.441 13.330 38.070 1.00 21.61 C +ATOM 352 O GLY A 43 26.111 13.618 36.960 1.00 20.30 O +ATOM 353 N GLY A 44 26.265 12.061 38.514 1.00 28.36 N +ATOM 354 CA GLY A 44 25.739 11.051 37.563 1.00 27.98 C +ATOM 355 C GLY A 44 26.375 9.678 37.776 1.00 27.19 C +ATOM 356 O GLY A 44 26.528 8.941 36.800 1.00 27.80 O +ATOM 357 N GLY A 45 26.850 9.471 38.986 1.00 25.83 N +ATOM 358 CA GLY A 45 27.465 8.145 39.296 1.00 28.98 C +ATOM 359 C GLY A 45 26.639 6.989 38.757 1.00 36.62 C +ATOM 360 O GLY A 45 27.172 6.010 38.234 1.00 35.15 O +ATOM 361 N CYS A 46 25.317 7.082 38.813 1.00 33.99 N +ATOM 362 CA CYS A 46 24.467 5.964 38.377 1.00 40.00 C +ATOM 363 C CYS A 46 24.588 5.723 36.883 1.00 45.29 C +ATOM 364 O CYS A 46 24.559 4.570 36.411 1.00 37.52 O +ATOM 365 CB CYS A 46 23.020 6.183 38.825 1.00 42.40 C +ATOM 366 SG CYS A 46 22.258 7.682 38.186 1.00 40.14 S +ATOM 367 N VAL A 47 24.693 6.812 36.110 1.00 32.75 N +ATOM 368 CA VAL A 47 24.890 6.683 34.666 1.00 29.26 C +ATOM 369 C VAL A 47 26.210 5.950 34.399 1.00 36.72 C +ATOM 370 O VAL A 47 26.281 5.122 33.486 1.00 35.04 O +ATOM 371 CB VAL A 47 24.923 8.025 33.926 1.00 27.19 C +ATOM 372 CG1 VAL A 47 24.966 7.846 32.416 1.00 27.48 C +ATOM 373 CG2 VAL A 47 23.683 8.835 34.310 1.00 35.14 C +ATOM 374 N VAL A 48 27.289 6.319 35.097 1.00 29.15 N +ATOM 375 CA VAL A 48 28.549 5.607 34.980 1.00 30.20 C +ATOM 376 C VAL A 48 28.400 4.127 35.376 1.00 26.65 C +ATOM 377 O VAL A 48 28.916 3.310 34.599 1.00 32.34 O +ATOM 378 CB VAL A 48 29.630 6.260 35.896 1.00 27.78 C +ATOM 379 CG1 VAL A 48 30.919 5.470 35.759 1.00 30.35 C +ATOM 380 CG2 VAL A 48 29.745 7.712 35.463 1.00 31.56 C +ATOM 381 N ASP A 49 27.791 3.859 36.526 1.00 29.84 N +ATOM 382 CA ASP A 49 27.709 2.473 36.973 1.00 42.09 C +ATOM 383 C ASP A 49 26.941 1.585 35.997 1.00 34.57 C +ATOM 384 O ASP A 49 27.304 0.403 35.850 1.00 42.29 O +ATOM 385 CB ASP A 49 27.037 2.346 38.321 1.00 36.30 C +ATOM 386 CG ASP A 49 27.716 3.000 39.473 1.00 45.15 C +ATOM 387 OD1 ASP A 49 27.053 3.278 40.490 1.00 46.27 O +ATOM 388 OD2 ASP A 49 28.939 3.278 39.353 1.00 44.81 O +ATOM 389 N GLU A 50 25.943 2.170 35.329 1.00 36.20 N +ATOM 390 CA GLU A 50 25.198 1.421 34.367 1.00 31.88 C +ATOM 391 C GLU A 50 25.999 1.113 33.122 1.00 37.38 C +ATOM 392 O GLU A 50 25.862 -0.008 32.571 1.00 36.85 O +ATOM 393 CB GLU A 50 23.893 2.125 33.944 1.00 37.37 C +ATOM 394 CG GLU A 50 22.923 2.178 35.124 1.00 43.39 C +ATOM 395 CD GLU A 50 21.695 3.023 34.756 1.00 55.20 C +ATOM 396 OE1 GLU A 50 21.466 3.153 33.523 1.00 59.97 O +ATOM 397 OE2 GLU A 50 21.050 3.500 35.708 1.00 50.20 O +ATOM 398 N LEU A 51 26.848 2.015 32.667 1.00 33.22 N +ATOM 399 CA LEU A 51 27.641 1.848 31.454 1.00 36.63 C +ATOM 400 C LEU A 51 28.810 0.908 31.855 1.00 30.05 C +ATOM 401 O LEU A 51 29.149 0.088 31.002 1.00 41.21 O +ATOM 402 CB LEU A 51 28.142 3.172 30.922 1.00 35.85 C +ATOM 403 CG LEU A 51 29.022 3.331 29.705 1.00 40.98 C +ATOM 404 CD1 LEU A 51 28.461 2.811 28.370 1.00 33.00 C +ATOM 405 CD2 LEU A 51 29.432 4.801 29.482 1.00 32.37 C +ATOM 406 N MET A 52 29.280 1.050 33.100 1.00 43.39 N +ATOM 407 CA MET A 52 30.307 0.099 33.549 1.00 48.70 C +ATOM 408 C MET A 52 29.699 -1.308 33.677 1.00 50.44 C +ATOM 409 O MET A 52 30.375 -2.271 33.335 1.00 44.83 O +ATOM 410 CB MET A 52 31.008 0.439 34.846 1.00 49.84 C +ATOM 411 CG MET A 52 31.876 1.690 34.865 1.00 45.23 C +ATOM 412 SD MET A 52 33.188 1.705 33.628 1.00 43.58 S +ATOM 413 CE MET A 52 32.233 1.695 32.116 1.00 60.83 C +ATOM 414 N LYS A 53 28.469 -1.368 34.172 1.00 60.50 N +ATOM 415 CA LYS A 53 27.770 -2.650 34.294 1.00 59.89 C +ATOM 416 C LYS A 53 27.655 -3.322 32.933 1.00 50.58 C +ATOM 417 O LYS A 53 27.989 -4.493 32.755 1.00 56.11 O +ATOM 418 CB LYS A 53 26.392 -2.445 34.914 1.00 67.82 C +ATOM 419 CG LYS A 53 25.550 -3.684 35.162 1.00 79.20 C +ATOM 420 CD LYS A 53 24.138 -3.325 35.608 1.00 84.45 C +ATOM 421 CE LYS A 53 23.499 -4.379 36.490 1.00 86.54 C +ATOM 422 NZ LYS A 53 23.054 -5.585 35.747 1.00 85.70 N +ATOM 423 N GLY A 54 27.232 -2.581 31.916 1.00 40.38 N +ATOM 424 CA GLY A 54 27.069 -3.091 30.567 1.00 44.62 C +ATOM 425 C GLY A 54 28.397 -3.473 29.910 1.00 43.33 C +ATOM 426 O GLY A 54 28.458 -4.169 28.883 1.00 43.32 O +ATOM 427 N LEU A 55 29.490 -2.984 30.511 1.00 46.99 N +ATOM 428 CA LEU A 55 30.814 -3.288 30.000 1.00 45.45 C +ATOM 429 C LEU A 55 31.518 -4.369 30.812 1.00 46.21 C +ATOM 430 O LEU A 55 32.607 -4.783 30.409 1.00 50.15 O +ATOM 431 CB LEU A 55 31.678 -2.012 29.946 1.00 41.07 C +ATOM 432 CG LEU A 55 31.175 -0.940 28.970 1.00 38.07 C +ATOM 433 CD1 LEU A 55 31.894 0.367 29.230 1.00 43.49 C +ATOM 434 CD2 LEU A 55 31.432 -1.391 27.533 1.00 43.13 C +ATOM 435 N ASN A 56 30.958 -4.802 31.913 1.00 41.25 N +ATOM 436 CA ASN A 56 31.511 -5.817 32.788 1.00 52.20 C +ATOM 437 C ASN A 56 32.740 -5.295 33.531 1.00 59.93 C +ATOM 438 O ASN A 56 33.698 -6.021 33.806 1.00 57.54 O +ATOM 439 CB AASN A 56 31.832 -7.108 32.029 0.50 54.69 C +ATOM 440 CG AASN A 56 32.359 -8.202 32.938 0.50 51.05 C +ATOM 441 OD1AASN A 56 31.732 -8.521 33.949 0.50 59.69 O +ATOM 442 ND2AASN A 56 33.508 -8.760 32.580 0.50 53.29 N +ATOM 443 CB BASN A 56 31.912 -7.056 31.972 0.50 54.69 C +ATOM 444 CG BASN A 56 30.738 -7.681 31.219 0.50 51.05 C +ATOM 445 OD1BASN A 56 29.768 -8.110 31.841 0.50 59.69 O +ATOM 446 ND2BASN A 56 30.767 -7.761 29.902 0.50 53.29 N +ATOM 447 N LEU A 57 32.697 -4.034 33.939 1.00 51.46 N +ATOM 448 CA LEU A 57 33.798 -3.394 34.658 1.00 49.13 C +ATOM 449 C LEU A 57 33.405 -3.164 36.107 1.00 50.73 C +ATOM 450 O LEU A 57 32.255 -2.847 36.419 1.00 44.99 O +ATOM 451 CB LEU A 57 34.180 -2.057 34.001 1.00 46.92 C +ATOM 452 CG LEU A 57 34.700 -2.190 32.558 1.00 40.73 C +ATOM 453 CD1 LEU A 57 34.673 -0.845 31.821 1.00 55.79 C +ATOM 454 CD2 LEU A 57 36.155 -2.683 32.639 1.00 51.06 C +ATOM 455 N PRO A 58 34.328 -3.400 37.032 1.00 39.83 N +ATOM 456 CA PRO A 58 34.129 -3.228 38.441 1.00 47.95 C +ATOM 457 C PRO A 58 34.073 -1.768 38.869 1.00 47.99 C +ATOM 458 O PRO A 58 34.674 -0.872 38.278 1.00 46.93 O +ATOM 459 CB PRO A 58 35.376 -3.870 39.084 1.00 52.83 C +ATOM 460 CG PRO A 58 36.411 -3.663 38.017 1.00 44.03 C +ATOM 461 CD PRO A 58 35.687 -3.966 36.732 1.00 49.34 C +ATOM 462 N VAL A 59 33.393 -1.565 39.987 1.00 46.61 N +ATOM 463 CA VAL A 59 33.262 -0.238 40.558 1.00 47.63 C +ATOM 464 C VAL A 59 33.919 -0.227 41.915 1.00 47.27 C +ATOM 465 O VAL A 59 33.380 -0.780 42.880 1.00 63.95 O +ATOM 466 CB VAL A 59 31.789 0.185 40.682 1.00 38.02 C +ATOM 467 CG1 VAL A 59 31.721 1.411 41.599 1.00 47.82 C +ATOM 468 CG2 VAL A 59 31.317 0.436 39.265 1.00 36.63 C +ATOM 469 N LYS A 60 35.060 0.374 42.053 1.00 38.39 N +ATOM 470 CA LYS A 60 35.848 0.458 43.256 1.00 36.97 C +ATOM 471 C LYS A 60 35.832 1.941 43.686 1.00 40.29 C +ATOM 472 O LYS A 60 36.299 2.760 42.888 1.00 33.18 O +ATOM 473 CB LYS A 60 37.332 0.151 42.997 1.00 41.28 C +ATOM 474 CG LYS A 60 38.128 -0.486 44.102 1.00 56.00 C +ATOM 475 CD LYS A 60 37.679 -0.318 45.525 1.00 59.70 C +ATOM 476 CE LYS A 60 37.866 -1.588 46.345 1.00 61.43 C +ATOM 477 NZ LYS A 60 39.239 -1.748 46.893 1.00 63.89 N +ATOM 478 N LYS A 61 35.300 2.163 44.872 1.00 36.59 N +ATOM 479 CA LYS A 61 35.362 3.485 45.476 1.00 39.13 C +ATOM 480 C LYS A 61 36.297 3.419 46.659 1.00 36.00 C +ATOM 481 O LYS A 61 36.242 2.537 47.528 1.00 46.21 O +ATOM 482 CB LYS A 61 33.943 3.958 45.802 1.00 39.06 C +ATOM 483 CG LYS A 61 33.238 4.368 44.508 1.00 35.61 C +ATOM 484 CD LYS A 61 31.874 4.979 44.762 1.00 43.75 C +ATOM 485 CE LYS A 61 31.156 5.304 43.453 1.00 44.28 C +ATOM 486 NZ LYS A 61 29.854 5.976 43.720 1.00 42.91 N +ATOM 487 N LYS A 62 37.269 4.320 46.697 1.00 42.31 N +ATOM 488 CA LYS A 62 38.271 4.334 47.763 1.00 45.45 C +ATOM 489 C LYS A 62 38.064 5.609 48.556 1.00 47.34 C +ATOM 490 O LYS A 62 38.354 6.725 48.112 1.00 45.58 O +ATOM 491 CB LYS A 62 39.642 4.166 47.136 1.00 45.74 C +ATOM 492 CG LYS A 62 40.822 3.938 48.044 1.00 53.16 C +ATOM 493 CD LYS A 62 41.959 3.283 47.269 1.00 56.84 C +ATOM 494 CE LYS A 62 43.240 3.238 48.090 1.00 57.74 C +ATOM 495 NZ LYS A 62 44.422 3.025 47.193 1.00 68.40 N +ATOM 496 N ASN A 63 37.419 5.429 49.711 1.00 53.87 N +ATOM 497 CA ASN A 63 37.117 6.552 50.593 1.00 52.57 C +ATOM 498 C ASN A 63 36.069 7.478 49.956 1.00 45.32 C +ATOM 499 O ASN A 63 36.222 8.694 49.986 1.00 50.64 O +ATOM 500 CB ASN A 63 38.378 7.318 50.965 1.00 54.12 C +ATOM 501 CG ASN A 63 39.525 6.507 51.524 1.00 65.09 C +ATOM 502 OD1 ASN A 63 40.660 6.984 51.719 1.00 62.13 O +ATOM 503 ND2 ASN A 63 39.296 5.228 51.805 1.00 66.86 N +ATOM 504 N GLY A 64 35.051 6.893 49.345 1.00 44.37 N +ATOM 505 CA GLY A 64 33.951 7.579 48.717 1.00 38.38 C +ATOM 506 C GLY A 64 34.227 8.112 47.321 1.00 38.89 C +ATOM 507 O GLY A 64 33.303 8.586 46.682 1.00 31.11 O +ATOM 508 N LEU A 65 35.440 7.986 46.809 1.00 30.78 N +ATOM 509 CA LEU A 65 35.797 8.456 45.470 1.00 27.15 C +ATOM 510 C LEU A 65 36.016 7.248 44.567 1.00 27.79 C +ATOM 511 O LEU A 65 36.638 6.235 44.965 1.00 31.26 O +ATOM 512 CB LEU A 65 37.061 9.312 45.519 1.00 26.74 C +ATOM 513 CG LEU A 65 37.042 10.511 46.460 1.00 22.14 C +ATOM 514 CD1 LEU A 65 38.367 11.217 46.465 1.00 27.03 C +ATOM 515 CD2 LEU A 65 35.946 11.461 45.907 1.00 20.96 C +ATOM 516 N ARG A 66 35.540 7.339 43.344 1.00 25.44 N +ATOM 517 CA ARG A 66 35.658 6.264 42.387 1.00 25.63 C +ATOM 518 C ARG A 66 37.073 6.160 41.808 1.00 26.66 C +ATOM 519 O ARG A 66 37.594 7.119 41.185 1.00 25.22 O +ATOM 520 CB ARG A 66 34.740 6.468 41.186 1.00 26.19 C +ATOM 521 CG ARG A 66 34.782 5.357 40.140 1.00 29.60 C +ATOM 522 CD ARG A 66 34.088 5.703 38.834 1.00 31.26 C +ATOM 523 NE ARG A 66 32.731 6.204 39.125 1.00 31.11 N +ATOM 524 CZ ARG A 66 31.704 5.389 39.326 1.00 34.91 C +ATOM 525 NH1 ARG A 66 31.793 4.073 39.239 1.00 36.77 N +ATOM 526 NH2 ARG A 66 30.511 5.920 39.643 1.00 27.08 N +ATOM 527 N VAL A 67 37.769 5.027 42.036 1.00 26.53 N +ATOM 528 CA VAL A 67 39.058 4.785 41.359 1.00 25.55 C +ATOM 529 C VAL A 67 38.789 4.844 39.867 1.00 20.78 C +ATOM 530 O VAL A 67 37.927 4.147 39.273 1.00 25.12 O +ATOM 531 CB VAL A 67 39.662 3.426 41.759 1.00 26.76 C +ATOM 532 CG1 VAL A 67 40.958 3.091 41.014 1.00 28.01 C +ATOM 533 CG2 VAL A 67 39.871 3.408 43.262 1.00 31.47 C +ATOM 534 N THR A 68 39.628 5.633 39.174 1.00 21.26 N +ATOM 535 CA THR A 68 39.445 5.933 37.777 1.00 20.06 C +ATOM 536 C THR A 68 40.729 5.669 37.008 1.00 21.51 C +ATOM 537 O THR A 68 41.497 6.561 36.752 1.00 21.78 O +ATOM 538 CB THR A 68 38.967 7.416 37.639 1.00 24.25 C +ATOM 539 OG1 THR A 68 37.756 7.564 38.439 1.00 21.92 O +ATOM 540 CG2 THR A 68 38.587 7.772 36.200 1.00 23.06 C +ATOM 541 N PRO A 69 40.872 4.411 36.552 1.00 26.47 N +ATOM 542 CA PRO A 69 42.068 4.070 35.759 1.00 25.73 C +ATOM 543 C PRO A 69 42.117 4.818 34.472 1.00 22.87 C +ATOM 544 O PRO A 69 41.082 5.286 33.912 1.00 23.09 O +ATOM 545 CB PRO A 69 41.933 2.575 35.590 1.00 27.77 C +ATOM 546 CG PRO A 69 41.101 2.101 36.752 1.00 24.21 C +ATOM 547 CD PRO A 69 40.061 3.242 36.917 1.00 24.28 C +ATOM 548 N ALA A 70 43.266 4.880 33.809 1.00 24.23 N +ATOM 549 CA ALA A 70 43.502 5.557 32.553 1.00 24.44 C +ATOM 550 C ALA A 70 42.653 4.878 31.491 1.00 25.51 C +ATOM 551 O ALA A 70 42.086 5.546 30.609 1.00 28.56 O +ATOM 552 CB ALA A 70 44.976 5.565 32.143 1.00 28.38 C +ATOM 553 N ASP A 71 42.361 3.601 31.646 1.00 30.21 N +ATOM 554 CA ASP A 71 41.557 2.896 30.658 1.00 33.33 C +ATOM 555 C ASP A 71 40.062 3.065 30.872 1.00 28.04 C +ATOM 556 O ASP A 71 39.306 2.505 30.072 1.00 31.25 O +ATOM 557 CB ASP A 71 41.976 1.413 30.563 1.00 34.12 C +ATOM 558 CG ASP A 71 41.409 0.599 31.673 1.00 38.13 C +ATOM 559 OD1 ASP A 71 40.952 1.131 32.712 1.00 38.06 O +ATOM 560 OD2 ASP A 71 41.380 -0.670 31.591 1.00 46.25 O +ATOM 561 N GLN A 72 39.611 3.886 31.813 1.00 26.26 N +ATOM 562 CA GLN A 72 38.194 4.082 32.130 1.00 21.89 C +ATOM 563 C GLN A 72 37.843 5.610 32.044 1.00 22.87 C +ATOM 564 O GLN A 72 36.662 5.961 32.039 1.00 23.21 O +ATOM 565 CB GLN A 72 37.911 3.500 33.502 1.00 29.07 C +ATOM 566 CG GLN A 72 37.637 1.985 33.541 1.00 29.21 C +ATOM 567 CD GLN A 72 37.604 1.305 34.842 1.00 32.83 C +ATOM 568 OE1 GLN A 72 36.740 1.608 35.693 1.00 39.21 O +ATOM 569 NE2 GLN A 72 38.505 0.282 35.092 1.00 31.83 N +ATOM 570 N ILE A 73 38.819 6.510 32.012 1.00 21.63 N +ATOM 571 CA ILE A 73 38.522 7.964 32.087 1.00 23.84 C +ATOM 572 C ILE A 73 37.725 8.373 30.854 1.00 20.61 C +ATOM 573 O ILE A 73 36.796 9.214 31.011 1.00 20.76 O +ATOM 574 CB ILE A 73 39.735 8.861 32.306 1.00 21.11 C +ATOM 575 CG1 ILE A 73 39.353 10.351 32.446 1.00 20.15 C +ATOM 576 CG2 ILE A 73 40.753 8.740 31.161 1.00 23.59 C +ATOM 577 CD1 ILE A 73 38.527 10.653 33.660 1.00 21.09 C +ATOM 578 N ASP A 74 37.968 7.854 29.661 1.00 19.55 N +ATOM 579 CA ASP A 74 37.239 8.262 28.464 1.00 20.21 C +ATOM 580 C ASP A 74 35.783 7.828 28.580 1.00 20.36 C +ATOM 581 O ASP A 74 34.854 8.623 28.258 1.00 20.55 O +ATOM 582 CB ASP A 74 37.931 7.714 27.203 1.00 23.04 C +ATOM 583 CG ASP A 74 39.262 8.416 27.001 1.00 39.67 C +ATOM 584 OD1 ASP A 74 39.470 9.577 27.416 1.00 27.87 O +ATOM 585 OD2 ASP A 74 40.273 7.911 26.460 1.00 48.07 O +ATOM 586 N ILE A 75 35.509 6.636 29.057 1.00 21.45 N +ATOM 587 CA ILE A 75 34.122 6.161 29.176 1.00 21.99 C +ATOM 588 C ILE A 75 33.407 6.951 30.252 1.00 20.12 C +ATOM 589 O ILE A 75 32.197 7.296 30.136 1.00 22.33 O +ATOM 590 CB ILE A 75 34.081 4.634 29.391 1.00 31.22 C +ATOM 591 CG1 ILE A 75 32.659 4.093 29.511 1.00 30.44 C +ATOM 592 CG2 ILE A 75 34.827 4.225 30.648 1.00 45.66 C +ATOM 593 CD1 ILE A 75 31.843 4.129 28.239 1.00 48.06 C +ATOM 594 N ILE A 76 34.029 7.217 31.393 1.00 18.77 N +ATOM 595 CA ILE A 76 33.419 7.981 32.477 1.00 20.43 C +ATOM 596 C ILE A 76 33.158 9.391 32.002 1.00 21.45 C +ATOM 597 O ILE A 76 32.082 9.950 32.257 1.00 20.46 O +ATOM 598 CB ILE A 76 34.333 7.951 33.716 1.00 22.37 C +ATOM 599 CG1 ILE A 76 34.234 6.492 34.217 1.00 24.27 C +ATOM 600 CG2 ILE A 76 33.943 8.880 34.871 1.00 24.06 C +ATOM 601 CD1 ILE A 76 35.221 6.155 35.308 1.00 28.12 C +ATOM 602 N THR A 77 34.116 9.942 31.247 1.00 18.60 N +ATOM 603 CA THR A 77 33.867 11.308 30.725 1.00 17.38 C +ATOM 604 C THR A 77 32.642 11.297 29.841 1.00 18.17 C +ATOM 605 O THR A 77 31.835 12.262 29.845 1.00 17.69 O +ATOM 606 CB THR A 77 35.138 11.749 29.951 1.00 17.75 C +ATOM 607 OG1 THR A 77 36.209 11.992 30.914 1.00 19.73 O +ATOM 608 CG2 THR A 77 34.907 13.057 29.230 1.00 19.94 C +ATOM 609 N GLY A 78 32.511 10.273 28.993 1.00 17.56 N +ATOM 610 CA GLY A 78 31.369 10.217 28.055 1.00 18.16 C +ATOM 611 C GLY A 78 30.056 10.189 28.827 1.00 16.44 C +ATOM 612 O GLY A 78 29.120 10.955 28.576 1.00 17.53 O +ATOM 613 N ALA A 79 30.000 9.385 29.899 1.00 18.31 N +ATOM 614 CA ALA A 79 28.772 9.250 30.672 1.00 19.08 C +ATOM 615 C ALA A 79 28.444 10.527 31.461 1.00 16.44 C +ATOM 616 O ALA A 79 27.275 10.908 31.529 1.00 18.00 O +ATOM 617 CB ALA A 79 28.840 8.133 31.716 1.00 21.39 C +ATOM 618 N LEU A 80 29.447 11.164 32.038 1.00 18.50 N +ATOM 619 CA LEU A 80 29.186 12.321 32.895 1.00 20.14 C +ATOM 620 C LEU A 80 29.193 13.630 32.107 1.00 17.14 C +ATOM 621 O LEU A 80 28.199 14.403 32.139 1.00 18.85 O +ATOM 622 CB LEU A 80 30.261 12.462 33.962 1.00 22.16 C +ATOM 623 CG LEU A 80 30.192 11.396 35.040 1.00 21.93 C +ATOM 624 CD1 LEU A 80 31.234 11.668 36.134 1.00 22.86 C +ATOM 625 CD2 LEU A 80 28.841 11.249 35.676 1.00 20.86 C +ATOM 626 N ALA A 81 30.304 13.927 31.406 1.00 16.67 N +ATOM 627 CA ALA A 81 30.331 15.170 30.640 1.00 18.33 C +ATOM 628 C ALA A 81 29.419 15.120 29.387 1.00 19.38 C +ATOM 629 O ALA A 81 29.065 16.186 28.911 1.00 18.40 O +ATOM 630 CB ALA A 81 31.754 15.503 30.156 1.00 17.67 C +ATOM 631 N GLY A 82 29.138 13.916 28.903 1.00 17.83 N +ATOM 632 CA GLY A 82 28.276 13.807 27.694 1.00 16.97 C +ATOM 633 C GLY A 82 26.822 13.476 28.072 1.00 14.66 C +ATOM 634 O GLY A 82 25.959 14.317 27.993 1.00 18.16 O +ATOM 635 N THR A 83 26.562 12.250 28.440 1.00 17.32 N +ATOM 636 CA THR A 83 25.160 11.773 28.599 1.00 16.06 C +ATOM 637 C THR A 83 24.482 12.527 29.724 1.00 15.96 C +ATOM 638 O THR A 83 23.373 13.087 29.516 1.00 17.48 O +ATOM 639 CB THR A 83 25.146 10.281 28.870 1.00 18.30 C +ATOM 640 OG1 THR A 83 25.808 9.540 27.851 1.00 17.77 O +ATOM 641 CG2 THR A 83 23.697 9.803 28.976 1.00 19.22 C +ATOM 642 N ALA A 84 25.090 12.597 30.905 1.00 16.41 N +ATOM 643 CA ALA A 84 24.334 13.275 31.971 1.00 16.67 C +ATOM 644 C ALA A 84 24.157 14.741 31.725 1.00 16.59 C +ATOM 645 O ALA A 84 23.080 15.373 31.905 1.00 18.12 O +ATOM 646 CB ALA A 84 25.047 12.999 33.295 1.00 19.59 C +ATOM 647 N ASN A 85 25.208 15.443 31.241 1.00 16.41 N +ATOM 648 CA ASN A 85 25.098 16.880 30.986 1.00 16.65 C +ATOM 649 C ASN A 85 24.097 17.137 29.859 1.00 14.93 C +ATOM 650 O ASN A 85 23.267 18.063 30.092 1.00 16.64 O +ATOM 651 CB ASN A 85 26.506 17.387 30.500 1.00 14.56 C +ATOM 652 CG ASN A 85 26.627 18.900 30.494 1.00 18.09 C +ATOM 653 OD1 ASN A 85 26.649 19.536 29.416 1.00 17.03 O +ATOM 654 ND2 ASN A 85 26.715 19.546 31.674 1.00 15.68 N +ATOM 655 N LYS A 86 24.092 16.378 28.794 1.00 16.92 N +ATOM 656 CA LYS A 86 23.187 16.670 27.680 1.00 17.80 C +ATOM 657 C LYS A 86 21.786 16.240 27.959 1.00 16.15 C +ATOM 658 O LYS A 86 20.867 16.893 27.455 1.00 16.88 O +ATOM 659 CB LYS A 86 23.770 16.037 26.383 1.00 17.33 C +ATOM 660 CG LYS A 86 24.558 17.182 25.694 1.00 18.12 C +ATOM 661 CD LYS A 86 25.693 17.631 26.611 1.00 19.86 C +ATOM 662 CE LYS A 86 26.490 18.736 25.914 1.00 17.96 C +ATOM 663 NZ LYS A 86 27.585 19.389 26.686 1.00 17.98 N +ATOM 664 N THR A 87 21.577 15.295 28.871 1.00 17.06 N +ATOM 665 CA THR A 87 20.196 14.939 29.257 1.00 16.88 C +ATOM 666 C THR A 87 19.671 16.138 30.011 1.00 15.79 C +ATOM 667 O THR A 87 18.516 16.553 29.775 1.00 17.46 O +ATOM 668 CB THR A 87 20.274 13.692 30.137 1.00 17.17 C +ATOM 669 OG1 THR A 87 20.626 12.579 29.359 1.00 21.15 O +ATOM 670 CG2 THR A 87 18.894 13.462 30.766 1.00 19.29 C +ATOM 671 N LEU A 88 20.426 16.788 30.874 1.00 18.21 N +ATOM 672 CA LEU A 88 19.956 17.958 31.589 1.00 15.14 C +ATOM 673 C LEU A 88 19.711 19.144 30.680 1.00 16.49 C +ATOM 674 O LEU A 88 18.764 19.919 30.884 1.00 17.98 O +ATOM 675 CB LEU A 88 20.862 18.329 32.759 1.00 16.13 C +ATOM 676 CG LEU A 88 20.855 17.360 33.909 1.00 18.63 C +ATOM 677 CD1 LEU A 88 21.968 17.674 34.877 1.00 21.21 C +ATOM 678 CD2 LEU A 88 19.520 17.402 34.633 1.00 19.65 C +ATOM 679 N LEU A 89 20.595 19.325 29.686 1.00 16.64 N +ATOM 680 CA LEU A 89 20.367 20.428 28.730 1.00 15.83 C +ATOM 681 C LEU A 89 19.109 20.147 27.907 1.00 15.90 C +ATOM 682 O LEU A 89 18.424 21.166 27.559 1.00 18.79 O +ATOM 683 CB LEU A 89 21.558 20.515 27.730 1.00 15.50 C +ATOM 684 CG LEU A 89 22.906 20.868 28.403 1.00 16.60 C +ATOM 685 CD1 LEU A 89 24.033 20.843 27.368 1.00 16.46 C +ATOM 686 CD2 LEU A 89 22.841 22.236 29.054 1.00 17.83 C +ATOM 687 N ALA A 90 18.767 18.888 27.660 1.00 15.58 N +ATOM 688 CA ALA A 90 17.535 18.627 26.911 1.00 17.08 C +ATOM 689 C ALA A 90 16.312 18.915 27.783 1.00 18.50 C +ATOM 690 O ALA A 90 15.314 19.486 27.236 1.00 19.18 O +ATOM 691 CB ALA A 90 17.524 17.158 26.461 1.00 17.80 C +ATOM 692 N TRP A 91 16.335 18.548 29.072 1.00 17.02 N +ATOM 693 CA TRP A 91 15.210 18.955 29.921 1.00 16.54 C +ATOM 694 C TRP A 91 15.087 20.424 30.024 1.00 17.67 C +ATOM 695 O TRP A 91 13.973 21.071 30.034 1.00 19.49 O +ATOM 696 CB TRP A 91 15.462 18.349 31.305 1.00 18.30 C +ATOM 697 CG TRP A 91 14.993 16.928 31.293 1.00 21.76 C +ATOM 698 CD1 TRP A 91 15.758 15.839 30.975 1.00 24.92 C +ATOM 699 CD2 TRP A 91 13.669 16.432 31.511 1.00 23.13 C +ATOM 700 NE1 TRP A 91 15.006 14.677 31.020 1.00 27.28 N +ATOM 701 CE2 TRP A 91 13.725 15.051 31.343 1.00 23.97 C +ATOM 702 CE3 TRP A 91 12.471 17.055 31.875 1.00 22.45 C +ATOM 703 CZ2 TRP A 91 12.610 14.238 31.498 1.00 23.92 C +ATOM 704 CZ3 TRP A 91 11.358 16.213 32.045 1.00 24.47 C +ATOM 705 CH2 TRP A 91 11.413 14.823 31.821 1.00 24.32 C +ATOM 706 N ALA A 92 16.188 21.173 30.066 1.00 16.67 N +ATOM 707 CA ALA A 92 16.140 22.664 30.091 1.00 16.36 C +ATOM 708 C ALA A 92 15.541 23.129 28.784 1.00 16.89 C +ATOM 709 O ALA A 92 14.598 23.943 28.869 1.00 18.18 O +ATOM 710 CB ALA A 92 17.510 23.297 30.251 1.00 20.17 C +ATOM 711 N LYS A 93 15.902 22.602 27.640 1.00 18.62 N +ATOM 712 CA LYS A 93 15.306 23.118 26.396 1.00 20.28 C +ATOM 713 C LYS A 93 13.805 22.775 26.483 1.00 20.37 C +ATOM 714 O LYS A 93 13.102 23.784 26.202 1.00 21.37 O +ATOM 715 CB LYS A 93 15.948 22.441 25.190 1.00 21.09 C +ATOM 716 CG LYS A 93 15.492 22.971 23.841 1.00 20.00 C +ATOM 717 CD LYS A 93 15.832 24.431 23.638 1.00 25.55 C +ATOM 718 CE LYS A 93 15.320 24.847 22.267 1.00 28.15 C +ATOM 719 NZ LYS A 93 15.226 26.307 22.027 1.00 34.54 N +ATOM 720 N LYS A 94 13.411 21.616 26.877 1.00 18.02 N +ATOM 721 CA LYS A 94 11.978 21.304 26.871 1.00 20.75 C +ATOM 722 C LYS A 94 11.171 22.339 27.635 1.00 20.97 C +ATOM 723 O LYS A 94 9.947 22.529 27.371 1.00 22.89 O +ATOM 724 CB LYS A 94 11.853 19.981 27.639 1.00 20.64 C +ATOM 725 CG LYS A 94 10.397 19.499 27.655 1.00 27.82 C +ATOM 726 CD LYS A 94 10.448 18.062 28.169 1.00 29.19 C +ATOM 727 CE LYS A 94 9.036 17.526 28.349 1.00 39.22 C +ATOM 728 NZ LYS A 94 8.291 18.345 29.353 1.00 51.47 N +ATOM 729 N HIS A 95 11.706 22.882 28.704 1.00 18.57 N +ATOM 730 CA HIS A 95 11.136 23.887 29.567 1.00 20.76 C +ATOM 731 C HIS A 95 11.477 25.322 29.195 1.00 19.00 C +ATOM 732 O HIS A 95 11.302 26.233 30.011 1.00 20.81 O +ATOM 733 CB HIS A 95 11.551 23.613 31.051 1.00 20.43 C +ATOM 734 CG HIS A 95 10.814 22.462 31.620 1.00 19.57 C +ATOM 735 ND1 HIS A 95 11.080 21.139 31.392 1.00 26.24 N +ATOM 736 CD2 HIS A 95 9.618 22.490 32.338 1.00 21.18 C +ATOM 737 CE1 HIS A 95 10.176 20.359 31.979 1.00 25.03 C +ATOM 738 NE2 HIS A 95 9.310 21.171 32.509 1.00 27.77 N +ATOM 739 N GLN A 96 11.960 25.515 27.973 1.00 20.47 N +ATOM 740 CA GLN A 96 12.211 26.841 27.450 1.00 19.97 C +ATOM 741 C GLN A 96 13.240 27.698 28.139 1.00 20.63 C +ATOM 742 O GLN A 96 13.287 28.911 28.200 1.00 24.22 O +ATOM 743 CB AGLN A 96 10.864 27.650 27.437 0.50 18.74 C +ATOM 744 CG AGLN A 96 9.637 26.909 26.920 0.50 24.21 C +ATOM 745 CD AGLN A 96 8.427 27.822 26.793 0.50 30.98 C +ATOM 746 OE1AGLN A 96 7.880 28.264 27.806 0.50 32.65 O +ATOM 747 NE2AGLN A 96 7.990 28.058 25.562 0.50 42.08 N +ATOM 748 CB BGLN A 96 10.834 27.617 27.419 0.50 18.74 C +ATOM 749 CG BGLN A 96 9.891 27.226 26.280 0.50 24.21 C +ATOM 750 CD BGLN A 96 9.092 25.955 26.581 0.50 30.98 C +ATOM 751 OE1BGLN A 96 9.214 24.967 25.859 0.50 32.65 O +ATOM 752 NE2BGLN A 96 8.272 25.921 27.615 0.50 42.08 N +ATOM 753 N ILE A 97 14.158 26.917 28.817 1.00 20.21 N +ATOM 754 CA ILE A 97 15.291 27.561 29.499 1.00 20.26 C +ATOM 755 C ILE A 97 16.516 27.648 28.582 1.00 18.62 C +ATOM 756 O ILE A 97 16.782 26.637 27.961 1.00 21.53 O +ATOM 757 CB ILE A 97 15.701 26.668 30.721 1.00 18.29 C +ATOM 758 CG1 ILE A 97 14.581 26.701 31.767 1.00 20.21 C +ATOM 759 CG2 ILE A 97 17.042 27.147 31.255 1.00 22.22 C +ATOM 760 CD1 ILE A 97 14.823 25.783 32.976 1.00 24.96 C +ATOM 761 N ALA A 98 17.099 28.830 28.418 1.00 20.29 N +ATOM 762 CA ALA A 98 18.328 28.862 27.613 1.00 18.35 C +ATOM 763 C ALA A 98 19.507 28.462 28.528 1.00 19.12 C +ATOM 764 O ALA A 98 19.883 29.225 29.372 1.00 20.61 O +ATOM 765 CB ALA A 98 18.632 30.272 27.082 1.00 19.50 C +ATOM 766 N ALA A 99 19.980 27.257 28.315 1.00 17.55 N +ATOM 767 CA ALA A 99 21.068 26.712 29.157 1.00 16.02 C +ATOM 768 C ALA A 99 22.302 26.630 28.304 1.00 18.47 C +ATOM 769 O ALA A 99 22.195 26.530 27.060 1.00 18.56 O +ATOM 770 CB ALA A 99 20.657 25.336 29.641 1.00 17.19 C +ATOM 771 N VAL A 100 23.454 26.565 28.999 1.00 16.97 N +ATOM 772 CA VAL A 100 24.731 26.335 28.281 1.00 15.69 C +ATOM 773 C VAL A 100 25.467 25.207 29.054 1.00 16.57 C +ATOM 774 O VAL A 100 25.662 25.402 30.261 1.00 14.98 O +ATOM 775 CB VAL A 100 25.625 27.562 28.157 1.00 16.61 C +ATOM 776 CG1 VAL A 100 26.967 27.231 27.537 1.00 19.60 C +ATOM 777 CG2 VAL A 100 24.921 28.587 27.257 1.00 17.66 C +ATOM 778 N GLY A 101 25.822 24.112 28.400 1.00 16.46 N +ATOM 779 CA GLY A 101 26.529 23.064 29.095 1.00 15.25 C +ATOM 780 C GLY A 101 28.024 23.344 29.196 1.00 15.81 C +ATOM 781 O GLY A 101 28.681 23.784 28.232 1.00 17.43 O +ATOM 782 N LEU A 102 28.659 23.127 30.341 1.00 14.79 N +ATOM 783 CA LEU A 102 30.100 23.332 30.531 1.00 15.11 C +ATOM 784 C LEU A 102 30.674 22.140 31.301 1.00 16.51 C +ATOM 785 O LEU A 102 29.893 21.383 31.942 1.00 15.06 O +ATOM 786 CB LEU A 102 30.303 24.578 31.414 1.00 16.60 C +ATOM 787 CG LEU A 102 29.783 25.897 30.850 1.00 16.76 C +ATOM 788 CD1 LEU A 102 29.978 27.033 31.888 1.00 18.94 C +ATOM 789 CD2 LEU A 102 30.449 26.313 29.540 1.00 17.08 C +ATOM 790 N PHE A 103 31.999 21.974 31.231 1.00 14.89 N +ATOM 791 CA PHE A 103 32.693 21.123 32.269 1.00 17.79 C +ATOM 792 C PHE A 103 33.612 22.112 32.966 1.00 14.48 C +ATOM 793 O PHE A 103 33.728 23.326 32.754 1.00 16.02 O +ATOM 794 CB PHE A 103 33.390 19.906 31.625 1.00 15.23 C +ATOM 795 CG PHE A 103 34.768 20.108 30.996 1.00 15.53 C +ATOM 796 CD1 PHE A 103 35.680 19.069 31.190 1.00 15.14 C +ATOM 797 CD2 PHE A 103 35.148 21.231 30.303 1.00 16.24 C +ATOM 798 CE1 PHE A 103 37.000 19.189 30.679 1.00 17.33 C +ATOM 799 CE2 PHE A 103 36.449 21.340 29.770 1.00 16.57 C +ATOM 800 CZ PHE A 103 37.339 20.293 30.004 1.00 15.85 C +ATOM 801 N LEU A 104 34.339 21.524 33.973 1.00 15.28 N +ATOM 802 CA LEU A 104 35.091 22.359 34.910 1.00 16.20 C +ATOM 803 C LEU A 104 36.215 23.156 34.306 1.00 14.90 C +ATOM 804 O LEU A 104 36.599 24.253 34.708 1.00 17.20 O +ATOM 805 CB LEU A 104 35.694 21.562 36.050 1.00 16.95 C +ATOM 806 CG LEU A 104 34.665 20.763 36.849 1.00 14.96 C +ATOM 807 CD1 LEU A 104 35.364 19.812 37.855 1.00 18.08 C +ATOM 808 CD2 LEU A 104 33.671 21.638 37.628 1.00 19.20 C +ATOM 809 N GLY A 105 36.696 22.645 33.132 1.00 16.04 N +ATOM 810 CA GLY A 105 37.822 23.316 32.450 1.00 17.11 C +ATOM 811 C GLY A 105 37.429 24.507 31.575 1.00 16.22 C +ATOM 812 O GLY A 105 38.268 25.319 31.185 1.00 17.17 O +ATOM 813 N ASP A 106 36.131 24.646 31.254 1.00 15.56 N +ATOM 814 CA ASP A 106 35.740 25.790 30.413 1.00 15.79 C +ATOM 815 C ASP A 106 35.891 27.121 31.117 1.00 17.01 C +ATOM 816 O ASP A 106 35.435 27.245 32.285 1.00 16.36 O +ATOM 817 CB ASP A 106 34.269 25.631 29.986 1.00 15.40 C +ATOM 818 CG ASP A 106 33.974 24.496 29.052 1.00 17.38 C +ATOM 819 OD1 ASP A 106 34.733 24.320 28.053 1.00 17.74 O +ATOM 820 OD2 ASP A 106 33.008 23.695 29.262 1.00 16.04 O +ATOM 821 N GLY A 107 36.626 28.081 30.554 1.00 16.75 N +ATOM 822 CA GLY A 107 36.923 29.315 31.286 1.00 17.67 C +ATOM 823 C GLY A 107 37.793 29.054 32.517 1.00 19.13 C +ATOM 824 O GLY A 107 37.846 29.985 33.354 1.00 19.43 O +ATOM 825 N ASP A 108 38.453 27.930 32.605 1.00 17.01 N +ATOM 826 CA ASP A 108 39.232 27.643 33.823 1.00 18.51 C +ATOM 827 C ASP A 108 38.347 27.897 35.033 1.00 19.28 C +ATOM 828 O ASP A 108 38.819 28.411 36.060 1.00 19.03 O +ATOM 829 CB ASP A 108 40.476 28.581 33.888 1.00 20.31 C +ATOM 830 CG ASP A 108 41.512 28.141 32.879 1.00 31.95 C +ATOM 831 OD1 ASP A 108 41.524 27.002 32.378 1.00 27.50 O +ATOM 832 OD2 ASP A 108 42.417 28.949 32.562 1.00 37.06 O +ATOM 833 N SER A 109 37.106 27.475 35.005 1.00 16.42 N +ATOM 834 CA SER A 109 36.157 27.813 36.085 1.00 15.76 C +ATOM 835 C SER A 109 36.533 27.163 37.401 1.00 23.18 C +ATOM 836 O SER A 109 36.375 27.748 38.443 1.00 20.19 O +ATOM 837 CB SER A 109 34.769 27.300 35.699 1.00 17.64 C +ATOM 838 OG SER A 109 34.258 28.056 34.592 1.00 16.69 O +ATOM 839 N VAL A 110 37.054 25.943 37.346 1.00 17.60 N +ATOM 840 CA VAL A 110 37.518 25.190 38.540 1.00 17.81 C +ATOM 841 C VAL A 110 38.849 24.546 38.127 1.00 18.62 C +ATOM 842 O VAL A 110 38.871 23.854 37.078 1.00 21.11 O +ATOM 843 CB VAL A 110 36.497 24.108 38.922 1.00 16.72 C +ATOM 844 CG1 VAL A 110 37.134 23.154 39.923 1.00 19.86 C +ATOM 845 CG2 VAL A 110 35.261 24.760 39.594 1.00 18.79 C +ATOM 846 N LYS A 111 39.874 24.803 38.922 1.00 19.30 N +ATOM 847 CA LYS A 111 41.195 24.251 38.709 1.00 22.20 C +ATOM 848 C LYS A 111 41.259 22.816 39.226 1.00 19.19 C +ATOM 849 O LYS A 111 40.748 22.513 40.299 1.00 19.66 O +ATOM 850 CB LYS A 111 42.259 25.129 39.349 1.00 23.71 C +ATOM 851 CG LYS A 111 42.415 26.490 38.690 1.00 31.49 C +ATOM 852 CD LYS A 111 43.410 27.362 39.463 1.00 40.98 C +ATOM 853 CE LYS A 111 44.019 28.405 38.532 1.00 53.83 C +ATOM 854 NZ LYS A 111 44.793 29.408 39.330 1.00 65.47 N +ATOM 855 N VAL A 112 41.812 21.916 38.421 1.00 17.94 N +ATOM 856 CA VAL A 112 41.903 20.519 38.806 1.00 16.78 C +ATOM 857 C VAL A 112 43.299 19.989 38.616 1.00 17.36 C +ATOM 858 O VAL A 112 44.029 20.276 37.662 1.00 18.90 O +ATOM 859 CB VAL A 112 40.897 19.671 38.014 1.00 20.69 C +ATOM 860 CG1 VAL A 112 40.919 18.212 38.402 1.00 23.90 C +ATOM 861 CG2 VAL A 112 39.465 20.207 38.216 1.00 19.70 C +ATOM 862 N THR A 113 43.736 19.230 39.637 1.00 17.62 N +ATOM 863 CA THR A 113 45.012 18.527 39.621 1.00 18.42 C +ATOM 864 C THR A 113 44.752 17.093 40.065 1.00 18.50 C +ATOM 865 O THR A 113 43.732 16.722 40.600 1.00 18.80 O +ATOM 866 CB THR A 113 46.041 19.172 40.568 1.00 17.20 C +ATOM 867 OG1 THR A 113 45.528 19.160 41.895 1.00 21.36 O +ATOM 868 CG2 THR A 113 46.514 20.528 40.137 1.00 18.33 C +ATOM 869 N GLN A 114 45.723 16.181 39.817 1.00 18.49 N +ATOM 870 CA GLN A 114 45.621 14.808 40.236 1.00 19.81 C +ATOM 871 C GLN A 114 45.623 14.682 41.747 1.00 21.42 C +ATOM 872 O GLN A 114 46.592 15.147 42.370 1.00 21.73 O +ATOM 873 CB GLN A 114 46.736 13.900 39.619 1.00 19.74 C +ATOM 874 CG GLN A 114 46.519 12.460 40.066 1.00 23.36 C +ATOM 875 CD GLN A 114 47.675 11.590 39.522 1.00 30.04 C +ATOM 876 OE1 GLN A 114 47.522 11.129 38.385 1.00 34.95 O +ATOM 877 NE2 GLN A 114 48.709 11.348 40.312 1.00 30.98 N +ATOM 878 N LEU A 115 44.551 14.157 42.323 1.00 17.79 N +ATOM 879 CA LEU A 115 44.540 14.054 43.775 1.00 18.98 C +ATOM 880 C LEU A 115 45.470 12.999 44.352 1.00 20.71 C +ATOM 881 O LEU A 115 46.105 13.312 45.375 1.00 22.95 O +ATOM 882 CB LEU A 115 43.102 13.781 44.193 1.00 20.52 C +ATOM 883 CG LEU A 115 42.856 13.451 45.674 1.00 21.76 C +ATOM 884 CD1 LEU A 115 43.230 14.622 46.565 1.00 22.92 C +ATOM 885 CD2 LEU A 115 41.373 13.096 45.876 1.00 23.98 C +ATOM 886 N ASP A 116 45.554 11.834 43.778 1.00 22.36 N +ATOM 887 CA ASP A 116 46.322 10.717 44.382 1.00 21.96 C +ATOM 888 C ASP A 116 46.612 9.665 43.353 1.00 22.42 C +ATOM 889 O ASP A 116 45.667 9.190 42.720 1.00 22.26 O +ATOM 890 CB ASP A 116 45.444 10.169 45.492 1.00 22.03 C +ATOM 891 CG ASP A 116 45.935 8.970 46.258 1.00 37.61 C +ATOM 892 OD1 ASP A 116 47.036 8.486 46.017 1.00 31.82 O +ATOM 893 OD2 ASP A 116 45.104 8.546 47.100 1.00 34.08 O +ATOM 894 N GLU A 117 47.885 9.260 43.248 1.00 21.97 N +ATOM 895 CA GLU A 117 48.150 8.227 42.242 1.00 22.57 C +ATOM 896 C GLU A 117 47.382 6.926 42.539 1.00 19.69 C +ATOM 897 O GLU A 117 47.075 6.273 41.523 1.00 23.76 O +ATOM 898 CB AGLU A 117 49.667 8.024 42.207 0.50 20.33 C +ATOM 899 CG AGLU A 117 50.145 7.395 43.502 0.50 22.54 C +ATOM 900 CD AGLU A 117 51.678 7.244 43.451 0.50 27.38 C +ATOM 901 OE1AGLU A 117 52.111 6.693 44.477 0.50 27.76 O +ATOM 902 OE2AGLU A 117 52.280 7.663 42.445 0.50 24.34 O +ATOM 903 CB BGLU A 117 49.659 7.913 42.193 0.50 20.33 C +ATOM 904 CG BGLU A 117 50.029 6.865 41.140 0.50 22.54 C +ATOM 905 CD BGLU A 117 51.525 6.550 41.108 0.50 27.38 C +ATOM 906 OE1BGLU A 117 52.329 7.156 41.914 0.50 27.76 O +ATOM 907 OE2BGLU A 117 51.983 5.679 40.274 0.50 24.34 O +ATOM 908 N GLU A 118 46.942 6.606 43.744 1.00 22.75 N +ATOM 909 CA GLU A 118 46.207 5.418 44.079 1.00 23.33 C +ATOM 910 C GLU A 118 44.777 5.458 43.540 1.00 20.88 C +ATOM 911 O GLU A 118 44.105 4.445 43.363 1.00 24.03 O +ATOM 912 CB GLU A 118 46.086 5.149 45.602 1.00 26.55 C +ATOM 913 CG GLU A 118 47.470 5.119 46.251 1.00 34.49 C +ATOM 914 CD GLU A 118 47.549 4.286 47.506 1.00 50.08 C +ATOM 915 OE1 GLU A 118 46.523 4.150 48.199 1.00 46.71 O +ATOM 916 OE2 GLU A 118 48.672 3.783 47.746 1.00 52.37 O +ATOM 917 N LEU A 119 44.346 6.697 43.184 1.00 19.99 N +ATOM 918 CA LEU A 119 43.009 6.859 42.612 1.00 23.30 C +ATOM 919 C LEU A 119 42.981 6.977 41.086 1.00 20.36 C +ATOM 920 O LEU A 119 41.892 6.932 40.478 1.00 21.08 O +ATOM 921 CB LEU A 119 42.352 8.150 43.180 1.00 22.88 C +ATOM 922 CG LEU A 119 42.095 8.077 44.694 1.00 23.27 C +ATOM 923 CD1 LEU A 119 41.515 9.438 45.156 1.00 23.63 C +ATOM 924 CD2 LEU A 119 41.057 6.998 44.988 1.00 28.21 C +ATOM 925 N GLY A 120 44.122 7.172 40.488 1.00 20.92 N +ATOM 926 CA GLY A 120 44.136 7.306 39.016 1.00 19.98 C +ATOM 927 C GLY A 120 43.724 8.759 38.692 1.00 18.06 C +ATOM 928 O GLY A 120 44.182 9.750 39.242 1.00 19.89 O +ATOM 929 N HIS A 121 42.912 8.809 37.614 1.00 19.35 N +ATOM 930 CA HIS A 121 42.480 10.090 37.076 1.00 19.51 C +ATOM 931 C HIS A 121 41.331 10.723 37.832 1.00 18.13 C +ATOM 932 O HIS A 121 40.251 10.957 37.270 1.00 20.20 O +ATOM 933 CB HIS A 121 42.025 9.835 35.633 1.00 20.10 C +ATOM 934 CG HIS A 121 43.157 9.769 34.665 1.00 22.97 C +ATOM 935 ND1 HIS A 121 43.423 10.650 33.662 1.00 21.90 N +ATOM 936 CD2 HIS A 121 44.177 8.871 34.630 1.00 28.00 C +ATOM 937 CE1 HIS A 121 44.511 10.297 32.993 1.00 25.73 C +ATOM 938 NE2 HIS A 121 44.961 9.191 33.549 1.00 26.49 N +ATOM 939 N VAL A 122 41.477 10.828 39.153 1.00 16.81 N +ATOM 940 CA VAL A 122 40.545 11.560 40.040 1.00 17.41 C +ATOM 941 C VAL A 122 41.152 12.896 40.348 1.00 18.40 C +ATOM 942 O VAL A 122 42.333 13.070 40.696 1.00 19.02 O +ATOM 943 CB VAL A 122 40.299 10.774 41.319 1.00 19.66 C +ATOM 944 CG1 VAL A 122 39.546 11.593 42.365 1.00 19.82 C +ATOM 945 CG2 VAL A 122 39.567 9.458 41.001 1.00 19.14 C +ATOM 946 N GLY A 123 40.324 13.964 40.151 1.00 18.39 N +ATOM 947 CA GLY A 123 40.842 15.291 40.410 1.00 18.58 C +ATOM 948 C GLY A 123 40.553 15.880 41.782 1.00 15.78 C +ATOM 949 O GLY A 123 39.528 15.584 42.347 1.00 18.28 O +ATOM 950 N LEU A 124 41.456 16.735 42.189 1.00 17.60 N +ATOM 951 CA LEU A 124 41.250 17.610 43.345 1.00 18.16 C +ATOM 952 C LEU A 124 40.830 18.923 42.711 1.00 17.27 C +ATOM 953 O LEU A 124 41.560 19.573 41.915 1.00 16.98 O +ATOM 954 CB LEU A 124 42.619 17.795 44.034 1.00 21.14 C +ATOM 955 CG LEU A 124 42.676 18.870 45.121 1.00 21.46 C +ATOM 956 CD1 LEU A 124 41.631 18.685 46.242 1.00 20.89 C +ATOM 957 CD2 LEU A 124 44.098 18.949 45.704 1.00 20.48 C +ATOM 958 N ALA A 125 39.631 19.372 43.086 1.00 17.16 N +ATOM 959 CA ALA A 125 39.057 20.603 42.583 1.00 19.86 C +ATOM 960 C ALA A 125 39.394 21.770 43.514 1.00 20.06 C +ATOM 961 O ALA A 125 39.081 21.692 44.708 1.00 22.93 O +ATOM 962 CB ALA A 125 37.561 20.401 42.407 1.00 19.91 C +ATOM 963 N GLN A 126 39.757 22.896 42.955 1.00 17.57 N +ATOM 964 CA GLN A 126 40.018 24.117 43.725 1.00 18.19 C +ATOM 965 C GLN A 126 39.423 25.297 42.947 1.00 19.57 C +ATOM 966 O GLN A 126 39.184 25.193 41.713 1.00 19.29 O +ATOM 967 CB GLN A 126 41.495 24.293 44.071 1.00 20.63 C +ATOM 968 CG GLN A 126 41.871 23.107 45.008 1.00 25.04 C +ATOM 969 CD GLN A 126 43.252 23.313 45.595 1.00 22.21 C +ATOM 970 OE1 GLN A 126 43.429 24.049 46.573 1.00 25.89 O +ATOM 971 NE2 GLN A 126 44.216 22.528 45.074 1.00 21.53 N +ATOM 972 N PRO A 127 39.213 26.452 43.541 1.00 18.85 N +ATOM 973 CA PRO A 127 38.546 27.557 42.862 1.00 20.24 C +ATOM 974 C PRO A 127 39.338 28.001 41.654 1.00 20.60 C +ATOM 975 O PRO A 127 40.549 28.036 41.659 1.00 21.32 O +ATOM 976 CB PRO A 127 38.475 28.679 43.916 1.00 20.14 C +ATOM 977 CG PRO A 127 38.522 27.915 45.222 1.00 22.93 C +ATOM 978 CD PRO A 127 39.389 26.691 45.001 1.00 19.51 C +ATOM 979 N GLY A 128 38.596 28.441 40.625 1.00 19.42 N +ATOM 980 CA GLY A 128 39.224 28.984 39.429 1.00 18.28 C +ATOM 981 C GLY A 128 38.748 30.392 39.105 1.00 19.90 C +ATOM 982 O GLY A 128 38.613 31.224 40.008 1.00 20.93 O +ATOM 983 N SER A 129 38.503 30.655 37.826 1.00 16.97 N +ATOM 984 CA SER A 129 38.053 32.006 37.421 1.00 20.17 C +ATOM 985 C SER A 129 36.579 32.134 37.187 1.00 18.96 C +ATOM 986 O SER A 129 36.085 31.269 36.450 1.00 19.10 O +ATOM 987 CB SER A 129 38.729 32.335 36.093 1.00 19.49 C +ATOM 988 OG SER A 129 38.127 33.509 35.533 1.00 20.70 O +ATOM 989 N PRO A 130 35.846 33.098 37.696 1.00 17.15 N +ATOM 990 CA PRO A 130 34.445 33.269 37.512 1.00 18.23 C +ATOM 991 C PRO A 130 34.093 34.020 36.222 1.00 17.68 C +ATOM 992 O PRO A 130 32.882 34.181 36.033 1.00 18.98 O +ATOM 993 CB PRO A 130 33.989 34.043 38.779 1.00 18.97 C +ATOM 994 CG PRO A 130 35.164 34.993 38.904 1.00 20.12 C +ATOM 995 CD PRO A 130 36.446 34.172 38.601 1.00 20.65 C +ATOM 996 N LYS A 131 35.114 34.380 35.459 1.00 18.39 N +ATOM 997 CA LYS A 131 34.749 35.352 34.331 1.00 18.79 C +ATOM 998 C LYS A 131 33.785 34.743 33.318 1.00 19.06 C +ATOM 999 O LYS A 131 32.836 35.413 32.959 1.00 19.72 O +ATOM 1000 CB LYS A 131 36.036 35.866 33.646 1.00 20.11 C +ATOM 1001 CG LYS A 131 36.666 36.926 34.562 1.00 31.64 C +ATOM 1002 CD LYS A 131 37.892 37.559 33.929 1.00 34.50 C +ATOM 1003 CE LYS A 131 38.755 38.253 34.984 1.00 50.38 C +ATOM 1004 NZ LYS A 131 39.939 38.954 34.412 1.00 51.68 N +ATOM 1005 N LEU A 132 34.070 33.536 32.847 1.00 18.37 N +ATOM 1006 CA LEU A 132 33.172 32.976 31.841 1.00 16.75 C +ATOM 1007 C LEU A 132 31.773 32.777 32.330 1.00 16.90 C +ATOM 1008 O LEU A 132 30.762 33.234 31.757 1.00 18.46 O +ATOM 1009 CB LEU A 132 33.724 31.637 31.314 1.00 17.66 C +ATOM 1010 CG LEU A 132 32.760 30.863 30.387 1.00 19.89 C +ATOM 1011 CD1 LEU A 132 32.512 31.630 29.067 1.00 19.55 C +ATOM 1012 CD2 LEU A 132 33.337 29.477 30.091 1.00 22.04 C +ATOM 1013 N ILE A 133 31.593 32.149 33.526 1.00 17.16 N +ATOM 1014 CA ILE A 133 30.236 31.920 34.028 1.00 18.53 C +ATOM 1015 C ILE A 133 29.514 33.216 34.408 1.00 16.16 C +ATOM 1016 O ILE A 133 28.324 33.281 34.092 1.00 18.92 O +ATOM 1017 CB ILE A 133 30.297 30.904 35.187 1.00 18.42 C +ATOM 1018 CG1 ILE A 133 30.565 29.518 34.575 1.00 16.82 C +ATOM 1019 CG2 ILE A 133 29.035 30.898 36.030 1.00 17.89 C +ATOM 1020 CD1 ILE A 133 30.931 28.512 35.682 1.00 19.15 C +ATOM 1021 N ASN A 134 30.267 34.157 34.983 1.00 16.89 N +ATOM 1022 CA ASN A 134 29.589 35.479 35.254 1.00 20.08 C +ATOM 1023 C ASN A 134 29.071 36.099 33.952 1.00 18.98 C +ATOM 1024 O ASN A 134 27.989 36.683 33.992 1.00 20.74 O +ATOM 1025 CB ASN A 134 30.513 36.434 35.980 1.00 21.26 C +ATOM 1026 CG ASN A 134 30.637 36.077 37.480 1.00 19.05 C +ATOM 1027 OD1 ASN A 134 29.936 35.268 38.011 1.00 23.62 O +ATOM 1028 ND2 ASN A 134 31.624 36.772 38.009 1.00 25.64 N +ATOM 1029 N SER A 135 29.877 36.005 32.916 1.00 20.09 N +ATOM 1030 CA SER A 135 29.432 36.538 31.608 1.00 21.19 C +ATOM 1031 C SER A 135 28.203 35.805 31.123 1.00 23.28 C +ATOM 1032 O SER A 135 27.275 36.459 30.614 1.00 22.91 O +ATOM 1033 CB SER A 135 30.537 36.373 30.565 1.00 22.99 C +ATOM 1034 OG SER A 135 30.031 36.957 29.339 1.00 28.84 O +ATOM 1035 N LEU A 136 28.080 34.482 31.193 1.00 17.47 N +ATOM 1036 CA LEU A 136 26.941 33.720 30.758 1.00 18.91 C +ATOM 1037 C LEU A 136 25.789 34.123 31.576 1.00 19.41 C +ATOM 1038 O LEU A 136 24.655 34.323 31.108 1.00 20.72 O +ATOM 1039 CB LEU A 136 27.178 32.207 30.934 1.00 20.22 C +ATOM 1040 CG LEU A 136 28.199 31.731 29.888 1.00 18.06 C +ATOM 1041 CD1 LEU A 136 28.665 30.342 30.319 1.00 19.84 C +ATOM 1042 CD2 LEU A 136 27.653 31.726 28.462 1.00 20.16 C +ATOM 1043 N LEU A 137 25.941 34.286 32.935 1.00 18.74 N +ATOM 1044 CA LEU A 137 24.842 34.670 33.822 1.00 20.50 C +ATOM 1045 C LEU A 137 24.294 36.087 33.465 1.00 19.17 C +ATOM 1046 O LEU A 137 23.043 36.231 33.464 1.00 21.84 O +ATOM 1047 CB LEU A 137 25.251 34.589 35.317 1.00 21.04 C +ATOM 1048 CG LEU A 137 25.541 33.169 35.818 1.00 19.31 C +ATOM 1049 CD1 LEU A 137 26.078 33.228 37.256 1.00 19.98 C +ATOM 1050 CD2 LEU A 137 24.325 32.284 35.832 1.00 18.67 C +ATOM 1051 N GLU A 138 25.241 36.973 33.259 1.00 20.77 N +ATOM 1052 CA GLU A 138 24.759 38.346 32.940 1.00 25.11 C +ATOM 1053 C GLU A 138 24.035 38.377 31.618 1.00 24.64 C +ATOM 1054 O GLU A 138 23.204 39.278 31.426 1.00 27.43 O +ATOM 1055 CB AGLU A 138 25.966 39.235 32.903 0.50 16.72 C +ATOM 1056 CG AGLU A 138 26.649 39.458 34.244 0.50 14.07 C +ATOM 1057 CD AGLU A 138 26.045 40.694 34.905 0.50 30.77 C +ATOM 1058 OE1AGLU A 138 24.980 41.193 34.490 0.50 36.40 O +ATOM 1059 OE2AGLU A 138 26.711 41.137 35.861 0.50 37.97 O +ATOM 1060 CB BGLU A 138 25.958 39.303 32.895 0.50 16.72 C +ATOM 1061 CG BGLU A 138 26.396 39.799 34.273 0.50 14.07 C +ATOM 1062 CD BGLU A 138 27.914 39.781 34.460 0.50 30.77 C +ATOM 1063 OE1BGLU A 138 28.687 40.105 33.479 0.50 36.40 O +ATOM 1064 OE2BGLU A 138 28.420 39.443 35.597 0.50 37.97 O +ATOM 1065 N ASN A 139 24.281 37.429 30.746 1.00 22.95 N +ATOM 1066 CA ASN A 139 23.623 37.407 29.424 1.00 21.05 C +ATOM 1067 C ASN A 139 22.377 36.551 29.482 1.00 25.33 C +ATOM 1068 O ASN A 139 21.812 36.300 28.389 1.00 30.00 O +ATOM 1069 CB ASN A 139 24.545 36.944 28.340 1.00 22.94 C +ATOM 1070 CG ASN A 139 25.598 37.827 27.767 1.00 33.22 C +ATOM 1071 OD1 ASN A 139 26.724 37.398 27.518 1.00 43.44 O +ATOM 1072 ND2 ASN A 139 25.184 39.053 27.450 1.00 34.44 N +ATOM 1073 N GLY A 140 21.966 36.018 30.605 1.00 22.58 N +ATOM 1074 CA GLY A 140 20.723 35.310 30.833 1.00 26.72 C +ATOM 1075 C GLY A 140 20.736 33.816 30.573 1.00 26.89 C +ATOM 1076 O GLY A 140 19.660 33.196 30.534 1.00 30.47 O +ATOM 1077 N TYR A 141 21.883 33.173 30.538 1.00 21.40 N +ATOM 1078 CA TYR A 141 21.928 31.723 30.357 1.00 19.54 C +ATOM 1079 C TYR A 141 22.007 30.962 31.703 1.00 19.64 C +ATOM 1080 O TYR A 141 22.500 31.617 32.660 1.00 22.31 O +ATOM 1081 CB TYR A 141 23.267 31.466 29.594 1.00 18.24 C +ATOM 1082 CG TYR A 141 23.318 31.993 28.184 1.00 18.32 C +ATOM 1083 CD1 TYR A 141 24.084 33.089 27.850 1.00 21.35 C +ATOM 1084 CD2 TYR A 141 22.555 31.376 27.173 1.00 18.86 C +ATOM 1085 CE1 TYR A 141 24.125 33.642 26.566 1.00 18.44 C +ATOM 1086 CE2 TYR A 141 22.619 31.873 25.882 1.00 20.75 C +ATOM 1087 CZ TYR A 141 23.375 33.011 25.583 1.00 20.47 C +ATOM 1088 OH TYR A 141 23.385 33.457 24.266 1.00 25.00 O +ATOM 1089 N LEU A 142 21.490 29.756 31.685 1.00 18.25 N +ATOM 1090 CA LEU A 142 21.695 28.862 32.840 1.00 18.84 C +ATOM 1091 C LEU A 142 22.883 27.912 32.546 1.00 16.76 C +ATOM 1092 O LEU A 142 22.733 27.008 31.753 1.00 17.14 O +ATOM 1093 CB LEU A 142 20.383 28.042 32.960 1.00 18.94 C +ATOM 1094 CG LEU A 142 20.438 26.916 34.000 1.00 33.32 C +ATOM 1095 CD1 LEU A 142 20.637 27.627 35.327 1.00 28.42 C +ATOM 1096 CD2 LEU A 142 19.259 25.945 34.067 1.00 25.81 C +ATOM 1097 N PRO A 143 23.983 28.114 33.269 1.00 15.95 N +ATOM 1098 CA PRO A 143 25.122 27.197 33.086 1.00 14.85 C +ATOM 1099 C PRO A 143 24.764 25.837 33.682 1.00 16.66 C +ATOM 1100 O PRO A 143 24.282 25.830 34.863 1.00 18.52 O +ATOM 1101 CB PRO A 143 26.283 27.905 33.761 1.00 17.00 C +ATOM 1102 CG PRO A 143 25.865 29.340 33.887 1.00 18.22 C +ATOM 1103 CD PRO A 143 24.358 29.261 34.124 1.00 19.09 C +ATOM 1104 N VAL A 144 25.109 24.757 33.053 1.00 15.61 N +ATOM 1105 CA VAL A 144 24.865 23.383 33.565 1.00 15.38 C +ATOM 1106 C VAL A 144 26.233 22.685 33.490 1.00 14.88 C +ATOM 1107 O VAL A 144 26.681 22.406 32.359 1.00 14.95 O +ATOM 1108 CB VAL A 144 23.755 22.660 32.785 1.00 14.24 C +ATOM 1109 CG1 VAL A 144 23.623 21.215 33.237 1.00 18.72 C +ATOM 1110 CG2 VAL A 144 22.421 23.454 32.828 1.00 16.72 C +ATOM 1111 N VAL A 145 26.875 22.466 34.648 1.00 16.06 N +ATOM 1112 CA VAL A 145 28.289 22.141 34.679 1.00 15.07 C +ATOM 1113 C VAL A 145 28.519 20.734 35.205 1.00 15.43 C +ATOM 1114 O VAL A 145 28.057 20.342 36.284 1.00 15.96 O +ATOM 1115 CB VAL A 145 28.988 23.150 35.628 1.00 15.33 C +ATOM 1116 CG1 VAL A 145 30.483 22.984 35.587 1.00 17.93 C +ATOM 1117 CG2 VAL A 145 28.617 24.596 35.315 1.00 17.57 C +ATOM 1118 N SER A 146 29.181 19.908 34.397 1.00 15.38 N +ATOM 1119 CA SER A 146 29.575 18.572 34.813 1.00 15.53 C +ATOM 1120 C SER A 146 30.824 18.597 35.649 1.00 14.99 C +ATOM 1121 O SER A 146 31.514 19.579 35.829 1.00 17.62 O +ATOM 1122 CB SER A 146 29.827 17.700 33.541 1.00 15.84 C +ATOM 1123 OG SER A 146 31.050 18.103 32.947 1.00 17.10 O +ATOM 1124 N SER A 147 31.111 17.396 36.248 1.00 17.34 N +ATOM 1125 CA SER A 147 32.199 17.322 37.216 1.00 16.20 C +ATOM 1126 C SER A 147 33.438 16.682 36.642 1.00 19.72 C +ATOM 1127 O SER A 147 34.342 16.199 37.410 1.00 19.25 O +ATOM 1128 CB SER A 147 31.737 16.617 38.499 1.00 19.79 C +ATOM 1129 OG SER A 147 31.525 15.249 38.304 1.00 20.35 O +ATOM 1130 N ILE A 148 33.558 16.703 35.301 1.00 15.11 N +ATOM 1131 CA ILE A 148 34.843 16.327 34.681 1.00 15.13 C +ATOM 1132 C ILE A 148 35.666 17.625 34.572 1.00 15.94 C +ATOM 1133 O ILE A 148 35.111 18.677 34.282 1.00 16.72 O +ATOM 1134 CB ILE A 148 34.629 15.798 33.254 1.00 15.64 C +ATOM 1135 CG1 ILE A 148 33.796 14.499 33.314 1.00 17.45 C +ATOM 1136 CG2 ILE A 148 35.912 15.431 32.513 1.00 18.56 C +ATOM 1137 CD1 ILE A 148 34.418 13.394 34.194 1.00 18.35 C +ATOM 1138 N GLY A 149 37.009 17.558 34.817 1.00 16.99 N +ATOM 1139 CA GLY A 149 37.859 18.703 34.616 1.00 17.15 C +ATOM 1140 C GLY A 149 39.066 18.222 33.785 1.00 17.07 C +ATOM 1141 O GLY A 149 39.097 17.078 33.298 1.00 18.12 O +ATOM 1142 N VAL A 150 40.055 19.126 33.766 1.00 16.09 N +ATOM 1143 CA VAL A 150 41.267 18.783 33.007 1.00 17.51 C +ATOM 1144 C VAL A 150 42.439 19.570 33.666 1.00 18.83 C +ATOM 1145 O VAL A 150 42.312 20.650 34.152 1.00 20.84 O +ATOM 1146 CB VAL A 150 41.102 19.148 31.524 1.00 18.07 C +ATOM 1147 CG1 VAL A 150 40.886 20.657 31.299 1.00 19.07 C +ATOM 1148 CG2 VAL A 150 42.277 18.674 30.676 1.00 21.91 C +ATOM 1149 N THR A 151 43.550 18.799 33.708 1.00 17.37 N +ATOM 1150 CA THR A 151 44.759 19.428 34.266 1.00 22.13 C +ATOM 1151 C THR A 151 45.428 20.307 33.214 1.00 22.89 C +ATOM 1152 O THR A 151 45.164 20.252 31.997 1.00 20.16 O +ATOM 1153 CB THR A 151 45.812 18.372 34.700 1.00 17.76 C +ATOM 1154 OG1 THR A 151 46.312 17.798 33.463 1.00 21.16 O +ATOM 1155 CG2 THR A 151 45.267 17.284 35.584 1.00 18.01 C +ATOM 1156 N ASP A 152 46.325 21.157 33.686 1.00 21.72 N +ATOM 1157 CA ASP A 152 47.069 22.034 32.810 1.00 19.31 C +ATOM 1158 C ASP A 152 47.880 21.244 31.795 1.00 22.62 C +ATOM 1159 O ASP A 152 48.147 21.788 30.703 1.00 26.08 O +ATOM 1160 CB ASP A 152 48.084 22.856 33.650 1.00 28.17 C +ATOM 1161 CG ASP A 152 47.370 23.951 34.411 1.00 33.25 C +ATOM 1162 OD1 ASP A 152 46.251 24.391 34.101 1.00 34.58 O +ATOM 1163 OD2 ASP A 152 48.018 24.434 35.379 1.00 43.27 O +ATOM 1164 N GLU A 153 48.178 19.991 32.050 1.00 22.54 N +ATOM 1165 CA GLU A 153 48.943 19.212 31.104 1.00 24.72 C +ATOM 1166 C GLU A 153 48.094 18.472 30.101 1.00 26.38 C +ATOM 1167 O GLU A 153 48.515 17.732 29.190 1.00 26.57 O +ATOM 1168 CB GLU A 153 49.876 18.236 31.834 1.00 26.98 C +ATOM 1169 CG GLU A 153 50.951 18.975 32.642 1.00 31.49 C +ATOM 1170 CD GLU A 153 50.407 19.494 33.957 1.00 34.83 C +ATOM 1171 OE1 GLU A 153 50.990 20.472 34.490 1.00 39.32 O +ATOM 1172 OE2 GLU A 153 49.419 18.970 34.540 1.00 28.93 O +ATOM 1173 N GLY A 154 46.773 18.691 30.270 1.00 22.47 N +ATOM 1174 CA GLY A 154 45.858 18.060 29.326 1.00 22.04 C +ATOM 1175 C GLY A 154 45.266 16.729 29.708 1.00 18.10 C +ATOM 1176 O GLY A 154 44.835 16.018 28.797 1.00 21.16 O +ATOM 1177 N GLN A 155 45.309 16.262 30.975 1.00 18.20 N +ATOM 1178 CA GLN A 155 44.726 14.985 31.327 1.00 17.93 C +ATOM 1179 C GLN A 155 43.309 15.228 31.950 1.00 17.93 C +ATOM 1180 O GLN A 155 43.132 16.069 32.841 1.00 19.17 O +ATOM 1181 CB GLN A 155 45.593 14.317 32.425 1.00 21.63 C +ATOM 1182 CG GLN A 155 46.964 13.868 31.829 1.00 24.32 C +ATOM 1183 CD GLN A 155 46.736 12.854 30.747 1.00 29.86 C +ATOM 1184 OE1 GLN A 155 45.991 11.856 30.837 1.00 34.41 O +ATOM 1185 NE2 GLN A 155 47.414 13.046 29.607 1.00 34.32 N +ATOM 1186 N LEU A 156 42.391 14.465 31.379 1.00 19.18 N +ATOM 1187 CA LEU A 156 41.013 14.552 31.893 1.00 18.32 C +ATOM 1188 C LEU A 156 41.018 13.962 33.277 1.00 20.20 C +ATOM 1189 O LEU A 156 41.679 12.989 33.643 1.00 20.22 O +ATOM 1190 CB LEU A 156 40.053 13.771 30.978 1.00 17.71 C +ATOM 1191 CG LEU A 156 39.888 14.494 29.640 1.00 19.37 C +ATOM 1192 CD1 LEU A 156 39.128 13.607 28.653 1.00 19.41 C +ATOM 1193 CD2 LEU A 156 39.096 15.818 29.752 1.00 19.86 C +ATOM 1194 N MET A 157 40.121 14.535 34.140 1.00 18.73 N +ATOM 1195 CA MET A 157 40.022 14.138 35.551 1.00 17.77 C +ATOM 1196 C MET A 157 38.554 13.990 35.921 1.00 16.93 C +ATOM 1197 O MET A 157 37.697 14.874 35.669 1.00 20.49 O +ATOM 1198 CB MET A 157 40.638 15.250 36.437 1.00 19.23 C +ATOM 1199 CG MET A 157 42.170 15.247 36.361 1.00 23.61 C +ATOM 1200 SD MET A 157 42.955 13.816 37.252 1.00 22.97 S +ATOM 1201 CE MET A 157 44.293 13.487 36.102 1.00 33.32 C +ATOM 1202 N ASN A 158 38.275 12.973 36.686 1.00 17.01 N +ATOM 1203 CA ASN A 158 36.951 12.724 37.251 1.00 16.18 C +ATOM 1204 C ASN A 158 36.966 13.348 38.626 1.00 18.66 C +ATOM 1205 O ASN A 158 37.732 12.971 39.518 1.00 18.46 O +ATOM 1206 CB ASN A 158 36.739 11.209 37.326 1.00 18.94 C +ATOM 1207 CG ASN A 158 35.444 10.769 37.912 1.00 21.14 C +ATOM 1208 OD1 ASN A 158 34.542 11.654 38.074 1.00 20.53 O +ATOM 1209 ND2 ASN A 158 35.218 9.521 38.307 1.00 21.26 N +ATOM 1210 N VAL A 159 36.110 14.329 38.850 1.00 17.19 N +ATOM 1211 CA VAL A 159 35.969 14.999 40.169 1.00 16.69 C +ATOM 1212 C VAL A 159 34.671 14.627 40.827 1.00 17.08 C +ATOM 1213 O VAL A 159 33.596 14.628 40.180 1.00 19.35 O +ATOM 1214 CB VAL A 159 36.046 16.517 40.000 1.00 16.63 C +ATOM 1215 CG1 VAL A 159 36.031 17.251 41.382 1.00 17.35 C +ATOM 1216 CG2 VAL A 159 37.324 16.927 39.294 1.00 18.90 C +ATOM 1217 N ASN A 160 34.698 14.285 42.093 1.00 17.18 N +ATOM 1218 CA ASN A 160 33.389 14.005 42.755 1.00 16.43 C +ATOM 1219 C ASN A 160 32.546 15.308 42.626 1.00 19.55 C +ATOM 1220 O ASN A 160 33.050 16.391 42.851 1.00 17.32 O +ATOM 1221 CB ASN A 160 33.678 13.747 44.225 1.00 19.38 C +ATOM 1222 CG ASN A 160 32.435 13.793 45.159 1.00 20.71 C +ATOM 1223 OD1 ASN A 160 32.197 14.912 45.664 1.00 21.81 O +ATOM 1224 ND2 ASN A 160 31.873 12.595 45.241 1.00 25.77 N +ATOM 1225 N ALA A 161 31.243 15.161 42.337 1.00 17.72 N +ATOM 1226 CA ALA A 161 30.462 16.333 42.015 1.00 17.40 C +ATOM 1227 C ALA A 161 30.136 17.227 43.210 1.00 16.91 C +ATOM 1228 O ALA A 161 30.016 18.442 42.976 1.00 18.04 O +ATOM 1229 CB ALA A 161 29.181 15.902 41.281 1.00 19.02 C +ATOM 1230 N ASP A 162 30.110 16.695 44.433 1.00 17.55 N +ATOM 1231 CA ASP A 162 29.947 17.560 45.581 1.00 17.61 C +ATOM 1232 C ASP A 162 31.155 18.476 45.769 1.00 16.85 C +ATOM 1233 O ASP A 162 31.049 19.653 46.024 1.00 18.90 O +ATOM 1234 CB ASP A 162 29.735 16.724 46.881 1.00 19.52 C +ATOM 1235 CG ASP A 162 28.471 15.933 46.912 1.00 22.84 C +ATOM 1236 OD1 ASP A 162 27.447 16.380 46.350 1.00 22.62 O +ATOM 1237 OD2 ASP A 162 28.460 14.830 47.495 1.00 22.68 O +ATOM 1238 N GLN A 163 32.378 17.895 45.588 1.00 17.99 N +ATOM 1239 CA GLN A 163 33.580 18.735 45.682 1.00 18.29 C +ATOM 1240 C GLN A 163 33.664 19.731 44.501 1.00 14.88 C +ATOM 1241 O GLN A 163 34.148 20.838 44.713 1.00 18.64 O +ATOM 1242 CB GLN A 163 34.800 17.776 45.577 1.00 18.14 C +ATOM 1243 CG GLN A 163 34.936 16.947 46.915 1.00 18.79 C +ATOM 1244 CD GLN A 163 36.062 15.916 46.851 1.00 19.44 C +ATOM 1245 OE1 GLN A 163 36.627 15.662 45.768 1.00 20.45 O +ATOM 1246 NE2 GLN A 163 36.323 15.241 47.938 1.00 24.56 N +ATOM 1247 N ALA A 164 33.220 19.291 43.320 1.00 15.89 N +ATOM 1248 CA ALA A 164 33.235 20.273 42.208 1.00 16.68 C +ATOM 1249 C ALA A 164 32.247 21.439 42.491 1.00 15.93 C +ATOM 1250 O ALA A 164 32.645 22.569 42.276 1.00 15.88 O +ATOM 1251 CB ALA A 164 32.821 19.622 40.905 1.00 19.00 C +ATOM 1252 N ALA A 165 31.098 21.090 43.058 1.00 15.34 N +ATOM 1253 CA ALA A 165 30.137 22.174 43.375 1.00 16.36 C +ATOM 1254 C ALA A 165 30.637 23.144 44.417 1.00 16.89 C +ATOM 1255 O ALA A 165 30.486 24.348 44.342 1.00 17.80 O +ATOM 1256 CB ALA A 165 28.858 21.470 43.848 1.00 17.75 C +ATOM 1257 N THR A 166 31.364 22.572 45.424 1.00 17.61 N +ATOM 1258 CA THR A 166 31.933 23.455 46.439 1.00 19.26 C +ATOM 1259 C THR A 166 32.978 24.369 45.858 1.00 17.12 C +ATOM 1260 O THR A 166 33.056 25.573 46.147 1.00 19.04 O +ATOM 1261 CB THR A 166 32.537 22.659 47.634 1.00 20.02 C +ATOM 1262 OG1 THR A 166 31.343 22.175 48.303 1.00 20.09 O +ATOM 1263 CG2 THR A 166 33.399 23.476 48.554 1.00 21.65 C +ATOM 1264 N ALA A 167 33.852 23.824 44.971 1.00 17.28 N +ATOM 1265 CA ALA A 167 34.868 24.660 44.365 1.00 17.51 C +ATOM 1266 C ALA A 167 34.242 25.762 43.488 1.00 15.61 C +ATOM 1267 O ALA A 167 34.754 26.883 43.504 1.00 17.29 O +ATOM 1268 CB ALA A 167 35.829 23.725 43.575 1.00 17.71 C +ATOM 1269 N LEU A 168 33.203 25.335 42.755 1.00 16.59 N +ATOM 1270 CA LEU A 168 32.541 26.398 41.939 1.00 17.54 C +ATOM 1271 C LEU A 168 31.810 27.427 42.819 1.00 17.01 C +ATOM 1272 O LEU A 168 31.882 28.611 42.463 1.00 18.26 O +ATOM 1273 CB LEU A 168 31.581 25.737 40.979 1.00 17.96 C +ATOM 1274 CG LEU A 168 31.023 26.748 39.942 1.00 17.08 C +ATOM 1275 CD1 LEU A 168 32.195 27.231 39.061 1.00 17.92 C +ATOM 1276 CD2 LEU A 168 29.982 26.087 39.049 1.00 19.51 C +ATOM 1277 N ALA A 169 31.284 26.997 43.984 1.00 17.63 N +ATOM 1278 CA ALA A 169 30.642 28.008 44.837 1.00 18.82 C +ATOM 1279 C ALA A 169 31.651 28.988 45.320 1.00 19.21 C +ATOM 1280 O ALA A 169 31.467 30.231 45.355 1.00 20.71 O +ATOM 1281 CB ALA A 169 30.020 27.251 46.043 1.00 18.23 C +ATOM 1282 N ALA A 170 32.897 28.532 45.677 1.00 17.83 N +ATOM 1283 CA ALA A 170 33.882 29.489 46.076 1.00 19.83 C +ATOM 1284 C ALA A 170 34.325 30.410 44.938 1.00 21.62 C +ATOM 1285 O ALA A 170 34.466 31.615 45.122 1.00 23.83 O +ATOM 1286 CB ALA A 170 35.135 28.717 46.588 1.00 19.84 C +ATOM 1287 N THR A 171 34.438 29.850 43.716 1.00 19.14 N +ATOM 1288 CA THR A 171 34.834 30.667 42.574 1.00 17.47 C +ATOM 1289 C THR A 171 33.797 31.793 42.295 1.00 19.67 C +ATOM 1290 O THR A 171 34.247 32.894 41.976 1.00 19.30 O +ATOM 1291 CB THR A 171 34.802 29.764 41.333 1.00 19.81 C +ATOM 1292 OG1 THR A 171 35.790 28.709 41.565 1.00 18.94 O +ATOM 1293 CG2 THR A 171 35.251 30.469 40.059 1.00 18.53 C +ATOM 1294 N LEU A 172 32.520 31.470 42.401 1.00 17.73 N +ATOM 1295 CA LEU A 172 31.485 32.481 42.041 1.00 17.18 C +ATOM 1296 C LEU A 172 30.969 33.225 43.251 1.00 20.83 C +ATOM 1297 O LEU A 172 30.145 34.155 43.039 1.00 22.31 O +ATOM 1298 CB LEU A 172 30.289 31.726 41.453 1.00 19.79 C +ATOM 1299 CG LEU A 172 30.527 30.913 40.209 1.00 17.36 C +ATOM 1300 CD1 LEU A 172 29.298 30.115 39.783 1.00 17.99 C +ATOM 1301 CD2 LEU A 172 31.070 31.752 39.059 1.00 17.46 C +ATOM 1302 N GLY A 173 31.376 32.844 44.466 1.00 20.92 N +ATOM 1303 CA GLY A 173 30.757 33.509 45.652 1.00 21.75 C +ATOM 1304 C GLY A 173 29.295 33.094 45.730 1.00 22.21 C +ATOM 1305 O GLY A 173 28.407 33.879 46.172 1.00 24.06 O +ATOM 1306 N ALA A 174 28.879 31.890 45.360 1.00 19.28 N +ATOM 1307 CA ALA A 174 27.531 31.424 45.273 1.00 18.58 C +ATOM 1308 C ALA A 174 27.007 30.695 46.524 1.00 21.21 C +ATOM 1309 O ALA A 174 27.793 30.041 47.216 1.00 23.17 O +ATOM 1310 CB ALA A 174 27.389 30.396 44.101 1.00 21.89 C +ATOM 1311 N ASP A 175 25.687 30.865 46.728 1.00 20.01 N +ATOM 1312 CA ASP A 175 25.010 30.018 47.686 1.00 22.80 C +ATOM 1313 C ASP A 175 25.007 28.583 47.143 1.00 21.87 C +ATOM 1314 O ASP A 175 25.159 28.445 45.892 1.00 20.54 O +ATOM 1315 CB ASP A 175 23.561 30.485 47.793 1.00 25.57 C +ATOM 1316 CG ASP A 175 23.372 31.936 48.144 1.00 43.82 C +ATOM 1317 OD1 ASP A 175 24.113 32.521 48.948 1.00 28.18 O +ATOM 1318 OD2 ASP A 175 22.448 32.589 47.581 1.00 55.72 O +ATOM 1319 N LEU A 176 24.885 27.567 47.952 1.00 20.48 N +ATOM 1320 CA LEU A 176 24.878 26.212 47.475 1.00 19.26 C +ATOM 1321 C LEU A 176 23.838 25.328 48.100 1.00 17.62 C +ATOM 1322 O LEU A 176 23.691 25.300 49.369 1.00 21.35 O +ATOM 1323 CB LEU A 176 26.297 25.629 47.769 1.00 20.33 C +ATOM 1324 CG LEU A 176 26.534 24.145 47.482 1.00 17.72 C +ATOM 1325 CD1 LEU A 176 26.459 23.898 45.950 1.00 18.81 C +ATOM 1326 CD2 LEU A 176 27.969 23.760 47.956 1.00 19.88 C +ATOM 1327 N ILE A 177 23.164 24.529 47.337 1.00 18.99 N +ATOM 1328 CA ILE A 177 22.247 23.498 47.763 1.00 20.00 C +ATOM 1329 C ILE A 177 22.642 22.145 47.186 1.00 19.70 C +ATOM 1330 O ILE A 177 22.821 22.088 45.935 1.00 19.83 O +ATOM 1331 CB ILE A 177 20.763 23.774 47.358 1.00 20.59 C +ATOM 1332 CG1 ILE A 177 20.236 25.032 48.032 1.00 25.66 C +ATOM 1333 CG2 ILE A 177 19.929 22.535 47.725 1.00 28.06 C +ATOM 1334 CD1 ILE A 177 18.834 25.490 47.606 1.00 26.68 C +ATOM 1335 N LEU A 178 22.947 21.105 47.892 1.00 17.69 N +ATOM 1336 CA LEU A 178 23.322 19.771 47.465 1.00 19.04 C +ATOM 1337 C LEU A 178 22.092 18.903 47.454 1.00 19.98 C +ATOM 1338 O LEU A 178 21.614 18.561 48.576 1.00 22.49 O +ATOM 1339 CB LEU A 178 24.461 19.195 48.339 1.00 19.93 C +ATOM 1340 CG LEU A 178 25.667 20.118 48.413 1.00 18.30 C +ATOM 1341 CD1 LEU A 178 26.710 19.591 49.432 1.00 23.64 C +ATOM 1342 CD2 LEU A 178 26.360 20.053 47.021 1.00 23.52 C +ATOM 1343 N LEU A 179 21.547 18.516 46.333 1.00 19.42 N +ATOM 1344 CA LEU A 179 20.364 17.693 46.267 1.00 17.95 C +ATOM 1345 C LEU A 179 20.666 16.224 46.043 1.00 22.44 C +ATOM 1346 O LEU A 179 21.365 15.939 45.003 1.00 27.29 O +ATOM 1347 CB LEU A 179 19.407 18.109 45.153 1.00 20.37 C +ATOM 1348 CG LEU A 179 18.745 19.470 45.269 1.00 27.94 C +ATOM 1349 CD1 LEU A 179 17.782 19.603 44.069 1.00 27.45 C +ATOM 1350 CD2 LEU A 179 17.932 19.584 46.560 1.00 26.32 C +ATOM 1351 N SER A 180 20.077 15.358 46.832 1.00 22.62 N +ATOM 1352 CA SER A 180 20.370 13.944 46.766 1.00 29.57 C +ATOM 1353 C SER A 180 19.088 13.111 46.878 1.00 25.08 C +ATOM 1354 O SER A 180 18.005 13.690 46.908 1.00 27.50 O +ATOM 1355 CB SER A 180 21.311 13.538 47.908 1.00 38.50 C +ATOM 1356 OG SER A 180 20.855 14.036 49.163 1.00 47.12 O +ATOM 1357 N ASP A 181 19.295 11.803 46.950 1.00 26.62 N +ATOM 1358 CA ASP A 181 18.152 10.899 46.989 1.00 29.14 C +ATOM 1359 C ASP A 181 17.654 10.702 48.421 1.00 31.25 C +ATOM 1360 O ASP A 181 16.669 9.993 48.634 1.00 37.68 O +ATOM 1361 CB AASP A 181 18.480 9.507 46.470 0.50 31.25 C +ATOM 1362 CG AASP A 181 19.418 9.418 45.298 0.50 36.64 C +ATOM 1363 OD1AASP A 181 19.242 10.136 44.300 0.50 38.06 O +ATOM 1364 OD2AASP A 181 20.344 8.583 45.394 0.50 31.41 O +ATOM 1365 CB BASP A 181 18.564 9.536 46.384 0.50 31.25 C +ATOM 1366 CG BASP A 181 19.692 8.862 47.167 0.50 36.64 C +ATOM 1367 OD1BASP A 181 20.184 9.438 48.212 0.50 38.06 O +ATOM 1368 OD2BASP A 181 20.151 7.720 46.783 0.50 31.41 O +ATOM 1369 N VAL A 182 18.369 11.181 49.403 1.00 28.04 N +ATOM 1370 CA VAL A 182 17.970 11.073 50.797 1.00 28.71 C +ATOM 1371 C VAL A 182 17.727 12.472 51.370 1.00 26.52 C +ATOM 1372 O VAL A 182 18.303 13.472 50.919 1.00 26.46 O +ATOM 1373 CB VAL A 182 19.039 10.375 51.666 1.00 36.77 C +ATOM 1374 CG1 VAL A 182 19.411 9.037 51.053 1.00 42.68 C +ATOM 1375 CG2 VAL A 182 20.233 11.291 51.845 1.00 39.47 C +ATOM 1376 N SER A 183 16.857 12.502 52.379 1.00 27.43 N +ATOM 1377 CA SER A 183 16.524 13.761 53.024 1.00 31.64 C +ATOM 1378 C SER A 183 17.589 14.207 53.992 1.00 31.22 C +ATOM 1379 O SER A 183 17.399 14.355 55.226 1.00 39.19 O +ATOM 1380 CB SER A 183 15.125 13.660 53.700 1.00 38.85 C +ATOM 1381 OG SER A 183 15.315 12.936 54.910 1.00 50.28 O +ATOM 1382 N GLY A 184 18.796 14.511 53.471 1.00 28.06 N +ATOM 1383 CA GLY A 184 19.867 15.064 54.269 1.00 27.03 C +ATOM 1384 C GLY A 184 20.724 13.934 54.840 1.00 23.18 C +ATOM 1385 O GLY A 184 20.787 12.810 54.327 1.00 31.02 O +ATOM 1386 N ILE A 185 21.395 14.266 55.929 1.00 21.16 N +ATOM 1387 CA ILE A 185 22.272 13.344 56.632 1.00 21.46 C +ATOM 1388 C ILE A 185 21.443 12.628 57.704 1.00 24.63 C +ATOM 1389 O ILE A 185 20.694 13.250 58.450 1.00 23.29 O +ATOM 1390 CB ILE A 185 23.469 14.070 57.263 1.00 20.87 C +ATOM 1391 CG1 ILE A 185 24.222 14.802 56.135 1.00 21.99 C +ATOM 1392 CG2 ILE A 185 24.404 13.051 57.902 1.00 25.40 C +ATOM 1393 CD1 ILE A 185 25.428 15.528 56.616 1.00 26.85 C +ATOM 1394 N LEU A 186 21.553 11.328 57.721 1.00 22.57 N +ATOM 1395 CA LEU A 186 20.794 10.491 58.651 1.00 28.35 C +ATOM 1396 C LEU A 186 21.634 9.974 59.802 1.00 30.06 C +ATOM 1397 O LEU A 186 22.834 9.758 59.724 1.00 26.27 O +ATOM 1398 CB LEU A 186 20.161 9.312 57.930 1.00 25.96 C +ATOM 1399 CG LEU A 186 19.477 9.617 56.605 1.00 27.78 C +ATOM 1400 CD1 LEU A 186 19.037 8.339 55.925 1.00 33.99 C +ATOM 1401 CD2 LEU A 186 18.325 10.612 56.771 1.00 26.32 C +ATOM 1402 N ASP A 187 20.962 9.864 60.966 1.00 27.50 N +ATOM 1403 CA ASP A 187 21.602 9.408 62.187 1.00 25.55 C +ATOM 1404 C ASP A 187 21.609 7.887 62.220 1.00 27.91 C +ATOM 1405 O ASP A 187 21.159 7.205 61.293 1.00 30.39 O +ATOM 1406 CB ASP A 187 20.988 10.048 63.440 1.00 25.94 C +ATOM 1407 CG ASP A 187 19.558 9.546 63.691 1.00 26.13 C +ATOM 1408 OD1 ASP A 187 19.150 8.523 63.113 1.00 25.46 O +ATOM 1409 OD2 ASP A 187 18.852 10.230 64.469 1.00 29.49 O +ATOM 1410 N GLY A 188 22.004 7.368 63.375 1.00 32.72 N +ATOM 1411 CA GLY A 188 22.181 5.925 63.550 1.00 31.29 C +ATOM 1412 C GLY A 188 20.893 5.143 63.391 1.00 42.82 C +ATOM 1413 O GLY A 188 20.906 3.933 63.157 1.00 40.42 O +ATOM 1414 N LYS A 189 19.764 5.830 63.550 1.00 34.63 N +ATOM 1415 CA LYS A 189 18.446 5.215 63.409 1.00 32.84 C +ATOM 1416 C LYS A 189 17.795 5.506 62.085 1.00 34.79 C +ATOM 1417 O LYS A 189 16.619 5.206 61.846 1.00 37.76 O +ATOM 1418 CB LYS A 189 17.594 5.736 64.584 1.00 33.65 C +ATOM 1419 CG LYS A 189 18.119 5.253 65.924 1.00 47.47 C +ATOM 1420 CD LYS A 189 17.141 5.456 67.069 1.00 56.96 C +ATOM 1421 CE LYS A 189 17.876 5.363 68.399 1.00 64.13 C +ATOM 1422 NZ LYS A 189 16.998 5.574 69.581 1.00 69.50 N +ATOM 1423 N GLY A 190 18.534 6.103 61.137 1.00 31.15 N +ATOM 1424 CA GLY A 190 18.015 6.424 59.813 1.00 28.82 C +ATOM 1425 C GLY A 190 17.081 7.634 59.838 1.00 23.67 C +ATOM 1426 O GLY A 190 16.339 7.754 58.875 1.00 29.05 O +ATOM 1427 N GLN A 191 17.221 8.483 60.864 1.00 24.25 N +ATOM 1428 CA GLN A 191 16.419 9.711 60.928 1.00 26.68 C +ATOM 1429 C GLN A 191 17.204 10.955 60.508 1.00 23.95 C +ATOM 1430 O GLN A 191 18.388 11.147 60.825 1.00 25.11 O +ATOM 1431 CB GLN A 191 15.800 9.961 62.323 1.00 26.55 C +ATOM 1432 CG GLN A 191 14.847 8.803 62.691 1.00 26.54 C +ATOM 1433 CD GLN A 191 13.983 9.117 63.910 1.00 29.47 C +ATOM 1434 OE1 GLN A 191 14.300 9.927 64.764 1.00 29.58 O +ATOM 1435 NE2 GLN A 191 12.853 8.406 63.971 1.00 25.21 N +ATOM 1436 N ARG A 192 16.509 11.889 59.870 1.00 22.63 N +ATOM 1437 CA ARG A 192 17.084 13.137 59.386 1.00 25.09 C +ATOM 1438 C ARG A 192 17.768 13.882 60.509 1.00 21.79 C +ATOM 1439 O ARG A 192 17.177 14.074 61.602 1.00 22.05 O +ATOM 1440 CB ARG A 192 15.983 14.022 58.752 1.00 22.66 C +ATOM 1441 CG ARG A 192 16.359 15.481 58.504 1.00 25.80 C +ATOM 1442 CD ARG A 192 15.187 16.255 57.881 1.00 24.89 C +ATOM 1443 NE ARG A 192 15.317 17.692 57.955 1.00 22.78 N +ATOM 1444 CZ ARG A 192 14.441 18.669 57.961 1.00 22.82 C +ATOM 1445 NH1 ARG A 192 13.170 18.251 57.905 1.00 27.47 N +ATOM 1446 NH2 ARG A 192 14.757 19.922 57.965 1.00 25.54 N +ATOM 1447 N ILE A 193 18.970 14.415 60.286 1.00 21.83 N +ATOM 1448 CA ILE A 193 19.630 15.311 61.237 1.00 20.68 C +ATOM 1449 C ILE A 193 19.401 16.741 60.792 1.00 21.80 C +ATOM 1450 O ILE A 193 19.825 17.087 59.648 1.00 22.74 O +ATOM 1451 CB ILE A 193 21.134 15.019 61.368 1.00 22.15 C +ATOM 1452 CG1 ILE A 193 21.294 13.590 61.904 1.00 22.82 C +ATOM 1453 CG2 ILE A 193 21.813 16.069 62.253 1.00 19.45 C +ATOM 1454 CD1 ILE A 193 22.767 13.151 61.761 1.00 21.72 C +ATOM 1455 N ALA A 194 18.783 17.673 61.497 1.00 20.93 N +ATOM 1456 CA ALA A 194 18.377 18.972 60.998 1.00 19.11 C +ATOM 1457 C ALA A 194 19.543 19.906 60.821 1.00 21.15 C +ATOM 1458 O ALA A 194 19.543 20.652 59.792 1.00 20.36 O +ATOM 1459 CB ALA A 194 17.364 19.589 62.003 1.00 20.93 C +ATOM 1460 N GLU A 195 20.532 19.941 61.709 1.00 21.34 N +ATOM 1461 CA GLU A 195 21.653 20.877 61.591 1.00 19.80 C +ATOM 1462 C GLU A 195 22.968 20.137 61.838 1.00 20.73 C +ATOM 1463 O GLU A 195 23.034 19.208 62.635 1.00 25.31 O +ATOM 1464 CB GLU A 195 21.514 21.986 62.634 1.00 22.78 C +ATOM 1465 CG GLU A 195 20.223 22.785 62.452 1.00 26.60 C +ATOM 1466 CD GLU A 195 20.042 23.882 63.488 1.00 31.14 C +ATOM 1467 OE1 GLU A 195 19.913 23.553 64.681 1.00 29.69 O +ATOM 1468 OE2 GLU A 195 19.983 25.027 62.987 1.00 26.17 O +ATOM 1469 N MET A 196 24.018 20.628 61.210 1.00 21.62 N +ATOM 1470 CA MET A 196 25.321 19.934 61.289 1.00 22.28 C +ATOM 1471 C MET A 196 26.427 20.966 61.410 1.00 25.22 C +ATOM 1472 O MET A 196 26.451 22.047 60.849 1.00 25.64 O +ATOM 1473 CB MET A 196 25.521 19.177 59.971 1.00 27.49 C +ATOM 1474 CG MET A 196 26.851 18.431 59.839 1.00 26.00 C +ATOM 1475 SD MET A 196 26.816 17.034 61.026 1.00 25.31 S +ATOM 1476 CE MET A 196 25.237 16.304 60.569 1.00 29.75 C +ATOM 1477 N THR A 197 27.307 20.706 62.369 1.00 23.97 N +ATOM 1478 CA THR A 197 28.515 21.501 62.573 1.00 25.92 C +ATOM 1479 C THR A 197 29.696 20.564 62.298 1.00 20.78 C +ATOM 1480 O THR A 197 29.531 19.364 62.227 1.00 22.67 O +ATOM 1481 CB THR A 197 28.650 22.003 64.023 1.00 28.08 C +ATOM 1482 OG1 THR A 197 28.745 20.837 64.892 1.00 25.59 O +ATOM 1483 CG2 THR A 197 27.454 22.855 64.403 1.00 29.37 C +ATOM 1484 N ALA A 198 30.909 21.173 62.256 1.00 22.73 N +ATOM 1485 CA ALA A 198 32.108 20.321 62.103 1.00 21.82 C +ATOM 1486 C ALA A 198 32.335 19.377 63.313 1.00 20.37 C +ATOM 1487 O ALA A 198 32.701 18.268 63.028 1.00 22.71 O +ATOM 1488 CB ALA A 198 33.301 21.240 61.920 1.00 23.69 C +ATOM 1489 N ALA A 199 32.022 19.888 64.487 1.00 23.74 N +ATOM 1490 CA ALA A 199 32.231 19.047 65.672 1.00 23.64 C +ATOM 1491 C ALA A 199 31.313 17.833 65.583 1.00 27.76 C +ATOM 1492 O ALA A 199 31.662 16.723 65.931 1.00 27.51 O +ATOM 1493 CB ALA A 199 31.970 19.837 66.942 1.00 30.34 C +ATOM 1494 N LYS A 200 30.033 18.106 65.250 1.00 25.12 N +ATOM 1495 CA LYS A 200 29.076 17.011 65.171 1.00 24.08 C +ATOM 1496 C LYS A 200 29.419 16.031 64.113 1.00 21.07 C +ATOM 1497 O LYS A 200 29.324 14.810 64.269 1.00 24.53 O +ATOM 1498 CB LYS A 200 27.648 17.575 64.943 1.00 23.85 C +ATOM 1499 CG LYS A 200 26.603 16.481 64.819 1.00 26.44 C +ATOM 1500 CD LYS A 200 25.191 16.927 64.527 1.00 40.87 C +ATOM 1501 CE LYS A 200 24.565 17.877 65.527 1.00 35.38 C +ATOM 1502 NZ LYS A 200 23.085 18.051 65.238 1.00 28.46 N +ATOM 1503 N ALA A 201 29.860 16.498 62.895 1.00 22.18 N +ATOM 1504 CA ALA A 201 30.238 15.614 61.849 1.00 20.56 C +ATOM 1505 C ALA A 201 31.469 14.757 62.240 1.00 19.60 C +ATOM 1506 O ALA A 201 31.465 13.591 61.882 1.00 25.13 O +ATOM 1507 CB ALA A 201 30.571 16.369 60.536 1.00 23.00 C +ATOM 1508 N GLU A 202 32.423 15.411 62.924 1.00 23.59 N +ATOM 1509 CA GLU A 202 33.538 14.590 63.482 1.00 27.73 C +ATOM 1510 C GLU A 202 33.041 13.457 64.393 1.00 25.98 C +ATOM 1511 O GLU A 202 33.450 12.318 64.272 1.00 29.67 O +ATOM 1512 CB GLU A 202 34.472 15.461 64.298 1.00 25.38 C +ATOM 1513 CG GLU A 202 35.760 14.732 64.780 1.00 25.13 C +ATOM 1514 CD GLU A 202 36.546 15.577 65.702 1.00 23.35 C +ATOM 1515 OE1 GLU A 202 36.265 16.631 66.233 1.00 25.81 O +ATOM 1516 OE2 GLU A 202 37.717 15.079 65.958 1.00 27.68 O +ATOM 1517 N GLN A 203 32.093 13.786 65.251 1.00 24.97 N +ATOM 1518 CA GLN A 203 31.554 12.767 66.177 1.00 26.01 C +ATOM 1519 C GLN A 203 30.883 11.665 65.404 1.00 25.10 C +ATOM 1520 O GLN A 203 31.044 10.486 65.687 1.00 31.84 O +ATOM 1521 CB GLN A 203 30.568 13.436 67.121 1.00 33.15 C +ATOM 1522 CG GLN A 203 29.799 12.507 68.042 1.00 44.68 C +ATOM 1523 CD GLN A 203 28.468 13.061 68.509 1.00 58.34 C +ATOM 1524 OE1 GLN A 203 28.338 14.117 69.125 1.00 64.88 O +ATOM 1525 NE2 GLN A 203 27.407 12.306 68.211 1.00 61.71 N +ATOM 1526 N LEU A 204 30.012 12.039 64.427 1.00 24.46 N +ATOM 1527 CA LEU A 204 29.349 11.010 63.651 1.00 23.60 C +ATOM 1528 C LEU A 204 30.185 10.118 62.808 1.00 24.64 C +ATOM 1529 O LEU A 204 29.894 8.983 62.410 1.00 31.80 O +ATOM 1530 CB LEU A 204 28.218 11.683 62.810 1.00 27.24 C +ATOM 1531 CG LEU A 204 27.130 12.304 63.687 1.00 26.37 C +ATOM 1532 CD1 LEU A 204 26.278 13.284 62.866 1.00 30.16 C +ATOM 1533 CD2 LEU A 204 26.298 11.211 64.343 1.00 31.48 C +ATOM 1534 N ILE A 205 31.314 10.692 62.325 1.00 24.11 N +ATOM 1535 CA ILE A 205 32.278 9.897 61.559 1.00 29.17 C +ATOM 1536 C ILE A 205 33.032 8.941 62.508 1.00 25.07 C +ATOM 1537 O ILE A 205 33.230 7.779 62.161 1.00 35.15 O +ATOM 1538 CB AILE A 205 33.277 10.888 60.930 0.50 19.93 C +ATOM 1539 CG1AILE A 205 32.559 11.744 59.890 0.50 21.30 C +ATOM 1540 CG2AILE A 205 34.469 10.188 60.294 0.50 23.89 C +ATOM 1541 CD1AILE A 205 33.366 12.750 59.109 0.50 20.09 C +ATOM 1542 CB BILE A 205 33.300 10.810 60.870 0.50 19.93 C +ATOM 1543 CG1BILE A 205 32.648 11.802 59.904 0.50 21.30 C +ATOM 1544 CG2BILE A 205 34.336 10.045 60.044 0.50 23.89 C +ATOM 1545 CD1BILE A 205 31.869 11.118 58.779 0.50 20.09 C +ATOM 1546 N GLU A 206 33.343 9.425 63.698 1.00 27.72 N +ATOM 1547 CA GLU A 206 34.038 8.615 64.721 1.00 25.29 C +ATOM 1548 C GLU A 206 33.160 7.434 65.115 1.00 32.40 C +ATOM 1549 O GLU A 206 33.627 6.304 65.317 1.00 36.98 O +ATOM 1550 CB GLU A 206 34.305 9.493 65.965 1.00 24.93 C +ATOM 1551 CG GLU A 206 35.492 10.442 65.807 1.00 24.71 C +ATOM 1552 CD GLU A 206 35.736 11.296 67.013 1.00 31.24 C +ATOM 1553 OE1 GLU A 206 36.536 12.259 66.947 1.00 34.00 O +ATOM 1554 OE2 GLU A 206 35.132 11.096 68.084 1.00 40.77 O +ATOM 1555 N GLN A 207 31.843 7.688 65.136 1.00 36.82 N +ATOM 1556 CA GLN A 207 30.870 6.653 65.502 1.00 32.40 C +ATOM 1557 C GLN A 207 30.492 5.794 64.334 1.00 26.78 C +ATOM 1558 O GLN A 207 29.634 4.899 64.534 1.00 36.07 O +ATOM 1559 CB GLN A 207 29.629 7.327 66.077 1.00 30.77 C +ATOM 1560 CG GLN A 207 30.003 8.177 67.296 1.00 36.05 C +ATOM 1561 CD GLN A 207 28.744 8.859 67.816 1.00 47.55 C +ATOM 1562 OE1 GLN A 207 27.910 9.342 67.047 1.00 48.74 O +ATOM 1563 NE2 GLN A 207 28.575 8.874 69.130 1.00 56.71 N +ATOM 1564 N GLY A 208 31.028 5.988 63.151 1.00 31.42 N +ATOM 1565 CA GLY A 208 30.716 5.134 62.002 1.00 26.27 C +ATOM 1566 C GLY A 208 29.285 5.325 61.479 1.00 36.32 C +ATOM 1567 O GLY A 208 28.744 4.490 60.739 1.00 33.98 O +ATOM 1568 N ILE A 209 28.663 6.445 61.823 1.00 29.57 N +ATOM 1569 CA ILE A 209 27.303 6.739 61.276 1.00 27.50 C +ATOM 1570 C ILE A 209 27.343 7.359 59.882 1.00 39.10 C +ATOM 1571 O ILE A 209 26.495 7.038 59.038 1.00 32.00 O +ATOM 1572 CB AILE A 209 26.584 7.651 62.280 0.50 21.66 C +ATOM 1573 CG1AILE A 209 26.447 6.983 63.661 0.50 20.53 C +ATOM 1574 CG2AILE A 209 25.225 8.150 61.811 0.50 19.70 C +ATOM 1575 CD1AILE A 209 25.443 5.884 63.704 0.50 30.87 C +ATOM 1576 CB BILE A 209 26.572 7.682 62.251 0.50 21.66 C +ATOM 1577 CG1BILE A 209 26.443 7.124 63.668 0.50 20.53 C +ATOM 1578 CG2BILE A 209 25.147 8.013 61.802 0.50 19.70 C +ATOM 1579 CD1BILE A 209 25.714 8.074 64.620 0.50 30.87 C +ATOM 1580 N ILE A 210 28.250 8.313 59.662 1.00 29.49 N +ATOM 1581 CA ILE A 210 28.453 8.899 58.329 1.00 35.89 C +ATOM 1582 C ILE A 210 29.578 8.070 57.646 1.00 25.94 C +ATOM 1583 O ILE A 210 30.608 8.048 58.289 1.00 31.25 O +ATOM 1584 CB ILE A 210 28.908 10.369 58.458 1.00 26.24 C +ATOM 1585 CG1 ILE A 210 27.706 11.246 58.860 1.00 29.60 C +ATOM 1586 CG2 ILE A 210 29.523 10.961 57.196 1.00 34.92 C +ATOM 1587 CD1 ILE A 210 28.066 12.622 59.289 1.00 24.20 C +ATOM 1588 N THR A 211 29.255 7.534 56.509 1.00 32.26 N +ATOM 1589 CA THR A 211 30.137 6.727 55.718 1.00 43.96 C +ATOM 1590 C THR A 211 29.946 6.989 54.221 1.00 40.63 C +ATOM 1591 O THR A 211 29.050 7.605 53.651 1.00 40.14 O +ATOM 1592 CB THR A 211 29.922 5.218 55.990 1.00 45.68 C +ATOM 1593 OG1 THR A 211 28.689 4.774 55.432 1.00 40.84 O +ATOM 1594 CG2 THR A 211 29.946 4.989 57.495 1.00 50.97 C +ATOM 1595 N ASP A 212 30.953 6.424 53.560 1.00 50.02 N +ATOM 1596 CA ASP A 212 31.178 6.411 52.139 1.00 47.29 C +ATOM 1597 C ASP A 212 31.157 7.831 51.579 1.00 33.52 C +ATOM 1598 O ASP A 212 31.919 8.681 52.049 1.00 40.97 O +ATOM 1599 CB ASP A 212 30.267 5.484 51.352 1.00 55.38 C +ATOM 1600 CG ASP A 212 29.296 6.151 50.410 1.00 63.02 C +ATOM 1601 OD1 ASP A 212 29.400 7.361 50.129 1.00 69.89 O +ATOM 1602 OD2 ASP A 212 28.381 5.463 49.906 1.00 74.24 O +ATOM 1603 N GLY A 213 30.378 8.011 50.538 1.00 38.75 N +ATOM 1604 CA GLY A 213 30.391 9.300 49.832 1.00 41.93 C +ATOM 1605 C GLY A 213 29.722 10.347 50.718 1.00 37.44 C +ATOM 1606 O GLY A 213 29.735 11.522 50.399 1.00 40.21 O +ATOM 1607 N MET A 214 29.187 9.889 51.860 1.00 36.70 N +ATOM 1608 CA MET A 214 28.452 10.864 52.665 1.00 33.13 C +ATOM 1609 C MET A 214 29.386 11.757 53.446 1.00 26.52 C +ATOM 1610 O MET A 214 29.210 12.913 53.734 1.00 34.08 O +ATOM 1611 CB MET A 214 27.379 10.299 53.600 1.00 32.32 C +ATOM 1612 CG MET A 214 26.539 11.453 54.185 1.00 41.75 C +ATOM 1613 SD MET A 214 25.537 12.219 52.869 1.00 52.83 S +ATOM 1614 CE MET A 214 25.740 13.983 53.185 1.00 52.18 C +ATOM 1615 N ILE A 215 30.592 11.165 53.683 1.00 31.67 N +ATOM 1616 CA ILE A 215 31.732 11.678 54.353 1.00 28.70 C +ATOM 1617 C ILE A 215 32.310 12.756 53.399 1.00 29.67 C +ATOM 1618 O ILE A 215 32.518 13.896 53.767 1.00 28.09 O +ATOM 1619 CB ILE A 215 32.869 10.691 54.677 1.00 32.82 C +ATOM 1620 CG1 ILE A 215 32.514 9.749 55.856 1.00 32.48 C +ATOM 1621 CG2 ILE A 215 34.105 11.426 55.173 1.00 31.16 C +ATOM 1622 CD1 ILE A 215 33.693 8.871 56.241 1.00 38.44 C +ATOM 1623 N VAL A 216 32.331 12.388 52.125 1.00 30.16 N +ATOM 1624 CA VAL A 216 32.810 13.322 51.101 1.00 31.80 C +ATOM 1625 C VAL A 216 31.785 14.457 50.954 1.00 21.07 C +ATOM 1626 O VAL A 216 32.246 15.603 50.880 1.00 25.35 O +ATOM 1627 CB VAL A 216 32.994 12.565 49.796 1.00 28.16 C +ATOM 1628 CG1 VAL A 216 33.287 13.471 48.597 1.00 29.82 C +ATOM 1629 CG2 VAL A 216 34.169 11.578 49.933 1.00 30.45 C +ATOM 1630 N LYS A 217 30.510 14.125 50.970 1.00 23.27 N +ATOM 1631 CA LYS A 217 29.472 15.133 50.841 1.00 21.79 C +ATOM 1632 C LYS A 217 29.498 16.146 51.983 1.00 24.66 C +ATOM 1633 O LYS A 217 29.449 17.358 51.749 1.00 23.51 O +ATOM 1634 CB LYS A 217 28.077 14.535 50.654 1.00 25.90 C +ATOM 1635 CG LYS A 217 27.047 15.536 50.151 1.00 28.71 C +ATOM 1636 CD LYS A 217 25.624 15.031 50.217 1.00 30.25 C +ATOM 1637 CE LYS A 217 25.413 13.825 49.316 1.00 35.66 C +ATOM 1638 NZ LYS A 217 25.887 14.192 47.945 1.00 32.82 N +ATOM 1639 N VAL A 218 29.509 15.686 53.224 1.00 24.46 N +ATOM 1640 CA VAL A 218 29.514 16.563 54.383 1.00 21.61 C +ATOM 1641 C VAL A 218 30.726 17.428 54.481 1.00 22.62 C +ATOM 1642 O VAL A 218 30.821 18.555 54.929 1.00 23.11 O +ATOM 1643 CB VAL A 218 29.267 15.841 55.740 1.00 22.66 C +ATOM 1644 CG1 VAL A 218 30.512 15.062 56.216 1.00 28.55 C +ATOM 1645 CG2 VAL A 218 28.906 16.808 56.860 1.00 26.38 C +ATOM 1646 N ASN A 219 31.917 16.881 54.186 1.00 24.70 N +ATOM 1647 CA ASN A 219 33.151 17.619 54.219 1.00 22.89 C +ATOM 1648 C ASN A 219 33.129 18.687 53.092 1.00 20.19 C +ATOM 1649 O ASN A 219 33.553 19.807 53.383 1.00 21.74 O +ATOM 1650 CB ASN A 219 34.394 16.751 53.985 1.00 25.98 C +ATOM 1651 CG ASN A 219 34.735 15.843 55.143 1.00 47.87 C +ATOM 1652 OD1 ASN A 219 33.860 15.200 55.716 1.00 54.97 O +ATOM 1653 ND2 ASN A 219 36.027 15.816 55.443 1.00 43.28 N +ATOM 1654 N ALA A 220 32.547 18.380 51.941 1.00 21.69 N +ATOM 1655 CA ALA A 220 32.431 19.384 50.884 1.00 19.96 C +ATOM 1656 C ALA A 220 31.481 20.497 51.339 1.00 19.62 C +ATOM 1657 O ALA A 220 31.768 21.679 51.121 1.00 22.02 O +ATOM 1658 CB ALA A 220 31.957 18.764 49.569 1.00 21.25 C +ATOM 1659 N ALA A 221 30.361 20.159 51.977 1.00 19.62 N +ATOM 1660 CA ALA A 221 29.435 21.162 52.479 1.00 18.81 C +ATOM 1661 C ALA A 221 30.007 22.041 53.605 1.00 17.47 C +ATOM 1662 O ALA A 221 29.859 23.245 53.584 1.00 19.58 O +ATOM 1663 CB ALA A 221 28.180 20.427 52.943 1.00 19.78 C +ATOM 1664 N LEU A 222 30.756 21.325 54.514 1.00 18.65 N +ATOM 1665 CA LEU A 222 31.418 22.147 55.511 1.00 19.27 C +ATOM 1666 C LEU A 222 32.471 23.148 55.001 1.00 20.19 C +ATOM 1667 O LEU A 222 32.634 24.249 55.509 1.00 21.52 O +ATOM 1668 CB LEU A 222 32.082 21.190 56.586 1.00 19.94 C +ATOM 1669 CG LEU A 222 31.079 20.507 57.531 1.00 23.57 C +ATOM 1670 CD1 LEU A 222 31.698 19.252 58.182 1.00 22.52 C +ATOM 1671 CD2 LEU A 222 30.591 21.534 58.549 1.00 25.45 C +ATOM 1672 N ASP A 223 33.206 22.649 53.963 1.00 20.96 N +ATOM 1673 CA ASP A 223 34.240 23.536 53.397 1.00 24.02 C +ATOM 1674 C ASP A 223 33.533 24.747 52.787 1.00 21.34 C +ATOM 1675 O ASP A 223 33.918 25.911 52.935 1.00 22.64 O +ATOM 1676 CB ASP A 223 34.959 22.750 52.309 1.00 20.83 C +ATOM 1677 CG ASP A 223 36.034 23.573 51.644 1.00 25.71 C +ATOM 1678 OD1 ASP A 223 36.558 24.518 52.281 1.00 36.60 O +ATOM 1679 OD2 ASP A 223 36.421 23.275 50.493 1.00 36.17 O +ATOM 1680 N ALA A 224 32.419 24.498 52.084 1.00 19.85 N +ATOM 1681 CA ALA A 224 31.675 25.577 51.445 1.00 20.77 C +ATOM 1682 C ALA A 224 31.106 26.561 52.470 1.00 21.11 C +ATOM 1683 O ALA A 224 31.219 27.768 52.227 1.00 21.60 O +ATOM 1684 CB ALA A 224 30.544 25.045 50.580 1.00 18.57 C +ATOM 1685 N ALA A 225 30.558 26.081 53.579 1.00 21.79 N +ATOM 1686 CA ALA A 225 30.043 26.980 54.595 1.00 21.00 C +ATOM 1687 C ALA A 225 31.123 27.857 55.208 1.00 22.43 C +ATOM 1688 O ALA A 225 30.884 29.042 55.439 1.00 23.81 O +ATOM 1689 CB ALA A 225 29.377 26.109 55.678 1.00 22.52 C +ATOM 1690 N ARG A 226 32.281 27.232 55.462 1.00 24.98 N +ATOM 1691 CA ARG A 226 33.321 28.083 56.090 1.00 25.33 C +ATOM 1692 C ARG A 226 33.874 29.082 55.072 1.00 28.39 C +ATOM 1693 O ARG A 226 34.220 30.204 55.415 1.00 29.50 O +ATOM 1694 CB ARG A 226 34.407 27.281 56.750 1.00 35.01 C +ATOM 1695 CG ARG A 226 34.975 26.100 56.019 1.00 37.04 C +ATOM 1696 CD ARG A 226 36.247 25.665 56.805 1.00 36.76 C +ATOM 1697 NE ARG A 226 35.842 24.773 57.876 1.00 37.58 N +ATOM 1698 CZ ARG A 226 35.696 23.462 57.788 1.00 28.86 C +ATOM 1699 NH1 ARG A 226 35.933 22.807 56.678 1.00 33.00 N +ATOM 1700 NH2 ARG A 226 35.317 22.748 58.858 1.00 34.87 N +ATOM 1701 N THR A 227 33.932 28.604 53.808 1.00 23.23 N +ATOM 1702 CA THR A 227 34.513 29.481 52.785 1.00 27.24 C +ATOM 1703 C THR A 227 33.634 30.649 52.383 1.00 26.32 C +ATOM 1704 O THR A 227 34.127 31.737 52.063 1.00 35.64 O +ATOM 1705 CB THR A 227 34.899 28.683 51.520 1.00 22.28 C +ATOM 1706 OG1 THR A 227 35.749 27.607 51.901 1.00 27.04 O +ATOM 1707 CG2 THR A 227 35.486 29.532 50.411 1.00 25.16 C +ATOM 1708 N LEU A 228 32.318 30.426 52.363 1.00 24.93 N +ATOM 1709 CA LEU A 228 31.376 31.468 52.004 1.00 29.14 C +ATOM 1710 C LEU A 228 30.873 32.244 53.222 1.00 26.29 C +ATOM 1711 O LEU A 228 30.341 33.342 53.094 1.00 30.17 O +ATOM 1712 CB LEU A 228 30.170 30.819 51.316 1.00 33.54 C +ATOM 1713 CG LEU A 228 30.331 29.840 50.170 1.00 36.05 C +ATOM 1714 CD1 LEU A 228 29.052 29.018 49.902 1.00 34.69 C +ATOM 1715 CD2 LEU A 228 30.706 30.580 48.873 1.00 33.06 C +ATOM 1716 N GLY A 229 30.959 31.653 54.414 1.00 27.76 N +ATOM 1717 CA GLY A 229 30.383 32.278 55.608 1.00 27.35 C +ATOM 1718 C GLY A 229 28.859 32.178 55.580 1.00 34.14 C +ATOM 1719 O GLY A 229 28.138 32.980 56.176 1.00 36.27 O +ATOM 1720 N ARG A 230 28.269 31.221 54.869 1.00 25.48 N +ATOM 1721 CA ARG A 230 26.837 31.045 54.783 1.00 26.11 C +ATOM 1722 C ARG A 230 26.496 29.562 54.948 1.00 24.68 C +ATOM 1723 O ARG A 230 27.285 28.694 54.558 1.00 26.62 O +ATOM 1724 CB ARG A 230 26.279 31.510 53.449 1.00 27.93 C +ATOM 1725 CG ARG A 230 26.245 32.925 52.947 1.00 42.47 C +ATOM 1726 CD ARG A 230 26.137 32.942 51.420 1.00 48.52 C +ATOM 1727 NE ARG A 230 26.991 33.946 50.830 1.00 51.91 N +ATOM 1728 CZ ARG A 230 27.344 34.074 49.565 1.00 53.94 C +ATOM 1729 NH1 ARG A 230 26.869 33.198 48.680 1.00 31.65 N +ATOM 1730 NH2 ARG A 230 28.147 35.076 49.228 1.00 55.00 N +ATOM 1731 N PRO A 231 25.343 29.210 55.508 1.00 24.23 N +ATOM 1732 CA PRO A 231 24.925 27.843 55.567 1.00 22.46 C +ATOM 1733 C PRO A 231 24.765 27.170 54.203 1.00 20.92 C +ATOM 1734 O PRO A 231 24.412 27.817 53.216 1.00 26.04 O +ATOM 1735 CB PRO A 231 23.565 27.946 56.282 1.00 27.15 C +ATOM 1736 CG PRO A 231 23.060 29.299 55.875 1.00 35.76 C +ATOM 1737 CD PRO A 231 24.302 30.180 55.961 1.00 31.06 C +ATOM 1738 N VAL A 232 24.927 25.875 54.182 1.00 19.90 N +ATOM 1739 CA VAL A 232 24.729 25.072 52.988 1.00 17.54 C +ATOM 1740 C VAL A 232 23.823 23.917 53.351 1.00 22.52 C +ATOM 1741 O VAL A 232 24.015 23.170 54.312 1.00 22.59 O +ATOM 1742 CB VAL A 232 26.121 24.534 52.548 1.00 22.04 C +ATOM 1743 CG1 VAL A 232 25.969 23.664 51.308 1.00 26.45 C +ATOM 1744 CG2 VAL A 232 27.135 25.643 52.343 1.00 24.66 C +ATOM 1745 N ASP A 233 22.847 23.716 52.469 1.00 21.00 N +ATOM 1746 CA ASP A 233 21.879 22.676 52.729 1.00 22.60 C +ATOM 1747 C ASP A 233 22.130 21.393 51.932 1.00 21.61 C +ATOM 1748 O ASP A 233 22.521 21.558 50.766 1.00 20.69 O +ATOM 1749 CB ASP A 233 20.453 23.101 52.304 1.00 24.61 C +ATOM 1750 CG ASP A 233 19.867 24.176 53.190 1.00 40.17 C +ATOM 1751 OD1 ASP A 233 20.020 23.976 54.396 1.00 35.33 O +ATOM 1752 OD2 ASP A 233 19.309 25.130 52.611 1.00 47.75 O +ATOM 1753 N ILE A 234 21.933 20.306 52.702 1.00 21.43 N +ATOM 1754 CA ILE A 234 21.819 19.028 51.941 1.00 20.98 C +ATOM 1755 C ILE A 234 20.413 18.539 51.909 1.00 21.56 C +ATOM 1756 O ILE A 234 19.803 18.330 52.956 1.00 21.74 O +ATOM 1757 CB ILE A 234 22.744 17.987 52.607 1.00 19.42 C +ATOM 1758 CG1 ILE A 234 24.181 18.383 52.354 1.00 21.42 C +ATOM 1759 CG2 ILE A 234 22.475 16.588 52.075 1.00 22.55 C +ATOM 1760 CD1 ILE A 234 25.174 17.573 53.170 1.00 21.50 C +ATOM 1761 N ALA A 235 19.683 18.293 50.835 1.00 19.36 N +ATOM 1762 CA ALA A 235 18.284 17.936 50.846 1.00 22.06 C +ATOM 1763 C ALA A 235 17.881 17.010 49.730 1.00 23.69 C +ATOM 1764 O ALA A 235 18.715 16.759 48.835 1.00 22.75 O +ATOM 1765 CB ALA A 235 17.518 19.257 50.763 1.00 22.43 C +ATOM 1766 N SER A 236 16.681 16.464 49.685 1.00 23.68 N +ATOM 1767 CA SER A 236 16.245 15.515 48.689 1.00 24.89 C +ATOM 1768 C SER A 236 15.533 16.172 47.508 1.00 22.96 C +ATOM 1769 O SER A 236 14.850 17.197 47.716 1.00 27.12 O +ATOM 1770 CB SER A 236 15.277 14.517 49.327 1.00 24.11 C +ATOM 1771 OG SER A 236 14.779 13.611 48.349 1.00 26.80 O +ATOM 1772 N TRP A 237 15.712 15.615 46.346 1.00 26.16 N +ATOM 1773 CA TRP A 237 15.009 16.005 45.125 1.00 28.98 C +ATOM 1774 C TRP A 237 13.753 15.178 44.885 1.00 29.81 C +ATOM 1775 O TRP A 237 13.104 15.351 43.835 1.00 26.48 O +ATOM 1776 CB TRP A 237 15.927 15.797 43.896 1.00 32.89 C +ATOM 1777 CG TRP A 237 16.434 14.372 43.809 1.00 35.76 C +ATOM 1778 CD1 TRP A 237 17.691 13.960 44.168 1.00 48.89 C +ATOM 1779 CD2 TRP A 237 15.737 13.178 43.422 1.00 38.58 C +ATOM 1780 NE1 TRP A 237 17.813 12.595 43.990 1.00 41.26 N +ATOM 1781 CE2 TRP A 237 16.621 12.096 43.521 1.00 47.71 C +ATOM 1782 CE3 TRP A 237 14.444 12.945 42.948 1.00 46.53 C +ATOM 1783 CZ2 TRP A 237 16.252 10.786 43.206 1.00 31.62 C +ATOM 1784 CZ3 TRP A 237 14.071 11.647 42.617 1.00 46.87 C +ATOM 1785 CH2 TRP A 237 14.965 10.583 42.743 1.00 34.48 C +ATOM 1786 N ARG A 238 13.449 14.261 45.780 1.00 23.51 N +ATOM 1787 CA ARG A 238 12.391 13.286 45.575 1.00 28.62 C +ATOM 1788 C ARG A 238 10.955 13.820 45.687 1.00 27.90 C +ATOM 1789 O ARG A 238 10.171 13.399 44.837 1.00 34.68 O +ATOM 1790 CB ARG A 238 12.519 12.111 46.575 1.00 28.34 C +ATOM 1791 CG ARG A 238 13.769 11.282 46.298 1.00 38.77 C +ATOM 1792 CD ARG A 238 13.671 9.960 47.067 1.00 41.16 C +ATOM 1793 NE ARG A 238 14.865 9.138 46.854 1.00 43.93 N +ATOM 1794 CZ ARG A 238 14.978 8.221 45.895 1.00 52.69 C +ATOM 1795 NH1 ARG A 238 13.962 8.020 45.061 1.00 49.65 N +ATOM 1796 NH2 ARG A 238 16.108 7.527 45.826 1.00 51.00 N +ATOM 1797 N HIS A 239 10.660 14.716 46.598 1.00 26.97 N +ATOM 1798 CA HIS A 239 9.285 15.108 46.891 1.00 32.36 C +ATOM 1799 C HIS A 239 8.942 16.512 46.366 1.00 25.66 C +ATOM 1800 O HIS A 239 9.333 17.508 46.913 1.00 29.79 O +ATOM 1801 CB HIS A 239 9.022 15.107 48.405 1.00 28.52 C +ATOM 1802 CG HIS A 239 9.481 13.800 49.012 1.00 32.26 C +ATOM 1803 ND1 HIS A 239 9.173 12.603 48.424 1.00 31.16 N +ATOM 1804 CD2 HIS A 239 10.219 13.546 50.114 1.00 48.01 C +ATOM 1805 CE1 HIS A 239 9.724 11.627 49.152 1.00 33.74 C +ATOM 1806 NE2 HIS A 239 10.348 12.184 50.175 1.00 43.29 N +ATOM 1807 N ALA A 240 8.113 16.426 45.338 1.00 34.03 N +ATOM 1808 CA ALA A 240 7.651 17.547 44.556 1.00 29.51 C +ATOM 1809 C ALA A 240 7.182 18.745 45.340 1.00 27.65 C +ATOM 1810 O ALA A 240 7.608 19.902 45.102 1.00 29.10 O +ATOM 1811 CB ALA A 240 6.535 17.035 43.641 1.00 35.27 C +ATOM 1812 N GLU A 241 6.345 18.487 46.372 1.00 25.19 N +ATOM 1813 CA GLU A 241 5.777 19.589 47.139 1.00 27.28 C +ATOM 1814 C GLU A 241 6.782 20.397 47.937 1.00 26.52 C +ATOM 1815 O GLU A 241 6.517 21.496 48.379 1.00 28.02 O +ATOM 1816 CB GLU A 241 4.687 19.116 48.117 1.00 26.40 C +ATOM 1817 CG GLU A 241 5.175 18.405 49.358 1.00 29.82 C +ATOM 1818 CD GLU A 241 5.572 16.998 49.100 1.00 24.30 C +ATOM 1819 OE1 GLU A 241 5.918 16.293 50.140 1.00 31.28 O +ATOM 1820 OE2 GLU A 241 5.625 16.374 48.042 1.00 24.47 O +ATOM 1821 N GLN A 242 7.967 19.756 48.172 1.00 24.39 N +ATOM 1822 CA GLN A 242 8.961 20.460 48.965 1.00 26.75 C +ATOM 1823 C GLN A 242 9.931 21.347 48.140 1.00 25.13 C +ATOM 1824 O GLN A 242 10.592 22.153 48.792 1.00 25.67 O +ATOM 1825 CB GLN A 242 9.875 19.418 49.682 1.00 26.27 C +ATOM 1826 CG GLN A 242 8.986 18.659 50.701 1.00 34.20 C +ATOM 1827 CD GLN A 242 9.716 17.547 51.417 1.00 44.02 C +ATOM 1828 OE1 GLN A 242 10.932 17.446 51.309 1.00 41.07 O +ATOM 1829 NE2 GLN A 242 9.048 16.674 52.159 1.00 38.91 N +ATOM 1830 N LEU A 243 9.853 21.105 46.839 1.00 22.29 N +ATOM 1831 CA LEU A 243 10.888 21.818 46.034 1.00 23.53 C +ATOM 1832 C LEU A 243 10.835 23.308 46.062 1.00 24.74 C +ATOM 1833 O LEU A 243 11.868 24.005 46.228 1.00 24.28 O +ATOM 1834 CB LEU A 243 10.804 21.272 44.605 1.00 27.22 C +ATOM 1835 CG LEU A 243 11.146 19.774 44.490 1.00 30.89 C +ATOM 1836 CD1 LEU A 243 11.083 19.251 43.067 1.00 36.90 C +ATOM 1837 CD2 LEU A 243 12.514 19.501 45.096 1.00 29.65 C +ATOM 1838 N PRO A 244 9.670 23.900 45.867 1.00 23.52 N +ATOM 1839 CA PRO A 244 9.629 25.381 45.868 1.00 30.12 C +ATOM 1840 C PRO A 244 10.169 26.024 47.111 1.00 29.69 C +ATOM 1841 O PRO A 244 10.980 26.973 47.129 1.00 28.49 O +ATOM 1842 CB PRO A 244 8.164 25.661 45.557 1.00 27.86 C +ATOM 1843 CG PRO A 244 7.687 24.481 44.769 1.00 27.94 C +ATOM 1844 CD PRO A 244 8.425 23.278 45.346 1.00 24.19 C +ATOM 1845 N ALA A 245 9.726 25.586 48.299 1.00 30.26 N +ATOM 1846 CA ALA A 245 10.242 26.117 49.562 1.00 32.15 C +ATOM 1847 C ALA A 245 11.741 25.895 49.792 1.00 31.98 C +ATOM 1848 O ALA A 245 12.450 26.738 50.349 1.00 33.12 O +ATOM 1849 CB ALA A 245 9.506 25.467 50.734 1.00 39.88 C +ATOM 1850 N LEU A 246 12.203 24.709 49.393 1.00 29.35 N +ATOM 1851 CA LEU A 246 13.611 24.368 49.457 1.00 32.09 C +ATOM 1852 C LEU A 246 14.408 25.393 48.673 1.00 35.78 C +ATOM 1853 O LEU A 246 15.355 25.991 49.204 1.00 32.13 O +ATOM 1854 CB LEU A 246 13.803 22.941 48.961 1.00 35.27 C +ATOM 1855 CG LEU A 246 15.268 22.467 48.852 1.00 38.36 C +ATOM 1856 CD1 LEU A 246 16.002 22.558 50.176 1.00 44.94 C +ATOM 1857 CD2 LEU A 246 15.277 21.048 48.310 1.00 38.03 C +ATOM 1858 N PHE A 247 14.046 25.658 47.402 1.00 25.54 N +ATOM 1859 CA PHE A 247 14.821 26.652 46.643 1.00 25.93 C +ATOM 1860 C PHE A 247 14.735 28.083 47.170 1.00 32.98 C +ATOM 1861 O PHE A 247 15.610 28.917 46.882 1.00 36.91 O +ATOM 1862 CB PHE A 247 14.405 26.613 45.185 1.00 31.21 C +ATOM 1863 CG PHE A 247 14.593 25.293 44.512 1.00 26.11 C +ATOM 1864 CD1 PHE A 247 14.023 25.006 43.283 1.00 30.49 C +ATOM 1865 CD2 PHE A 247 15.445 24.324 45.073 1.00 32.33 C +ATOM 1866 CE1 PHE A 247 14.216 23.802 42.677 1.00 32.29 C +ATOM 1867 CE2 PHE A 247 15.620 23.100 44.465 1.00 39.22 C +ATOM 1868 CZ PHE A 247 15.022 22.844 43.251 1.00 34.59 C +ATOM 1869 N ASN A 248 13.749 28.394 47.964 1.00 31.49 N +ATOM 1870 CA ASN A 248 13.538 29.693 48.589 1.00 41.03 C +ATOM 1871 C ASN A 248 14.252 29.824 49.934 1.00 47.55 C +ATOM 1872 O ASN A 248 14.231 30.908 50.521 1.00 47.10 O +ATOM 1873 CB ASN A 248 12.048 30.004 48.746 1.00 36.95 C +ATOM 1874 CG ASN A 248 11.792 31.498 48.835 1.00 48.60 C +ATOM 1875 OD1 ASN A 248 10.891 31.971 49.535 1.00 40.94 O +ATOM 1876 ND2 ASN A 248 12.588 32.295 48.113 1.00 39.08 N +ATOM 1877 N GLY A 249 14.794 28.732 50.464 1.00 39.73 N +ATOM 1878 CA GLY A 249 15.681 28.813 51.625 1.00 38.71 C +ATOM 1879 C GLY A 249 15.224 28.069 52.868 1.00 40.69 C +ATOM 1880 O GLY A 249 16.022 27.990 53.804 1.00 48.32 O +ATOM 1881 N MET A 250 14.079 27.473 52.887 1.00 35.40 N +ATOM 1882 CA MET A 250 13.442 26.704 53.944 1.00 49.78 C +ATOM 1883 C MET A 250 14.280 25.436 54.144 1.00 45.65 C +ATOM 1884 O MET A 250 14.847 24.872 53.202 1.00 42.49 O +ATOM 1885 CB MET A 250 11.979 26.452 53.594 1.00 43.16 C +ATOM 1886 CG MET A 250 11.000 25.824 54.579 1.00 58.89 C +ATOM 1887 SD MET A 250 9.941 24.548 53.910 1.00 70.40 S +ATOM 1888 CE MET A 250 8.230 25.103 53.862 1.00 39.65 C +ATOM 1889 N PRO A 251 14.420 25.028 55.396 1.00 51.19 N +ATOM 1890 CA PRO A 251 15.202 23.857 55.780 1.00 47.08 C +ATOM 1891 C PRO A 251 14.434 22.570 55.626 1.00 40.68 C +ATOM 1892 O PRO A 251 13.554 22.216 56.424 1.00 37.97 O +ATOM 1893 CB PRO A 251 15.498 24.191 57.247 1.00 42.98 C +ATOM 1894 CG PRO A 251 14.239 24.806 57.739 1.00 44.97 C +ATOM 1895 CD PRO A 251 13.530 25.391 56.538 1.00 50.50 C +ATOM 1896 N MET A 252 14.787 21.797 54.594 1.00 33.05 N +ATOM 1897 CA MET A 252 14.107 20.546 54.301 1.00 30.21 C +ATOM 1898 C MET A 252 14.923 19.272 54.589 1.00 23.34 C +ATOM 1899 O MET A 252 14.440 18.134 54.485 1.00 27.09 O +ATOM 1900 CB MET A 252 13.859 20.582 52.763 1.00 34.27 C +ATOM 1901 CG MET A 252 12.841 21.613 52.290 1.00 38.48 C +ATOM 1902 SD MET A 252 11.566 22.068 53.468 1.00 44.86 S +ATOM 1903 CE MET A 252 10.696 20.519 53.622 1.00 37.10 C +ATOM 1904 N GLY A 253 16.187 19.506 54.868 1.00 24.24 N +ATOM 1905 CA GLY A 253 17.096 18.359 55.032 1.00 20.34 C +ATOM 1906 C GLY A 253 18.078 18.662 56.121 1.00 23.58 C +ATOM 1907 O GLY A 253 17.654 18.800 57.296 1.00 22.18 O +ATOM 1908 N THR A 254 19.371 18.695 55.843 1.00 19.16 N +ATOM 1909 CA THR A 254 20.396 18.994 56.812 1.00 19.66 C +ATOM 1910 C THR A 254 21.057 20.314 56.592 1.00 20.88 C +ATOM 1911 O THR A 254 21.617 20.434 55.435 1.00 20.88 O +ATOM 1912 CB THR A 254 21.467 17.893 56.946 1.00 18.67 C +ATOM 1913 OG1 THR A 254 20.817 16.643 57.197 1.00 21.57 O +ATOM 1914 CG2 THR A 254 22.481 18.243 57.977 1.00 21.01 C +ATOM 1915 N ARG A 255 21.061 21.300 57.428 1.00 18.66 N +ATOM 1916 CA ARG A 255 21.661 22.600 57.173 1.00 17.10 C +ATOM 1917 C ARG A 255 23.029 22.505 57.820 1.00 21.70 C +ATOM 1918 O ARG A 255 23.200 22.250 59.017 1.00 22.02 O +ATOM 1919 CB ARG A 255 20.846 23.740 57.836 1.00 20.60 C +ATOM 1920 CG ARG A 255 21.426 25.130 57.575 1.00 21.88 C +ATOM 1921 CD ARG A 255 20.355 26.223 57.552 1.00 26.32 C +ATOM 1922 NE ARG A 255 19.523 26.019 56.380 1.00 27.38 N +ATOM 1923 CZ ARG A 255 18.422 26.707 56.054 1.00 35.09 C +ATOM 1924 NH1 ARG A 255 18.047 27.695 56.851 1.00 44.84 N +ATOM 1925 NH2 ARG A 255 17.776 26.360 54.932 1.00 32.78 N +ATOM 1926 N ILE A 256 24.093 22.632 57.012 1.00 22.66 N +ATOM 1927 CA ILE A 256 25.467 22.575 57.487 1.00 21.82 C +ATOM 1928 C ILE A 256 25.857 23.989 57.811 1.00 20.21 C +ATOM 1929 O ILE A 256 25.683 25.011 57.110 1.00 27.87 O +ATOM 1930 CB ILE A 256 26.339 22.070 56.295 1.00 21.81 C +ATOM 1931 CG1 ILE A 256 25.758 20.747 55.799 1.00 26.92 C +ATOM 1932 CG2 ILE A 256 27.806 22.086 56.679 1.00 30.03 C +ATOM 1933 CD1 ILE A 256 25.681 19.530 56.621 1.00 31.83 C +ATOM 1934 N LEU A 257 26.293 24.201 59.069 1.00 27.12 N +ATOM 1935 CA LEU A 257 26.712 25.415 59.680 1.00 39.28 C +ATOM 1936 C LEU A 257 28.226 25.480 59.934 1.00 45.68 C +ATOM 1937 O LEU A 257 28.793 24.561 60.559 1.00 39.14 O +ATOM 1938 CB LEU A 257 26.088 25.578 61.079 1.00 30.65 C +ATOM 1939 CG LEU A 257 24.570 25.458 61.099 1.00 33.76 C +ATOM 1940 CD1 LEU A 257 24.058 25.412 62.521 1.00 34.06 C +ATOM 1941 CD2 LEU A 257 23.943 26.616 60.322 1.00 46.47 C +ATOM 1942 N ALA A 258 28.808 26.602 59.556 1.00 45.54 N +ATOM 1943 CA ALA A 258 30.250 26.760 59.853 1.00 56.77 C +ATOM 1944 C ALA A 258 30.462 27.856 60.896 1.00 59.90 C +ATOM 1945 O ALA A 258 29.442 28.446 61.325 1.00 66.55 O +ATOM 1946 CB ALA A 258 31.062 27.042 58.613 1.00 44.82 C +TER 1947 ALA A 258 +HETATM 1948 CA NLG A1259 32.235 10.774 40.715 1.00 22.94 C +HETATM 1949 C NLG A1259 32.002 9.560 40.196 1.00 27.29 C +HETATM 1950 OXT NLG A1259 32.795 8.778 39.354 1.00 27.10 O +HETATM 1951 O NLG A1259 31.047 8.757 40.505 1.00 28.71 O +HETATM 1952 CB NLG A1259 31.615 11.808 39.808 1.00 19.40 C +HETATM 1953 CG NLG A1259 30.040 11.630 39.688 1.00 19.32 C +HETATM 1954 CD NLG A1259 29.398 12.025 41.011 1.00 21.73 C +HETATM 1955 OE1 NLG A1259 29.827 12.681 41.976 1.00 22.44 O +HETATM 1956 OE2 NLG A1259 28.273 11.447 41.024 1.00 30.01 O +HETATM 1957 C7 NLG A1259 34.525 10.593 41.676 1.00 23.12 C +HETATM 1958 C8 NLG A1259 35.827 10.722 41.547 1.00 22.01 C +HETATM 1959 O7 NLG A1259 34.054 9.818 42.554 1.00 24.98 O +HETATM 1960 N2 NLG A1259 33.746 10.909 40.942 1.00 24.96 N +HETATM 1961 PG ANP A1260 25.926 11.715 42.530 0.70 40.34 P +HETATM 1962 O1G ANP A1260 26.330 13.066 42.292 0.70 30.03 O +HETATM 1963 O2G ANP A1260 27.036 10.834 43.026 0.70 38.16 O +HETATM 1964 O3G ANP A1260 25.409 11.202 41.281 0.70 40.83 O +HETATM 1965 PB ANP A1260 24.919 11.701 45.361 0.70 40.37 P +HETATM 1966 O1B ANP A1260 26.159 12.453 45.681 0.70 32.20 O +HETATM 1967 O2B ANP A1260 23.648 12.326 45.700 0.70 48.11 O +HETATM 1968 N3B ANP A1260 24.927 11.416 43.822 0.70 35.31 N +HETATM 1969 PA ANP A1260 25.982 9.653 47.111 0.70 48.34 P +HETATM 1970 O1A ANP A1260 25.679 8.147 47.176 0.70 55.19 O +HETATM 1971 O2A ANP A1260 27.311 9.768 46.464 0.70 54.10 O +HETATM 1972 O3A ANP A1260 24.803 10.392 46.284 0.70 48.69 O +HETATM 1973 O5' ANP A1260 25.910 10.014 48.731 0.70 29.14 O +HETATM 1974 C5' ANP A1260 24.696 9.710 49.602 0.70 27.84 C +HETATM 1975 C4' ANP A1260 24.603 8.420 49.897 0.70 27.30 C +HETATM 1976 O4' ANP A1260 25.224 8.531 51.213 0.70 27.39 O +HETATM 1977 C3' ANP A1260 23.176 7.882 50.334 0.70 27.32 C +HETATM 1978 O3' ANP A1260 22.226 7.477 49.415 0.70 25.24 O +HETATM 1979 C2' ANP A1260 23.651 6.854 51.465 0.70 27.34 C +HETATM 1980 O2' ANP A1260 23.819 5.518 50.717 0.70 28.12 O +HETATM 1981 C1' ANP A1260 25.000 7.345 51.937 0.70 27.43 C +HETATM 1982 N9 ANP A1260 25.165 7.467 53.245 1.00 27.73 N +HETATM 1983 C8 ANP A1260 26.116 6.890 54.068 1.00 27.44 C +HETATM 1984 N7 ANP A1260 26.103 7.205 55.305 1.00 27.70 N +HETATM 1985 C5 ANP A1260 25.068 8.066 55.352 1.00 26.20 C +HETATM 1986 C6 ANP A1260 24.564 8.744 56.448 1.00 26.22 C +HETATM 1987 N6 ANP A1260 24.960 8.733 57.748 1.00 25.50 N +HETATM 1988 N1 ANP A1260 23.474 9.582 56.215 1.00 26.89 N +HETATM 1989 C2 ANP A1260 22.961 9.687 54.921 1.00 23.86 C +HETATM 1990 N3 ANP A1260 23.365 9.083 53.806 1.00 26.35 N +HETATM 1991 C4 ANP A1260 24.464 8.254 54.105 1.00 26.45 C +HETATM 1992 MG MG A1261 28.109 11.489 45.492 1.00 38.96 MG +HETATM 1993 O HOH A2001 27.394 37.718 40.786 1.00 42.58 O +HETATM 1994 O HOH A2002 29.198 36.463 44.102 1.00 34.65 O +HETATM 1995 O HOH A2003 23.383 38.663 46.260 1.00 38.98 O +HETATM 1996 O HOH A2004 17.322 10.410 31.849 1.00 52.58 O +HETATM 1997 O HOH A2005 10.814 7.678 39.500 1.00 51.69 O +HETATM 1998 O HOH A2006 15.591 11.823 30.563 1.00 33.28 O +HETATM 1999 O HOH A2007 14.550 8.001 32.855 1.00 52.52 O +HETATM 2000 O HOH A2008 24.052 2.465 29.064 1.00 47.91 O +HETATM 2001 O HOH A2009 24.499 5.640 29.191 1.00 51.21 O +HETATM 2002 O HOH A2010 39.602 39.630 39.531 1.00 52.37 O +HETATM 2003 O HOH A2011 17.266 2.782 30.492 1.00 56.25 O +HETATM 2004 O HOH A2012 4.181 15.769 35.037 1.00 54.29 O +HETATM 2005 O HOH A2013 40.339 0.178 50.671 1.00 54.51 O +HETATM 2006 O HOH A2014 32.836 3.318 52.148 1.00 61.99 O +HETATM 2007 O HOH A2015 5.030 23.022 35.897 1.00 47.11 O +HETATM 2008 O HOH A2016 6.911 25.760 36.234 1.00 35.12 O +HETATM 2009 O HOH A2017 10.092 26.683 42.665 1.00 29.50 O +HETATM 2010 O HOH A2018 42.720 12.857 26.716 1.00 57.66 O +HETATM 2011 O HOH A2019 6.451 28.308 36.500 1.00 43.26 O +HETATM 2012 O HOH A2020 38.222 4.117 25.761 1.00 69.22 O +HETATM 2013 O HOH A2021 13.708 35.753 34.573 1.00 35.44 O +HETATM 2014 O HOH A2022 18.508 31.378 36.336 1.00 35.00 O +HETATM 2015 O HOH A2023 12.503 29.893 33.477 1.00 38.42 O +HETATM 2016 O HOH A2024 12.157 36.835 44.638 1.00 34.06 O +HETATM 2017 O HOH A2025 12.030 29.385 23.601 1.00 45.69 O +HETATM 2018 O HOH A2026 14.781 36.412 36.863 1.00 35.00 O +HETATM 2019 O HOH A2027 7.384 19.197 25.416 1.00 73.27 O +HETATM 2020 O HOH A2028 16.139 43.152 36.151 1.00 34.59 O +HETATM 2021 O HOH A2029 20.480 39.313 39.868 1.00 37.48 O +HETATM 2022 O HOH A2030 16.512 33.252 38.952 1.00 28.76 O +HETATM 2023 O HOH A2031 16.406 36.220 44.179 1.00 33.41 O +HETATM 2024 O HOH A2032 21.050 31.497 35.307 1.00 27.28 O +HETATM 2025 O HOH A2033 47.976 14.499 36.123 1.00 36.88 O +HETATM 2026 O HOH A2034 50.246 15.746 39.516 1.00 33.28 O +HETATM 2027 O HOH A2035 29.483 15.115 36.406 1.00 21.48 O +HETATM 2028 O HOH A2036 24.318 4.404 31.445 1.00 39.73 O +HETATM 2029 O HOH A2037 37.950 37.393 38.935 1.00 53.95 O +HETATM 2030 O HOH A2038 23.573 3.218 40.209 1.00 66.28 O +HETATM 2031 O HOH A2039 18.176 2.512 33.969 1.00 60.06 O +HETATM 2032 O HOH A2040 15.393 35.952 29.999 1.00 66.48 O +HETATM 2033 O HOH A2041 19.413 31.294 23.346 1.00 45.29 O +HETATM 2034 O HOH A2042 50.354 14.776 32.651 1.00 34.68 O +HETATM 2035 O HOH A2043 36.501 14.449 51.823 1.00 39.73 O +HETATM 2036 O HOH A2044 37.146 24.068 46.889 1.00 32.58 O +HETATM 2037 O HOH A2045 39.230 35.106 40.744 1.00 56.90 O +HETATM 2038 O HOH A2046 38.233 3.218 51.430 1.00 45.71 O +HETATM 2039 O HOH A2047 19.775 29.010 49.281 1.00 50.21 O +HETATM 2040 O HOH A2048 34.503 4.096 49.885 1.00 46.45 O +HETATM 2041 O HOH A2049 33.966 2.560 38.194 1.00 33.23 O +HETATM 2042 O HOH A2050 36.146 1.999 39.692 1.00 43.35 O +HETATM 2043 O HOH A2051 22.144 5.583 56.051 1.00 49.45 O +HETATM 2044 O HOH A2052 19.462 14.587 65.009 1.00 32.84 O +HETATM 2045 O HOH A2053 16.290 11.831 68.228 1.00 33.23 O +HETATM 2046 O HOH A2054 9.108 17.667 56.084 1.00 96.26 O +HETATM 2047 O HOH A2055 40.330 6.121 28.762 1.00 29.68 O +HETATM 2048 O HOH A2056 43.802 8.044 29.070 1.00 51.29 O +HETATM 2049 O HOH A2057 44.044 1.575 33.026 1.00 37.01 O +HETATM 2050 O HOH A2058 36.889 0.068 29.613 1.00 48.90 O +HETATM 2051 O HOH A2059 38.978 -2.040 30.240 1.00 57.82 O +HETATM 2052 O HOH A2060 42.470 9.903 24.523 1.00 45.47 O +HETATM 2053 O HOH A2061 40.718 11.136 25.827 1.00 35.97 O +HETATM 2054 O HOH A2062 42.105 10.914 27.471 1.00 40.32 O +HETATM 2055 O HOH A2063 37.491 4.459 28.747 1.00 33.62 O +HETATM 2056 O HOH A2064 31.021 7.057 28.589 1.00 61.37 O +HETATM 2057 O HOH A2065 35.945 18.560 50.536 1.00 38.94 O +HETATM 2058 O AHOH A2066 29.676 17.690 27.048 0.50 17.91 O +HETATM 2059 O HOH A2067 38.307 27.917 48.677 1.00 36.42 O +HETATM 2060 O HOH A2068 26.746 6.950 28.432 1.00 31.63 O +HETATM 2061 O HOH A2069 29.565 20.584 28.722 1.00 17.47 O +HETATM 2062 O HOH A2070 19.788 10.052 30.492 1.00 49.06 O +HETATM 2063 O HOH A2071 5.062 13.888 41.895 1.00 39.66 O +HETATM 2064 O HOH A2072 19.578 23.066 25.739 1.00 23.74 O +HETATM 2065 O HOH A2073 12.410 14.303 27.919 1.00 55.94 O +HETATM 2066 O HOH A2074 13.607 27.624 24.098 1.00 41.46 O +HETATM 2067 O HOH A2075 16.024 28.398 24.570 1.00 47.96 O +HETATM 2068 O HOH A2076 7.670 21.512 29.427 1.00 39.95 O +HETATM 2069 O HOH A2077 8.569 21.554 25.041 1.00 50.27 O +HETATM 2070 O HOH A2078 11.590 28.817 30.978 1.00 30.99 O +HETATM 2071 O HOH A2079 7.690 23.903 28.913 1.00 54.43 O +HETATM 2072 O HOH A2080 13.400 30.829 30.355 1.00 39.48 O +HETATM 2073 O HOH A2081 18.532 25.554 26.383 1.00 22.36 O +HETATM 2074 O HOH A2082 15.856 31.232 29.248 1.00 36.20 O +HETATM 2075 O HOH A2083 21.127 28.323 25.252 1.00 21.91 O +HETATM 2076 O HOH A2084 40.788 24.119 30.620 1.00 26.36 O +HETATM 2077 O HOH A2085 31.608 22.169 27.607 1.00 16.52 O +HETATM 2078 O HOH A2086 37.481 24.014 27.932 1.00 17.93 O +HETATM 2079 O HOH A2087 36.668 32.398 33.336 1.00 23.29 O +HETATM 2080 O HOH A2088 41.737 32.249 33.376 1.00 49.99 O +HETATM 2081 O HOH A2089 40.868 27.129 29.537 1.00 32.88 O +HETATM 2082 O HOH A2090 41.423 29.606 36.893 1.00 37.60 O +HETATM 2083 O HOH A2091 40.836 25.054 35.067 1.00 32.59 O +HETATM 2084 O HOH A2092 46.387 21.363 36.669 1.00 28.10 O +HETATM 2085 O HOH A2093 43.753 21.321 42.394 1.00 21.31 O +HETATM 2086 O HOH A2094 47.928 19.393 43.229 1.00 22.85 O +HETATM 2087 O HOH A2095 48.113 16.717 38.269 1.00 27.80 O +HETATM 2088 O HOH A2096 47.534 12.306 47.569 1.00 30.68 O +HETATM 2089 O HOH A2097 47.506 6.208 38.961 1.00 30.82 O +HETATM 2090 O HOH A2098 54.915 8.066 41.347 1.00 48.78 O +HETATM 2091 O HOH A2099 44.128 1.855 43.765 1.00 25.85 O +HETATM 2092 O HOH A2100 47.164 8.194 32.420 1.00 47.18 O +HETATM 2093 O HOH A2101 43.759 11.045 41.808 1.00 21.51 O +HETATM 2094 O HOH A2102 38.266 17.946 45.024 1.00 23.51 O +HETATM 2095 O HOH A2103 38.073 20.045 46.548 1.00 28.23 O +HETATM 2096 O HOH A2104 41.771 25.616 47.761 1.00 41.57 O +HETATM 2097 O HOH A2105 43.893 24.507 49.263 1.00 41.76 O +HETATM 2098 O HOH A2106 41.935 30.692 41.220 1.00 43.91 O +HETATM 2099 O HOH A2107 41.762 31.787 38.545 1.00 33.18 O +HETATM 2100 O HOH A2108 38.537 31.925 42.590 1.00 28.54 O +HETATM 2101 O HOH A2109 39.736 35.658 36.567 1.00 42.27 O +HETATM 2102 O HOH A2110 33.774 30.813 34.939 1.00 17.99 O +HETATM 2103 O HOH A2111 32.769 38.238 33.422 1.00 29.20 O +HETATM 2104 O HOH A2112 32.515 36.804 41.023 1.00 36.76 O +HETATM 2105 O HOH A2113 29.170 35.435 40.551 1.00 26.52 O +HETATM 2106 O HOH A2114 33.328 38.453 36.290 1.00 35.36 O +HETATM 2107 O HOH A2115 30.519 39.619 29.061 1.00 57.91 O +HETATM 2108 O HOH A2116 21.218 34.160 34.151 1.00 36.63 O +HETATM 2109 O HOH A2117 29.363 40.706 31.602 1.00 43.91 O +HETATM 2110 O HOH A2118 30.417 39.586 33.500 1.00 42.54 O +HETATM 2111 O HOH A2119 19.887 34.546 26.834 1.00 50.99 O +HETATM 2112 O HOH A2120 18.407 31.070 30.972 1.00 35.49 O +HETATM 2113 O HOH A2121 17.075 33.546 29.184 1.00 33.60 O +HETATM 2114 O HOH A2122 17.000 34.578 32.540 1.00 50.30 O +HETATM 2115 O HOH A2123 21.567 33.099 22.637 1.00 28.64 O +HETATM 2116 O HOH A2124 24.818 35.951 23.985 1.00 40.70 O +HETATM 2117 O HOH A2125 30.279 18.509 30.295 1.00 17.18 O +HETATM 2118 O HOH A2126 41.274 23.654 33.345 1.00 34.39 O +HETATM 2119 O HOH A2127 42.671 22.758 35.704 1.00 25.18 O +HETATM 2120 O HOH A2128 39.443 21.760 35.002 1.00 17.55 O +HETATM 2121 O HOH A2129 48.329 15.989 34.084 1.00 30.41 O +HETATM 2122 O HOH A2130 48.063 24.494 30.094 1.00 34.02 O +HETATM 2123 O HOH A2131 51.606 22.842 31.105 1.00 56.10 O +HETATM 2124 O HOH A2132 48.445 19.459 37.083 1.00 30.12 O +HETATM 2125 O HOH A2133 52.338 22.591 33.247 1.00 56.31 O +HETATM 2126 O HOH A2134 43.268 12.067 30.004 1.00 30.86 O +HETATM 2127 O HOH A2135 29.578 12.369 47.514 1.00 31.98 O +HETATM 2128 O HOH A2136 37.244 14.231 43.429 1.00 18.84 O +HETATM 2129 O HOH A2137 36.134 21.441 46.761 1.00 26.98 O +HETATM 2130 O HOH A2138 38.119 13.283 49.611 1.00 40.18 O +HETATM 2131 O HOH A2139 33.532 26.879 48.837 1.00 29.72 O +HETATM 2132 O HOH A2140 36.767 34.045 42.434 1.00 35.06 O +HETATM 2133 O HOH A2141 33.588 35.647 42.612 1.00 34.42 O +HETATM 2134 O HOH A2142 23.974 35.173 49.195 1.00 37.69 O +HETATM 2135 O HOH A2143 21.486 33.866 50.133 1.00 56.08 O +HETATM 2136 O HOH A2144 21.581 27.013 50.722 1.00 46.97 O +HETATM 2137 O HOH A2145 22.032 13.466 51.474 1.00 37.80 O +HETATM 2138 O HOH A2146 16.892 9.045 65.761 1.00 34.47 O +HETATM 2139 O HOH A2147 20.181 12.335 65.949 1.00 50.65 O +HETATM 2140 O HOH A2148 22.137 5.523 58.951 1.00 58.46 O +HETATM 2141 O HOH A2149 15.989 5.854 57.435 1.00 56.34 O +HETATM 2142 O HOH A2150 12.163 6.743 61.522 1.00 35.28 O +HETATM 2143 O HOH A2151 15.046 12.458 65.594 1.00 29.77 O +HETATM 2144 O HOH A2152 17.533 12.888 64.232 1.00 29.34 O +HETATM 2145 O HOH A2153 10.077 19.427 58.152 1.00 42.01 O +HETATM 2146 O HOH A2154 17.468 21.705 58.283 1.00 25.36 O +HETATM 2147 O HOH A2155 19.432 21.076 65.523 1.00 28.11 O +HETATM 2148 O HOH A2156 19.576 25.657 60.823 1.00 44.66 O +HETATM 2149 O HOH A2157 28.660 21.584 67.547 1.00 37.67 O +HETATM 2150 O HOH A2158 32.028 22.808 64.934 1.00 33.35 O +HETATM 2151 O HOH A2159 20.351 18.687 64.437 1.00 24.82 O +HETATM 2152 O HOH A2160 22.012 15.553 65.937 1.00 43.77 O +HETATM 2153 O HOH A2161 22.137 18.003 67.899 1.00 43.88 O +HETATM 2154 O HOH A2162 23.879 21.584 65.741 1.00 50.61 O +HETATM 2155 O HOH A2163 23.353 20.157 67.041 1.00 49.46 O +HETATM 2156 O HOH A2164 32.838 6.760 60.068 1.00 34.17 O +HETATM 2157 O HOH A2165 27.235 1.916 62.905 1.00 56.19 O +HETATM 2158 O HOH A2166 30.323 2.978 48.512 1.00 53.40 O +HETATM 2159 O HOH A2167 34.953 16.132 50.323 1.00 27.15 O +HETATM 2160 O HOH A2168 36.044 25.932 48.981 1.00 36.30 O +HETATM 2161 O HOH A2169 35.439 20.621 49.336 1.00 28.71 O +HETATM 2162 O HOH A2170 37.541 23.961 54.588 1.00 42.31 O +HETATM 2163 O HOH A2171 33.309 31.128 58.074 1.00 42.36 O +HETATM 2164 O HOH A2172 36.707 32.926 52.529 1.00 60.37 O +HETATM 2165 O HOH A2173 29.893 36.479 47.928 1.00 44.64 O +HETATM 2166 O HOH A2174 24.844 28.705 50.654 1.00 29.34 O +HETATM 2167 O HOH A2175 18.107 21.936 55.524 1.00 30.04 O +HETATM 2168 O HOH A2176 11.441 15.682 41.661 1.00 33.13 O +HETATM 2169 O HOH A2177 9.381 14.153 42.479 1.00 40.68 O +HETATM 2170 O HOH A2178 14.764 5.671 43.373 1.00 57.43 O +HETATM 2171 O HOH A2179 11.509 8.865 44.400 1.00 65.36 O +HETATM 2172 O HOH A2180 11.462 8.529 42.509 1.00 50.29 O +HETATM 2173 O HOH A2181 12.129 16.181 48.209 1.00 32.48 O +HETATM 2174 O HOH A2182 7.669 10.347 46.167 1.00 60.54 O +HETATM 2175 O HOH A2183 6.852 13.911 44.368 1.00 39.49 O +HETATM 2176 O HOH A2184 7.446 23.926 48.989 1.00 33.38 O +HETATM 2177 O HOH A2185 6.102 16.447 52.745 1.00 33.95 O +HETATM 2178 O HOH A2186 11.331 28.371 44.618 1.00 33.06 O +HETATM 2179 O HOH A2187 8.073 29.267 48.881 1.00 49.10 O +HETATM 2180 O HOH A2188 16.797 25.199 51.199 1.00 49.90 O +HETATM 2181 O HOH A2189 12.012 17.187 54.442 1.00 42.04 O +HETATM 2182 O HOH A2190 15.014 16.702 52.094 1.00 29.51 O +HETATM 2183 O HOH A2191 12.498 15.761 54.481 1.00 87.15 O +HETATM 2184 O HOH A2192 16.376 30.118 56.735 1.00 48.04 O +HETATM 2185 O HOH A2193 31.188 24.102 62.114 1.00 37.72 O +HETATM 2186 O HOH A2194 32.331 9.917 44.583 1.00 31.37 O +HETATM 2187 O HOH A2195 28.852 13.544 44.255 1.00 27.10 O +HETATM 2188 O HOH A2196 29.761 8.553 42.730 1.00 43.20 O +HETATM 2189 O HOH A2197 24.295 8.703 41.218 1.00 44.13 O +HETATM 2190 O HOH A2198 23.458 14.300 44.584 1.00 38.88 O +CONECT 1948 1949 1952 1960 +CONECT 1949 1948 1950 1951 +CONECT 1950 1949 +CONECT 1951 1949 +CONECT 1952 1948 1953 +CONECT 1953 1952 1954 +CONECT 1954 1953 1955 1956 +CONECT 1955 1954 +CONECT 1956 1954 +CONECT 1957 1958 1959 1960 +CONECT 1958 1957 +CONECT 1959 1957 +CONECT 1960 1948 1957 +CONECT 1961 1962 1963 1964 1968 +CONECT 1962 1961 +CONECT 1963 1961 1992 +CONECT 1964 1961 +CONECT 1965 1966 1967 1968 1972 +CONECT 1966 1965 1992 +CONECT 1967 1965 +CONECT 1968 1961 1965 +CONECT 1969 1970 1971 1972 1973 +CONECT 1970 1969 +CONECT 1971 1969 1992 +CONECT 1972 1965 1969 +CONECT 1973 1969 1974 +CONECT 1974 1973 1975 +CONECT 1975 1974 1976 1977 +CONECT 1976 1975 1981 +CONECT 1977 1975 1978 1979 +CONECT 1978 1977 +CONECT 1979 1977 1980 1981 +CONECT 1980 1979 +CONECT 1981 1976 1979 1982 +CONECT 1982 1981 1983 1991 +CONECT 1983 1982 1984 +CONECT 1984 1983 1985 +CONECT 1985 1984 1986 1991 +CONECT 1986 1985 1987 1988 +CONECT 1987 1986 +CONECT 1988 1986 1989 +CONECT 1989 1988 1990 +CONECT 1990 1989 1991 +CONECT 1991 1982 1985 1990 +CONECT 1992 1963 1966 1971 2127 +CONECT 1992 2187 +CONECT 2127 1992 +CONECT 2187 1992 +MASTER 345 0 3 13 14 0 10 6 2189 1 48 20 +END diff --git a/testdata/1gs5_Repair_0_ST.fxout b/testdata/1gs5_Repair_0_ST.fxout new file mode 100644 index 0000000..e643de5 --- /dev/null +++ b/testdata/1gs5_Repair_0_ST.fxout @@ -0,0 +1 @@ +argB/1gs5_Repair.pdb -33.0386 -201.431 -52.5681 -294.211 -7.26582 380.883 -402.154 11.2723 141.699 388.729 0 0 0 5.37873 170.686 -3.95905 0 0 0 0 0.587221 0 259 diff --git a/testdata/MDH-Eukaryota-test.fasta b/testdata/MDH-Eukaryota-test.fasta new file mode 100644 index 0000000..b637d40 --- /dev/null +++ b/testdata/MDH-Eukaryota-test.fasta @@ -0,0 +1,300 @@ +>9606.ENSP00000327070 +MLSALARPASAALRRSFSTSAQNNAKVAVLGASGGIGQPLSLLLKNSPLVSRLTLYDIAH +TPGVAADLSHIETKAAVKGYLGPEQLPDCLKGCDVVVIPA +>2711.XP_006466391.1 +MQQPTSGANQRIARIAAHLHPPTLQIEGESSGLGRMDCRAKGGSPGFKVAVLGAAGGIGQ +PLAMLMKINPLVSVLHLYDVVNTPGVTADISHMDTNAVVR +>2711.XP_006477460.1 +MAATSATTFSIRSTIAFGPKAGQLPPSKPSGVRFNSKNSLVSFSGLKAVTSVICESNTSF +LNKESCSALRSTFARKAQSSEQRPQYALQPQASFKVAVLG +>2711.XP_006478245.1 +MLQAEVLGLDPRDVDVPVVGGHAGVTILPLLSQVKPPCSFTQEETEYLTNRIQNGGTEVV +EAKAGAGSATLSMAYAAVKFADACLRGLRGDAGVVECAFV +>2711.XP_006485676.1 +MRSSVLRSVKTLAKPAGARGYSSESVPDRKVAVLGAAGGIGQPLALLMKLNPLVSRLALY +DIANTPGVAADVGHINTRSEVAGYMGNDQLGQALEDSDVV +>2711.XP_006486803.1 +MEFSSEANQRIARISAHLYPPNLQMEENSCLRQAKCRAKGGAAGFKVAILGAAGGIGQPL +AMLMKINPLVSVLHLYDVVNTPGVTADISHMDTGAVVRGF +>2711.XP_006494638.1 +MLQAEVLGLDPRDVDVPVVGGHAGVTILPLLSQVKPPCSFTQEETEYLTNRIQNGGTEVV +EAKAGAGSATLSMAYAAVKFADACLRGLRGDAGVVECAFV +>2850.Phatr42398 +MSSASKKVAVLGAAGGIGQPLSMLLKLSPAIGELACYDIVGTPGVAADLSHIPTRARVSG +CLPAAGAWPPRGNEGLGEALTGADVVVIPAGVPRKPGMTR +>2880.D8LQM3 +MSAVARIQLASKVAAPMASKALGVSSSRFFTGTARAQNKVTVVGAAGGIGQPMSLLLKLS +GKVEHLSLFDIVNTPGVAADISHCNSKGKVTGHKGAEEMA +>2903.EOD05272 +MAGFKVCVVGGAGGIGQPLSMLMAMDPNVAELCVYDLTIAMIPADGVAADLSHLNKAAKV +KAYAFDKDARAADVAGECLTGCDLVLVPAGVPRKPGQDRA +>2903.EOD19958 +MLRAAPSLLRRSARAYSSSSSHVKVAVLGAAGGIGQPLSLLCKLSDSIDEVACYDVVGTP +GVAADLSHCPTKAVITGDLPSAGTWPPSGNSGLERTLTGA +>2903.EOD23190 +MPGYKVCVVGGAGGIGQPLSMLMAMDPNVAELCVYDLTIAMIPADGVAADLGHLNKAAKV +KAYAFDKDARAAEVAGECLTGCDLVLVPAGVPRKPGQDRA +>3055.EDO96543 +MSLQSSIRADSNCTLPNNPVCVLLPVDFIVAAMASSTSSAMAKWAAQAARGFAAAAPSSG +KGRKVAVLGAAGGIGQPLSMLMKMNSQVSSLSLYDIAGTP +>3055.EDP03144 +MLLANRVNAGAARRVSGRAAAPIAVRAGRRSLVCEARKVALLGAAGGIGQPLALLLKMNK +FVTELALYDIANVVGVAADLSHCNTPVKVTGYTGPEELGA +>3055.EDP06365 +MADPLNRIQKIASHLDPAKPRKFKVALLGAAGGIGQPLSLLLKMSPYVSDLALYDVANTP +GVAADVSHMSTAARVRGYLGPDQLGAALTGAALVIIPAGV +>3067.XP_002953466.1 +MASQSSASLLKWAQAASRGFAAAAASGPGRKVAVLGAAGGIGQPLSMLMKMNAQVSQLSL +YDVIGTPGVAADVSHINTKAQAKGFDKDGLAEALRGCDLV +>3067.XP_002954828.1 +MAALNRIQKIASHLDPPKLFKFKVAVLGAAGGIGQPLSMLLKMSPYISELSLYDVANTPG +VAADVSHMSTAARVKGYLGPDQLPAALAGCHLVIIPAGVP +>3067.XP_002957197.1 +MVARSSRRSLRCEARKVALLGAGGGIGQPLALLLKMNKFVTELALYDIVGVAGVAADLSH +CNTPVKVTAFTGPEELAGCLSGADLVVIPAGVPRKPGMTR +>3075.A0A087SC94 +MDRVSRLSAHFVHDTQGLAGSVHPEATSASGSGKFNVALLGAAGGIGQPLALLLKQSAYI +KELRLYDVANTAGVAADLSHIATGARVTAHSGAEALGTAL +>3075.A0A087SG45 +MNSLFRASRDLLRASATRGYASASFPDRKVAVLGAAGGIGQPLSLLLKLNPYVTELALYD +IAGTPGVAADISHINSKGRVKGYAGEDQLGEALKGADVIV +>3075.A0A087SLQ1 +MSVLACSSTRPAATPCVAGVQPRAKPSRAGPITASLRVVTPAFRRADNVQLRSVRSSAAP +QGRTLGATVEAKNVALLGAAGGIGQPLALLLKLNPQITEL +>3218.PP1S122_52V6.1 +MLSHCNTTIPSHQPASLPNKGCIVGMWGAESFCRMGTARVAAFIRCGCHLESRMRACSVG +GDAAGLQGQQLWARGKRTVAVLGGAGGIGQPLSLLLKLNP +>3218.PP1S201_6V6.1 +MAARFAAAGLLKRALSSAPQQQVRCMSSQTPKRKVAVLGAAGGIGQPLGLLMKLNPLVTD +LSLYDIAGTPGVASDLSHINTGANVEGFAGEQELAKALKG +>3218.PP1S26_26V6.1 +MASMATTAFHAATAANRACLSSIAASSASPASCRSVSFSSFRLAAASGLPGLSLSSASVR +GGFVRLQSDGVSKVSVQGMPVQVRADSSASAGPKSGSSTF +>3218.PP1S38_300V6.1 +MEEANARAQVRMARIASHMRAPEGNSMVGLEREPTRARGAAPGFKVAVLGAAGGIGQPLS +LLMKMHPLVSTLHLYDVFNTPGVVADLSHTNTSAVVRGFL +>3218.PP1S39_428V6.1 +MEMANVRAQVRLARIASHMEAPERNIMTGVEREATRARGAAPGFKVAILGAAGGIGQPLS +LLMKMSPLVSTLHLYDVFNTPGVVADLSHTNTSAVVRGFL +>3218.PP1S79_110V6.1 +MASTATAFNAATAANGVRLNSIAASCASSASCRSVSFSSLRPAAASRLSSLNSSLRGGFI +VVQGDVAWRQDVRGMPVQVRADASGAAAPKSGSSTFKVAV +>3218.PP1S91_247V6.1 +MAARSVAVGLLKRALSSQQQVRGMSSATPKRKVAVLGAAGGIGQPLGLLMKLNPLVTDLS +LYDIAGTPGVACDISHINTGANVEGFAGEEDLAKALKGCD +>3641.EOX91815 +MQPNNSQVNRRIATISAHLNPPNYSQMEGGSGLGRANCRAKGGSAGFKVAILGAAGGIGQ +PLAMLMKMNPLVSVLHLYDVVNAPGVTADISHMDTGAVVR +>3641.EOX97285 +MFKSIHSWHLEGNIIPTPPFNFHPLSRKRKEMEFSSEANQRIARISAHLHPPNHQMKESS +ALRRADCRAKGGAPGFKVAILGAAGGIGQPLAMLMKMNPL +>3641.EOY13192 +MFRSVARSAAGKHLLRRGYATDSVPDRKVAVLGAAGGIGQPLALLMKLNPLVSQLALYDI +ANTPGVAADVSHINTRSEVAGYVGEEQLGQALEGSDVVII +>3641.EOY21869 +MMVNILSRERRCIRYTKEKGKILGRENSAAKRVDLKECEMAATSATSFSIGSTVSLGSRG +CSLPQKKPFSVRFTSQNSLTSFSGLKAATSVNCESESSFL +>3641.EOY28058 +MKITMLGSAVAALKKAAAASPSTCASTHLLSRSYYSAGSYPERKVAILGAAGGIGQPLAL +LMKLNPFVSSLSLYDIANTPGVAADVSHINYPAQVAGYVG +>3649.evm.model.supercontig_129.41 +MQPAQDANQRIARISAHINPPNLEMEESSGLSRVNCRAKGGSTGFKVAILGAAGGIGQPL +ALLMKMNPLVSVLHLYDVVNTPGVTADISHMDTGAVVRGF +>3649.evm.model.supercontig_131.66 +MSGWMMVKSSGRQLLRRGYATVAAPERKVAVLGAAGGIGQPLALLMKLNPLVSKLALYDI +ANTPGVAADVGHVNTRSEVTGYMGEDQLGQALEGSDVVII +>3649.evm.model.supercontig_20.65 +MEFNADINQRIATISAHLRPSTPQMEESFGVARGDCRSKGGAPGFKVAILGAAGGIGQPL +AMLMKMNPLVSVLHLYDVVNSPGVTADLGHMDTGAVVRGF +>3649.evm.model.supercontig_423.5 +MAATSATTFSIGSTASFGSRVRLQAQSKPAGVRFNAPVLSSFNGLKAAASLSCESESSFL +GRESTAALRSSFAPKVKKSEQRSQYGLQTQASYKVAVLGA +>3656.XP_008440462.1 +MQPIPDVNQRIARISAHLHPPKYQMEESSVLRRANCRAKGGAPGFRVAILGAAGGIGQPL +AMLMKMNPLVSVLHLYDVVNAPGVTADISHMDTGAVVRGF +>3656.XP_008451622.1 +MAATSATILSIGATESLNCKLSSFSHSKSASLRINSHETLQSFCGLKADSSLRCDSESSF +LGKQSSAALWRHLAPSAQRVNLNVRKNLQPQASYKVAVLG +>3656.XP_008451713.1 +MKASILRSVRSAVSRSSSSNRLLTRTFATESVPERKVAVLGAAGGIGQPLALLMKLNPLV +SKLALYDIAGTPGVAADVGHVNTRSEVTGYVGEEQLGKAL +>3656.XP_008453677.1 +LLIKMSPLVATLNLYDIANVKGVAADISHCNTPSKVQDFTGPSELANALKGVDVVVIPAG +VPRKPGMTRDDLFNINAGIVKSLVEAVADNCPDAFIHIIS +>3659.XP_004136050.1 +MAATSATILSIGATESLNSKLNSFSLSKSASLRISSHETLQSFCGLKSDSSLRCDLESSF +LGKQSRAALWRHLAPSAQRVNSNACKNLQPQASYKVAVLG +>3659.XP_004137217.1 +MKASILRSVRSAVSRSSSSNHLLTRTFATESVPERKVAVLGAAGGIGQPLALLMKLNPLV +SKLALYDIGATPGVAADVGHVNTRSEVTGYMGEEQLGKAL +>3659.XP_004138301.1 +MAATSVTSLSIGATASLNTKLNLFSQSKSASPRINSLKLQSFCGLKADSSLRCDSESSFL +GKQSSAALWRHLAPSAQRENLNLCKSLQPQASYKVAVLGA +>3659.XP_004143423.1 +MQPIPDVNQRIARISAHLHPPKYQMEESSVLRRANCRAKGGAPGFKVAILGAAGGIGQPL +AMLMKMNPLVSVLHLYDVVNAPGVTADISHMDTGAVVRGF +>3659.XP_004154973.1 +MAATSVTSLSIGATASLNTKLNLFSQSKSASPRINSLKLQSFCGLKADSSLRCDSESSFL +GKQSSAALWRHLAPSAQRENLNLCKSLQPQASYKVAVLGA +>3659.XP_004156521.1 +MKASILRSVRSAVSRSSSSNHLLTRTFATESVPERKVAVLGAAGGIGQPLALLMKLNPLV +SKLALYDIGATPGVAADVGHVNTRSEVTGYMGEEQLGKAL +>3659.XP_004160537.1 +MAATSATILSIGATESLNSKLNSFSLSKSASLRISSHETLQSFCGLKSDSSLRCDLESSF +LGKQSRAALWRHLAPSAQRVNSNACKNLQPQASYKVAVLG +>3659.XP_004160930.1 +MQPIPDVNQRIARISAHLHPPKYQMEESSVLRRANCRAKGGAPGFKVAILGAAGGIGQPL +AMLMKMNPLVSVLHLYDVVNAPGVTADISHMDTGAVVRGF +>3694.POPTR_0001s29420.1 +MESIREASQRIARISAHLQPPNSQTEESCVLKRADCRAKGGAPGFKVAILGAAGGIGQPL +AMLMKMNPSVSVLHLYDVVNTPGVTADIGHMDTGAVVRGF +>3694.POPTR_0001s38560.1 +MRNSMLRSIKSLTTSPSSHVLRRGYASEAVPERKVAVLGAAGGIGQSLSLLMKLNPLVSN +LALYDIANTPGVAADVSHINTRSEVVGYASDAELGKALEG +>3694.POPTR_0004s05340.1 +MKAAVLRSSRAALRPCTCRHLVGRSYSSTESSPESKVAILGAAGGIGQPLALLMKLNPLI +SSLSLYDIANTPGVAADVSHINSRAQVAGYAGEEQLGEAL +>3694.POPTR_0004s11170.1 +MAATSAATFSAGSTVAFGTKASQLPQSKPSAVRFKSQKSLATFSGLKAATFVKCESESSF +LGKESSAALRGSVVPKAQKSSQKSQYHLNPQASYKVAILG +>3694.POPTR_0007s14510.1 +MQQSNLRIARIAAHINPPNLQMVEEDLGLERVNCRAKGASSGFKVAILGAAGGIGQPLAM +LMKMNPLVSLLHLYDVVNAPGVTADISHMDTSAVVRGFLG +>3694.POPTR_0009s08520.1 +MESVANQRIARVSAHLQPPNSQMEESCVLKRTDCRAKGGAPGFKVAILGAAGGIGQPLAM +LMKMNPLVSVLHLYDVVNAPGVTADISHMDTGAVVRGFLG +>3694.POPTR_0011s09860.1 +MMLRSIKSLATSPSSHILRRGYASEAVPDRKVAVLGAAGGIGQPLALLMKLNPLVSSLAL +YDIANTPGVAADVSHINTRSEVSGYSGEAELGKALEGADV +>3694.POPTR_0017s00780.1 +AAPKSSNLSDDDIKALTWRTQDGGTEVVEAKAGKGSATLSMAYAGAVFADACLKGLNGVP +DIVECSFVQSSITDLPFFASKGLESFKPELKASIEKGVEF +>3694.POPTR_0017s00790.1 +MKAAVLRSSRAALRPCTSRHLVGRSYSSTESRPERKVAILGAAGGIGQPLALLLKLNPLI +SSLSLYDIANTPGVAADVSHINSRAQVAGYAGEEQLVEAL +>3694.POPTR_0017s13630.1 +MAATSAATFSIGSTISLGTKGSQLPQSKPLSVRFNSQNTLATFSGLKAAIFVKCESESSF +LGKESSAALRGAAAPKAQKSSQRSQYRLNPQASYKVAILG +>3694.POPTR_0017s13640.1 +MAAASAATFSVGSAFSFGTKASQLPQSKLSSVRFNSQSSLATFSGLKAATFVTCESESSF +LGKESNAALRCSVAPKAQKSSQRSQHRLNPQASYKVAVLG +>3702.AT1G53240.1 +MFRSMLVRSSASAKQAVIRRSFSSGSVPERKVAILGAAGGIGQPLALLMKLNPLVSSLSL +YDIANTPGVAADVGHINTRSEVVGYMGDDNLAKALEGADL +>3702.AT2G22780.1 +MDPNQRIARISAHLNPPNLHNQIADGSGLNRVACRAKGGSPGFKVAILGAAGGIGQPLAM +LMKMNPLVSVLHLYDVANAPGVTADISHMDTSAVVRGFLG +>3702.AT3G15020.1 +MFRSMIVRSASPVKQGLLRRGFASESVPDRKVVILGAAGGIGQPLSLLMKLNPLVSSLSL +YDIANTPGVAADVGHINTRSQVSGYMGDDDLGKALEGADL +>3702.AT3G47520.1 +MATATSASLFSTVSSSYSKASSIPHSRLQSVKFNSVPSFTGLKSTSLISGSDSSSLAKTL +RGSVTKAQTSDKKPYGFKINASYKVAVLGAAGGIGQPLSL +>3702.AT3G53910.1 +MFLRNSDPYAMISFLKSLIRALDGDDDVFDFAFVASSVTELPYFATRTKIGKKRIEEVID +SDLQGLAKYEERAIKAIKPRVKVTIEKDITLLQRTFVAIS +>3702.AT5G09660.4 +MEFRGDANQRIARISAHLTPQMEAKNSVIGRENCRAKGGNPGFKVAILGAAGGIGQSLSL +LMKMNPLVSLLHLYDVVNAPGVTADVSHMDTGAVVRGFLG +>3711.Bra009397.1-P +MEFRGDATQRIAMISAHLQPSFTSQMEGKNTVMGRENCRGKGGKAGFKVAILGAAGGIGQ +SLSLLMKMNPLVSLLHLYDVVNAPGVTADVSHMDTGAVVR +>3711.Bra018137.1-P +MAAASSISIGSTVPRASSSSSSSSLPQSRAQAVNFNYSLPRFTALRSSTLLSGPDSSSFA +KSLRGSVTKPQSTDTKPYGLNINASYKVSVLGAAGGIGQP +>3711.Bra019504.1-P +MSHLVSTLHLYNIANVKRVVADLSLCNTHSQVLAFTGPSELADCLKDVNVMVIPAGVPRK +HSMTRNTVNSTVPIAAQVLTKKGVYDPKKLFGVTTLDVVR +>3711.Bra019790.1-P +MASSSFSVSYSSTTSSLPVFRTSQAVVFSSTSKFHTLTPRSSSYGKSLSTKAHASSDNKK +LYVENVNCSSKVTIIGSSLGIGPALSTSLKKSPLVSTLRF +>3711.Bra028624.1-P +MEFRGDANKRIAMISAHLQPSFTPQMEAKNSVMGLESCRAKGGNPGFKVAILGAAGGIGQ +SLSLLMKMNPLVSLLHLYDVVNAPGVTADVSHMDTGAVVR +>3711.Bra030204.1-P +MDANQRIARISAHLNPPNLDQIGSGSGLEGVGCRAKGGSPGFKVAILGAAGGIGQPLAML +MKMNPLVSLLHLYDVANAPGVTADISHMDTSAIVRGFLGQ +>3711.Bra030951.1-P +MFRSALVRSSASAKQSLLRRSFSSGSVPERKVAILGAAGGIGQPLALLMKLNPLVSSLSL +YDIANTPGVAADVGHINTRSQVVGYMGDDNLAKALEGADL +>3711.Bra038112.1-P +MFRSMLVRSSSSAKQSLIRRNLSSGSVPERKVAILGAAGGIGQPLALLMKLNPLVSSLSL +YDIANTPGVAADVGHINTRSEPGMTRDDLFNINAGIVKNL +>3711.Bra039662.1-P +MFRSVIVRSSSSAKQSLLRRSFSSSVPERKVAILGAAGGIGQPLALLMKLNPLVSSLSLF +DIANTPGVAADVGHINTRSEVVGYMGDDELAKALEGADLV +>3712.Bo2g009460.1 +MEFRGDANKRIAMISAHLQPSFTPQMEAKNSVMGLESCRAKGGNPGFKVAILGAAGGIGQ +SLSLLMKMNPLVSLLHLYDVVNAPGVTADVSHMDTGAVVR +>3712.Bo3g042870.1 +MASKDVRLLLNTWRHQKPPHPPVHIAQKINDDMRNRIAILLRCQNGQWDELRVRWTSSCT +LPDRKWTLYARGRSQISRRKMAAATSLTSCGFCSLCSPLQ +>3712.Bo3g115020.1 +MRTKEKQHSSHSFTRLTTLSFTSPHSPCHTCLALQHSLSSRRHTALPLAPRCHTAVSLVP +RRHKSPSLLNNAHIMFSFEYRSKCLSFRLNRSFRRDFTEK +>3712.Bo3g134610.1 +MAATSAASSISIGSNLSRATSSSSRAQAVNFNYSLPRFTALRSSTLLSGPESSSFAKSLR +GSVMKSQSTDTKPYGLNINASYKVAVLGAAGGIGQPLSLL +>3712.Bo3g167150.1 +MGVTMLDDAEVMSHNPREVVVPVVGGHAIVTILPLLSQVKPPCSFTQKEIEYLTDRMENG +GIEVVKAKAGAAVKSADACLKGLRGNANIVECAFVATHVT +>3712.Bo3g183840.1 +QKHPWKWKRIKKQRVETYLIIIECLAKFSPCKMFRSALVRSSASAKQSLLRRSFSSGSVP +ERKVAILGAAGGIGQPLALLMKLNPLVSSLSLYDIANTPG +>3712.Bo4g151040.1 +MDANQRIARISAHLNPPNLDQIGSGSGLERVGCRAKGGSPGFKVAILGAAGGIGQPLAML +MKMNPLVSLLHLYDVANAPGVTADISHMDTSAIVRGFLGQ +>3712.Bo5g016610.1 +MSAEVLKQRGVYDPKKLFGLMTPETELARAFVAERFVLYVEDVHVPVIGGHCSLTALPLF +SKTTPPYREFFEARGAERFVLSLLRALGGANDMFQCCFVE +>3712.Bo5g092980.1 +MKRTKMSAKKNTQEEGSSQREKQRPKKWDKSDTTHYNNMKKVAVPATQLACPETMTILGI +KTDIEGLFQKMGLGQLCNLNEPTYPELVRQFIASAYVTRP +>3712.Bo6g029380.1 +MEAQKWWRLKQEKVQLHCRWCNYAGALFADACLKGLNGVPDVEECSYVQSTITELPFFAS +KVRLGKNGVEDVLDLGPLSDFEKEGLEALKPKLKSFIEKG +>3712.Bo6g029400.1 +MFRCMLVRSSSSAKQSLMRRNLSSGSVPERKVAILGAAGGIGQPLALLMKLNPLVSSLSL +YDIANTPGVAADVGHINTRSEVVGYMGDDNLAKALEGADL +>3712.Bo6g031300.1 +MFRSVIVRSSSSAKQSLLRRSFSSSSSSVPERKVAILGAAGGIGQPLALLMKLNPLVSSL +SLFDIANTPGVAADVGHINTRSEVVGYMGDDELAKALEGA +>3712.Bo7g062050.1 +MGDKFDLKKLMGVTMLDAVSRANTFVAEVMSHNPREVVVPVVGGHARVTILPLLSQVKLP +CSFTQKEIEYLTDRMENGGIEVVKAKYGAVKFADACLKGL +>3712.Bo9g173890.1 +MEFRGDANQRIAMISAHLQPSFTSQMEEKNSVMGRENCRGKGGKAGFKVAILGAAGGIGQ +SLSLLMKMNPLVSLLHLYDVVNAPGVTADVSHMDTGAVVR +>3750.XP_008342624.1 +MAYAAVKFADACLRGLRGDAGVVECAFLASQVTELPFFASKVRLGRTGAEEIYPLGPLNE +YERAGLEKAKKELAASIQKGVSFVRK +>3750.XP_008342632.1 +MQQQPSPEVNAXQRIARISAHLDPPNLQMENAATVSRLNCRAKGGAAGFKVAILGAAGGI +GQPLALLMKMNPLVSVIHLYDVVNTPGVTSDISHMDTGAV +>3750.XP_008351884.1 +MAATSAAAFSVGTNCSLGHKAAAFQQSKPCALRFNSQNPLKSSFNGLKATPSFNCETETS +FSGKETASALRASFARKAHKEALVVQSQFQPQASYKVAVL +>3750.XP_008360846.1 +MAATSAAAFSVGTNCSLGHKAAAFQQSKPCALRFNSQNPLKSSFNGLKATPSFNCETETS +FSGKETASALRASFARKAHKEALVVQSQFQPQASYKVAVL +>3750.XP_008365871.1 +MENAATVNWLNCRAKGGTAGYKVAILGAVGGIGQPLAMLMKMNPLVSVLHLYDVVNTPGV +TSDISQMDTGTVMRGFLGQQQLDEALTRMELVIIPIGVPR +>3750.XP_008367914.1 +MRPSMSIARSVHRVARRSYSSASVPERKVAVLGAAGGIGQPLALLMKLNPLVSHLSLYDI +AGTPGVAADVSHINTRSEVKGYAGEEQLAQALEGADVVII +>3750.XP_008372893.1 +MESSVGANGRIAKISAHLFPPNSQVEDGSALSRGDCRAKGGAPGFKVAIVGAAGGIGQPL +AMLMKMNPLVSVLHLYDVVNAPGVTADISHMDTGAVVRGF +>3750.XP_008374550.1 +MAATSAATFSIGTNCSLGHKAASFQQTKPCALRFNSQNLLKSSFNGLKATTSFNCETETS +FSGKETAKALRASFARKAHKDAQVVQSQFQPQASYKVAVL +>3750.XP_008378631.1 +MAAKMMSAVGXKGIRSGIGHNGRVALPKQVNVPIKVTIQQSLRSQLVVKKHNLEVKATHN +IGTQTNEENPDVTITYKVAVLGDLSRVVGGSLIDSVSFKG +>3750.XP_008393801.1 +MQXHPSSEVNANQRIARISAHLDPPNLQMENAATVNRLNCRAKGGTAGYKVAILGAAGGI +GQPLAMLMKMNPLVSVLHLYDVVNTPGVTSDISHMDTGAV +>3760.EMJ01799 +MEPSVEANGRIARISAHLFPPNLQMEDGSALRRVDCRAKGGAPGFKVAILGAAGGIGQPL +AMLMKINPLVSVLHLYDVVNAPGVTADISHMDTGAVVRGF diff --git a/testdata/MDH-Human-seed-test.fasta b/testdata/MDH-Human-seed-test.fasta new file mode 100644 index 0000000..ed097de --- /dev/null +++ b/testdata/MDH-Human-seed-test.fasta @@ -0,0 +1,3 @@ +>2711.XP_006486803.1 +MEFSSEANQRIARISAHLYPPNLQMEENSCLRQAKCRAKGGAAGFKVAILGAAGGIGQPL +AMLMKINPLVSVLHLYDVVNTPGVTADISHMDTGAVVRGF \ No newline at end of file diff --git a/testdata/argB-short.fasta b/testdata/argB-short.fasta new file mode 100644 index 0000000..496dc9d --- /dev/null +++ b/testdata/argB-short.fasta @@ -0,0 +1,2 @@ +>sp|P0A6C8|ARGB_ECOLI Acetylglutamate kinase OS=Escherichia coli (strain K12) OX=83333 GN=argB PE=1 SV=1 +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK diff --git a/testdata/argB.fasta b/testdata/argB.fasta new file mode 100644 index 0000000..edfd5d6 --- /dev/null +++ b/testdata/argB.fasta @@ -0,0 +1,6 @@ +>sp|P0A6C8|ARGB_ECOLI Acetylglutamate kinase OS=Escherichia coli (strain K12) OX=83333 GN=argB PE=1 SV=1 +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA diff --git a/testdata/dataset-with-energies-short-sequences.fasta b/testdata/dataset-with-energies-short-sequences.fasta new file mode 100644 index 0000000..35b501a --- /dev/null +++ b/testdata/dataset-with-energies-short-sequences.fasta @@ -0,0 +1,62 @@ +>sp|P0A6C8|ARGB_ECOLI:-33.0386 sp|P0A6C8|ARGB_ECOLI Acetylglutamate kinase OS=Escherichia coli (strain K12) OX=83333 GN=argB PE=1 SV=1 +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +>1gs5_Repair_1:-31.0518 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:NA160R; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLIIVHGGGCVVDELMKGLNLPVK +>1gs5_Repair_2:-30.2729 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:AA92I; +MMNPLIIKLGGVLLDSEEALERLFSANVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +>1gs5_Repair_3:-29.6667 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:IA7N; +MMNPLINKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +>1gs5_Repair_4:-32.3344 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:PA130N; +MMNPLIIKLGGVLLDQEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +>1gs5_Repair_5:-31.6647 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:KA200C; +MMNPLIAKLGGVLLDSEEALERLFSALVNYRESAQRPLVIVHGGGCVVDELMKGLNLPVK +>1gs5_Repair_6:-34.089 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:HA95F; +MMNPLIINLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +>1gs5_Repair_7:-32.867 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA156F; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHSGGCVVDELMKGLNLPVK +>1gs5_Repair_8:-32.611 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:NA219T; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLGLPVK +>1gs5_Repair_9:-31.4941 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA228G; +MMNPLIIKLGGVLLDSAEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +>1gs5_Repair_10:-32.0178 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA228V; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGCGCVVDELMKGLNLPVK +>1gs5_Repair_11:-32.4719 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:GA82Q; +MMNPEIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +>1gs5_Repair_12:-32.652 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:EA50D; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDDLMKGLNLPVK +>1gs5_Repair_13:-29.6071 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:GA105V; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRERHQRPLVIVHGGGCVVDELMKGLNLPVK +>1gs5_Repair_14:-35.2219 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:GA213N; +MMNPLIIKLGGVLLDSEEALARLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +>1gs5_Repair_15:-29.3677 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA159N; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVA +>1gs5_Repair_16:-33.8303 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:EA195L; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESMQRPLVIVHGGGCVVDELMKGLNLPVK +>1gs5_Repair_17:-31.903 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:EA241H; +MMNPLIIKCGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +>1gs5_Repair_18:-33.9048 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:EA195W; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVVELMKGLNLPVK +>1gs5_Repair_19:-29.816 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA27K; +MMNPLIIKLGGVLLDSEEALERLFSAKVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +>1gs5_Repair_20:-34.2157 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:KA217V; +MMNPLIIKLGGVLDDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +>1gs5_Repair_21:-29.3014 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA9K; +MMNPLIIKKGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +>1gs5_Repair_22:-31.1338 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:DA187R; +MMNPLIIKLGGVLLDSEEALERLFSALVRYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +>1gs5_Repair_23:-33.0669 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:TA211V; +MNNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +>1gs5_Repair_24:-32.141 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:KA62C; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRASHQRPLVIVHGGGCVVDELMKGLNLPVK +>1gs5_Repair_25:-31.394 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:KA189V; +MMNPLIIKLGGVLVDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +>1gs5_Repair_26:-32.2089 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:PA58G; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKYLNLGVK +>1gs5_Repair_27:-32.624 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:DA212C; +MMNPLIIKLGGVLLDSAEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +>1gs5_Repair_28:-30.9174 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:PA143L; +MMNPLIIKLGGVLLDSEEALERLFSALVNQRESHQRPLVIVHGGGCVVDELMKGLNLPVK +>1gs5_Repair_29:-32.5227 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:RA22A; +MMNPLIIKLGGVLLDSEEALEALFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +>1gs5_Repair_30:-33.9382 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:SA236F; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK \ No newline at end of file diff --git a/testdata/dataset-with-energies.fasta b/testdata/dataset-with-energies.fasta new file mode 100644 index 0000000..ce8355a --- /dev/null +++ b/testdata/dataset-with-energies.fasta @@ -0,0 +1,7206 @@ +>sp|P0A6C8|ARGB_ECOLI:-33.0386 sp|P0A6C8|ARGB_ECOLI Acetylglutamate kinase OS=Escherichia coli (strain K12) OX=83333 GN=argB PE=1 SV=1 +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_1:-31.0518 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:NA160R; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVRADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_2:-30.2729 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:AA92I; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWIKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_3:-29.6667 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:IA7N; +MMNPLINKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_4:-32.3344 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:PA130N; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSNKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_5:-31.6647 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:KA200C; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAACAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_6:-34.089 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:HA95F; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKFQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_7:-32.867 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA156F; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQFMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_8:-32.611 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:NA219T; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVTAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_9:-31.4941 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA228G; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTGGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_10:-32.0178 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA228V; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTVGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_11:-32.4719 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:GA82Q; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAQTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_12:-32.652 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:EA50D; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDDLMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_13:-29.6071 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:GA105V; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLVDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_14:-35.2219 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:GA213N; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDNMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_15:-29.3677 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA159N; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNNNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_16:-33.8303 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:EA195L; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIALMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_17:-31.903 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:EA241H; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +HQLPALFNGMPMGTRILA +>1gs5_Repair_18:-33.9048 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:EA195W; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAWMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_19:-29.816 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA27K; +MMNPLIIKLGGVLLDSEEALERLFSAKVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_20:-34.2157 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:KA217V; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVVVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_21:-29.3014 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA9K; +MMNPLIIKKGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_22:-31.1338 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:DA187R; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILRGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_23:-33.0669 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:TA211V; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIIVDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_24:-32.141 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:KA62C; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KCNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_25:-31.394 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:KA189V; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGVGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_26:-32.2089 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:PA58G; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLGVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_27:-32.624 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:DA212C; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITCGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_28:-30.9174 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:PA143L; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLLVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_29:-32.5227 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:RA22A; +MMNPLIIKLGGVLLDSEEALEALFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_30:-33.9382 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:SA236F; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIAFWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_31:-32.8051 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:QA203D; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEDLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_32:-34.9039 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:SA16W; +MMNPLIIKLGGVLLDWEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_33:-33.9807 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:SA183K; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVKGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_34:-31.9067 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:GA82T; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALATTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_35:-29.533 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:IA234T; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDTASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_36:-33.2717 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:EA50I; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDILMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_37:-30.4215 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA23H; +MMNPLIIKLGGVLLDSEEALERHFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_38:-32.5834 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:DA108S; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGSSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_39:-31.4086 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:PA244S; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLSALFNGMPMGTRILA +>1gs5_Repair_40:-31.7296 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:IA210V; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIVTDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_41:-31.0455 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:FA103C; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLCLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_42:-31.869 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:DA162N; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNANQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_43:-30.2227 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA102Q; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGQFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_44:-34.0947 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:EA32K; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRKSHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_45:-28.9551 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA23A; +MMNPLIIKLGGVLLDSEEALERAFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_46:-32.26 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:AA221S; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNASLDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_47:-32.6453 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:AA90D; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLDWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_48:-31.438 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA168F; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATAFAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_49:-29.8207 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA144N; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPNVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_50:-28.6934 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA179A; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILAS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_51:-28.2283 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA38G; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPGVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_52:-34.2114 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:GA188L; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDLKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_53:-33.447 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:AA84I; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTINKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_54:-32.7159 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:EA206T; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLITQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_55:-30.6764 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:HA42C; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVCGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_56:-32.7722 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:NA134V; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLIVSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_57:-29.5986 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:AA164M; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQMATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_58:-30.6696 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA20K; +MMNPLIIKLGGVLLDSEEAKERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_59:-32.8649 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:QA163E; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADEAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_60:-24.0175 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:TA68P; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVPPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_61:-34.281 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA9W; +MMNPLIIKWGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_62:-29.7105 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:AA220P; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNPALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_63:-26.7639 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:IA7R; +MMNPLIRKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_64:-32.0013 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:AA19E; +MMNPLIIKLGGVLLDSEEELERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_65:-28.7694 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA172A; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATAGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_66:-33.9719 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:QA207R; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIERGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_67:-32.336 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:AA225S; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDASRTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_68:-33.2603 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:HA121Y; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +YVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_69:-32.6182 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:HA239Q; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRQA +EQLPALFNGMPMGTRILA +>1gs5_Repair_70:-31.2624 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA222H; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAAHDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_71:-33.9783 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:TA113R; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVRQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_72:-27.455 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA179D; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILDS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_73:-33.3464 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:QA72A; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADAIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_74:-33.2303 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:QA35K; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHKRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_75:-33.3051 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:NA139M; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLEMGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_76:-29.5643 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:GA101Q; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVQLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_77:-30.2039 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:GA249L; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNLMPMGTRILA +>1gs5_Repair_78:-28.8757 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:PA4G; +MMNGLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_79:-25.1468 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:AA125Q; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLQQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_80:-36.2089 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:SA236M; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIAMWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_81:-31.5382 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA57V; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNVPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_82:-33.0632 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:DA116H; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLHEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_83:-33.1951 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:TA227Y; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARYLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_84:-27.154 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:IA6S; +MMNPLSIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_85:-30.7794 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:AA161Q; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNQDQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_86:-33.4119 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:KA8N; +MMNPLIINLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_87:-30.905 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:DA187Q; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILQGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_88:-25.2809 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:GA44T; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGTGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_89:-31.1808 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:MA214V; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGVIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_90:-30.75 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA48C; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVCDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_91:-32.5909 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:EA206D; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIDQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_92:-33.2546 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:EA153S; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDSGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_93:-26.3466 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA172R; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATRGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_94:-28.1705 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:HA42F; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVFGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_95:-21.1115 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA218Y; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKYNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_96:-28.1018 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:TA171E; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAAELGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_97:-26.9043 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA38H; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPHVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_98:-32.4467 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:QA163A; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADAAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_99:-33.5187 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:QA207N; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIENGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_100:-28.7075 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA243D; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQDPALFNGMPMGTRILA +>1gs5_Repair_1:-27.5915 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:IA185K; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGKLDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_2:-33.1566 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:DA49W; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVWELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_3:-32.9325 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA150T; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGTTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_4:-33.1049 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:DA152V; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTVEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_5:-32.1818 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:DA74K; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIKIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_6:-33.3728 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:RA230F; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGFPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_7:-30.69 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:GA208C; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQCIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_8:-31.9619 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:AA169V; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALVATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_9:-32.7939 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:KA60W; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVW +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_10:-33.8251 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:EA32R; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRRSHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_11:-32.0773 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:EA138T; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLTNGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_12:-12.8556 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:AA225Y; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAYRTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_13:-33.3556 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:DA15T; +MMNPLIIKLGGVLLTSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_14:-27.5172 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:DA162R; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNARQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_15:-32.3222 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:MA250Q; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGQPMGTRILA +>1gs5_Repair_16:-28.1893 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA144S; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPSVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_17:-32.9647 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:NA134E; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLIESLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_18:-33.0846 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:EA17L; +MMNPLIIKLGGVLLDSLEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_19:-26.8619 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:GA44V; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGVGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_20:-29.8666 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:AA174T; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGTDLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_21:-29.798 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA243Y; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQYPALFNGMPMGTRILA +>1gs5_Repair_22:-28.215 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA104T; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFTGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_23:-33.7458 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:IA177M; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLMLLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_24:-33.0522 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:EA32A; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRASHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_25:-30.9391 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA124S; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGSAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_26:-31.7873 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:GA82F; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAFTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_27:-27.3848 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:GA43P; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHPGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_28:-32.4224 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:HA239R; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRRA +EQLPALFNGMPMGTRILA +>1gs5_Repair_29:-27.5609 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA232E; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPEDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_30:-16.6319 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:GA128D; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPDSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_31:-27.6053 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:IA256S; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRSLA +>1gs5_Repair_32:-32.495 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:DA15W; +MMNPLIIKLGGVLLWSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_33:-34.3919 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:AA170F; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAFTLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_34:-27.2263 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:AA125N; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLNQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_35:-31.7937 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA136T; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSTLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_36:-33.2983 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:EA138W; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLWNGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_37:-34.3721 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:QA207M; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEMGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_38:-33.1377 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:DA15N; +MMNPLIIKLGGVLLNSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_39:-33.2177 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:EA206H; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIHQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_40:-32.3156 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:PA251V; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMVMGTRILA +>1gs5_Repair_41:-31.5215 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:NA63W; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKWGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_42:-19.8024 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:GA107L; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDLDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_43:-32.2133 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:AA26S; +MMNPLIIKLGGVLLDSEEALERLFSSLVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_44:-33.6733 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:EA153F; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDFGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_45:-29.5334 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:IA133A; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLANSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_46:-36.7957 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA12K; +MMNPLIIKLGGKLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_47:-32.3831 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:QA207E; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEEGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_48:-27.5497 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:IA210S; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGISTDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_49:-32.21 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA232L; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPLDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_50:-31.9647 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:IA209Q; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGQITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_51:-32.9451 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:EA21F; +MMNPLIIKLGGVLLDSEEALFRLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_52:-30.1373 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:GA105D; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLDDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_53:-35.2035 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:SA183M; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVMGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_54:-31.0009 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:PA127A; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQAGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_55:-16.0214 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:AA79Y; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGYLAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_56:-28.7441 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:GA105Y; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLYDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_57:-31.0373 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA142F; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYFPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_58:-31.8485 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:GA105F; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLFDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_59:-32.166 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:KA111S; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVSVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_60:-26.3751 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:AA161W; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNWDQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_61:-32.6849 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:KA94I; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKIHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_62:-32.9406 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:DA106H; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGHGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_63:-32.5425 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:MA2K; +MKNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_64:-30.5892 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:PA127H; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQHGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_65:-26.6371 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA112Q; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKQTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_66:-31.699 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:IA75C; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDCITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_67:-31.4974 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:IA7V; +MMNPLIVKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_68:-33.854 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:QA242S; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +ESLPALFNGMPMGTRILA +>1gs5_Repair_69:-30.7409 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:SA109R; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDRVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_70:-30.3364 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA243T; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQTPALFNGMPMGTRILA +>1gs5_Repair_71:-32.691 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:GA101D; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVDLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_72:-33.7423 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:DA49N; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVNELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_73:-33.2086 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:KA217R; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVRVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_74:-30.3319 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:GA190A; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKAQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_75:-32.5527 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA216K; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIKKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_76:-29.8133 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:IA76H; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIHTGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_77:-29.8987 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:IA148A; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSAGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_78:-29.1872 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:RA255H; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTHILA +>1gs5_Repair_79:-34.0549 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:DA181I; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +IVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_80:-30.8807 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:SA135P; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINPLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_81:-33.796 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:SA183L; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVLGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_82:-26.8653 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:AA174N; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGNDLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_83:-34.1705 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:TA83F; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGFANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_84:-31.6695 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:TA166L; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAALALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_85:-28.6374 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:GA43T; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHTGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_86:-32.6338 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:AA245H; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPHLFNGMPMGTRILA +>1gs5_Repair_87:-34.2729 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:RA230L; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGLPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_88:-32.0005 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:IA215E; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMEVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_89:-32.9837 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:QA35C; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHCRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_90:-29.1524 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:GA140M; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENMYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_91:-33.9083 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:AA170R; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALARTLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_92:-31.3244 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:TA211P; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIIPDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_93:-33.0398 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:KA94Y; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKYHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_94:-32.111 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:PA58Q; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLQVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_95:-33.0668 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA27I; +MMNPLIIKLGGVLLDSEEALERLFSAIVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_96:-33.0505 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:EA118F; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEFLG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_97:-32.193 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:KA131V; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPVLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_98:-31.5194 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:AA258Q; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILQ +>1gs5_Repair_99:-28.2942 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA122D; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HDGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_100:-33.1727 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:SA236W; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIAWWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_1:-28.4878 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:RA36K,IA185N; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQKPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGNLDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_2:-33.4141 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:RA22W,DA49Y; +MMNPLIIKLGGVLLDSEEALEWLFSALVNYRESHQRPLVIVHGGGCVVYELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_3:-29.023 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:SA180R,AA224I; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLR +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDIARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_4:-32.1547 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:EA18V,EA117K; +MMNPLIIKLGGVLLDSEVALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDKELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_5:-29.532 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:DA74K,SA147E; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIKIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSEIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_6:-15.917 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:GA128T,QA155H; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPTSPKLINSLLENGYLPVVSSIGVTDEGHLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_7:-24.2848 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:DA187C,MA196R; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILCGKGQRIAERTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_8:-33.4906 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:AA19S,GA188L; +MMNPLIIKLGGVLLDSEESLERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDLKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_9:-32.6878 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:SA33C,DA74M; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRECHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIMIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_10:-30.6572 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:YA30G,SA183P; +MMNPLIIKLGGVLLDSEEALERLFSALVNGRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVPGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_11:-32.8017 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:EA118W,EA138Y; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEWLG +HVGLAQPGSPKLINSLLYNGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_12:-31.8147 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:KA189E,QA242E; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGEGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EELPALFNGMPMGTRILA +>1gs5_Repair_13:-31.1473 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:KA86I,AA201T; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANITLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKTEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_14:-19.1258 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:SA236F,TA254R; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIAFWRHA +EQLPALFNGMPMGRRILA +>1gs5_Repair_15:-19.8512 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:MA52L,GA253V; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELLKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMVTRILA +>1gs5_Repair_16:-27.9323 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:KA131L,IA209P; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPLLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGPITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_17:-31.995 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA14H,VA100Y; +MMNPLIIKLGGVLHDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAYGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_18:-18.9509 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:PA130I,VA159K; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSIKLINSLLENGYLPVVSSIGVTDEGQLMNKNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_19:-32.7644 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:QA35S,DA74M; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHSRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIMIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_20:-30.2256 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:NA3A,IA210Q; +MMAPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIQTDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_21:-25.045 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:TA83R,GA149K; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGRANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIKVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_22:-28.2226 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:HA42K,AA194F; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVKGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIFEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_23:-29.7068 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA51S,LA136E; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDESMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSELENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_24:-25.088 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:GA11N,DA223S; +MMNPLIIKLGNVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALSAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_25:-29.6147 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:HA42N,NA63C; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVNGGGCVVDELMKGLNLPVK +KKCGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_26:-27.4348 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA13H,EA18V; +MMNPLIIKLGGVHLDSEVALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_27:-31.315 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:KA61D,LA124M; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +DKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGMAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_28:-30.8752 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:EA50P,SA183H; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDPLMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVHGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_29:-28.3366 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:SA16G,HA42E; +MMNPLIIKLGGVLLDGEEALERLFSALVNYRESHQRPLVIVEGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_30:-29.7733 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA47C,LA88C; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCCVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTCLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_31:-27.4383 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA246A,GA249S; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPAAFNSMPMGTRILA +>1gs5_Repair_32:-26.7526 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:IA76D,LA88G; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIDTGALAGTANKTGLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_33:-30.2708 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:RA31L,MA196A; +MMNPLIIKLGGVLLDSEEALERLFSALVNYLESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEATAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_34:-33.0049 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:EA17M,EA138A; +MMNPLIIKLGGVLLDSMEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLANGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_35:-33.5947 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:QA114K,DA175H; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTKLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGAHLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_36:-32.3873 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:AA98M,EA241Q; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIMAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +QQLPALFNGMPMGTRILA +>1gs5_Repair_37:-1.44801 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:GA128F,AA167W; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPFSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATWLAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_38:-32.3341 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:GA101Q,EA138I; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVQLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLINGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_39:-30.9288 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:RA66N,PA231N; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLNVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRNVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_40:-17.3634 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA57V,AA164R; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNVPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQRATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_41:-31.9462 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:KA131H,QA242V; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPHLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EVLPALFNGMPMGTRILA +>1gs5_Repair_42:-28.1214 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:PA143I,MA196H; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLIVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEHTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_43:-31.8505 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:AA26S,AA198T; +MMNPLIIKLGGVLLDSEEALERLFSSLVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTTAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_44:-17.154 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:AA99F,EA153P; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAFVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDPGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_45:-29.4614 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:IA133A,DA212E; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLANSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITEGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_46:-26.6874 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA12K,GA107V; +MMNPLIIKLGGKLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDVDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_47:-25.5385 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:IA185E,IA209N; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGELDGKGQRIAEMTAAKAEQLIEQGNITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_48:-22.7597 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:MA196S,IA210E; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAESTAAKAEQLIEQGIETDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_49:-27.5839 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA38K,VA232T; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPKVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPTDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_50:-31.755 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:RA22H,DA212A; +MMNPLIIKLGGVLLDSEEALEHLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITAGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_51:-32.6469 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:EA21F,SA129Y; +MMNPLIIKLGGVLLDSEEALFRLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGYPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_52:-28.4626 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:DA49C,GA105P; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVCELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLPDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_53:-32.9131 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:QA242F,FA247L; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EFLPALLNGMPMGTRILA +>1gs5_Repair_54:-31.9196 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:PA58A,PA127K; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLAVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQKGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_55:-31.0838 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:RA36Y,AA79S; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQYPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGSLAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_56:-30.294 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:GA45Y,GA105N; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGYCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLNDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_57:-35.3525 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:RA66F,LA142M; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLFVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYMPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_58:-27.6804 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:PA37M,GA105W; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRMLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLWDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_59:-32.3514 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:NA158C,KA189F; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMCVNADQAATALAATLGADLILLS +DVSGILDGFGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_60:-31.5207 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:DA15W,AA161V; +MMNPLIIKLGGVLLWSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNVDQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_61:-31.565 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:KA94I,LA228F; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKIHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTFGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_62:-27.2606 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:DA106H,VA145F; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGHGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVFSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_63:-30.3351 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:MA2K,HA95V; +MKNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKVQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_64:-27.3041 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:PA127H,LA246Q; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQHGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPAQFNGMPMGTRILA +>1gs5_Repair_65:-30.4924 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:AA194K,AA235L; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIKEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDILSWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_66:-30.9821 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:DA187K,HA239D; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILKGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRDA +EQLPALFNGMPMGTRILA +>1gs5_Repair_67:-28.6535 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:IA7W,LA243H; +MMNPLIWKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQHPALFNGMPMGTRILA +>1gs5_Repair_68:-33.6424 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:PA58S,QA242F; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLSVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EFLPALFNGMPMGTRILA +>1gs5_Repair_69:-32.3173 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:EA206F,PA244A; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIFQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLAALFNGMPMGTRILA +>1gs5_Repair_70:-25.1794 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA80R,IA185E; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGARAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGELDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_71:-32.9035 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:GA54V,AA245N; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKVLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPNLFNGMPMGTRILA +>1gs5_Repair_72:-23.5395 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:TA68E,GA229W; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVEPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLWRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_73:-12.5148 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:CA46Q,GA107F; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGQVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDFDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_74:-30.0784 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA28S,AA220V; +MMNPLIIKLGGVLLDSEEALERLFSALSNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNVALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_75:-22.8987 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA112K,AA221C; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKKTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNACLDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_76:-28.8676 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:IA76H,AA92T; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIHTGALAGTANKTLLAWTKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_77:-30.0065 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:FA103A,IA148V; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLALGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSVGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_78:-30.5859 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA119G,AA198L; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEEGG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTLAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_79:-32.5345 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:AA70I,FA103Y; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPIDQIDIITGALAGTANKTLLAWAKKHQIAAVGLYLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_80:-31.4468 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:QA114F,QA163G; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTFLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADGAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_81:-31.8514 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:QA155R,IA210V; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGRLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIVTDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_82:-30.3825 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA186G,GA229R; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGIGDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLRRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_83:-27.3173 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA136P,LA142Y; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSPLENGYYPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_84:-31.1673 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:QA96M,WA237D; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHMIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASDRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_85:-30.5937 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:DA74N,NA139T; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQINIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLETGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_86:-25.6681 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA55D,AA161H; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGDNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNHDQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_87:-31.6515 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:SA146V,TA166E; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVVSIGVTDEGQLMNVNADQAAEALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_88:-33.0664 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:QA96S,SA183N; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHSIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVNGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_89:-34.588 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:RA31Y,AA245F; +MMNPLIIKLGGVLLDSEEALERLFSALVNYYESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPFLFNGMPMGTRILA +>1gs5_Repair_90:-25.6616 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:AA26S,AA161Y; +MMNPLIIKLGGVLLDSEEALERLFSSLVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNYDQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_91:-25.655 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:KA53N,SA109R; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMNGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDRVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_92:-32.8026 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:QA163M,GA173E; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADMAATALAATLEADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_93:-32.7653 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:RA66M,AA220G; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLMVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNGALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_94:-31.502 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA23Y,IA209E; +MMNPLIIKLGGVLLDSEEALERYFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGEITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_95:-14.8871 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:TA68R,AA99Y; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVRPADQIDIITGALAGTANKTLLAWAKKHQIAYVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_96:-30.0517 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA65R,LA222K; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGRRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAAKDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_97:-30.4696 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA38P,GA45T; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPPVIVHGGTCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_98:-30.3088 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:GA190D,LA257Y; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKDQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRIYA +>1gs5_Repair_99:-12.5424 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:AA198S,TA254R; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTSAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGRRILA +>1gs5_Repair_100:-36.8739 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA12K,KA111N; +MMNPLIIKLGGKLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVNVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_1:-32.6968 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:NA85R,NA160Q; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTARKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVQADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_2:-30.8122 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:AA92I,SA109Q; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWIKKHQIAAVGLFLGDGDQVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_3:-32.8352 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:SA16Q,MA214Q; +MMNPLIIKLGGVLLDQEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGQIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_4:-29.5273 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:YA30C,DA223G; +MMNPLIIKLGGVLLDSEEALERLFSALVNCRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALGAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_5:-28.9048 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:IA7A,KA111R; +MMNPLIAKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVRVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_6:-27.8774 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:SA180T,LA246S; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLT +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPASFNGMPMGTRILA +>1gs5_Repair_7:-34.3735 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:KA8T,NA29M; +MMNPLIITLGGVLLDSEEALERLFSALVMYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_8:-33.1982 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:SA135N,RA192C; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINNLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQCIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_9:-29.3148 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA100I,LA104E; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAIGLFEGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_10:-30.9104 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:HA95P,AA98L; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKPQILAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_11:-32.8763 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA150Y,EA206I; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGYTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIIQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_12:-31.1491 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA132D,EA138H; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKDINSLLHNGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_13:-16.2821 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:NA134M,GA184D; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLIMSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSDILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_14:-30.1936 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:EA17D,LA20N; +MMNPLIIKLGGVLLDSDEANERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_15:-32.7955 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA65C,GA188M; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGCRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDMKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_16:-34.2355 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:DA15K,NA219E; +MMNPLIIKLGGVLLKSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVEAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_17:-29.7827 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:AA220V,LA222K; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNVAKDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_18:-26.6887 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:AA92K,GA249S; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWKKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNSMPMGTRILA +>1gs5_Repair_19:-30.3903 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA27C,AA198V; +MMNPLIIKLGGVLLDSEEALERLFSACVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTVAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_20:-26.2979 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:AA221M,AA224T; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAMLDTARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_21:-33.0885 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA144L,PA244L; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPLVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLLALFNGMPMGTRILA +>1gs5_Repair_22:-35.47 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:RA31H,SA183F; +MMNPLIIKLGGVLLDSEEALERLFSALVNYHESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVFGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_23:-34.0674 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:KA62I,QA72H; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KINGLRVTPADHIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_24:-33.105 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA28Y,TA83C; +MMNPLIIKLGGVLLDSEEALERLFSALYNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGCANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_25:-27.4423 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:EA21Y,IA234D; +MMNPLIIKLGGVLLDSEEALYRLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDDASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_26:-31.356 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:KA86T,PA130K; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANTTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSKKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_27:-28.2559 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:IA40T,LA222W; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVTVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAAWDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_28:-29.9348 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:KA93R,AA258K; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWARKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILK +>1gs5_Repair_29:-29.3925 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA41N,IA205V; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVINHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLVEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_30:-27.6765 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:GA154T,PA231I; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDETQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRIVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_31:-36.3751 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:HA239I,QA242L; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRIA +ELLPALFNGMPMGTRILA +>1gs5_Repair_32:-33.888 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:SA109L,TA211P; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDLVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIIPDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_33:-27.5665 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA48D,LA142D; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVDDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYDPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_34:-32.0337 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:EA18F,QA72C; +MMNPLIIKLGGVLLDSEFALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADCIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_35:-31.1373 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:GA78V,LA80S; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITVASAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_36:-25.8186 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:PA143K,DA175W; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLKVVSSIGVTDEGQLMNVNADQAATALAATLGAWLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_37:-26.9686 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA57E,VA232P; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNEPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPPDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_38:-27.7236 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:GA154T,DA233C; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDETQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVCIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_39:-26.5391 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:RA22G,GA154V; +MMNPLIIKLGGVLLDSEEALEGLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEVQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_40:-22.4475 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:AA81S,GA128S; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALSGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPSSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_41:-29.3226 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:PA4D,DA233Q; +MMNDLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVQIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_42:-34.0321 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:QA72Y,DA181T; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADYIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +TVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_43:-25.5765 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:MA52F,SA147W; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELFKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSWIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_44:-24.0635 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:EA118T,AA164H; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDETLG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQHATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_45:-32.6052 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:MA2I,KA86E; +MINPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANETLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_46:-31.1761 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA89V,LA257V; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLVAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRIVA +>1gs5_Repair_47:-29.9817 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:YA30G,SA135F; +MMNPLIIKLGGVLLDSEEALERLFSALVNGRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINFLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_48:-29.0448 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:KA53T,IA148P; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMTGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSPGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_49:-31.8311 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:EA21L,IA75E; +MMNPLIIKLGGVLLDSEEALLRLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDEITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_50:-33.1714 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:DA106H,TA227Q; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGHGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARQLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_51:-29.2627 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA168I,LA222R; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATAIAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAARDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_52:-31.3163 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA88H,EA153G; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTHLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDGGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_53:-27.0998 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:IA75D,MA157G; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDDITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLGNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_54:-27.8961 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:IA193P,HA239C; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRPAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRCA +EQLPALFNGMPMGTRILA +>1gs5_Repair_55:-27.7685 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA168E,AA225V; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATAEAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAVRTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_56:-31.6478 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA67A,TA87Q; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRATPADQIDIITGALAGTANKQLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_57:-32.6543 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:DA74E,LA228R; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIEIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTRGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_58:-33.5705 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:KA53F,AA198D; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMFGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTDAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_59:-34.4245 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:DA212G,NA219D; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITGGMIVKVDAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_60:-31.2525 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:AA19E,AA70P; +MMNPLIIKLGGVLLDSEEELERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPPDQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_61:-33.5913 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA28L,KA93R; +MMNPLIIKLGGVLLDSEEALERLFSALLNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWARKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_62:-26.1769 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:AA70G,TA254D; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPGDQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGDRILA +>1gs5_Repair_63:-26.034 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA80D,MA157D; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGADAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLDNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_64:-31.9664 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:RA36V,GA45W; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQVPLVIVHGGWCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_65:-27.8607 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:AA198Y,IA256E; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTYAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRELA +>1gs5_Repair_66:-27.2031 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:IA193G,DA223P; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRGAEMTAAKAEQLIEQGIITDGMIVKVNAALPAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_67:-31.2264 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA38I,KA61S; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPIVIVHGGGCVVDELMKGLNLPVK +SKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_68:-29.0164 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA65D,IA148N; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGDRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSNGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_69:-30.987 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:IA76E,AA240R; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIETGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHR +EQLPALFNGMPMGTRILA +>1gs5_Repair_70:-27.9601 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA132W,AA221P; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKWINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAPLDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_71:-16.643 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:EA195D,AA225Y; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIADMTAAKAEQLIEQGIITDGMIVKVNAALDAYRTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_72:-31.8956 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:IA76T,AA98F; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDITTGALAGTANKTLLAWAKKHQIFAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_73:-34.2986 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:QA72L,TA87G; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADLIDIITGALAGTANKGLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_74:-18.527 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:TA166L,IA185W; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAALALAATLGADLILLS +DVSGWLDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_75:-33.0812 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:RA22K,TA227C; +MMNPLIIKLGGVLLDSEEALEKLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARCLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_76:-32.6947 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:KA8H,DA162S; +MMNPLIIHLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNASQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_77:-21.0408 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:SA147W,LA246Q; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSWIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPAQFNGMPMGTRILA +>1gs5_Repair_78:-15.1119 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:QA191L,GA253I; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGLRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMITRILA +>1gs5_Repair_79:-27.8533 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA9N,IA234V; +MMNPLIIKNGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDVASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_80:-27.3779 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA9R,PA127R; +MMNPLIIKRGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQRGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_81:-32.3804 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA41L,LA156Y; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVILHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQYMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_82:-28.8588 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:PA127L,GA208S; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQLGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQSIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_83:-28.3756 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA137Q,GA213V; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLQENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDVMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_84:11.7743 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:GA149H,GA253H; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIHVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMHTRILA +>1gs5_Repair_85:-30.859 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:EA18A,LA27Y; +MMNPLIIKLGGVLLDSEAALERLFSAYVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_86:-32.5999 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:DA116W,TA151K; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLWEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVKDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_87:-31.1872 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:KA61D,QA96Y; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +DKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHYIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_88:-26.4273 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA176M,IA210P; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADMILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIPTDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_89:-27.4883 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:AA92W,KA189M; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWWKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGMGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_90:-29.8925 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:MA2C,IA148N; +MCNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSNGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_91:-33.6149 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:DA116F,KA200D; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLFEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAADAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_92:-28.2147 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:TA68N,KA200P; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVNPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAPAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_93:-27.8885 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:FA24C,KA94E; +MMNPLIIKLGGVLLDSEEALERLCSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKEHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_94:-16.0983 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:GA82V,GA123I; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAVTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVILAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_95:-17.9031 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:QA35Y,GA123L; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHYRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVLLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_96:-29.9096 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:QA191S,GA208M; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGSRIAEMTAAKAEQLIEQMIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_97:-6.971 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:SA146Y,QA203T; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVYSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAETLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_98:-29.7375 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:AA26V,GA43N; +MMNPLIIKLGGVLLDSEEALERLFSVLVNYRESHQRPLVIVHNGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_99:-30.4154 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:KA8L,IA133S; +MMNPLIILLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLSNSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_100:-22.0152 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:DA162W,VA218R; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNAWQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKRNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_1:-28.8366 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:NA85R,NA160Q,LA172H; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTARKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVQADQAATALAATHGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_2:-26.8981 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA39A,LA102S,DA106A; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLAIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGSFLGAGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_3:-30.3477 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:SA25V,AA201D,AA245F; +MMNPLIIKLGGVLLDSEEALERLFVALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKDEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPFLFNGMPMGTRILA +>1gs5_Repair_4:-29.909 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:IA75F,TA77D,MA252E; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDFIDGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPEGTRILA +>1gs5_Repair_5:-20.0688 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA57N,VA110R,KA217P; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNNPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSRKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVPVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_6:-32.1007 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:NA56A,SA129C,TA227Q; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLALPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGCPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARQLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_7:-34.8313 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:RA36L,CA46D,NA134W; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQLPLVIVHGGGDVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLIWSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_8:-30.1082 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:DA15N,TA166D,EA195A; +MMNPLIIKLGGVLLNSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAADALAATLGADLILLS +DVSGILDGKGQRIAAMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_9:-25.6334 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:HA95L,VA100E,LA104H; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKLQIAAEGLFHGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_10:-32.1049 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:PA58F,HA95L,AA98S; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLFVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKLQISAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_11:-32.8313 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA150Y,EA153I,EA206L; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGYTDIGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLILQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_12:-26.2574 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:HA42D,DA74H,DA116A; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVDGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIHIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLAEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_13:9.99434 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:HA34M,NA134C,GA184F; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESMQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLICSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSFILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_14:-31.6075 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:TA77D,AA90D,NA158H; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIIDGALAGTANKTLLDWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMHVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_15:-28.0106 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA65C,AA161M,GA188A; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGCRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNMDQAATALAATLGADLILLS +DVSGILDAKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_16:-31.7959 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:DA15K,IA73C,NA219H; +MMNPLIIKLGGVLLKSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQCDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVHAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_17:-33.9 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:KA8V,AA221K,DA223W; +MMNPLIIVLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAKLWAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_18:-33.4455 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:AA90K,AA92S,AA170F; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLKWSKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAFTLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_19:-30.7666 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA27C,HA34V,AA198Y; +MMNPLIIKLGGVLLDSEEALERLFSACVNYRESVQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTYAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_20:-29.7998 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA182K,VA216S,LA222A; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DKSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMISKVNAAADAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_21:-31.7041 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:PA69L,VA144L,PA244Y; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTLADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPLVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLYALFNGMPMGTRILA +>1gs5_Repair_22:-30.8712 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:RA31M,AA167I,KA217T; +MMNPLIIKLGGVLLDSEEALERLFSALVNYMESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATILAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVTVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_23:-24.7852 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:EA17L,AA92W,LA115R; +MMNPLIIKLGGVLLDSLEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWWKKHQIAAVGLFLGDGDSVKVTQRDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_24:-31.2874 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA28Y,LA38C,TA83K; +MMNPLIIKLGGVLLDSEEALERLFSALYNYRESHQRPCVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGKANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_25:-32.7893 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:EA21Y,SA236D,AA240T; +MMNPLIIKLGGVLLDSEEALYRLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIADWRHT +EQLPALFNGMPMGTRILA +>1gs5_Repair_26:-29.9575 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:KA86T,PA130K,TA197W; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANTTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSKKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMWAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_27:-16.8312 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA119T,AA167W,SA236Q; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEETG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATWLAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIAQWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_28:-31.0331 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:KA93R,QA191K,AA258I; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWARKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGKRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILI +>1gs5_Repair_29:-29.429 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA41N,KA86V,IA205L; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVINHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANVTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLLEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_30:-31.9799 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:QA35T,QA155L,DA233Y; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHTRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGLLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVYIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_31:-24.391 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA13Q,TA254M,RA255L; +MMNPLIIKLGGVQLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGMLILA +>1gs5_Repair_32:-7.84324 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA88Y,TA166E,GA184R; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTYLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAAEALAATLGADLILLS +DVSRILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_33:-30.6168 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA51K,IA97N,RA192V; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDEKMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQNAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQVIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_34:-24.4643 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:EA18H,TA68R,QA191L; +MMNPLIIKLGGVLLDSEHALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVRPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGLRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_35:-31.0476 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:KA86P,WA91F,DA181M; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANPTLLAFAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +MVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_36:-29.6463 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:DA71Q,GA105F,IA177N; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPAQQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLFDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLNLLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_37:-23.6802 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA13W,IA193Q,AA198H; +MMNPLIIKLGGVWLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRQAEMTHAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_38:-30.0117 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA27I,VA59T,TA171K; +MMNPLIIKLGGVLLDSEEALERLFSAIVNYRESHQRPLVIVHGGGCVVDELMKGLNLPTK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAAKLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_39:-21.4318 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:GA101V,GA107Q,AA170L; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVVLFLGDQDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALALTLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_40:-26.7814 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:EA18Y,DA187A,AA224V; +MMNPLIIKLGGVLLDSEYALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILAGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDVARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_41:-26.8453 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:GA43W,AA99P,GA101Q; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHWGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAPVQLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_42:-31.7995 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:KA131E,AA194C,PA231Q; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPELINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRICEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRQVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_43:-31.7379 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:WA91Q,EA153R,DA212K; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAQAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDRGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITKGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_44:-24.9966 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:SA146L,TA151I,QA155S; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVLSIGVIDEGSLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_45:5.44743 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:TA171W,LA204S,GA208P; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAAWLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQSIEQPIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_46:-31.9737 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:KA111A,EA118K,RA226N; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVAVTQLDEKLG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAANTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_47:-33.9596 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:MA2F,QA35P,SA135L; +MFNPLIIKLGGVLLDSEEALERLFSALVNYRESHPRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINLLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_48:-32.3547 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:HA34M,EA202Y,PA244N; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESMQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAYQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLNALFNGMPMGTRILA +>1gs5_Repair_49:-10.911 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:NA139A,LA176E,AA225Y; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLEAGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADEILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAYRTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_50:-32.7099 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:EA32F,VA67I,AA170L; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRFSHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRITPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALALTLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_51:-29.2587 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA41Q,AA92F,KA111L; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIQHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWFKKHQIAAVGLFLGDGDSVLVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_52:-32.5816 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:AA79N,DA212T,SA236L; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGNLAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITTGMIVKVNAALDAARTLGRPVDIALWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_53:-30.6736 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:GA54K,KA200M,FA247Q; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKKLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAMAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALQNGMPMGTRILA +>1gs5_Repair_54:-31.0922 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:DA74T,LA104M,PA130K; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQITIITGALAGTANKTLLAWAKKHQIAAVGLFMGDGDSVKVTQLDEELG +HVGLAQPGSKKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_55:-30.8737 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA80G,GA213N,AA220G; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGAGAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDNMIVKVNGALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_56:-29.8929 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA67L,PA127S,NA160W; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRLTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQSGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVWADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_57:-33.4502 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:KA8E,EA21K,DA175Q; +MMNPLIIELGGVLLDSEEALKRLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGAQLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_58:-28.5808 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA104S,LA124W,MA252L; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFSGDGDSVKVTQLDEELG +HVGWAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPLGTRILA +>1gs5_Repair_59:-26.1527 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA41S,NA63T,RA226F; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVISHGGGCVVDELMKGLNLPVK +KKTGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAAFTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_60:-24.013 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:GA101S,DA162Y,IA256S; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVSLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNAYQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRSLA +>1gs5_Repair_61:-30.3309 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA65D,GA82S,GA101P; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGDRVTPADQIDIITGALASTANKTLLAWAKKHQIAAVPLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_62:-22.7769 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:TA77Y,LA132R,AA221K; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIIYGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKRINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAKLDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_63:-26.5097 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:AA19E,SA129D,IA210F; +MMNPLIIKLGGVLLDSEEELERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGDPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIFTDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_64:-21.4385 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:SA25A,AA169E,LA172D; +MMNPLIIKLGGVLLDSEEALERLFAALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALEATDGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_65:-29.6662 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:KA93R,IA209S,EA241V; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWARKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGSITDGMIVKVNAALDAARTLGRPVDIASWRHA +VQLPALFNGMPMGTRILA +>1gs5_Repair_66:-32.8118 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:KA131A,LA142M,LA257F; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPALINSLLENGYMPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRIFA +>1gs5_Repair_67:-26.8475 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:PA58T,TA77W,AA125I; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLTVK +KKNGLRVTPADQIDIIWGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLIQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_68:-31.7475 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:NA56G,QA191I,MA196V; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLGLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGIRIAEVTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_69:-33.6596 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA27H,VA47I,DA223M; +MMNPLIIKLGGVLLDSEEALERLFSAHVNYRESHQRPLVIVHGGGCIVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALMAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_70:-38.3389 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:QA72R,SA109L,TA113W; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADRIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDLVKVWQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_71:-32.1107 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:KA62D,LA88I,WA91L; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KDNGLRVTPADQIDIITGALAGTANKTILALAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_72:-26.2603 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA59A,QA72T,AA225D; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPAK +KKNGLRVTPADTIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDADRTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_73:-31.7191 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:PA58L,DA74A,VA150C; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLLVK +KKNGLRVTPADQIAIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGCTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_74:-29.6401 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:EA117M,GA140S,AA245L; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDMELG +HVGLAQPGSPKLINSLLENSYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPLLFNGMPMGTRILA +>1gs5_Repair_75:-24.9714 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA13Q,GA101I,LA137E; +MMNPLIIKLGGVQLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVILFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLEENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_76:-20.6696 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:QA72L,AA240P,GA253L; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADLIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHP +EQLPALFNGMPMLTRILA +>1gs5_Repair_77:-22.728 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:PA4G,QA96P,QA155I; +MMNGLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHPIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGILMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_78:-25.27 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA104E,MA157A,TA197F; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFEGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLANVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMFAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_79:-25.37 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:DA15G,AA165Q,GA188Y; +MMNPLIIKLGGVLLGSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAQTALAATLGADLILLS +DVSGILDYKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_80:-28.3729 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:AA70E,WA91N,MA214C; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPEDQIDIITGALAGTANKTLLANAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGCIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_81:-23.7075 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:HA95C,GA120P,AA161P; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKCQIAAVGLFLGDGDSVKVTQLDEELP +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNPDQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_82:-26.062 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:EA17I,DA74R,MA196D; +MMNPLIIKLGGVLLDSIEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIRIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEDTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_83:-18.5236 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:IA6G,LA23A,LA168E; +MMNPLGIKLGGVLLDSEEALERAFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATAEAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_84:-28.0311 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:NA139K,GA173I,LA222H; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLEKGYLPVVSSIGVTDEGQLMNVNADQAATALAATLIADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAAHDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_85:-21.9175 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:QA191P,LA246N,IA256F; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGPRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPANFNGMPMGTRFLA +>1gs5_Repair_86:-17.2357 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:KA62E,IA215V,GA253E; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KENGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMVVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMETRILA +>1gs5_Repair_87:-28.6791 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:NA3V,GA101Q,AA194N; +MMVPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVQLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRINEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_88:-31.0012 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:EA17K,LA55W,KA217E; +MMNPLIIKLGGVLLDSKEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGWNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVEVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_89:-27.5999 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:NA158G,VA159N,LA186M; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMGNNADQAATALAATLGADLILLS +DVSGIMDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_90:-21.4194 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:YA30F,IA133Q,AA225E; +MMNPLIIKLGGVLLDSEEALERLFSALVNFRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLQNSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAERTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_91:-28.3092 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:WA91Q,AA169S,MA214T; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAQAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALSATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGTIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_92:-24.6349 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:PA130I,VA182A,LA246S; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSIKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DASGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPASFNGMPMGTRILA +>1gs5_Repair_93:-26.9243 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:IA7L,GA82E,SA109H; +MMNPLILKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAETANKTLLAWAKKHQIAAVGLFLGDGDHVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_94:-30.3287 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:IA40K,VA216F,AA225C; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVKVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIFKVNAALDACRTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_95:-37.1931 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:SA33K,DA162E,EA202F; +MMNPLIIKLGGVLLDSEEALERLFSALVNYREKHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNAEQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAFQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_96:-32.7508 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:TA83S,KA86C,DA223V; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGSANCTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALVAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_97:-0.059201 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:GA107I,GA123K,HA239K; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDIDSVKVTQLDEELG +HVKLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRKA +EQLPALFNGMPMGTRILA +>1gs5_Repair_98:-21.523 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:GA10P,LA104Y,DA175A; +MMNPLIIKLPGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFYGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGAALILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_99:-27.3865 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA110C,AA224N,AA225S; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSCKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDNSRTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_100:-24.3541 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA59Y,AA167R,FA247K; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPYK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATRLAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALKNGMPMGTRILA +>1gs5_Repair_1:-28.0856 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:RA36K,IA185N,DA187N; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQKPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGNLNGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_2:-29.3548 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:AA81Q,LA119Q,LA228H; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALQGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEEQG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTHGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_3:-24.1151 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA122R,DA187I,SA236C; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HRGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILIGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIACWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_4:-27.9485 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:EA18V,EA118K,VA144D; +MMNPLIIKLGGVLLDSEVALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEKLG +HVGLAQPGSPKLINSLLENGYLPDVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_5:-24.8636 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:IA7K,DA181Q,LA243P; +MMNPLIKKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +QVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQPPALFNGMPMGTRILA +>1gs5_Repair_6:-28.6846 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA39S,TA211G,WA237N; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLSIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIIGDGMIVKVNAALDAARTLGRPVDIASNRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_7:-23.9841 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:SA146D,DA187R,MA196N; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVDSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILRGKGQRIAENTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_8:-33.2005 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:AA19S,DA49L,GA188A; +MMNPLIIKLGGVLLDSEESLERLFSALVNYRESHQRPLVIVHGGGCVVLELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDAKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_9:-33.2049 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:SA33C,DA74M,LA119M; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRECHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIMIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEEMG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_10:-16.9145 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:YA30G,SA183P,GA184P; +MMNPLIIKLGGVLLDSEEALERLFSALVNGRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVPPILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_11:-31.9087 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:EA118W,EA138Y,KA200Q; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEWLG +HVGLAQPGSPKLINSLLYNGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAQAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_12:-23.2432 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:MA157E,GA190E,LA243A; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLENVNADQAATALAATLGADLILLS +DVSGILDGKEQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQAPALFNGMPMGTRILA +>1gs5_Repair_13:-25.5398 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:KA86I,LA104T,AA201R; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANITLLAWAKKHQIAAVGLFTGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKREQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_14:-27.0282 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:TA227F,SA236R,TA254Q; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARFLGRPVDIARWRHA +EQLPALFNGMPMGQRILA +>1gs5_Repair_15:5.24616 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:MA52L,AA169V,GA253F; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELLKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALVATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMFTRILA +>1gs5_Repair_16:-23.3318 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:KA131L,AA201P,IA209P; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPLLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKPEQLIEQGPITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_17:-19.2619 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA65F,VA122C,VA159F; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGFRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HCGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNFNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_18:-29.5785 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:QA114L,VA144K,DA162S; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTLLDEELG +HVGLAQPGSPKLINSLLENGYLPKVSSIGVTDEGQLMNVNASQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_19:-21.5993 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:AA81C,LA168Y,AA169Q; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALCGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATAYQATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_20:-33.097 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:NA3Q,NA160S,TA227L; +MMQPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVSADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARLLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_21:-22.4509 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:GA140R,AA161K,TA166L; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENRYLPVVSSIGVTDEGQLMNVNKDQAALALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_22:-27.5286 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:HA42K,AA98F,AA194G; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVKGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIFAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIGEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_23:-19.0191 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:AA98M,AA167F,AA199F; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIMAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATFLAATLGADLILLS +DVSGILDGKGQRIAEMTAFKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_24:-26.0735 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:GA11I,TA83I,SA129H; +MMNPLIIKLGIVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGIANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGHPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_25:-26.8897 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA137N,IA185A,HA239K; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLNENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGALDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRKA +EQLPALFNGMPMGTRILA +>1gs5_Repair_26:-33.9099 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:PA127A,DA175Y,RA238F; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQAGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGAYLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWFHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_27:-26.3669 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:NA139G,DA187A,LA222D; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLEGGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILAGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAADDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_28:-22.3713 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA122T,LA124H,AA164D; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HTGHAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQDATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_29:-31.5799 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA102W,EA118I,LA228S; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGWFLGDGDSVKVTQLDEILG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTSGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_30:-27.2401 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:EA32A,DA74C,RA255Y; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRASHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQICIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTYILA +>1gs5_Repair_31:-30.4961 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:AA19Y,DA223Q,DA233C; +MMNPLIIKLGGVLLDSEEYLERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALQAARTLGRPVCIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_32:-32.5521 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:GA78T,TA197R,MA250I; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITTALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMRAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGIPMGTRILA +>1gs5_Repair_33:-29.2927 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:DA15V,MA52D,RA66M; +MMNPLIIKLGGVLLVSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELDKGLNLPVK +KKNGLMVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_34:-19.1259 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:EA17Y,VA39N,GA44E; +MMNPLIIKLGGVLLDSYEALERLFSALVNYRESHQRPLNIVHGEGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_35:-29.1694 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA150L,RA230Y,TA254G; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGLTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGYPVDIASWRHA +EQLPALFNGMPMGGRILA +>1gs5_Repair_36:-24.0751 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:GA10N,VA48P,AA92R; +MMNPLIIKLNGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVPDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWRKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_37:-36.0966 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA12E,IA148V,WA237I; +MMNPLIIKLGGELLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSVGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASIRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_38:-33.0932 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA14K,DA15L,LA222M; +MMNPLIIKLGGVLKLSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAAMDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_39:-24.9757 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:SA135L,AA169R,GA190Q; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINLLLENGYLPVVSSIGVTDEGQLMNVNADQAATALRATLGADLILLS +DVSGILDGKQQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_40:-28.4496 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:FA24Y,IA40H,RA255N; +MMNPLIIKLGGVLLDSEEALERLYSALVNYRESHQRPLVHVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTNILA +>1gs5_Repair_41:-33.4115 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:DA15T,DA175T,MA250F; +MMNPLIIKLGGVLLTSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGATLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGFPMGTRILA +>1gs5_Repair_42:-6.82682 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:MA2R,GA107W,KA200D; +MRNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDWDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAADAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_43:-31.7128 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA122M,AA161M,TA227Q; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HMGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNMDQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARQLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_44:-29.3139 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA23D,KA217L,GA229R; +MMNPLIIKLGGVLLDSEEALERDFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVLVNAALDAARTLRRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_45:-28.0078 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA41A,MA52C,AA81V; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIAHGGGCVVDELCKGLNLPVK +KKNGLRVTPADQIDIITGALVGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_46:-30.333 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA12K,DA106V,GA107N; +MMNPLIIKLGGKLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGVNDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_47:-32.4985 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:GA45E,VA144N,GA188W; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGECVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPNVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDWKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_48:6.77979 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA65P,GA123E,GA184D; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGPRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVELAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSDILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_49:-26.6444 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:IA75K,LA176R,RA192A; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDKITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADRILLS +DVSGILDGKGQAIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_50:-25.9257 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA144S,DA187W,AA194D; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPSVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILWGKGQRIDEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_51:-28.9605 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA150I,LA172H,EA202C; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGITDEGQLMNVNADQAATALAATHGADLILLS +DVSGILDGKGQRIAEMTAAKACQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_52:-32.0767 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:SA25Y,AA26L,LA186N; +MMNPLIIKLGGVLLDSEEALERLFYLLVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGINDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_53:-24.8056 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:TA113C,GA140M,LA246F; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVCQLDEELG +HVGLAQPGSPKLINSLLENMYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPAFFNGMPMGTRILA +>1gs5_Repair_54:-9.12831 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:GA149E,VA150H,MA196Y; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIEHTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEYTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_55:-32.7309 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:NA63R,VA100A,WA237C; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKRGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAAGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASCRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_56:-8.19367 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:CA46Y,GA107H,QA126P; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGYVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDHDSVKVTQLDEELG +HVGLAPPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_57:-28.0566 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:DA49M,AA98F,VA218R; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVMELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIFAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKRNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_58:-22.4518 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:TA113G,LA137H,LA142S; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVGQLDEELG +HVGLAQPGSPKLINSLHENGYSPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_59:-27.4252 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA28C,LA119G,RA226G; +MMNPLIIKLGGVLLDSEEALERLFSALCNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEEGG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAAGTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_60:-30.3693 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA5V,DA106H,VA182N; +MMNPVIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGHGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DNSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_61:-31.642 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:CA46F,LA55A,AA167T; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGFVVDELMKGANLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATTLAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_62:-27.8679 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA104G,NA134D,SA147N; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFGGDGDSVKVTQLDEELG +HVGLAQPGSPKLIDSLLENGYLPVVSNIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_63:-29.2604 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:QA126A,NA134H,RA255F; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAAPGSPKLIHSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTFILA +>1gs5_Repair_64:-30.5544 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA145M,LA222K,PA231S; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVMSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAAKDAARTLGRSVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_65:-33.8505 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:FA24L,NA56R,EA153G; +MMNPLIIKLGGVLLDSEEALERLLSALVNYRESHQRPLVIVHGGGCVVDELMKGLRLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDGGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_66:-28.0778 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:GA11C,GA101K,DA175P; +MMNPLIIKLGCVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVKLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGAPLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_67:-32.4742 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:PA58H,SA180Q,RA238F; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLHVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLQ +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWFHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_68:-27.885 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA48R,NA158K,AA194G; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVRDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMKVNADQAATALAATLGADLILLS +DVSGILDGKGQRIGEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_69:-20.2904 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA179S,LA204G,AA235E; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILSS +DVSGILDGKGQRIAEMTAAKAEQGIEQGIITDGMIVKVNAALDAARTLGRPVDIESWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_70:-21.596 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:PA37D,GA149T,TA211R; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRDLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSITVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIIRDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_71:-32.2413 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:QA72A,AA170C,EA195N; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADAIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALACTLGADLILLS +DVSGILDGKGQRIANMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_72:-15.1771 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:AA90C,LA168W,VA232H; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLCWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATAWAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPHDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_73:-27.0132 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:AA19Y,TA171K,KA200D; +MMNPLIIKLGGVLLDSEEYLERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAAKLGADLILLS +DVSGILDGKGQRIAEMTAADAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_74:-24.9324 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:PA69L,VA122A,LA136P; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTLADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HAGLAQPGSPKLINSPLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_75:-25.849 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:EA18C,FA24T,NA29K; +MMNPLIIKLGGVLLDSECALERLTSALVKYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_76:-29.2069 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA89K,LA222K,AA245D; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLKAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAAKDAARTLGRPVDIASWRHA +EQLPDLFNGMPMGTRILA +>1gs5_Repair_77:-21.8278 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA23S,LA115T,AA221P; +MMNPLIIKLGGVLLDSEEALERSFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQTDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAPLDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_78:-18.9151 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:GA123M,WA237G,HA239D; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVMLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASGRDA +EQLPALFNGMPMGTRILA +>1gs5_Repair_79:-22.7762 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA65E,AA99N,AA221D; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGERVTPADQIDIITGALAGTANKTLLAWAKKHQIANVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNADLDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_80:-19.9538 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:MA2T,GA64P,LA124H; +MTNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNPLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGHAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_81:-27.5166 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:TA83N,VA159A,DA212P; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGNANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNANADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITPGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_82:-9.17239 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:SA16C,EA195Y,TA254F; +MMNPLIIKLGGVLLDCEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAYMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGFRILA +>1gs5_Repair_83:-28.0092 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:PA37L,LA88Q,KA111H; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRLLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTQLAWAKKHQIAAVGLFLGDGDSVHVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_84:-16.8282 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:GA120D,VA144P,AA235G; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELD +HVGLAQPGSPKLINSLLENGYLPPVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIGSWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_85:-21.951 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:IA148D,LA168G,WA237D; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSDGVTDEGQLMNVNADQAATAGAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASDRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_86:-19.4006 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:EA50A,AA99Y,IA210Q; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDALMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAYVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIQTDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_87:-26.2148 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:YA30L,VA159C,LA246H; +MMNPLIIKLGGVLLDSEEALERLFSALVNLRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNCNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPAHFNGMPMGTRILA +>1gs5_Repair_88:-29.2127 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:GA11K,AA81H,NA160E; +MMNPLIIKLGKVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALHGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVEADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_89:-26.0916 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:GA43M,DA108H,GA229T; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHMGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGHSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLTRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_90:-31.2086 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:GA78I,GA190E,MA250Q; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITIALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKEQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGQPMGTRILA +>1gs5_Repair_91:-23.4085 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:QA96H,PA143K,RA230E; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHHIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLKVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGEPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_92:-21.3926 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:GA120S,VA216A,TA254I; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELS +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIAKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGIRILA +>1gs5_Repair_93:-28.7603 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:QA96M,AA225S,GA249D; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHMIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDASRTLGRPVDIASWRHA +EQLPALFNDMPMGTRILA +>1gs5_Repair_94:-32.499 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:DA15A,RA66Q,KA86D; +MMNPLIIKLGGVLLASEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLQVTPADQIDIITGALAGTANDTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_95:-20.0998 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:AA125S,AA161F,LA168G; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLSQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNFDQAATAGAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_96:-29.5548 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:AA19L,TA68M,NA219H; +MMNPLIIKLGGVLLDSEELLERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVMPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVHAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_97:-27.0055 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:KA111L,EA153P,LA168D; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVLVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDPGQLMNVNADQAATADAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_98:-29.2158 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:AA90Q,VA122F,VA232N; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLQWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HFGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPNDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_99:-29.9337 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:RA31P,GA188W,QA191D; +MMNPLIIKLGGVLLDSEEALERLFSALVNYPESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDWKGDRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_100:-33.1425 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA12D,VA144K,EA206M; +MMNPLIIKLGGDLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPKVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIMQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_1:-21.9584 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:RA36K,IA185N,DA187N,AA235Y; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQKPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGNLNGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIYSWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_2:-31.6822 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:AA92Q,SA135Q,DA223I,PA231H; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWQKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINQLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALIAARTLGRHVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_3:-26.7204 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:GA10R,VA122H,DA187E,SA236G; +MMNPLIIKLRGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HHGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILEGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIAGWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_4:-32.1535 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:EA18V,EA118K,VA182D,GA188S; +MMNPLIIKLGGVLLDSEVALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEKLG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DDSGILDSKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_5:3.20467 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:IA7S,IA75T,VA110C,AA221W; +MMNPLISKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDTITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSCKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAWLDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_6:-24.9949 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA13D,DA49R,WA91S,AA240T; +MMNPLIIKLGGVDLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVRELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLASAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHT +EQLPALFNGMPMGTRILA +>1gs5_Repair_7:-23.1229 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:FA103Y,KA189A,GA208Q,FA247D; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLYLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGAGQRIAEMTAAKAEQLIEQQIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALDNGMPMGTRILA +>1gs5_Repair_8:-11.7928 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:PA58C,KA94Q,DA175H,GA184L; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLCVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKQHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGAHLILLS +DVSLILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_9:-30.0729 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:SA109G,IA133S,IA193M,SA236M; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDGVKVTQLDEELG +HVGLAQPGSPKLSNSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRMAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIAMWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_10:-25.4483 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:EA18F,AA161R,TA166Q,SA180V; +MMNPLIIKLGGVLLDSEFALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNRDQAAQALAATLGADLILLV +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_11:-28.3127 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:PA58E,AA84Y,TA151C,NA219W; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLEVK +KKNGLRVTPADQIDIITGALAGTYNKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVCDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVWAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_12:-36.2185 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:DA15L,SA16L,EA21W,HA121M; +MMNPLIIKLGGVLLLLEEALWRLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +MVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_13:-23.9417 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:IA7N,FA24G,AA98Q,HA121N; +MMNPLINKLGGVLLDSEEALERLGSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIQAVGLFLGDGDSVKVTQLDEELG +NVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_14:-31.7215 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:NA134L,SA183V,IA193D,PA231K; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLILSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVVGILDGKGQRDAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRKVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_15:-15.7446 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:HA42F,EA50C,LA137Y,AA258Q; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVFGGGCVVDCLMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLYENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILQ +>1gs5_Repair_16:-30.0587 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:EA17T,NA219K,AA245P,FA247V; +MMNPLIIKLGGVLLDSTEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVKAALDAARTLGRPVDIASWRHA +EQLPPLVNGMPMGTRILA +>1gs5_Repair_17:-14.6693 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:RA31V,SA147F,AA165R,MA250V; +MMNPLIIKLGGVLLDSEEALERLFSALVNYVESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSFIGVTDEGQLMNVNADQARTALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGVPMGTRILA +>1gs5_Repair_18:-30.5988 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:TA151M,IA210M,SA236W,LA257Q; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVMDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIMTDGMIVKVNAALDAARTLGRPVDIAWWRHA +EQLPALFNGMPMGTRIQA +>1gs5_Repair_19:-30.5763 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:EA138C,IA177H,IA193E,HA239V; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLCNGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLHLLS +DVSGILDGKGQREAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRVA +EQLPALFNGMPMGTRILA +>1gs5_Repair_20:-23.1029 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA27G,GA54V,LA132A,GA229S; +MMNPLIIKLGGVLLDSEEALERLFSAGVNYRESHQRPLVIVHGGGCVVDELMKVLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKAINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLSRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_21:-29.717 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:RA22Q,TA83S,VA100N,YA141E; +MMNPLIIKLGGVLLDSEEALEQLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGSANKTLLAWAKKHQIAANGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGELPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_22:-25.0094 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:EA21P,HA34E,WA91V,GA173H; +MMNPLIIKLGGVLLDSEEALPRLFSALVNYRESEQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAVAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLHADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_23:-30.0492 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA150K,NA160T,AA220I,DA233A; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGKTDEGQLMNVTADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNIALDAARTLGRPVAIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_24:-33.8537 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:SA25Y,VA47A,QA155A,EA206S; +MMNPLIIKLGGVLLDSEEALERLFYALVNYRESHQRPLVIVHGGGCAVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGALMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLISQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_25:-23.7633 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:GA10N,HA42P,GA173E,AA198T; +MMNPLIIKLNGVLLDSEEALERLFSALVNYRESHQRPLVIVPGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLEADLILLS +DVSGILDGKGQRIAEMTTAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_26:-29.6891 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA51Q,EA118V,LA222F,LA243H; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDEQMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEVLG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAAFDAARTLGRPVDIASWRHA +EQHPALFNGMPMGTRILA +>1gs5_Repair_27:-0.790461 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:PA4Y,KA61N,IA177S,TA254H; +MMNYLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +NKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLSLLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGHRILA +>1gs5_Repair_28:-26.2829 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:HA34R,DA71V,LA176H,IA185A; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESRQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPAVQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADHILLS +DVSGALDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_29:-10.1556 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:GA82A,KA111A,LA115I,GA123E; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAATANKTLLAWAKKHQIAAVGLFLGDGDSVAVTQIDEELG +HVELAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_30:-35.119 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:EA50T,RA66M,KA111H,RA238D; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDTLMKGLNLPVK +KKNGLMVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVHVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWDHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_31:-31.4088 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:DA49I,GA105L,DA108W,LA228F; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVIELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLLDGWSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTFGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_32:-29.5675 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:DA71S,GA78V,NA134P,SA147L; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPASQIDIITVALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLIPSLLENGYLPVVSLIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_33:-20.8653 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:YA30H,TA68Q,TA197K,KA200V; +MMNPLIIKLGGVLLDSEEALERLFSALVNHRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVQPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMKAAVAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_34:-6.96941 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:AA26N,VA59S,YA141Q,GA184E; +MMNPLIIKLGGVLLDSEEALERLFSNLVNYRESHQRPLVIVHGGGCVVDELMKGLNLPSK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGQLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSEILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_35:-25.818 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:IA133M,TA151G,LA172R,IA210L; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLMNSLLENGYLPVVSSIGVGDEGQLMNVNADQAATALAATRGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGILTDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_36:-18.032 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:IA40N,KA60L,GA128E,KA189M; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVNVHGGGCVVDELMKGLNLPVL +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPESPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGMGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_37:-23.0821 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:GA82R,KA189H,AA194H,IA234W; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALARTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGHGQRIHEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDWASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_38:-33.3923 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:DA15S,GA82V,GA101P,RA192Y; +MMNPLIIKLGGVLLSSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAVTANKTLLAWAKKHQIAAVPLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQYIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_39:-31.3453 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:RA36P,LA243M,NA248A,MA252P; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQPPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQMPALFAGMPPGTRILA +>1gs5_Repair_40:-22.2299 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA47W,EA118P,LA137D,FA247V; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCWVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEPLG +HVGLAQPGSPKLINSLDENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALVNGMPMGTRILA +>1gs5_Repair_41:-26.1393 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:SA25R,LA119R,GA173C,NA219P; +MMNPLIIKLGGVLLDSEEALERLFRALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEERG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLCADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVPAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_42:-30.4413 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:HA34K,HA95P,QA96E,KA111S; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESKQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKPEIAAVGLFLGDGDSVSVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_43:-30.4825 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:MA2T,KA53F,AA79I,NA139S; +MTNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMFGLNLPVK +KKNGLRVTPADQIDIITGILAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLESGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_44:-32.3547 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:AA26L,LA51Y,AA90F,AA240C; +MMNPLIIKLGGVLLDSEEALERLFSLLVNYRESHQRPLVIVHGGGCVVDEYMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLFWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHC +EQLPALFNGMPMGTRILA +>1gs5_Repair_45:-19.0972 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:KA94Y,VA159H,LA176H,SA236E; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKYHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNHNADQAATALAATLGADHILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIAEWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_46:-24.3691 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:HA121K,PA143D,VA144S,TA166M; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +KVGLAQPGSPKLINSLLENGYLDSVSSIGVTDEGQLMNVNADQAAMALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_47:-33.4459 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:KA94W,DA108K,KA111F,RA192K; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKWHQIAAVGLFLGDGKSVFVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQKIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_48:-32.2905 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA55F,LA119G,DA181F,DA223R; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGFNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEEGG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +FVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALRAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_49:-25.4058 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:IA97D,SA129R,GA149C,LA156V; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQDAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGRPKLINSLLENGYLPVVSSICVTDEGQVMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_50:-29.0343 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:EA21W,VA47Y,SA109P,LA204K; +MMNPLIIKLGGVLLDSEEALWRLFSALVNYRESHQRPLVIVHGGGCYVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDPVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQKIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_51:-31.9154 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:QA35G,QA126V,LA137I,SA236A; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHGRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAVPGSPKLINSLIENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIAAWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_52:-4.01148 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:MA2D,VA112W,AA125I,TA254G; +MDNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKWTQLDEELG +HVGLIQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGGRILA +>1gs5_Repair_53:-21.4864 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA12R,KA93N,AA125E,MA196C; +MMNPLIIKLGGRLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWANKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLEQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAECTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_54:-31.0046 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:AA26G,VA48I,QA163L,IA193Q; +MMNPLIIKLGGVLLDSEEALERLFSGLVNYRESHQRPLVIVHGGGCVIDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADLAATALAATLGADLILLS +DVSGILDGKGQRQAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_55:-30.3834 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:GA45D,KA60M,IA76D,NA134Q; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGDCVVDELMKGLNLPVM +KKNGLRVTPADQIDIDTGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLIQSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_56:-24.2782 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:QA35R,AA99D,MA196R,RA230I; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHRRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIADVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAERTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGIPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_57:-28.7248 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:NA63A,GA82I,NA160I,AA167T; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKAGLRVTPADQIDIITGALAITANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVIADQAATTLAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_58:-26.6399 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA23C,IA73G,QA126T,QA163M; +MMNPLIIKLGGVLLDSEEALERCFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQGDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLATPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADMAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_59:-31.138 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:NA134G,DA152M,EA241S,MA252V; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLIGSLLENGYLPVVSSIGVTMEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +SQLPALFNGMPVGTRILA +>1gs5_Repair_60:-10.5228 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA5A,SA16M,LA119Q,AA174R; +MMNPAIIKLGGVLLDMEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEEQG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGRDLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_61:-29.6099 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:IA6L,FA24W,LA156I,MA214V; +MMNPLLIKLGGVLLDSEEALERLWSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQIMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGVIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_62:-29.2196 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:KA94W,VA100G,LA102F,VA150G; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKWHQIAAGGFFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGGTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_63:-26.8503 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:AA99V,IA193K,EA202V,VA232P; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAVVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRKAEMTAAKAVQLIEQGIITDGMIVKVNAALDAARTLGRPPDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_64:-27.4112 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:AA99R,TA113H,QA114P,QA203D; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIARVGLFLGDGDSVKVHPLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEDLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_65:-24.6847 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA150F,GA154Q,AA169P,DA175N; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGFTDEQQLMNVNADQAATALPATLGANLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_66:-22.7931 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:EA138Y,LA168R,AA169R,AA220T; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLYNGYLPVVSSIGVTDEGQLMNVNADQAATARRATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNTALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_67:-25.9584 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA27S,LA57K,DA223G,GA249F; +MMNPLIIKLGGVLLDSEEALERLFSASVNYRESHQRPLVIVHGGGCVVDELMKGLNKPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALGAARTLGRPVDIASWRHA +EQLPALFNFMPMGTRILA +>1gs5_Repair_68:-33.9822 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:RA36Q,VA100Q,NA139I,DA181N; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQQPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAQGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLEIGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +NVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_69:-25.8976 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:AA26F,QA155E,GA188L,LA222A; +MMNPLIIKLGGVLLDSEEALERLFSFLVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGELMNVNADQAATALAATLGADLILLS +DVSGILDLKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAAADAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_70:-24.3358 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:KA61T,LA168N,LA178G,DA223Y; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +TKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATANAATLGADLIGLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALYAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_71:-24.014 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA9D,NA85I,FA103A,VA216H; +MMNPLIIKDGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTAIKTLLAWAKKHQIAAVGLALGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIHKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_72:-27.2437 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA14P,VA39I,VA144F,GA229N; +MMNPLIIKLGGVLPDSEEALERLFSALVNYRESHQRPLIIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPFVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLNRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_73:-23.6627 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:AA19R,VA41T,VA122S,IA215H; +MMNPLIIKLGGVLLDSEERLERLFSALVNYRESHQRPLVITHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HSGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMHVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_74:-21.654 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:KA62D,GA120I,NA219M,SA236I; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KDNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELI +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVMAALDAARTLGRPVDIAIWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_75:-26.337 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:SA16Q,AA167L,AA170F,GA208S; +MMNPLIIKLGGVLLDQEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATLLAFTLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQSIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_76:-33.3541 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:PA130H,NA160E,SA183N,RA230W; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSHKLINSLLENGYLPVVSSIGVTDEGQLMNVEADQAATALAATLGADLILLS +DVNGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGWPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_77:-23.8328 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:DA108A,AA164T,LA172S,GA173M; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGASVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQTATALAATSMADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_78:-26.9206 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:AA26W,HA34V,IA75S,MA250E; +MMNPLIIKLGGVLLDSEEALERLFSWLVNYRESVQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDSITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGEPMGTRILA +>1gs5_Repair_79:-28.3212 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:SA25A,EA32Q,MA250C,TA254G; +MMNPLIIKLGGVLLDSEEALERLFAALVNYRQSHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGCPMGGRILA +>1gs5_Repair_80:-28.438 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:WA91P,SA180N,EA195F,NA219K; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAPAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLN +DVSGILDGKGQRIAFMTAAKAEQLIEQGIITDGMIVKVKAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_81:-31.144 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA48A,WA91T,SA129Y,SA236L; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVADELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLATAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGYPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIALWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_82:-31.8109 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:KA8W,NA29A,LA176I,AA245I; +MMNPLIIWLGGVLLDSEEALERLFSALVAYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADIILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPILFNGMPMGTRILA +>1gs5_Repair_83:-18.3174 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:AA84Y,DA108Q,PA130E,VA218N; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTYNKTLLAWAKKHQIAAVGLFLGDGQSVKVTQLDEELG +HVGLAQPGSEKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKNNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_84:-21.0248 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:EA18P,AA92Y,IA210P,PA231A; +MMNPLIIKLGGVLLDSEPALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWYKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIPTDGMIVKVNAALDAARTLGRAVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_85:-22.0302 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:GA43A,LA178G,DA187T,KA200Q; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHAGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLIGLS +DVSGILTGKGQRIAEMTAAQAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_86:-26.6663 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:RA22G,DA71G,EA195R,IA234A; +MMNPLIIKLGGVLLDSEEALEGLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPAGQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIARMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDAASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_87:-31.7528 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:SA33V,LA65W,SA183H,AA235G; +MMNPLIIKLGGVLLDSEEALERLFSALVNYREVHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGWRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVHGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIGSWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_88:-25.7082 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:IA7C,MA157A,AA220Q,NA248D; +MMNPLICKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLANVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNQALDAARTLGRPVDIASWRHA +EQLPALFDGMPMGTRILA +>1gs5_Repair_89:-26.0932 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:NA63W,GA154E,QA191Y,MA196I; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKWGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEEQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGYRIAEITAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_90:-31.6088 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:DA15T,NA29I,DA106T,MA252Y; +MMNPLIIKLGGVLLTSEEALERLFSALVIYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGTGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPYGTRILA +>1gs5_Repair_91:-11.8562 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:DA162T,FA247S,GA253M,IA256A; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNATQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALSNGMPMMTRALA +>1gs5_Repair_92:-31.7426 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:QA72Y,NA134H,SA135H,DA187F; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADYIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLIHHLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILFGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_93:-30.4076 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA48E,PA58K,DA71N,DA152I; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVEDELMKGLNLKVK +KKNGLRVTPANQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTIEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_94:-35.6801 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA27F,QA114L,EA118F,AA245L; +MMNPLIIKLGGVLLDSEEALERLFSAFVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTLLDEFLG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPLLFNGMPMGTRILA +>1gs5_Repair_95:-1.66384 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:FA24G,MA52K,IA75E,VA159Y; +MMNPLIIKLGGVLLDSEEALERLGSALVNYRESHQRPLVIVHGGGCVVDELKKGLNLPVK +KKNGLRVTPADQIDEITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNYNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_96:-27.0876 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA23V,TA77Q,AA125V,LA137V; +MMNPLIIKLGGVLLDSEEALERVFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIIQGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLVQPGSPKLINSLVENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_97:-32.695 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:KA62V,SA129T,GA188Y,PA251E; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KVNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGTPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDYKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMEMGTRILA +>1gs5_Repair_98:-29.7407 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:GA105P,SA109N,EA206V,AA225T; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLPDGDNVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIVQGIITDGMIVKVNAALDATRTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_99:-31.8381 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:SA33E,LA65K,KA200M,EA202L; +MMNPLIIKLGGVLLDSEEALERLFSALVNYREEHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGKRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAMALQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_100:-15.2325 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA55F,GA184M,TA211E,LA257S; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGFNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSMILDGKGQRIAEMTAAKAEQLIEQGIIEDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRISA +>1gs5_Repair_1:-26.6998 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:NA85R,FA103E,NA160I,LA172C; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTARKTLLAWAKKHQIAAVGLELGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVIADQAATALAATCGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_2:-23.6616 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:DA106G,GA154R,QA203F,GA229V; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGGGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDERQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEFLIEQGIITDGMIVKVNAALDAARTLVRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_3:-29.5592 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:EA18P,HA42F,RA226L,SA236Q; +MMNPLIIKLGGVLLDSEPALERLFSALVNYRESHQRPLVIVFGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAALTLGRPVDIAQWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_4:-31.3342 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA55Y,LA65T,DA74C,NA158K; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGYNLPVK +KKNGTRVTPADQICIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMKVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_5:-34.1476 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:GA45W,VA47M,GA173D,DA233P; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGWCMVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLDADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVPIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_6:-30.6962 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA13M,GA43N,GA105A,DA212S; +MMNPLIIKLGGVMLDSEEALERLFSALVNYRESHQRPLVIVHNGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLADGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITSGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_7:-23.8092 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:QA35T,LA80F,KA86M,AA125R; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHTRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGAFAGTANMTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLRQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_8:-30.807 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:EA50Y,LA102Q,PA130M,DA175I; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDYLMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGQFLGDGDSVKVTQLDEELG +HVGLAQPGSMKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGAILILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_9:-3.2826 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:FA24P,GA44P,LA137I,PA143H; +MMNPLIIKLGGVLLDSEEALERLPSALVNYRESHQRPLVIVHGPGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLIENGYLHVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_10:-32.2353 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:PA58K,DA108Y,KA111V,QA126W; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLKVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGYSVVVTQLDEELG +HVGLAWPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_11:-8.63491 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:AA79Y,KA94S,QA114K,LA243C; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGYLAGTANKTLLAWAKSHQIAAVGLFLGDGDSVKVTKLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQCPALFNGMPMGTRILA +>1gs5_Repair_12:-12.1867 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA41D,GA120R,GA128K,TA227R; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIDHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELR +HVGLAQPKSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARRLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_13:-27.548 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:HA34V,AA161L,VA216C,VA232K; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESVQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNLDQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMICKVNAALDAARTLGRPKDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_14:-11.2283 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:SA25P,AA201G,QA207P,GA253D; +MMNPLIIKLGGVLLDSEEALERLFPALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKGEQLIEPGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMDTRILA +>1gs5_Repair_15:-29.8732 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:TA83Y,SA236C,PA244I,LA246T; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGYANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIACWRHA +EQLIATFNGMPMGTRILA +>1gs5_Repair_16:-23.3965 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:DA15Y,IA73W,IA148W,TA171A; +MMNPLIIKLGGVLLYSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQWDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSWGVTDEGQLMNVNADQAATALAAALGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_17:-32.1998 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA47Y,LA80W,LA136I,KA217L; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCYVDELMKGLNLPVK +KKNGLRVTPADQIDIITGAWAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSILENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVLVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_18:-28.9673 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:DA108Q,DA223K,GA229Q,GA249E; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGQSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALKAARTLQRPVDIASWRHA +EQLPALFNEMPMGTRILA +>1gs5_Repair_19:-10.8248 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:EA32F,GA44A,DA108A,GA123Q; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRFSHQRPLVIVHGAGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGASVKVTQLDEELG +HVQLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_20:4.44471 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA39Y,HA42L,GA44N,GA123K; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLYIVLGNGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVKLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_21:-15.1579 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:KA62W,LA178N,TA197H,GA253R; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KWNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLINLS +DVSGILDGKGQRIAEMHAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMRTRILA +>1gs5_Repair_22:-25.0598 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:SA33I,YA141E,IA148S,SA180T; +MMNPLIIKLGGVLLDSEEALERLFSALVNYREIHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGELPVVSSSGVTDEGQLMNVNADQAATALAATLGADLILLT +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_23:-24.6874 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:IA6P,LA102W,VA110I,VA182C; +MMNPLPIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGWFLGDGDSIKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DCSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_24:-20.8916 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:MA196H,LA204G,GA208M,PA251Y; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEHTAAKAEQGIEQMIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMYMGTRILA +>1gs5_Repair_25:-30.611 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA55A,RA66S,IA76L,EA153G; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGANLPVK +KKNGLSVTPADQIDILTGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDGGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_26:-23.1204 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:KA8I,VA39T,VA47I,MA196P; +MMNPLIIILGGVLLDSEEALERLFSALVNYRESHQRPLTIVHGGGCIVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEPTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_27:-21.5327 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA100G,LA115N,AA167K,IA193A; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAGGLFLGDGDSVKVTQNDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATKLAATLGADLILLS +DVSGILDGKGQRAAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_28:-24.3597 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA9E,KA60M,DA187P,DA223F; +MMNPLIIKEGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVM +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILPGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALFAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_29:0.381792 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:SA25M,WA91C,GA123R,LA168C; +MMNPLIIKLGGVLLDSEEALERLFMALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLACAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVRLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATACAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_30:-27.2991 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:SA25H,LA57I,AA92Y,IA133K; +MMNPLIIKLGGVLLDSEEALERLFHALVNYRESHQRPLVIVHGGGCVVDELMKGLNIPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWYKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLKNSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_31:-35.6998 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:SA33C,QA126F,LA136M,VA182E; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRECHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAFPGSPKLINSMLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DESGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_32:-29.5429 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:KA8C,VA110S,DA152H,GA173L; +MMNPLIICLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSSKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTHEGQLMNVNADQAATALAATLLADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_33:-26.0332 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:IA133S,SA135V,KA189W,PA251D; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLSNVLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGWGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMDMGTRILA +>1gs5_Repair_34:-9.135 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:QA35S,MA157N,AA174H,AA258L; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHSRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLNNVNADQAATALAATLGHDLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILL +>1gs5_Repair_35:-21.4307 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA51T,PA69K,PA130C,AA174N; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDETMKGLNLPVK +KKNGLRVTKADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSCKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGNDLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_36:-22.4597 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:SA33T,RA230A,LA257P,AA258F; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRETHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGAPVDIASWRHA +EQLPALFNGMPMGTRIPF +>1gs5_Repair_37:-25.7452 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:SA33K,GA44L,DA108V,EA206W; +MMNPLIIKLGGVLLDSEEALERLFSALVNYREKHQRPLVIVHGLGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGVSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIWQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_38:-27.6608 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:EA21A,NA56G,AA79N,IA193A; +MMNPLIIKLGGVLLDSEEALARLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLGLPVK +KKNGLRVTPADQIDIITGNLAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRAAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_39:-37.5103 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:NA3L,SA16D,TA113H,NA219I; +MMLPLIIKLGGVLLDDEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVHQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVIAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_40:-26.5237 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:PA58F,LA115W,VA144N,LA176I; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLFVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQWDEELG +HVGLAQPGSPKLINSLLENGYLPNVSSIGVTDEGQLMNVNADQAATALAATLGADIILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_41:-25.4121 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:EA21S,VA28Y,AA164Q,DA175H; +MMNPLIIKLGGVLLDSEEALSRLFSALYNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQQATALAATLGAHLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_42:-30.8323 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:PA58G,LA102N,KA200L,KA217E; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLGVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGNFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAALAEQLIEQGIITDGMIVEVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_43:-31.0701 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:NA56L,PA69H,TA87W,PA251M; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLLLPVK +KKNGLRVTHADQIDIITGALAGTANKWLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMMMGTRILA +>1gs5_Repair_44:-29.6758 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:RA36F,QA72K,RA230C,TA254N; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQFPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADKIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGCPVDIASWRHA +EQLPALFNGMPMGNRILA +>1gs5_Repair_45:-7.79619 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA20K,LA23D,DA152W,GA184V; +MMNPLIIKLGGVLLDSEEAKERDFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTWEGQLMNVNADQAATALAATLGADLILLS +DVSVILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_46:-31.6354 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:TA77R,QA114H,IA148A,DA152P; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIIRGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTHLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSAGVTPEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_47:-30.26 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:GA101I,AA125C,VA150F,GA173H; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVILFLGDGDSVKVTQLDEELG +HVGLCQPGSPKLINSLLENGYLPVVSSIGFTDEGQLMNVNADQAATALAATLHADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_48:-24.1658 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:IA7N,YA141E,MA196T,AA201V; +MMNPLINKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGELPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAETTAAKVEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_49:-23.4878 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:HA42A,VA145G,KA189S,AA235V; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVAGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVGSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGSGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIVSWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_50:-23.8015 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:IA6G,WA91M,IA209P,DA212G; +MMNPLGIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAMAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGPITGGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_51:-33.2133 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:DA71L,KA111T,SA183G,TA211D; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPALQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVTVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVGGILDGKGQRIAEMTAAKAEQLIEQGIIDDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_52:-26.3341 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:IA75M,EA118T,PA127A,LA137D; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDMITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDETLG +HVGLAQAGSPKLINSLDENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_53:-15.5682 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:TA83D,DA108G,AA164Y,IA185M; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGDANKTLLAWAKKHQIAAVGLFLGDGGSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQYATALAATLGADLILLS +DVSGMLDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_54:-29.2377 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA13W,GA43E,VA182D,MA252L; +MMNPLIIKLGGVWLDSEEALERLFSALVNYRESHQRPLVIVHEGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DDSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPLGTRILA +>1gs5_Repair_55:-21.4145 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA5H,LA13Y,GA82E,IA209C; +MMNPHIIKLGGVYLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAETANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGCITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_56:-27.514 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:EA21T,KA94D,LA115I,AA169L; +MMNPLIIKLGGVLLDSEEALTRLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKDHQIAAVGLFLGDGDSVKVTQIDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALLATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_57:-20.8214 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA9N,FA24N,TA211Y,TA254M; +MMNPLIIKNGGVLLDSEEALERLNSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIIYDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGMRILA +>1gs5_Repair_58:-28.1022 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:RA31S,GA105D,NA160F,QA191K; +MMNPLIIKLGGVLLDSEEALERLFSALVNYSESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLDDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVFADQAATALAATLGADLILLS +DVSGILDGKGKRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_59:-23.9432 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA41N,TA77N,SA147W,DA233K; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVINHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIINGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSWIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVKIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_60:-17.2101 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:RA22I,IA97R,LA104Y,AA125I; +MMNPLIIKLGGVLLDSEEALEILFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQRAAVGLFYGDGDSVKVTQLDEELG +HVGLIQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_61:-18.1031 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:QA96N,VA150S,GA253M,RA255G; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHNIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGSTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMMTGILA +>1gs5_Repair_62:-31.142 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA100H,KA200Q,SA236H,MA252N; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAHGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAQAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIAHWRHA +EQLPALFNGMPNGTRILA +>1gs5_Repair_63:-15.449 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:AA99W,LA104G,YA141P,AA169Q; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAWVGLFGGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGPLPVVSSIGVTDEGQLMNVNADQAATALQATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_64:-33.7446 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:NA3L,VA28I,DA49Y,KA93W; +MMLPLIIKLGGVLLDSEEALERLFSALINYRESHQRPLVIVHGGGCVVYELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAWKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_65:6.63968 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:DA116C,GA149Q,NA158V,TA171W; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLCEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIQVTDEGQLMVVNADQAATALAAWLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_66:-11.7975 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:AA81Q,GA184V,IA210T,AA245C; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALQGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSVILDGKGQRIAEMTAAKAEQLIEQGITTDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPCLFNGMPMGTRILA +>1gs5_Repair_67:-13.967 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:RA36Q,IA40M,GA64I,KA94E; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQQPLVMVHGGGCVVDELMKGLNLPVK +KKNILRVTPADQIDIITGALAGTANKTLLAWAKEHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_68:-22.0587 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA5S,LA27H,IA205G,EA241T; +MMNPSIIKLGGVLLDSEEALERLFSAHVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLGEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +TQLPALFNGMPMGTRILA +>1gs5_Repair_69:-25.0557 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:GA43H,LA176S,VA182M,IA215L; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHHGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADSILLS +DMSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMLVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_70:-26.666 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:NA56E,LA102Q,DA152W,AA221V; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLELPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGQFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTWEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAVLDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_71:-8.88878 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:SA25C,IA76C,PA143Y,AA194T; +MMNPLIIKLGGVLLDSEEALERLFCALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDICTGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLYVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRITEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_72:-26.184 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:QA72L,TA87G,LA176C,FA247V; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADLIDIITGALAGTANKGLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADCILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALVNGMPMGTRILA +>1gs5_Repair_73:-34.215 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:TA83L,EA118W,TA166M,LA186D; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGLANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEWLG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAAMALAATLGADLILLS +DVSGIDDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_74:-31.8814 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:RA22L,EA32S,TA113C,LA124T; +MMNPLIIKLGGVLLDSEEALELLFSALVNYRSSHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVCQLDEELG +HVGTAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_75:-22.3095 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA28Q,GA107V,VA122I,EA195Q; +MMNPLIIKLGGVLLDSEEALERLFSALQNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDVDSVKVTQLDEELG +HIGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAQMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_76:-33.1636 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:NA29Q,GA78H,QA163A,TA211M; +MMNPLIIKLGGVLLDSEEALERLFSALVQYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITHALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADAAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIIMDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_77:-22.9515 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:HA34I,TA151S,AA201Y,AA235D; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESIQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVSDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKYEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIDSWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_78:-24.891 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:KA53V,LA65G,EA118T,GA190I; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMVGLNLPVK +KKNGGRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDETLG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKIQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_79:-15.5479 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA9R,PA143R,LA178F,PA244M; +MMNPLIIKRGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLRVVSSIGVTDEGQLMNVNADQAATALAATLGADLIFLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLMALFNGMPMGTRILA +>1gs5_Repair_80:-19.4959 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:YA30S,EA32V,EA118C,MA157P; +MMNPLIIKLGGVLLDSEEALERLFSALVNSRVSHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDECLG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLPNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_81:-8.2002 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA48C,GA120H,AA167P,LA246W; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVCDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELH +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATPLAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPAWFNGMPMGTRILA +>1gs5_Repair_82:-30.7802 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA9V,VA100R,SA109A,LA124D; +MMNPLIIKVGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAARGLFLGDGDAVKVTQLDEELG +HVGDAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_83:-23.486 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:RA36L,AA84Q,AA99P,IA256P; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQLPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTQNKTLLAWAKKHQIAPVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRPLA +>1gs5_Repair_84:-25.9486 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA28N,TA171C,MA214I,AA258F; +MMNPLIIKLGGVLLDSEEALERLFSALNNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAACLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGIIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILF +>1gs5_Repair_85:-34.5499 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:NA3E,TA77V,TA151P,TA211E; +MMEPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIIVGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVPDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIIEDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_86:-25.6012 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA88N,GA188C,LA222E,AA224T; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTNLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDCKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAAEDTARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_87:-0.646233 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:RA36N,EA50T,GA149W,GA213E; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQNPLVIVHGGGCVVDTLMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIWVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDEMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_88:-27.35 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:PA37H,AA201W,MA214G,AA235M; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRHLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKWEQLIEQGIITDGGIVKVNAALDAARTLGRPVDIMSWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_89:-20.5839 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:QA96M,PA143D,DA152K,AA161F; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHMIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLDVVSSIGVTKEGQLMNVNFDQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_90:-26.2285 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:GA54C,IA76T,KA94Q,GA154T; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKCLNLPVK +KKNGLRVTPADQIDITTGALAGTANKTLLAWAKQHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDETQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_91:-25.5755 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:PA58T,VA100S,LA178S,SA180V; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLTVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAASGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLISLV +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_92:-12.1761 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:TA68Q,GA107R,AA167K,EA206M; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVQPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDRDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATKLAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIMQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_93:-28.7234 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA12G,LA104C,IA205M,IA210S; +MMNPLIIKLGGGLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFCGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLMEQGISTDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_94:-33.0391 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:SA33N,QA35V,KA62Q,AA81Q; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRENHVRPLVIVHGGGCVVDELMKGLNLPVK +KQNGLRVTPADQIDIITGALQGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_95:-30.6326 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:AA26R,GA54D,KA60D,LA222V; +MMNPLIIKLGGVLLDSEEALERLFSRLVNYRESHQRPLVIVHGGGCVVDELMKDLNLPVD +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAAVDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_96:-25.8208 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:IA75T,AA98T,GA107A,AA201E; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDTITGALAGTANKTLLAWAKKHQITAVGLFLGDADSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKEEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_97:-25.1898 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:FA24G,RA36P,LA65T,DA181C; +MMNPLIIKLGGVLLDSEEALERLGSALVNYRESHQPPLVIVHGGGCVVDELMKGLNLPVK +KKNGTRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +CVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_98:-33.0371 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:RA22K,EA50T,VA59H,AA161G; +MMNPLIIKLGGVLLDSEEALEKLFSALVNYRESHQRPLVIVHGGGCVVDTLMKGLNLPHK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNGDQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_99:-23.0416 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:DA187H,IA210K,AA235K,LA257Q; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILHGKGQRIAEMTAAKAEQLIEQGIKTDGMIVKVNAALDAARTLGRPVDIKSWRHA +EQLPALFNGMPMGTRIQA +>1gs5_Repair_100:-29.1645 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:RA36C,LA51C,AA92N,KA111S; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQCPLVIVHGGGCVVDECMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWNKKHQIAAVGLFLGDGDSVSVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_1:-28.1672 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:NA85R,FA103E,DA152I,NA160E,LA172A; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTARKTLLAWAKKHQIAAVGLELGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTIEGQLMNVEADQAATALAATAGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_2:-26.7995 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA132Q,GA173R,EA206F,IA215V,VA232F; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKQINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLRADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIFQGIITDGMVVKVNAALDAARTLGRPFDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_3:-34.3816 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:SA16F,EA18F,HA42L,QA203G,TA227C; +MMNPLIIKLGGVLLDFEFALERLFSALVNYRESHQRPLVIVLGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEGLIEQGIITDGMIVKVNAALDAARCLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_4:-29.5912 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA55Y,LA65T,DA74C,QA155K,NA158S; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGYNLPVK +KKNGTRVTPADQICIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGKLMSVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_5:-12.3229 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA20F,LA65D,DA71P,GA123N,LA186D; +MMNPLIIKLGGVLLDSEEAFERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGDRVTPAPQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVNLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGIDDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_6:-25.2881 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA13M,GA43N,KA94A,LA136S,MA214Q; +MMNPLIIKLGGVMLDSEEALERLFSALVNYRESHQRPLVIVHNGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKAHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSSLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGQIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_7:-18.2407 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:QA35T,LA80F,KA86M,AA125R,LA204S; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHTRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGAFAGTANMTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLRQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQSIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_8:0.08031 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:EA50G,LA51F,VA110H,TA171H,AA194I; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDGFMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSHKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAAHLGADLILLS +DVSGILDGKGQRIIEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_9:-30.342 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:KA131P,NA139P,TA166I,SA236H,MA250Q; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPPLINSLLEPGYLPVVSSIGVTDEGQLMNVNADQAAIALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIAHWRHA +EQLPALFNGQPMGTRILA +>1gs5_Repair_10:-22.1944 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:QA114V,TA197K,GA208F,IA256P,LA257H; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTVLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMKAAKAEQLIEQFIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRPHA +>1gs5_Repair_11:-27.5345 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA65Y,DA74S,DA181K,TA197C,LA204C; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGYRVTPADQISIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +KVSGILDGKGQRIAEMCAAKAEQCIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_12:-25.9062 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA41D,DA106R,VA145L,GA229R,VA232L; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIDHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGRGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVLSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLRRPLDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_13:-32.607 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:HA34V,EA117L,AA161E,VA216K,VA232I; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESVQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDLELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNEDQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIKKVNAALDAARTLGRPIDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_14:13.6963 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:SA25P,LA176Q,AA201P,QA207D,GA253F; +MMNPLIIKLGGVLLDSEEALERLFPALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADQILLS +DVSGILDGKGQRIAEMTAAKPEQLIEDGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMFTRILA +>1gs5_Repair_15:-26.6592 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:PA58Y,TA83C,SA236I,PA244T,LA246E; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLYVK +KKNGLRVTPADQIDIITGALAGCANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIAIWRHA +EQLTAEFNGMPMGTRILA +>1gs5_Repair_16:-22.9232 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:DA15Y,IA73W,IA148W,NA160A,TA171V; +MMNPLIIKLGGVLLYSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQWDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSWGVTDEGQLMNVAADQAATALAAVLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_17:-25.6859 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA47Y,LA80W,GA120L,LA136K,KA217I; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCYVDELMKGLNLPVK +KKNGLRVTPADQIDIITGAWAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELL +HVGLAQPGSPKLINSKLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVIVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_18:-26.9763 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:DA108Q,EA117K,DA223G,GA229E,GA249E; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGQSVKVTQLDKELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALGAARTLERPVDIASWRHA +EQLPALFNEMPMGTRILA +>1gs5_Repair_19:-24.7231 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:EA32G,GA82D,DA108L,IA148H,DA152C; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRGSHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALADTANKTLLAWAKKHQIAAVGLFLGDGLSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSHGVTCEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_20:-13.0304 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:GA43V,GA78L,AA90D,GA123K,TA227Y; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHVGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITLALAGTANKTLLDWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVKLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARYLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_21:-26.4229 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:DA49S,LA104P,VA145A,SA183M,LA186H; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVSELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFPGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVASSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVMGIHDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_22:-26.3611 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:EA18L,KA53E,TA87P,KA94T,AA240H; +MMNPLIIKLGGVLLDSELALERLFSALVNYRESHQRPLVIVHGGGCVVDELMEGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKPLLAWAKTHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHH +EQLPALFNGMPMGTRILA +>1gs5_Repair_23:-25.0774 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:IA6P,LA102W,VA110I,DA181E,VA182G; +MMNPLPIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGWFLGDGDSIKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +EGSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_24:-23.242 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:PA4H,QA191H,IA205M,IA209Y,MA252H; +MMNHLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGHRIAEMTAAKAEQLMEQGYITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPHGTRILA +>1gs5_Repair_25:-29.1638 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:RA22A,LA55S,RA66L,IA76Q,KA200T; +MMNPLIIKLGGVLLDSEEALEALFSALVNYRESHQRPLVIVHGGGCVVDELMKGSNLPVK +KKNGLLVTPADQIDIQTGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAATAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_26:-29.5841 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:KA8I,VA39T,VA47I,EA138P,IA215E; +MMNPLIIILGGVLLDSEEALERLFSALVNYRESHQRPLTIVHGGGCIVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLPNGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMEVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_27:-26.3491 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:MA52N,QA72K,AA169R,IA177R,NA219Y; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELNKGLNLPVK +KKNGLRVTPADKIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALRATLGADLRLLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVYAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_28:-27.2295 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA9E,KA60M,KA189P,QA203F,WA237G; +MMNPLIIKEGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVM +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGPGQRIAEMTAAKAEFLIEQGIITDGMIVKVNAALDAARTLGRPVDIASGRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_29:-17.4855 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:SA25M,WA91C,SA109R,GA123C,LA168C; +MMNPLIIKLGGVLLDSEEALERLFMALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLACAKKHQIAAVGLFLGDGDRVKVTQLDEELG +HVCLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATACAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_30:-30.2377 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:SA25H,LA57I,AA92Y,FA103L,LA243Q; +MMNPLIIKLGGVLLDSEEALERLFHALVNYRESHQRPLVIVHGGGCVVDELMKGLNIPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWYKKHQIAAVGLLLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQQPALFNGMPMGTRILA +>1gs5_Repair_31:-28.54 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:GA11C,SA33M,QA126M,LA136E,VA182Q; +MMNPLIIKLGCVLLDSEEALERLFSALVNYREMHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAMPGSPKLINSELENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DQSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_32:-18.1952 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:KA8C,VA110S,LA156G,AA174L,LA179S; +MMNPLIICLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSSKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQGMNVNADQAATALAATLGLDLILSS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_33:-30.9038 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:KA8S,NA85V,VA112T,SA135D,AA198R; +MMNPLIISLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTAVKTLLAWAKKHQIAAVGLFLGDGDSVKTTQLDEELG +HVGLAQPGSPKLINDLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTRAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_34:-32.7446 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA27I,QA35M,LA57M,NA158T,DA175T; +MMNPLIIKLGGVLLDSEEALERLFSAIVNYRESHMRPLVIVHGGGCVVDELMKGLNMPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMTVNADQAATALAATLGATLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_35:-17.1975 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:QA72G,GA128N,TA166D,KA189Y,EA206H; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADGIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPNSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAADALAATLGADLILLS +DVSGILDGYGQRIAEMTAAKAEQLIHQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_36:-31.3103 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:DA15K,SA33K,FA103I,KA131F,GA249I; +MMNPLIIKLGGVLLKSEEALERLFSALVNYREKHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLILGDGDSVKVTQLDEELG +HVGLAQPGSPFLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNIMPMGTRILA +>1gs5_Repair_37:-12.7223 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:GA105P,LA115G,NA160C,VA218H,IA234S; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLPDGDSVKVTQGDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVCADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKHNAALDAARTLGRPVDSASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_38:-26.1989 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA88Q,QA126R,GA149A,GA208D,IA234L; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTQLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLARPGSPKLINSLLENGYLPVVSSIAVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQDIITDGMIVKVNAALDAARTLGRPVDLASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_39:-27.2985 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:HA42L,QA163A,DA212R,GA229V,NA248E; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVLGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADAAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITRGMIVKVNAALDAARTLVRPVDIASWRHA +EQLPALFEGMPMGTRILA +>1gs5_Repair_40:-28.4541 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA9P,VA12L,KA62F,NA160K,DA233Y; +MMNPLIIKPGGLLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KFNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVKADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVYIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_41:-22.9947 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:RA22T,GA44N,KA62M,LA80C,LA176V; +MMNPLIIKLGGVLLDSEEALETLFSALVNYRESHQRPLVIVHGNGCVVDELMKGLNLPVK +KMNGLRVTPADQIDIITGACAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADVILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_42:-9.81459 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:EA18W,DA74L,AA174S,AA225Y,EA241R; +MMNPLIIKLGGVLLDSEWALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQILIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGSDLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAYRTLGRPVDIASWRHA +RQLPALFNGMPMGTRILA +>1gs5_Repair_43:-25.928 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:IA6H,NA29G,HA34T,SA129P,NA139D; +MMNPLHIKLGGVLLDSEEALERLFSALVGYRESTQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGPPKLINSLLEDGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_44:-25.0765 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA23S,AA84M,QA155V,EA195K,MA214Q; +MMNPLIIKLGGVLLDSEEALERSFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTMNKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGVLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAKMTAAKAEQLIEQGIITDGQIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_45:-19.1196 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA28P,WA91S,SA146T,VA150H,AA221I; +MMNPLIIKLGGVLLDSEEALERLFSALPNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLASAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVTSIGHTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAILDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_46:-29.2438 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:FA24Y,NA56Y,LA88K,VA182I,LA186C; +MMNPLIIKLGGVLLDSEEALERLYSALVNYRESHQRPLVIVHGGGCVVDELMKGLYLPVK +KKNGLRVTPADQIDIITGALAGTANKTKLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DISGICDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_47:-27.8132 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:EA21S,FA24A,SA33C,QA114M,NA139A; +MMNPLIIKLGGVLLDSEEALSRLASALVNYRECHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTMLDEELG +HVGLAQPGSPKLINSLLEAGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_48:-29.3351 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:KA8H,AA19S,EA21A,KA111S,GA213W; +MMNPLIIHLGGVLLDSEESLARLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVSVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDWMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_49:-29.5429 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA48N,AA81C,AA90F,KA111D,GA213Q; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVNDELMKGLNLPVK +KKNGLRVTPADQIDIITGALCGTANKTLLFWAKKHQIAAVGLFLGDGDSVDVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDQMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_50:-24.9631 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA9T,EA21V,VA47P,EA202M,IA256K; +MMNPLIIKTGGVLLDSEEALVRLFSALVNYRESHQRPLVIVHGGGCPVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAMQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRKLA +>1gs5_Repair_51:-24.7714 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:EA21S,DA71M,MA157C,LA178A,GA208V; +MMNPLIIKLGGVLLDSEEALSRLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPAMQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLCNVNADQAATALAATLGADLIALS +DVSGILDGKGQRIAEMTAAKAEQLIEQVIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_52:-1.21452 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:FA24E,PA130Q,SA146Y,LA222S,MA250I; +MMNPLIIKLGGVLLDSEEALERLESALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSQKLINSLLENGYLPVVYSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAASDAARTLGRPVDIASWRHA +EQLPALFNGIPMGTRILA +>1gs5_Repair_53:-19.7391 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:GA10A,VA47H,KA53Q,AA99R,QA242P; +MMNPLIIKLAGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCHVDELMQGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIARVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EPLPALFNGMPMGTRILA +>1gs5_Repair_54:11.0616 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:KA62V,DA106G,VA112Y,QA114E,SA146Y; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KVNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGGGDSVKYTELDEELG +HVGLAQPGSPKLINSLLENGYLPVVYSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_55:-18.3013 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:FA24D,LA65V,KA94S,VA122P,KA217S; +MMNPLIIKLGGVLLDSEEALERLDSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGVRVTPADQIDIITGALAGTANKTLLAWAKSHQIAAVGLFLGDGDSVKVTQLDEELG +HPGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVSVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_56:-23.1207 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:GA10T,GA11C,RA22L,DA187C,PA244V; +MMNPLIIKLTCVLLDSEEALELLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILCGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLVALFNGMPMGTRILA +>1gs5_Repair_57:-10.9297 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:KA8Q,LA9Y,PA143W,DA162N,LA176I; +MMNPLIIQYGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLWVVSSIGVTDEGQLMNVNANQAATALAATLGADIILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_58:-12.6677 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:GA105Y,GA107P,GA149V,DA152Y,EA241D; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLYDPDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIVVTYEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +DQLPALFNGMPMGTRILA +>1gs5_Repair_59:-26.5266 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:EA21D,GA45P,IA148E,SA236R,MA252K; +MMNPLIIKLGGVLLDSEEALDRLFSALVNYRESHQRPLVIVHGGPCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSEGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIARWRHA +EQLPALFNGMPKGTRILA +>1gs5_Repair_60:-16.1787 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:AA99V,AA125R,PA127H,DA152Y,AA245D; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAVVGLFLGDGDSVKVTQLDEELG +HVGLRQHGSPKLINSLLENGYLPVVSSIGVTYEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPDLFNGMPMGTRILA +>1gs5_Repair_61:-21.3737 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA110C,VA122P,NA160R,SA180I,LA186G; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSCKVTQLDEELG +HPGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVRADQAATALAATLGADLILLI +DVSGIGDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_62:-28.0277 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA27T,DA106M,TA151F,IA215K,WA237P; +MMNPLIIKLGGVLLDSEEALERLFSATVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGMGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVFDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMKVKVNAALDAARTLGRPVDIASPRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_63:-22.8032 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA28K,NA29S,LA55C,TA166Q,VA218F; +MMNPLIIKLGGVLLDSEEALERLFSALKSYRESHQRPLVIVHGGGCVVDELMKGCNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAAQALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKFNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_64:-24.7792 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:IA97F,LA119N,LA168M,LA204R,DA223Q; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQFAAVGLFLGDGDSVKVTQLDEENG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATAMAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQRIEQGIITDGMIVKVNAALQAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_65:-26.0616 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:YA30F,VA48Y,LA57P,LA136F,NA248S; +MMNPLIIKLGGVLLDSEEALERLFSALVNFRESHQRPLVIVHGGGCVYDELMKGLNPPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSFLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFSGMPMGTRILA +>1gs5_Repair_66:-21.3666 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:IA6K,AA70R,PA130S,VA144K,MA214H; +MMNPLKIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPRDQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSSKLINSLLENGYLPKVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGHIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_67:-27.6591 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:MA2T,GA11A,EA117P,AA161T,MA250G; +MTNPLIIKLGAVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDPELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNTDQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGGPMGTRILA +>1gs5_Repair_68:-26.9165 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:SA146G,TA166W,LA179N,KA189V,EA195C; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVGSIGVTDEGQLMNVNADQAAWALAATLGADLILNS +DVSGILDGVGQRIACMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_69:-31.1724 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:EA17H,CA46D,VA47Q,QA96T,TA166E; +MMNPLIIKLGGVLLDSHEALERLFSALVNYRESHQRPLVIVHGGGDQVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHTIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAAEALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_70:-6.27847 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA41D,GA128Y,IA193F,GA208L,DA223C; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIDHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPYSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRFAEMTAAKAEQLIEQLIITDGMIVKVNAALCAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_71:-15.4409 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:TA87M,DA116A,GA128L,PA143S,DA162N; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKMLLAWAKKHQIAAVGLFLGDGDSVKVTQLAEELG +HVGLAQPLSPKLINSLLENGYLSVVSSIGVTDEGQLMNVNANQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_72:1.34533 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:YA30R,GA54D,SA180A,GA184H,MA214S; +MMNPLIIKLGGVLLDSEEALERLFSALVNRRESHQRPLVIVHGGGCVVDELMKDLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLA +DVSHILDGKGQRIAEMTAAKAEQLIEQGIITDGSIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_73:-30.1418 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:KA8R,QA72V,TA77H,IA148A,DA212A; +MMNPLIIRLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADVIDIIHGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSAGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITAGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_74:-28.9862 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:MA52I,KA60R,PA69H,SA135K,NA160T; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELIKGLNLPVR +KKNGLRVTHADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINKLLENGYLPVVSSIGVTDEGQLMNVTADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_75:-22.0838 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:MA2H,NA85V,DA187Q,VA218H,RA230Y; +MHNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTAVKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILQGKGQRIAEMTAAKAEQLIEQGIITDGMIVKHNAALDAARTLGYPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_76:-17.1291 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:DA15K,GA82H,LA132P,GA149Q,IA193C; +MMNPLIIKLGGVLLKSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAHTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKPINSLLENGYLPVVSSIQVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRCAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_77:-26.298 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:IA7C,LA23M,NA56K,LA179T,EA241K; +MMNPLICKLGGVLLDSEEALERMFSALVNYRESHQRPLVIVHGGGCVVDELMKGLKLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILTS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +KQLPALFNGMPMGTRILA +>1gs5_Repair_78:-29.0275 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:SA16V,PA127R,EA153F,GA190F,NA219C; +MMNPLIIKLGGVLLDVEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQRGSPKLINSLLENGYLPVVSSIGVTDFGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKFQRIAEMTAAKAEQLIEQGIITDGMIVKVCAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_79:-27.4401 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA9C,VA12Y,MA157C,AA164G,IA205S; +MMNPLIIKCGGYLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLCNVNADQGATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLSEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_80:-16.857 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:GA11P,LA20S,IA76T,TA77E,MA157T; +MMNPLIIKLGPVLLDSEEASERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDITEGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLTNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_81:-16.675 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:DA116P,AA167P,LA176C,IA185Y,GA249M; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLPEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATPLAATLGADCILLS +DVSGYLDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNMMPMGTRILA +>1gs5_Repair_82:-31.0566 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA9V,EA32R,IA76A,KA93D,NA134M; +MMNPLIIKVGGVLLDSEEALERLFSALVNYRRSHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIATGALAGTANKTLLAWADKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLIMSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_83:-24.8908 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:KA8I,RA36Q,AA84P,AA99P,IA256K; +MMNPLIIILGGVLLDSEEALERLFSALVNYRESHQQPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTPNKTLLAWAKKHQIAPVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRKLA +>1gs5_Repair_84:-17.6976 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA12M,AA99S,LA104N,LA179Q,IA234W; +MMNPLIIKLGGMLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIASVGLFNGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILQS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDWASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_85:-16.5148 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:GA44I,SA183V,IA205F,IA215Y,LA222P; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGIGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVVGILDGKGQRIAEMTAAKAEQLFEQGIITDGMYVKVNAAPDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_86:-26.3497 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:SA25M,QA35E,PA69I,EA153I,LA172D; +MMNPLIIKLGGVLLDSEEALERLFMALVNYRESHERPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTIADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDIGQLMNVNADQAATALAATDGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_87:7.07756 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:NA134E,GA184F,MA196G,AA198F,WA237Q; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLIESLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSFILDGKGQRIAEGTFAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASQRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_88:-21.2246 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:EA50A,NA63Q,AA81G,SA147K,GA253S; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDALMKGLNLPVK +KKQGLRVTPADQIDIITGALGGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSKIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMSTRILA +>1gs5_Repair_89:-26.0954 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:YA30A,GA105D,SA180A,RA192G,EA241S; +MMNPLIIKLGGVLLDSEEALERLFSALVNARESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLDDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLA +DVSGILDGKGQGIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +SQLPALFNGMPMGTRILA +>1gs5_Repair_90:-29.9909 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:NA3W,VA48L,PA130M,TA151N,AA235P; +MMWPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVLDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSMKLINSLLENGYLPVVSSIGVNDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIPSWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_91:-27.9831 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:EA18T,YA30E,GA54H,DA74A,LA179F; +MMNPLIIKLGGVLLDSETALERLFSALVNERESHQRPLVIVHGGGCVVDELMKHLNLPVK +KKNGLRVTPADQIAIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILFS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_92:-15.1423 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:RA31Q,HA42E,GA44H,EA50L,QA191T; +MMNPLIIKLGGVLLDSEEALERLFSALVNYQESHQRPLVIVEGHGCVVDLLMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGTRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_93:-19.2824 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:EA17Q,KA111I,GA120V,DA223P,RA230K; +MMNPLIIKLGGVLLDSQEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVIVTQLDEELV +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALPAARTLGKPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_94:-30.5766 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA14R,QA35E,PA37F,TA87S,RA238T; +MMNPLIIKLGGVLRDSEEALERLFSALVNYRESHERFLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKSLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWTHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_95:-25.1015 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:SA33L,TA83A,EA118P,LA228Y,VA232A; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRELHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGAANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEPLG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTYGRPADIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_96:-25.1305 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA27R,HA34Q,KA93D,AA221I,AA235M; +MMNPLIIKLGGVLLDSEEALERLFSARVNYRESQQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWADKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAILDAARTLGRPVDIMSWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_97:-21.4791 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA48N,VA59N,GA107T,SA236Q,LA257R; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVNDELMKGLNLPNK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDTDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIAQWRHA +EQLPALFNGMPMGTRIRA +>1gs5_Repair_98:-30.9773 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:RA36C,VA47M,DA74R,DA212W,PA244A; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQCPLVIVHGGGCMVDELMKGLNLPVK +KKNGLRVTPADQIRIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITWGMIVKVNAALDAARTLGRPVDIASWRHA +EQLAALFNGMPMGTRILA +>1gs5_Repair_99:-18.5895 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:RA36Q,LA38R,GA120V,VA159A,RA192M; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQQPRVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELV +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNANADQAATALAATLGADLILLS +DVSGILDGKGQMIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_100:-29.9879 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:IA40V,DA49E,NA139Q,AA201H,DA223F; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVVVHGGGCVVEELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLEQGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKHEQLIEQGIITDGMIVKVNAALFAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_1:-16.2248 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:RA36K,IA185N,DA187N,VA218W,AA235E; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQKPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGNLNGKGQRIAEMTAAKAEQLIEQGIITDGMIVKWNAALDAARTLGRPVDIESWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_2:-32.886 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:AA92Q,SA135Q,DA223I,RA226I,PA231E; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWQKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINQLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALIAAITLGREVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_3:-19.5906 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:GA10H,KA61A,KA62T,AA161N,IA215G; +MMNPLIIKLHGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +ATNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNNDQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMGVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_4:-20.0813 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:EA18V,EA118K,VA182D,GA188S,GA253M; +MMNPLIIKLGGVLLDSEVALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEKLG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DDSGILDSKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMMTRILA +>1gs5_Repair_5:-21.007 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:IA7S,IA177T,DA187E,NA219W,GA249L; +MMNPLISKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLTLLS +DVSGILEGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVWAALDAARTLGRPVDIASWRHA +EQLPALFNLMPMGTRILA +>1gs5_Repair_6:-27.0883 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA28N,AA84V,AA164G,IA185K,QA203V; +MMNPLIIKLGGVLLDSEEALERLFSALNNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTVNKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQGATALAATLGADLILLS +DVSGKLDGKGQRIAEMTAAKAEVLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_7:-26.5689 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:DA49Y,NA160A,AA164G,TA197D,AA225K; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVYELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVAADQGATALAATLGADLILLS +DVSGILDGKGQRIAEMDAAKAEQLIEQGIITDGMIVKVNAALDAKRTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_8:-26.1628 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:DA15H,NA63L,LA88N,LA104N,TA211C; +MMNPLIIKLGGVLLHSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKLGLRVTPADQIDIITGALAGTANKTNLAWAKKHQIAAVGLFNGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIICDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_9:-27.4735 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:FA103G,GA190S,EA195M,TA197M,TA211I; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLGLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKSQRIAMMMAAKAEQLIEQGIIIDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_10:-27.19 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:YA30V,SA109R,LA119I,EA195M,IA215R; +MMNPLIIKLGGVLLDSEEALERLFSALVNVRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDRVKVTQLDEEIG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAMMTAAKAEQLIEQGIITDGMRVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_11:-30.7658 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:SA180E,DA187Y,KA217C,DA223W,AA258C; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLE +DVSGILYGKGQRIAEMTAAKAEQLIEQGIITDGMIVCVNAALWAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILC +>1gs5_Repair_12:-34.8769 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:DA15L,SA16L,EA21W,HA121M,EA241Q; +MMNPLIIKLGGVLLLLEEALWRLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +MVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +QQLPALFNGMPMGTRILA +>1gs5_Repair_13:-19.4695 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:IA7N,FA24G,WA91E,AA98D,HA121G; +MMNPLINKLGGVLLDSEEALERLGSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAEAKKHQIDAVGLFLGDGDSVKVTQLDEELG +GVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_14:-32.2636 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA132I,NA134V,SA183D,IA193M,PA231M; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKIIVSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVDGILDGKGQRMAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRMVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_15:-25.3398 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:NA29F,LA57C,QA191Y,MA214E,AA225M; +MMNPLIIKLGGVLLDSEEALERLFSALVFYRESHQRPLVIVHGGGCVVDELMKGLNCPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGYRIAEMTAAKAEQLIEQGIITDGEIVKVNAALDAMRTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_16:-21.5547 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:EA17T,GA208K,NA219P,AA245V,FA247N; +MMNPLIIKLGGVLLDSTEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQKIITDGMIVKVPAALDAARTLGRPVDIASWRHA +EQLPVLNNGMPMGTRILA +>1gs5_Repair_17:-16.6805 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:RA31V,VA144F,SA147A,AA165V,GA253L; +MMNPLIIKLGGVLLDSEEALERLFSALVNYVESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPFVSAIGVTDEGQLMNVNADQAVTALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMLTRILA +>1gs5_Repair_18:-15.6277 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:RA31F,GA123M,YA141T,SA180Q,EA202D; +MMNPLIIKLGGVLLDSEEALERLFSALVNYFESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVMLAQPGSPKLINSLLENGTLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLQ +DVSGILDGKGQRIAEMTAAKADQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_19:23.5818 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:QA35C,GA44I,TA151E,IA177V,GA184Y; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHCRPLVIVHGIGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVEDEGQLMNVNADQAATALAATLGADLVLLS +DVSYILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_20:-27.9805 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA27G,GA54V,LA132A,RA230S,DA233E; +MMNPLIIKLGGVLLDSEEALERLFSAGVNYRESHQRPLVIVHGGGCVVDELMKVLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKAINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGSPVEIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_21:-30.6777 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:RA22Q,TA83S,VA100N,YA141E,QA203L; +MMNPLIIKLGGVLLDSEEALEQLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGSANKTLLAWAKKHQIAANGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGELPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAELLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_22:8.70522 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:WA91F,HA95E,AA221V,RA230H,GA253Y; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAFAKKEQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAVLDAARTLGHPVDIASWRHA +EQLPALFNGMPMYTRILA +>1gs5_Repair_23:-30.7491 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:KA131M,VA150S,NA160I,AA220R,DA233W; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPMLINSLLENGYLPVVSSIGSTDEGQLMNVIADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNRALDAARTLGRPVWIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_24:-28.5437 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA9Y,SA25A,GA44A,NA139S,RA255N; +MMNPLIIKYGGVLLDSEEALERLFAALVNYRESHQRPLVIVHGAGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLESGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTNILA +>1gs5_Repair_25:-22.0465 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:GA10N,IA75P,PA130E,AA167T,GA229E; +MMNPLIIKLNGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDPITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSEKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATTLAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLERPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_26:-26.1072 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA51Q,EA118V,SA146M,LA222H,LA243Y; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDEQMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEVLG +HVGLAQPGSPKLINSLLENGYLPVVMSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAAHDAARTLGRPVDIASWRHA +EQYPALFNGMPMGTRILA +>1gs5_Repair_27:-17.1244 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:PA4Y,KA61N,GA123S,IA177H,TA254A; +MMNYLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +NKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVSLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLHLLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGARILA +>1gs5_Repair_28:-12.4909 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:GA120A,LA178T,PA231G,LA243E,IA256Y; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELA +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLITLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRGVDIASWRHA +EQEPALFNGMPMGTRYLA +>1gs5_Repair_29:-26.2885 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:NA63R,GA101Q,VA110C,LA136E,AA161Q; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKRGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVQLFLGDGDSCKVTQLDEELG +HVGLAQPGSPKLINSELENGYLPVVSSIGVTDEGQLMNVNQDQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_30:-26.4395 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:EA32T,AA70M,LA102H,LA104N,TA197E; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRTSHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPMDQIDIITGALAGTANKTLLAWAKKHQIAAVGHFNGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMEAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_31:-31.6076 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:DA49I,GA105L,DA108W,LA228F,LA257N; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVIELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLLDGWSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTFGRPVDIASWRHA +EQLPALFNGMPMGTRINA +>1gs5_Repair_32:-29.9753 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:DA71S,GA78V,NA134P,SA147L,EA206R; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPASQIDIITVALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLIPSLLENGYLPVVSLIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIRQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_33:-14.7597 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:GA11I,YA30Q,TA68K,TA197V,KA200R; +MMNPLIIKLGIVLLDSEEALERLFSALVNQRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVKPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMVAARAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_34:-24.9292 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:AA26N,VA59S,LA119Q,EA153Q,QA155P; +MMNPLIIKLGGVLLDSEEALERLFSNLVNYRESHQRPLVIVHGGGCVVDELMKGLNLPSK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEEQG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDQGPLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_35:-26.8692 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:TA87K,IA133G,TA151R,LA172I,IA210L; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKKLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLGNSLLENGYLPVVSSIGVRDEGQLMNVNADQAATALAATIGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGILTDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_36:-18.9746 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:IA40N,KA60L,GA128E,IA148M,KA189W; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVNVHGGGCVVDELMKGLNLPVL +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPESPKLINSLLENGYLPVVSSMGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGWGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_37:-23.1198 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:GA82R,IA177H,GA190H,AA194W,KA217Y; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALARTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLHLLS +DVSGILDGKHQRIWEMTAAKAEQLIEQGIITDGMIVYVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_38:-30.2711 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:DA15S,GA54V,GA82P,GA101Y,RA192F; +MMNPLIIKLGGVLLSSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKVLNLPVK +KKNGLRVTPADQIDIITGALAPTANKTLLAWAKKHQIAAVYLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQFIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_39:-21.7619 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:RA36P,SA109K,PA244A,GA249P,GA253A; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQPPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDKVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLAALFNPMPMATRILA +>1gs5_Repair_40:-15.5711 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:AA19R,SA146Q,QA203N,LA246V,FA247E; +MMNPLIIKLGGVLLDSEERLERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVQSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAENLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPAVENGMPMGTRILA +>1gs5_Repair_41:-24.0846 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:GA82A,KA111I,KA200A,AA224E,RA230M; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAATANKTLLAWAKKHQIAAVGLFLGDGDSVIVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAAAEQLIEQGIITDGMIVKVNAALDEARTLGMPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_42:-25.7279 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:DA106R,SA109L,VA159K,DA233G,MA250Q; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGRGDLVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNKNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVGIASWRHA +EQLPALFNGQPMGTRILA +>1gs5_Repair_43:-29.5981 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA28C,DA175F,KA189L,GA190K,EA202S; +MMNPLIIKLGGVLLDSEEALERLFSALCNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGAFLILLS +DVSGILDGLKQRIAEMTAAKASQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_44:-2.65304 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:QA35P,AA81K,GA107W,LA204P,LA228Q; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHPRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALKGTANKTLLAWAKKHQIAAVGLFLGDWDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQPIEQGIITDGMIVKVNAALDAARTQGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_45:-19.3979 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:MA2A,EA18R,LA104V,VA159M,FA247P; +MANPLIIKLGGVLLDSERALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFVGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNMNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALPNGMPMGTRILA +>1gs5_Repair_46:-25.1581 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:MA2W,GA154I,QA203V,NA248G,LA257C; +MWNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEIQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEVLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFGGMPMGTRICA +>1gs5_Repair_47:-23.5494 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:DA74K,HA95Q,SA129N,FA247H,GA249L; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIKIITGALAGTANKTLLAWAKKQQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGNPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALHNLMPMGTRILA +>1gs5_Repair_48:-20.5083 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA13W,RA22C,TA68E,RA192W,MA214Q; +MMNPLIIKLGGVWLDSEEALECLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVEPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQWIAEMTAAKAEQLIEQGIITDGQIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_49:-24.714 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:AA90C,DA116A,GA120M,AA201K,DA223G; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLCWAKKHQIAAVGLFLGDGDSVKVTQLAEELM +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKKEQLIEQGIITDGMIVKVNAALGAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_50:-25.6189 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA80G,DA116W,IA209P,TA211F,NA219T; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGAGAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLWEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGPIFDGMIVKVTAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_51:-28.7055 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:AA84L,LA119I,QA126V,AA240R,LA243F; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTLNKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEEIG +HVGLAVPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHR +EQFPALFNGMPMGTRILA +>1gs5_Repair_52:-23.895 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:NA3F,NA85M,VA218Q,AA225M,RA226D; +MMFPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTAMKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKQNAALDAMDTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_53:-24.0125 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:GA10I,MA52N,AA90Y,LA137M,VA159S; +MMNPLIIKLIGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELNKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLYWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLMENGYLPVVSSIGVTDEGQLMNSNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_54:-25.3049 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:HA34A,VA47S,WA91V,HA95Q,IA185A; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESAQRPLVIVHGGGCSVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAVAKKQQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGALDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_55:-23.7247 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA41S,EA50P,NA63I,TA83A,AA225T; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVISHGGGCVVDPLMKGLNLPVK +KKIGLRVTPADQIDIITGALAGAANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDATRTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_56:-23.0716 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:GA10K,LA132C,VA182M,EA206V,RA255E; +MMNPLIIKLKGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKCINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DMSGILDGKGQRIAEMTAAKAEQLIVQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTEILA +>1gs5_Repair_57:-19.6319 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:NA29I,GA43T,NA219S,AA224N,IA234R; +MMNPLIIKLGGVLLDSEEALERLFSALVIYRESHQRPLVIVHTGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVSAALDNARTLGRPVDRASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_58:-24.3861 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA55C,VA122G,AA220T,EA241M,LA257V; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGCNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HGGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNTALDAARTLGRPVDIASWRHA +MQLPALFNGMPMGTRIVA +>1gs5_Repair_59:-27.6696 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:SA25Q,LA156M,NA158S,GA249V,LA257K; +MMNPLIIKLGGVLLDSEEALERLFQALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQMMSVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNVMPMGTRIKA +>1gs5_Repair_60:-22.3717 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:SA16A,LA20D,LA38K,LA115D,IA215K; +MMNPLIIKLGGVLLDAEEADERLFSALVNYRESHQRPKVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQDDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMKVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_61:-28.5486 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:IA6E,VA67S,IA215M,DA233I,PA251I; +MMNPLEIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRSTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMMVKVNAALDAARTLGRPVIIASWRHA +EQLPALFNGMIMGTRILA +>1gs5_Repair_62:-7.57806 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA67I,VA122C,GA123D,LA168T,PA244A; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRITPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HCDLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATATAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLAALFNGMPMGTRILA +>1gs5_Repair_63:-23.7885 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:PA127A,KA131A,LA137V,DA162K,KA189R; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQAGSPALINSLVENGYLPVVSSIGVTDEGQLMNVNAKQAATALAATLGADLILLS +DVSGILDGRGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_64:-30.0452 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:AA70T,FA103D,EA118T,PA130D,TA211W; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPTDQIDIITGALAGTANKTLLAWAKKHQIAAVGLDLGDGDSVKVTQLDETLG +HVGLAQPGSDKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIIWDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_65:-2.08457 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:CA46K,GA123A,AA169W,DA187T,TA227D; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGKVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVALAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALWATLGADLILLS +DVSGILTGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARDLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_66:-28.2949 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:YA30W,DA49F,DA74K,FA103A,SA147G; +MMNPLIIKLGGVLLDSEEALERLFSALVNWRESHQRPLVIVHGGGCVVFELMKGLNLPVK +KKNGLRVTPADQIKIITGALAGTANKTLLAWAKKHQIAAVGLALGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSGIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_67:-23.101 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA9K,LA156C,AA169I,VA182G,MA214G; +MMNPLIIKKGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQCMNVNADQAATALIATLGADLILLS +DGSGILDGKGQRIAEMTAAKAEQLIEQGIITDGGIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_68:-23.9875 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:GA54C,GA78P,LA102H,TA171E,DA233I; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKCLNLPVK +KKNGLRVTPADQIDIITPALAGTANKTLLAWAKKHQIAAVGHFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAAELGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVIIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_69:-9.08198 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA59I,GA149F,IA185S,AA225V,GA229K; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPIK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIFVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGSLDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAVRTLKRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_70:-21.7533 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:EA18N,SA33T,PA37M,LA89E,SA146Q; +MMNPLIIKLGGVLLDSENALERLFSALVNYRETHQRMLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLEAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVQSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_71:-19.4801 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA9G,IA73K,GA120L,DA175R,TA211V; +MMNPLIIKGGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQKDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELL +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGARLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIIVDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_72:-26.0156 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:NA3F,IA6P,LA38I,TA83D,GA101Y; +MMFPLPIKLGGVLLDSEEALERLFSALVNYRESHQRPIVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGDANKTLLAWAKKHQIAAVYLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_73:-12.9341 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:AA19D,LA57P,EA117L,AA165Q,LA179D; +MMNPLIIKLGGVLLDSEEDLERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNPPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDLELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAQTALAATLGADLILDS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_74:-24.473 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:IA73M,IA75Q,LA142K,QA191I,RA226P; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQMDQITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYKPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGIRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAAPTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_75:-19.8282 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA57A,VA100P,AA125N,LA168W,SA236E; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNAPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAPGLFLGDGDSVKVTQLDEELG +HVGLNQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATAWAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIAEWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_76:-30.8556 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:KA8Q,GA78L,GA101D,PA130W,AA258Q; +MMNPLIIQLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITLALAGTANKTLLAWAKKHQIAAVDLFLGDGDSVKVTQLDEELG +HVGLAQPGSWKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILQ +>1gs5_Repair_77:-11.9045 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA39G,GA64L,QA114C,IA133F,WA237L; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLGIVHGGGCVVDELMKGLNLPVK +KKNLLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTCLDEELG +HVGLAQPGSPKLFNSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASLRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_78:-29.0148 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:RA66W,AA92L,LA115S,LA156Y,GA190S; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLWVTPADQIDIITGALAGTANKTLLAWLKKHQIAAVGLFLGDGDSVKVTQSDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQYMNVNADQAATALAATLGADLILLS +DVSGILDGKSQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_79:-1.26271 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA20Q,GA123N,AA170T,EA202A,LA246P; +MMNPLIIKLGGVLLDSEEAQERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVNLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALATTLGADLILLS +DVSGILDGKGQRIAEMTAAKAAQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPAPFNGMPMGTRILA +>1gs5_Repair_80:-27.66 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:WA91K,VA100F,IA133G,TA211M,RA238W; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAKAKKHQIAAFGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLGNSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIIMDGMIVKVNAALDAARTLGRPVDIASWWHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_81:-9.6473 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA122H,EA153Y,GA184C,LA243D,LA257P; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HHGLAQPGSPKLINSLLENGYLPVVSSIGVTDYGQLMNVNADQAATALAATLGADLILLS +DVSCILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQDPALFNGMPMGTRIPA +>1gs5_Repair_82:-24.8601 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA57N,AA99C,IA133K,LA178F,GA208R; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNNPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIACVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLKNSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLIFLS +DVSGILDGKGQRIAEMTAAKAEQLIEQRIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_83:-8.98549 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA65N,AA99V,AA165Y,WA237T,FA247N; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGNRVTPADQIDIITGALAGTANKTLLAWAKKHQIAVVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAYTALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASTRHA +EQLPALNNGMPMGTRILA +>1gs5_Repair_84:-19.1682 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA51H,KA93F,LA102C,QA126P,AA225L; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDEHMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAFKHQIAAVGCFLGDGDSVKVTQLDEELG +HVGLAPPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDALRTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_85:-25.01 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:EA21Y,KA60G,VA100M,VA122D,LA178R; +MMNPLIIKLGGVLLDSEEALYRLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVG +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAMGLFLGDGDSVKVTQLDEELG +HDGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLIRLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_86:-29.5708 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA14R,PA127I,SA129L,RA226T,AA245Y; +MMNPLIIKLGGVLRDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQIGLPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAATTLGRPVDIASWRHA +EQLPYLFNGMPMGTRILA +>1gs5_Repair_87:-7.17497 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA41N,QA191H,EA195K,AA225W,RA238S; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVINHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGHRIAKMTAAKAEQLIEQGIITDGMIVKVNAALDAWRTLGRPVDIASWSHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_88:-18.3082 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:HA42S,LA57T,LA89R,IA148K,GA208P; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVSGGGCVVDELMKGLNTPVK +KKNGLRVTPADQIDIITGALAGTANKTLRAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSKGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQPIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_89:-27.9839 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:QA35D,LA136D,YA141T,QA207I,MA250L; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHDRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSDLENGTLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEIGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGLPMGTRILA +>1gs5_Repair_90:-13.923 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:AA19R,PA37F,LA115Y,GA128T,GA188R; +MMNPLIIKLGGVLLDSEERLERLFSALVNYRESHQRFLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQYDEELG +HVGLAQPTSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDRKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_91:-32.7398 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA12T,FA103W,DA175V,AA199P,IA209G; +MMNPLIIKLGGTLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLWLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGAVLILLS +DVSGILDGKGQRIAEMTAPKAEQLIEQGGITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_92:-24.4422 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:RA36P,VA122A,AA169N,NA219L,TA254S; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQPPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HAGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALNATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVLAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGSRILA +>1gs5_Repair_93:-36.6147 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA14W,DA71M,NA134H,SA183F,NA248Q; +MMNPLIIKLGGVLWDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPAMQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLIHSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVFGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFQGMPMGTRILA +>1gs5_Repair_94:-26.9913 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:KA53Y,NA56T,AA79E,QA191D,LA257R; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMYGLTLPVK +KKNGLRVTPADQIDIITGELAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGDRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRIRA +>1gs5_Repair_95:-31.2346 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:DA15F,AA98Q,NA160A,LA222K,GA249R; +MMNPLIIKLGGVLLFSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIQAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVAADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAAKDAARTLGRPVDIASWRHA +EQLPALFNRMPMGTRILA +>1gs5_Repair_96:-20.3419 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA14A,PA127H,GA173L,AA240V,IA256E; +MMNPLIIKLGGVLADSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQHGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLLADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHV +EQLPALFNGMPMGTRELA +>1gs5_Repair_97:-33.3728 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:QA35E,RA36V,VA47T,LA228F,HA239T; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHEVPLVIVHGGGCTVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTFGRPVDIASWRTA +EQLPALFNGMPMGTRILA +>1gs5_Repair_98:-27.3793 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:NA56F,RA66S,SA180Y,AA235V,WA237S; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLFLPVK +KKNGLSVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLY +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIVSSRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_99:-26.7737 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA12K,IA75S,PA143C,AA174P,RA238F; +MMNPLIIKLGGKLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDSITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLCVVSSIGVTDEGQLMNVNADQAATALAATLGPDLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWFHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_100:-26.7652 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA100H,EA138I,AA169N,LA222F,LA228V; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAHGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLINGYLPVVSSIGVTDEGQLMNVNADQAATALNATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAAFDAARTVGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_1:-28.7747 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:NA85R,FA103E,DA152I,NA160E,LA172A,EA202M; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTARKTLLAWAKKHQIAAVGLELGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTIEGQLMNVEADQAATALAATAGADLILLS +DVSGILDGKGQRIAEMTAAKAMQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_2:-24.1926 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:EA17G,LA132R,GA173F,EA206V,IA215P,VA232I; +MMNPLIIKLGGVLLDSGEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKRINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLFADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIVQGIITDGMPVKVNAALDAARTLGRPIDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_3:-30.7959 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:SA16F,EA18F,HA42L,LA204Q,RA238E,MA252W; +MMNPLIIKLGGVLLDFEFALERLFSALVNYRESHQRPLVIVLGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQQIEQGIITDGMIVKVNAALDAARTLGRPVDIASWEHA +EQLPALFNGMPWGTRILA +>1gs5_Repair_4:-15.341 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA65S,IA75T,TA77R,AA99F,RA226M,GA249H; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGSRVTPADQIDTIRGALAGTANKTLLAWAKKHQIAFVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAAMTLGRPVDIASWRHA +EQLPALFNHMPMGTRILA +>1gs5_Repair_5:-10.8189 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA20F,LA65D,DA71P,EA117N,GA123D,LA186Y; +MMNPLIIKLGGVLLDSEEAFERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGDRVTPAPQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDNELG +HVDLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGIYDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_6:-26.3773 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA13M,GA43N,KA94A,LA136S,AA161G,MA214V; +MMNPLIIKLGGVMLDSEEALERLFSALVNYRESHQRPLVIVHNGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKAHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSSLENGYLPVVSSIGVTDEGQLMNVNGDQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGVIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_7:-17.4314 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:QA35T,LA80F,KA86M,AA125R,AA201S,LA204G; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHTRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGAFAGTANMTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLRQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKSEQGIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_8:5.68375 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:EA50G,LA51F,VA110H,TA171H,IA193H,AA194F; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDGFMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSHKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAAHLGADLILLS +DVSGILDGKGQRHFEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_9:-25.197 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:KA131P,NA139P,TA166I,SA236H,MA250Q,IA256F; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPPLINSLLEPGYLPVVSSIGVTDEGQLMNVNADQAAIALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIAHWRHA +EQLPALFNGQPMGTRFLA +>1gs5_Repair_10:-33.093 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:RA66V,SA135K,EA195F,AA198P,IA209H,LA222H; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLVVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINKLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAFMTPAKAEQLIEQGHITDGMIVKVNAAHDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_11:-22.5921 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:NA63S,AA98K,IA148C,DA152E,EA206G,AA225L; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKSGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIKAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSCGVTEEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIGQGIITDGMIVKVNAALDALRTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_12:-16.1681 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:HA42D,GA43R,TA171L,KA200R,VA232L,IA234L; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVDRGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAALLGADLILLS +DVSGILDGKGQRIAEMTAARAEQLIEQGIITDGMIVKVNAALDAARTLGRPLDLASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_13:-24.267 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:HA34V,EA118L,GA123C,VA145K,GA190L,SA236Q; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESVQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDELLG +HVCLAQPGSPKLINSLLENGYLPVKSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKLQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIAQWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_14:-4.4709 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:SA25P,LA176Q,GA190P,AA201C,QA207F,GA253Q; +MMNPLIIKLGGVLLDSEEALERLFPALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADQILLS +DVSGILDGKPQRIAEMTAAKCEQLIEFGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMQTRILA +>1gs5_Repair_15:-30.5333 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:PA58Y,QA72C,IA76L,HA95T,AA161Q,WA237I; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLYVK +KKNGLRVTPADCIDILTGALAGTANKTLLAWAKKTQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNQDQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASIRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_16:-20.569 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:DA15Y,IA73W,IA148W,NA160A,TA171V,TA227D; +MMNPLIIKLGGVLLYSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQWDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSWGVTDEGQLMNVAADQAATALAAVLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARDLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_17:-23.6772 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA47Y,LA80W,GA120L,LA136K,GA190L,KA217I; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCYVDELMKGLNLPVK +KKNGLRVTPADQIDIITGAWAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELL +HVGLAQPGSPKLINSKLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKLQRIAEMTAAKAEQLIEQGIITDGMIVIVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_18:-22.1336 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:NA85Q,KA111L,QA155G,AA225Q,RA226Q,HA239S; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTAQKTLLAWAKKHQIAAVGLFLGDGDSVLVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGGLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAQQTLGRPVDIASWRSA +EQLPALFNGMPMGTRILA +>1gs5_Repair_19:-28.6869 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:EA32G,GA82D,DA108L,QA126I,IA148D,DA152K; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRGSHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALADTANKTLLAWAKKHQIAAVGLFLGDGLSVKVTQLDEELG +HVGLAIPGSPKLINSLLENGYLPVVSSDGVTKEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_20:6.5998 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:GA43V,GA78L,AA90D,KA111L,GA123Y,TA227R; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHVGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITLALAGTANKTLLDWAKKHQIAAVGLFLGDGDSVLVTQLDEELG +HVYLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARRLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_21:-24.2621 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:YA30A,GA44A,GA45K,KA62M,TA77C,PA127V; +MMNPLIIKLGGVLLDSEEALERLFSALVNARESHQRPLVIVHGAKCVVDELMKGLNLPVK +KMNGLRVTPADQIDIICGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQVGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_22:2.09002 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:RA31H,GA64M,FA103Q,TA113F,EA117N,AA125H; +MMNPLIIKLGGVLLDSEEALERLFSALVNYHESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNMLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLQLGDGDSVKVFQLDNELG +HVGLHQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_23:-9.36483 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:IA6C,DA71H,VA112E,LA179G,DA223C,VA232R; +MMNPLCIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPAHQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKETQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILGS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALCAARTLGRPRDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_24:-25.7668 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:PA4H,LA38G,NA85M,FA103Y,VA182H,GA213A; +MMNHLIIKLGGVLLDSEEALERLFSALVNYRESHQRPGVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTAMKTLLAWAKKHQIAAVGLYLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DHSGILDGKGQRIAEMTAAKAEQLIEQGIITDAMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_25:-25.7426 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:EA18A,RA22S,LA55I,RA66G,IA76T,KA200D; +MMNPLIIKLGGVLLDSEAALESLFSALVNYRESHQRPLVIVHGGGCVVDELMKGINLPVK +KKNGLGVTPADQIDITTGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAADAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_26:-9.00113 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:RA36P,VA39E,EA50Q,TA68F,AA99L,GA140N; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQPPLEIVHGGGCVVDQLMKGLNLPVK +KKNGLRVFPADQIDIITGALAGTANKTLLAWAKKHQIALVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENNYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_27:11.2869 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA59A,KA61R,AA79Y,SA109W,LA137Y,IA210A; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPAK +RKNGLRVTPADQIDIITGYLAGTANKTLLAWAKKHQIAAVGLFLGDGDWVKVTQLDEELG +HVGLAQPGSPKLINSLYENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIATDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_28:-15.6429 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA9E,RA31M,VA110F,TA166M,RA192H,MA196E; +MMNPLIIKEGGVLLDSEEALERLFSALVNYMESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSFKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAAMALAATLGADLILLS +DVSGILDGKGQHIAEETAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_29:-12.9865 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:SA25M,WA91C,SA109R,GA123C,LA168C,IA210Q; +MMNPLIIKLGGVLLDSEEALERLFMALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLACAKKHQIAAVGLFLGDGDRVKVTQLDEELG +HVCLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATACAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIQTDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_30:-35.453 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:SA25H,LA57I,AA92Y,FA103L,DA212G,DA233T; +MMNPLIIKLGGVLLDSEEALERLFHALVNYRESHQRPLVIVHGGGCVVDELMKGLNIPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWYKKHQIAAVGLLLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITGGMIVKVNAALDAARTLGRPVTIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_31:-19.9074 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA20N,QA72H,GA78K,GA154P,MA157F,GA208D; +MMNPLIIKLGGVLLDSEEANERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADHIDIITKALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEPQLFNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQDIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_32:-19.0617 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA89S,TA113A,LA115M,IA148S,AA174S,GA208P; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLSAWAKKHQIAAVGLFLGDGDSVKVAQMDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSSGVTDEGQLMNVNADQAATALAATLGSDLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQPIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_33:-27.7462 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA28Y,LA57R,LA65R,VA182P,VA216M,LA257D; +MMNPLIIKLGGVLLDSEEALERLFSALYNYRESHQRPLVIVHGGGCVVDELMKGLNRPVK +KKNGRRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DPSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIMKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRIDA +>1gs5_Repair_34:-23.5209 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA48N,TA68S,SA135Q,DA162Y,GA208V,NA248C; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVNDELMKGLNLPVK +KKNGLRVSPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINQLLENGYLPVVSSIGVTDEGQLMNVNAYQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQVIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFCGMPMGTRILA +>1gs5_Repair_35:-7.28887 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:IA75G,LA88Q,DA162W,AA165P,IA210S,GA229L; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDGITGALAGTANKTQLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNAWQAPTALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGISTDGMIVKVNAALDAARTLLRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_36:-21.7841 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:KA62V,NA85A,LA104Q,VA112K,VA122Y,WA237R; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KVNGLRVTPADQIDIITGALAGTAAKTLLAWAKKHQIAAVGLFQGDGDSVKKTQLDEELG +HYGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASRRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_37:-21.8183 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA12C,KA62C,GA107S,DA187L,PA244G,TA254M; +MMNPLIIKLGGCLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KCNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDSDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILLGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLGALFNGMPMGMRILA +>1gs5_Repair_38:-31.183 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA12S,AA79M,TA113Y,PA130D,AA167E,DA223T; +MMNPLIIKLGGSLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGMLAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVYQLDEELG +HVGLAQPGSDKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATELAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALTAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_39:1.26988 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:AA79Y,TA87N,NA134P,TA197L,SA236T,GA253E; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGYLAGTANKNLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLIPSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMLAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIATWRHA +EQLPALFNGMPMETRILA +>1gs5_Repair_40:-20.1869 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA14F,MA52T,LA119S,QA126C,TA171P,KA217D; +MMNPLIIKLGGVLFDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELTKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEESG +HVGLACPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAAPLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVDVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_41:-18.9484 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA39P,CA46A,GA54N,MA196Y,AA224V,PA231D; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLPIVHGGGAVVDELMKNLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEYTAAKAEQLIEQGIITDGMIVKVNAALDVARTLGRDVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_42:-10.9041 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:RA31D,TA87H,QA126H,GA128Y,TA151S,EA195G; +MMNPLIIKLGGVLLDSEEALERLFSALVNYDESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKHLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAHPYSPKLINSLLENGYLPVVSSIGVSDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAGMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_43:-6.42352 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:GA43F,NA63C,LA136S,PA143V,SA146F,LA204T; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHFGGCVVDELMKGLNLPVK +KKCGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSSLENGYLVVVFSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQTIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_44:-27.7372 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:GA11M,EA50V,GA54V,VA100I,AA167T,AA201M; +MMNPLIIKLGMVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDVLMKVLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAIGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATTLAATLGADLILLS +DVSGILDGKGQRIAEMTAAKMEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_45:-9.59572 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:MA2A,LA80W,YA141G,KA189V,QA203L,TA254H; +MANPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGAWAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGGLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGVGQRIAEMTAAKAELLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGHRILA +>1gs5_Repair_46:-11.2984 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA110N,GA149S,LA172S,IA177E,IA185C,IA256C; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSNKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSISVTDEGQLMNVNADQAATALAATSGADLELLS +DVSGCLDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRCLA +>1gs5_Repair_47:-22.7023 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:DA49N,IA73M,IA97Y,IA148N,SA180N,TA227E; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVNELMKGLNLPVK +KKNGLRVTPADQMDIITGALAGTANKTLLAWAKKHQYAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSNGVTDEGQLMNVNADQAATALAATLGADLILLN +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARELGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_48:-28.4488 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:PA4A,VA47T,NA160K,RA192L,MA196V,DA233E; +MMNALIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCTVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVKADQAATALAATLGADLILLS +DVSGILDGKGQLIAEVTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVEIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_49:-27.5237 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:NA3V,LA9G,PA58A,VA59K,EA206M,TA211H; +MMVPLIIKGGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLAKK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIMQGIIHDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_50:-23.4286 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA9P,GA10E,CA46L,VA216M,TA254N,AA258L; +MMNPLIIKPEGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGLVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIMKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGNRILL +>1gs5_Repair_51:-16.7447 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:NA85H,LA115S,AA225M,PA231E,AA235C,FA247A; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTAHKTLLAWAKKHQIAAVGLFLGDGDSVKVTQSDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAMRTLGREVDICSWRHA +EQLPALANGMPMGTRILA +>1gs5_Repair_52:-10.1248 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:QA35F,NA63F,GA64D,VA67P,AA224S,LA243A; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHFRPLVIVHGGGCVVDELMKGLNLPVK +KKFDLRPTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDSARTLGRPVDIASWRHA +EQAPALFNGMPMGTRILA +>1gs5_Repair_53:-28.2302 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA47N,LA115E,LA124S,DA175F,IA205V,GA249E; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCNVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQEDEELG +HVGSAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGAFLILLS +DVSGILDGKGQRIAEMTAAKAEQLVEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNEMPMGTRILA +>1gs5_Repair_54:-15.6373 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:PA4W,IA7D,DA49P,KA131G,SA236V,IA256T; +MMNWLIDKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVPELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPGLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIAVWRHA +EQLPALFNGMPMGTRTLA +>1gs5_Repair_55:-17.9905 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:NA3K,GA11W,TA87W,TA113K,GA190L,GA213V; +MMKPLIIKLGWVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKWLLAWAKKHQIAAVGLFLGDGDSVKVKQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKLQRIAEMTAAKAEQLIEQGIITDVMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_56:-15.4978 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:YA30I,QA72R,AA79F,AA92M,TA166D,LA178S; +MMNPLIIKLGGVLLDSEEALERLFSALVNIRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADRIDIITGFLAGTANKTLLAWMKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAADALAATLGADLISLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_57:-28.0478 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA38F,LA168N,LA176V,SA183F,DA212I,RA238E; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPFVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATANAATLGADVILLS +DVFGILDGKGQRIAEMTAAKAEQLIEQGIITIGMIVKVNAALDAARTLGRPVDIASWEHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_58:0.728451 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:RA36N,GA123Q,IA133P,GA140P,NA219Q,AA225N; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQNPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVQLAQPGSPKLPNSLLENPYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVQAALDANRTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_59:-22.4388 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:AA19L,VA67F,TA68I,PA69W,IA133K,LA178V; +MMNPLIIKLGGVLLDSEELLERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRFIWADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLKNSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLIVLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_60:-33.2947 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:HA42L,LA65W,PA69I,LA132W,NA158M,NA219K; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVLGGGCVVDELMKGLNLPVK +KKNGWRVTIADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKWINSLLENGYLPVVSSIGVTDEGQLMMVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVKAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_61:-27.9997 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:MA2A,LA80C,AA84G,NA139V,AA194W,AA240Y; +MANPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGACAGTGNKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLEVGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIWEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHY +EQLPALFNGMPMGTRILA +>1gs5_Repair_62:-28.7058 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA41L,QA96L,KA111H,KA131N,TA151P,IA205N; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVILHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHLIAAVGLFLGDGDSVHVTQLDEELG +HVGLAQPGSPNLINSLLENGYLPVVSSIGVPDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLNEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_63:-21.2721 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:NA29T,NA85H,AA125S,LA176V,AA235P,NA248W; +MMNPLIIKLGGVLLDSEEALERLFSALVTYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTAHKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLSQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADVILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIPSWRHA +EQLPALFWGMPMGTRILA +>1gs5_Repair_64:-0.565605 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:YA30Q,KA62M,AA79Y,IA133G,QA155A,TA227P; +MMNPLIIKLGGVLLDSEEALERLFSALVNQRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KMNGLRVTPADQIDIITGYLAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLGNSLLENGYLPVVSSIGVTDEGALMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARPLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_65:-19.2293 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:KA53P,DA106C,SA109R,QA155V,AA170S,NA248D; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMPGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGCGDRVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGVLMNVNADQAATALASTLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFDGMPMGTRILA +>1gs5_Repair_66:-27.5801 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:AA19S,IA40E,DA152P,LA168V,IA215R,DA223T; +MMNPLIIKLGGVLLDSEESLERLFSALVNYRESHQRPLVEVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTPEGQLMNVNADQAATAVAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMRVKVNAALTAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_67:-2.10982 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:MA2P,IA40S,GA82N,GA123K,LA136D,FA247S; +MPNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVSVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALANTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVKLAQPGSPKLINSDLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALSNGMPMGTRILA +>1gs5_Repair_68:-26.1465 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA14G,NA85M,GA105M,IA215T,RA226Q,FA247N; +MMNPLIIKLGGVLGDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTAMKTLLAWAKKHQIAAVGLFLMDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMTVKVNAALDAAQTLGRPVDIASWRHA +EQLPALNNGMPMGTRILA +>1gs5_Repair_69:-5.73447 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:QA155V,LA204W,AA220Y,DA223E,PA231T,GA253I; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGVLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQWIEQGIITDGMIVKVNYALEAARTLGRTVDIASWRHA +EQLPALFNGMPMITRILA +>1gs5_Repair_70:-19.2105 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA28Y,GA44N,RA66N,PA69V,TA113V,LA172F; +MMNPLIIKLGGVLLDSEEALERLFSALYNYRESHQRPLVIVHGNGCVVDELMKGLNLPVK +KKNGLNVTVADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVVQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATFGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_71:-20.3651 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:EA17C,NA56D,QA96P,IA177N,MA196F,EA241Y; +MMNPLIIKLGGVLLDSCEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLDLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHPIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLNLLS +DVSGILDGKGQRIAEFTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +YQLPALFNGMPMGTRILA +>1gs5_Repair_72:-22.6667 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:DA49F,GA140W,VA145A,LA156N,LA179A,NA219R; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVFELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENWYLPVASSIGVTDEGQNMNVNADQAATALAATLGADLILAS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVRAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_73:-31.903 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:KA61P,VA145L,AA169G,SA183C,EA206R,MA214K; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +PKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVLSSIGVTDEGQLMNVNADQAATALGATLGADLILLS +DVCGILDGKGQRIAEMTAAKAEQLIRQGIITDGKIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_74:-24.1954 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA13Q,SA33H,GA43E,IA73D,LA178K,SA180K; +MMNPLIIKLGGVQLDSEEALERLFSALVNYREHHQRPLVIVHEGGCVVDELMKGLNLPVK +KKNGLRVTPADQDDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLIKLK +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_75:-28.431 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:WA91E,DA116E,NA134H,KA189N,TA211L,MA250I; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAEAKKHQIAAVGLFLGDGDSVKVTQLEEELG +HVGLAQPGSPKLIHSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGNGQRIAEMTAAKAEQLIEQGIILDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGIPMGTRILA +>1gs5_Repair_76:-25.1641 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:PA4M,DA74T,QA96V,KA111C,PA130N,LA132C; +MMNMLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQITIITGALAGTANKTLLAWAKKHVIAAVGLFLGDGDSVCVTQLDEELG +HVGLAQPGSNKCINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_77:-31.0889 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:RA36W,AA90R,LA104Q,SA109I,DA116F,AA199M; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQWPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLRWAKKHQIAAVGLFQGDGDIVKVTQLFEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAMKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_78:-6.93701 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:IA6C,DA15I,GA107L,PA130R,IA177P,AA258F; +MMNPLCIKLGGVLLISEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDLDSVKVTQLDEELG +HVGLAQPGSRKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLPLLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILF +>1gs5_Repair_79:-23.9705 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:GA10E,LA65C,DA71C,TA83N,MA214R,FA247V; +MMNPLIIKLEGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGCRVTPACQIDIITGALAGNANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGRIVKVNAALDAARTLGRPVDIASWRHA +EQLPALVNGMPMGTRILA +>1gs5_Repair_80:-31.7093 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA13V,EA21H,SA25L,AA90S,GA101A,TA211A; +MMNPLIIKLGGVVLDSEEALHRLFLALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLSWAKKHQIAAVALFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIIADGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_81:-18.3334 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA9H,DA74L,AA98T,AA164N,IA185H,EA241Q; +MMNPLIIKHGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQILIITGALAGTANKTLLAWAKKHQITAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQNATALAATLGADLILLS +DVSGHLDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +QQLPALFNGMPMGTRILA +>1gs5_Repair_82:-25.2741 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:QA96V,IA97K,GA101R,VA144A,GA188F,IA205R; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHVKAAVRLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPAVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDFKGQRIAEMTAAKAEQLREQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_83:-21.7332 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:IA40D,DA49R,TA68N,SA129T,GA208C,LA228S; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVDVHGGGCVVRELMKGLNLPVK +KKNGLRVNPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGTPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQCIITDGMIVKVNAALDAARTSGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_84:-18.7431 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:GA54T,GA140T,MA157P,VA182G,LA222M,DA223C; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKTLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENTYLPVVSSIGVTDEGQLPNVNADQAATALAATLGADLILLS +DGSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAAMCAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_85:-25.7287 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:HA42A,DA74M,LA88E,SA183G,LA186Y,IA209N; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVAGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIMIITGALAGTANKTELAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVGGIYDGKGQRIAEMTAAKAEQLIEQGNITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_86:-27.7745 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:RA36N,PA37R,EA50R,AA170M,GA208T,LA257M; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQNRLVIVHGGGCVVDRLMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAMTLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQTIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRIMA +>1gs5_Repair_87:-24.6741 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA23W,IA40R,LA65W,KA189M,GA190W,RA230H; +MMNPLIIKLGGVLLDSEEALERWFSALVNYRESHQRPLVRVHGGGCVVDELMKGLNLPVK +KKNGWRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGMWQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGHPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_88:-25.2738 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:MA2C,AA99D,LA178F,AA220M,DA233R,IA234R; +MCNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIADVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLIFLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNMALDAARTLGRPVRRASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_89:-25.6439 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA39M,AA79C,AA81K,GA154D,DA187V,GA229K; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLMIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGCLKGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEDQLMNVNADQAATALAATLGADLILLS +DVSGILVGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLKRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_90:-21.8745 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:HA34Q,QA35R,VA41R,LA55M,NA219G,LA246A; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESQRRPLVIRHGGGCVVDELMKGMNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVGAALDAARTLGRPVDIASWRHA +EQLPAAFNGMPMGTRILA +>1gs5_Repair_91:-29.8623 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:AA19D,VA48I,AA70T,EA117C,DA187L,AA221G; +MMNPLIIKLGGVLLDSEEDLERLFSALVNYRESHQRPLVIVHGGGCVIDELMKGLNLPVK +KKNGLRVTPTDQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDCELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILLGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAGLDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_92:-15.5724 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA59A,AA70T,VA122D,AA225R,RA226C,IA256F; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPAK +KKNGLRVTPTDQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HDGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDARCTLGRPVDIASWRHA +EQLPALFNGMPMGTRFLA +>1gs5_Repair_93:-0.403951 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:TA171W,AA201K,GA213N,PA231M,SA236V,PA244T; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAAWLGADLILLS +DVSGILDGKGQRIAEMTAAKKEQLIEQGIITDNMIVKVNAALDAARTLGRMVDIAVWRHA +EQLTALFNGMPMGTRILA +>1gs5_Repair_94:-27.221 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA5N,SA33N,WA91K,DA162C,AA164M,AA170R; +MMNPNIIKLGGVLLDSEEALERLFSALVNYRENHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAKAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNACQMATALARTLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_95:-24.3828 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA5E,LA80R,PA127T,VA150E,DA223P,RA226Q; +MMNPEIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGARAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQTGSPKLINSLLENGYLPVVSSIGETDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALPAAQTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_96:-30.2045 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA12H,EA50F,TA68G,AA174S,NA219I,AA240C; +MMNPLIIKLGGHLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDFLMKGLNLPVK +KKNGLRVGPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGSDLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVIAALDAARTLGRPVDIASWRHC +EQLPALFNGMPMGTRILA +>1gs5_Repair_97:-15.024 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA5V,RA36S,IA73W,GA123M,TA151G,VA232M; +MMNPVIIKLGGVLLDSEEALERLFSALVNYRESHQSPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQWDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVMLAQPGSPKLINSLLENGYLPVVSSIGVGDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPMDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_98:-22.7753 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA38V,DA74V,WA91G,LA115K,LA136K,AA169G; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPVVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIVIITGALAGTANKTLLAGAKKHQIAAVGLFLGDGDSVKVTQKDEELG +HVGLAQPGSPKLINSKLENGYLPVVSSIGVTDEGQLMNVNADQAATALGATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_99:-26.1392 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:SA16D,RA36E,LA51R,AA92S,KA111M,AA224Y; +MMNPLIIKLGGVLLDDEEALERLFSALVNYRESHQEPLVIVHGGGCVVDERMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWSKKHQIAAVGLFLGDGDSVMVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDYARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_100:-24.209 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:KA8H,LA27F,GA105V,GA128A,SA180L,MA252Q; +MMNPLIIHLGGVLLDSEEALERLFSAFVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLVDGDSVKVTQLDEELG +HVGLAQPASPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLL +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPQGTRILA +>1gs5_Repair_1:-20.884 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:RA36K,SA183N,IA185N,DA187Y,VA218C,AA235R; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQKPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVNGNLYGKGQRIAEMTAAKAEQLIEQGIITDGMIVKCNAALDAARTLGRPVDIRSWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_2:-30.8804 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:AA92Q,LA115Q,SA135H,DA223I,RA226Q,PA231E; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWQKKHQIAAVGLFLGDGDSVKVTQQDEELG +HVGLAQPGSPKLINHLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALIAAQTLGREVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_3:-24.5684 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:GA10H,KA61A,KA62T,FA103R,EA153H,VA216R; +MMNPLIIKLHGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +ATNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLRLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDHGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIRKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_4:-29.1696 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:SA16V,EA18K,EA118D,VA182P,PA251K,IA256L; +MMNPLIIKLGGVLLDVEKALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEDLG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DPSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMKMGTRLLA +>1gs5_Repair_5:-15.084 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:IA7S,LA55T,IA177C,DA187W,NA219L,GA249V; +MMNPLISKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGTNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLCLLS +DVSGILWGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVLAALDAARTLGRPVDIASWRHA +EQLPALFNVMPMGTRILA +>1gs5_Repair_6:-27.3771 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA13V,TA87Q,NA158K,AA174V,VA216W,FA247Y; +MMNPLIIKLGGVVLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKQLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMKVNADQAATALAATLGVDLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIWKVNAALDAARTLGRPVDIASWRHA +EQLPALYNGMPMGTRILA +>1gs5_Repair_7:-32.1125 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA47L,AA92Q,EA138R,SA146C,GA208L,HA239S; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCLVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWQKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLRNGYLPVVCSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQLIITDGMIVKVNAALDAARTLGRPVDIASWRSA +EQLPALFNGMPMGTRILA +>1gs5_Repair_8:-19.7978 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:EA17C,VA28F,GA78N,GA107D,QA163A,IA185N; +MMNPLIIKLGGVLLDSCEALERLFSALFNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITNALAGTANKTLLAWAKKHQIAAVGLFLGDDDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADAAATALAATLGADLILLS +DVSGNLDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_9:-18.5587 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:HA42G,LA51S,QA72M,VA112M,GA140L,LA222E; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVGGGGCVVDESMKGLNLPVK +KKNGLRVTPADMIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKMTQLDEELG +HVGLAQPGSPKLINSLLENLYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAAEDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_10:-22.9902 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:YA30V,SA109R,LA119I,VA216K,MA252R,LA257I; +MMNPLIIKLGGVLLDSEEALERLFSALVNVRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDRVKVTQLDEEIG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIKKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPRGTRIIA +>1gs5_Repair_11:11.449 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:IA76E,GA107Y,SA180C,DA187W,VA218D,AA224E; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIETGALAGTANKTLLAWAKKHQIAAVGLFLGDYDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLC +DVSGILWGKGQRIAEMTAAKAEQLIEQGIITDGMIVKDNAALDEARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_12:-30.0902 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:DA15M,SA16E,VA28K,HA121Q,LA222W,LA243I; +MMNPLIIKLGGVLLMEEEALERLFSALKNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +QVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAAWDAARTLGRPVDIASWRHA +EQIPALFNGMPMGTRILA +>1gs5_Repair_13:-21.4256 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:IA7N,FA24G,GA101E,EA195N,AA198H,AA201R; +MMNPLINKLGGVLLDSEEALERLGSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVELFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIANMTHAKREQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_14:-29.8128 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA132I,NA134V,GA173D,SA183K,IA193F,PA231E; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKIIVSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLDADLILLS +DVKGILDGKGQRFAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGREVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_15:-20.673 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:NA29F,LA57C,LA142Y,QA191E,MA214K,AA225K; +MMNPLIIKLGGVLLDSEEALERLFSALVFYRESHQRPLVIVHGGGCVVDELMKGLNCPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYYPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGERIAEMTAAKAEQLIEQGIITDGKIVKVNAALDAKRTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_16:-24.0116 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:EA17T,NA134K,GA208P,NA219V,AA245D,FA247L; +MMNPLIIKLGGVLLDSTEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLIKSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQPIITDGMIVKVVAALDAARTLGRPVDIASWRHA +EQLPDLLNGMPMGTRILA +>1gs5_Repair_17:-7.05469 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:RA31V,QA126P,VA144A,SA147V,AA165L,GA253K; +MMNPLIIKLGGVLLDSEEALERLFSALVNYVESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAPPGSPKLINSLLENGYLPAVSVIGVTDEGQLMNVNADQALTALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMKTRILA +>1gs5_Repair_18:28.6646 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:RA31F,EA50M,GA123W,YA141Q,SA180D,EA202R; +MMNPLIIKLGGVLLDSEEALERLFSALVNYFESHQRPLVIVHGGGCVVDMLMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVWLAQPGSPKLINSLLENGQLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLD +DVSGILDGKGQRIAEMTAAKARQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_19:0.831022 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:QA35C,VA41H,GA44E,TA151V,IA177Y,GA184E; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHCRPLVIHHGEGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVVDEGQLMNVNADQAATALAATLGADLYLLS +DVSEILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_20:-18.2032 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA27G,GA54V,GA107A,IA133S,NA134E,LA178V; +MMNPLIIKLGGVLLDSEEALERLFSAGVNYRESHQRPLVIVHGGGCVVDELMKVLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDADSVKVTQLDEELG +HVGLAQPGSPKLSESLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLIVLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_21:-17.243 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA23E,RA36L,LA104M,AA161K,PA244V,FA247Q; +MMNPLIIKLGGVLLDSEEALEREFSALVNYRESHQLPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFMGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNKDQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLVALQNGMPMGTRILA +>1gs5_Repair_22:-21.386 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:DA15P,LA80E,EA153V,GA208H,RA255Y,LA257G; +MMNPLIIKLGGVLLPSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGAEAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDVGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQHIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTYIGA +>1gs5_Repair_23:-23.2912 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:NA85A,NA134W,LA176G,EA206Q,VA218W,HA239N; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTAAKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLIWSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADGILLS +DVSGILDGKGQRIAEMTAAKAEQLIQQGIITDGMIVKWNAALDAARTLGRPVDIASWRNA +EQLPALFNGMPMGTRILA +>1gs5_Repair_24:-22.4392 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA9Y,SA25A,GA43A,GA44S,EA50R,AA79R; +MMNPLIIKYGGVLLDSEEALERLFAALVNYRESHQRPLVIVHASGCVVDRLMKGLNLPVK +KKNGLRVTPADQIDIITGRLAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_25:-25.2368 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:GA10A,VA48M,DA71L,IA76N,LA104E,DA106Y; +MMNPLIIKLAGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVMDELMKGLNLPVK +KKNGLRVTPALQIDINTGALAGTANKTLLAWAKKHQIAAVGLFEGYGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_26:-19.3234 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:RA31T,EA117I,EA118K,AA125I,GA208D,IA256F; +MMNPLIIKLGGVLLDSEEALERLFSALVNYTESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDIKLG +HVGLIQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQDIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRFLA +>1gs5_Repair_27:-32.6557 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:KA8T,KA60I,KA61I,DA71L,LA80M,GA249A; +MMNPLIITLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVI +IKNGLRVTPALQIDIITGAMAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNAMPMGTRILA +>1gs5_Repair_28:-13.9992 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA5T,AA98W,AA99M,AA174K,GA229V,AA240G; +MMNPTIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIWMVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGKDLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLVRPVDIASWRHG +EQLPALFNGMPMGTRILA +>1gs5_Repair_29:-21.5658 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:IA40T,LA115W,TA151D,TA197M,VA218R,RA238D; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVTVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQWDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVDDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMMAAKAEQLIEQGIITDGMIVKRNAALDAARTLGRPVDIASWDHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_30:-8.67797 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:EA50N,IA76P,LA89I,SA109W,GA173A,AA224W; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDNLMKGLNLPVK +KKNGLRVTPADQIDIPTGALAGTANKTLIAWAKKHQIAAVGLFLGDGDWVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLAADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDWARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_31:-26.7514 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:RA22F,TA77N,NA85P,QA114N,EA202Q,HA239S; +MMNPLIIKLGGVLLDSEEALEFLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIINGALAGTAPKTLLAWAKKHQIAAVGLFLGDGDSVKVTNLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAQQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRSA +EQLPALFNGMPMGTRILA +>1gs5_Repair_32:-6.32721 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:SA25D,GA64N,LA156N,AA169K,SA180G,NA248I; +MMNPLIIKLGGVLLDSEEALERLFDALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNNLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQNMNVNADQAATALKATLGADLILLG +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFIGMPMGTRILA +>1gs5_Repair_33:-14.2105 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:IA6P,TA113L,AA174N,TA197K,GA208T,VA216A; +MMNPLPIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVLQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGNDLILLS +DVSGILDGKGQRIAEMKAAKAEQLIEQTIITDGMIAKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_34:-23.8692 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:KA93P,GA107N,TA151M,DA152N,TA166Q,RA238H; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAPKHQIAAVGLFLGDNDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVMNEGQLMNVNADQAAQALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWHHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_35:-25.8011 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:KA8D,GA54M,GA101W,LA176E,SA236D,MA252G; +MMNPLIIDLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKMLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVWLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADEILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIADWRHA +EQLPALFNGMPGGTRILA +>1gs5_Repair_36:-29.0026 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA47K,HA121W,AA201N,NA219S,AA220E,PA251D; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCKVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +WVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKNEQLIEQGIITDGMIVKVSEALDAARTLGRPVDIASWRHA +EQLPALFNGMDMGTRILA +>1gs5_Repair_37:-21.1578 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:AA70M,GA82W,HA95T,LA104F,KA217G,GA229A; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPMDQIDIITGALAWTANKTLLAWAKKTQIAAVGLFFGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVGVNAALDAARTLARPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_38:2.45411 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:EA17S,VA67C,IA73W,LA119G,YA141Q,TA254Y; +MMNPLIIKLGGVLLDSSEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRCTPADQWDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEEGG +HVGLAQPGSPKLINSLLENGQLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGYRILA +>1gs5_Repair_39:-15.8054 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:NA29H,AA84E,IA133C,DA162H,LA172W,PA244Q; +MMNPLIIKLGGVLLDSEEALERLFSALVHYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTENKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLCNSLLENGYLPVVSSIGVTDEGQLMNVNAHQAATALAATWGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLQALFNGMPMGTRILA +>1gs5_Repair_40:-30.3543 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:DA15W,SA16N,GA78F,KA131Q,YA141V,LA222E; +MMNPLIIKLGGVLLWNEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITFALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPQLINSLLENGVLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAAEDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_41:-0.35956 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:EA18L,EA21I,PA37Q,DA49S,IA73T,GA107Y; +MMNPLIIKLGGVLLDSELALIRLFSALVNYRESHQRQLVIVHGGGCVVSELMKGLNLPVK +KKNGLRVTPADQTDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDYDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_42:-27.328 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:GA54M,NA56M,KA61D,AA125I,EA202F,AA220C; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKMLMLPVK +DKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLIQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAFQLIEQGIITDGMIVKVNCALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_43:-21.9597 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:SA16M,LA23P,HA95M,EA153H,LA168H,MA250N; +MMNPLIIKLGGVLLDMEEALERPFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKMQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDHGQLMNVNADQAATAHAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGNPMGTRILA +>1gs5_Repair_44:-27.1307 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA41A,DA116E,AA198V,EA206I,GA213R,LA243C; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIAHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLEEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTVAKAEQLIIQGIITDRMIVKVNAALDAARTLGRPVDIASWRHA +EQCPALFNGMPMGTRILA +>1gs5_Repair_45:-35.0682 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA12K,AA90V,LA102N,SA109G,NA219V,MA252L; +MMNPLIIKLGGKLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLVWAKKHQIAAVGNFLGDGDGVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVVAALDAARTLGRPVDIASWRHA +EQLPALFNGMPLGTRILA +>1gs5_Repair_46:-28.0815 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:KA8N,KA86F,PA130Y,NA139M,IA209E,AA258V; +MMNPLIINLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANFTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSYKLINSLLEMGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGEITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILV +>1gs5_Repair_47:-27.4956 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:PA4D,VA47Q,QA96Y,NA139K,TA166A,QA191H; +MMNDLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCQVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHYIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLEKGYLPVVSSIGVTDEGQLMNVNADQAAAALAATLGADLILLS +DVSGILDGKGHRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_48:-28.9398 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:IA7K,GA45R,LA89A,DA175C,GA213S,WA237C; +MMNPLIKKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGRCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLAAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGACLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDSMIVKVNAALDAARTLGRPVDIASCRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_49:-17.7491 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:KA62T,TA68W,TA83N,VA144T,DA187H,AA194N; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KTNGLRVWPADQIDIITGALAGNANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPTVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILHGKGQRINEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_50:-25.8367 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:SA33I,AA81I,QA163C,EA202W,IA209H,FA247I; +MMNPLIIKLGGVLLDSEEALERLFSALVNYREIHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALIGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADCAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAWQLIEQGHITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALINGMPMGTRILA +>1gs5_Repair_51:-19.5374 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA13T,LA27V,TA113I,QA191P,LA204S,AA235L; +MMNPLIIKLGGVTLDSEEALERLFSAVVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVIQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGPRIAEMTAAKAEQSIEQGIITDGMIVKVNAALDAARTLGRPVDILSWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_52:-25.0581 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA12S,QA35I,AA92P,VA144S,NA160C,QA191L; +MMNPLIIKLGGSLLDSEEALERLFSALVNYRESHIRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWPKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPSVSSIGVTDEGQLMNVCADQAATALAATLGADLILLS +DVSGILDGKGLRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_53:-16.9855 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:EA18K,MA52N,LA80T,PA127S,PA143T,AA164D; +MMNPLIIKLGGVLLDSEKALERLFSALVNYRESHQRPLVIVHGGGCVVDELNKGLNLPVK +KKNGLRVTPADQIDIITGATAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQSGSPKLINSLLENGYLTVVSSIGVTDEGQLMNVNADQDATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_54:-25.2049 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:DA49L,VA122E,QA126H,LA186A,PA244Q,GA249M; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVLELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HEGLAHPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGIADGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLQALFNMMPMGTRILA +>1gs5_Repair_55:-23.5939 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:RA31Y,TA83W,LA179N,IA210F,RA230D,AA235I; +MMNPLIIKLGGVLLDSEEALERLFSALVNYYESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGWANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILNS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIFTDGMIVKVNAALDAARTLGDPVDIISWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_56:-12.0913 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:GA44E,VA48Q,LA51N,GA107Q,QA191K,VA216G; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGEGCVQDENMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDQDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGKRIAEMTAAKAEQLIEQGIITDGMIGKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_57:-26.5659 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA41I,GA43Q,TA68D,TA77I,SA183W,PA251N; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIIHQGGCVVDELMKGLNLPVK +KKNGLRVDPADQIDIIIGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVWGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMNMGTRILA +>1gs5_Repair_58:-25.643 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA28A,QA126T,LA176D,GA188I,KA189Q,VA216H; +MMNPLIIKLGGVLLDSEEALERLFSALANYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLATPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADDILLS +DVSGILDIQGQRIAEMTAAKAEQLIEQGIITDGMIHKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_59:-5.5929 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:AA26F,GA54I,GA128L,NA134I,GA149Q,NA158Y; +MMNPLIIKLGGVLLDSEEALERLFSFLVNYRESHQRPLVIVHGGGCVVDELMKILNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPLSPKLIISLLENGYLPVVSSIQVTDEGQLMYVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_60:-26.6977 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:KA94T,IA97N,QA163V,GA173E,MA214V,DA233E; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKTHQNAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADVAATALAATLEADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGVIVKVNAALDAARTLGRPVEIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_61:-11.8777 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:GA44Q,LA57T,TA68G,KA94W,LA176G,QA203D; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGQGCVVDELMKGLNTPVK +KKNGLRVGPADQIDIITGALAGTANKTLLAWAKWHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADGILLS +DVSGILDGKGQRIAEMTAAKAEDLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_62:-23.6775 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:YA30H,AA81S,NA160L,SA183P,AA220H,PA244Q; +MMNPLIIKLGGVLLDSEEALERLFSALVNHRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALSGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVLADQAATALAATLGADLILLS +DVPGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNHALDAARTLGRPVDIASWRHA +EQLQALFNGMPMGTRILA +>1gs5_Repair_63:-25.2495 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:DA15A,RA31I,PA37F,KA62D,VA145T,AA225M; +MMNPLIIKLGGVLLASEEALERLFSALVNYIESHQRFLVIVHGGGCVVDELMKGLNLPVK +KDNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVTSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAMRTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_64:-7.57756 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA55N,DA74K,LA88C,GA184M,LA186K,AA235R; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGNNLPVK +KKNGLRVTPADQIKIITGALAGTANKTCLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSMIKDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIRSWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_65:-29.5922 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:EA18N,DA49A,KA61H,TA151Y,EA202F,PA231L; +MMNPLIIKLGGVLLDSENALERLFSALVNYRESHQRPLVIVHGGGCVVAELMKGLNLPVK +HKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVYDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAFQLIEQGIITDGMIVKVNAALDAARTLGRLVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_66:-10.248 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA9K,EA138C,LA156H,AA169H,VA182G,MA214W; +MMNPLIIKKGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLCNGYLPVVSSIGVTDEGQHMNVNADQAATALHATLGADLILLS +DGSGILDGKGQRIAEMTAAKAEQLIEQGIITDGWIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_67:2.42973 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:GA54C,GA78P,TA87H,LA102E,TA171H,IA234Y; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKCLNLPVK +KKNGLRVTPADQIDIITPALAGTANKHLLAWAKKHQIAAVGEFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAAHLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDYASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_68:-19.5474 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA59I,QA96F,GA149S,IA185V,AA225K,GA229F; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPIK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHFIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSISVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGVLDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAKRTLFRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_69:-24.9271 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:EA18N,LA20T,SA33M,PA37E,LA89Q,SA146A; +MMNPLIIKLGGVLLDSENATERLFSALVNYREMHQRELVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLQAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVASIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_70:-16.9914 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA9G,IA73K,GA82L,HA121R,AA220V,RA255F; +MMNPLIIKGGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQKDIITGALALTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +RVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNVALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTFILA +>1gs5_Repair_71:-22.6523 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:NA3F,IA6P,EA21L,LA38D,TA83Y,GA101F; +MMFPLPIKLGGVLLDSEEALLRLFSALVNYRESHQRPDVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGYANKTLLAWAKKHQIAAVFLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_72:-20.3957 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:AA19D,LA57P,KA61I,EA117Q,AA165C,LA179T; +MMNPLIIKLGGVLLDSEEDLERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNPPVK +IKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDQELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQACTALAATLGADLILTS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_73:-22.3449 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:IA73M,IA75Q,LA142K,MA157H,QA191P,TA227C; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQMDQITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYKPVVSSIGVTDEGQLHNVNADQAATALAATLGADLILLS +DVSGILDGKGPRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARCLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_74:-23.0157 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:MA52S,IA76R,DA106W,AA167Q,AA170S,NA248Q; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELSKGLNLPVK +KKNGLRVTPADQIDIRTGALAGTANKTLLAWAKKHQIAAVGLFLGWGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATQLASTLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFQGMPMGTRILA +>1gs5_Repair_75:-27.8659 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:KA8Q,GA78L,GA101D,FA103W,PA130E,GA140Y; +MMNPLIIQLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITLALAGTANKTLLAWAKKHQIAAVDLWLGDGDSVKVTQLDEELG +HVGLAQPGSEKLINSLLENYYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_76:-9.99167 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA39G,GA64L,GA78C,QA114F,IA133K,RA238A; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLGIVHGGGCVVDELMKGLNLPVK +KKNLLRVTPADQIDIITCALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTFLDEELG +HVGLAQPGSPKLKNSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWAHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_77:-26.5065 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:RA66W,AA92L,LA115S,LA156Y,TA166P,GA190K; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLWVTPADQIDIITGALAGTANKTLLAWLKKHQIAAVGLFLGDGDSVKVTQSDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQYMNVNADQAAPALAATLGADLILLS +DVSGILDGKKQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_78:-10.6641 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA20Q,LA80N,GA123T,AA170R,EA202P,LA246Q; +MMNPLIIKLGGVLLDSEEAQERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGANAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVTLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALARTLGADLILLS +DVSGILDGKGQRIAEMTAAKAPQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPAQFNGMPMGTRILA +>1gs5_Repair_79:-29.2557 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:IA40M,WA91F,VA100G,IA133F,TA211W,HA239Y; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVMVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAFAKKHQIAAGGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLFNSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIIWDGMIVKVNAALDAARTLGRPVDIASWRYA +EQLPALFNGMPMGTRILA +>1gs5_Repair_80:-3.33226 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:WA91H,VA122W,EA153C,GA184D,LA243P,LA257F; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAHAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HWGLAQPGSPKLINSLLENGYLPVVSSIGVTDCGQLMNVNADQAATALAATLGADLILLS +DVSDILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQPPALFNGMPMGTRIFA +>1gs5_Repair_81:-7.85702 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:AA81D,GA123D,TA166L,GA229F,PA231R,MA252T; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALDGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVDLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAALALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLFRRVDIASWRHA +EQLPALFNGMPTGTRILA +>1gs5_Repair_82:-24.1735 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA65N,AA99V,TA166Y,LA179W,LA246N,NA248F; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGNRVTPADQIDIITGALAGTANKTLLAWAKKHQIAVVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAAYALAATLGADLILWS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPANFFGMPMGTRILA +>1gs5_Repair_83:-19.0028 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA23H,LA51F,KA93C,LA102P,QA126L,AA225P; +MMNPLIIKLGGVLLDSEEALERHFSALVNYRESHQRPLVIVHGGGCVVDEFMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWACKHQIAAVGPFLGDGDSVKVTQLDEELG +HVGLALPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAPRTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_84:-19.7225 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:AA19Y,EA21H,KA60F,LA137D,VA216R,HA239T; +MMNPLIIKLGGVLLDSEEYLHRLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVF +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLDENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIRKVNAALDAARTLGRPVDIASWRTA +EQLPALFNGMPMGTRILA +>1gs5_Repair_85:-32.2882 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:DA49S,KA86V,QA163P,SA183Y,EA202T,PA244M; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVSELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANVTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADPAATALAATLGADLILLS +DVYGILDGKGQRIAEMTAAKATQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLMALFNGMPMGTRILA +>1gs5_Repair_86:-29.4757 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:VA41M,LA51N,LA55D,AA70K,AA90N,TA151P; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIMHGGGCVVDENMKGDNLPVK +KKNGLRVTPKDQIDIITGALAGTANKTLLNWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVPDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_87:-7.94646 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:NA3I,LA57P,TA83I,AA84W,QA126V,VA182G; +MMIPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNPPVK +KKNGLRVTPADQIDIITGALAGIWNKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAVPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DGSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_88:-19.0727 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:GA64C,GA78R,AA90P,LA142W,LA156W,LA186H; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNCLRVTPADQIDIITRALAGTANKTLLPWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYWPVVSSIGVTDEGQWMNVNADQAATALAATLGADLILLS +DVSGIHDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_89:-18.3142 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:WA91D,YA141F,MA157F,KA189H,LA246R,FA247S; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLADAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGFLPVVSSIGVTDEGQLFNVNADQAATALAATLGADLILLS +DVSGILDGHGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPARSNGMPMGTRILA +>1gs5_Repair_90:-20.3898 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:FA24H,LA51S,NA56V,TA171V,IA177A,LA186T; +MMNPLIIKLGGVLLDSEEALERLHSALVNYRESHQRPLVIVHGGGCVVDESMKGLVLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAAVLGADLALLS +DVSGITDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_91:-10.372 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:EA18L,AA26Y,PA37C,HA42E,LA137Q,LA204D; +MMNPLIIKLGGVLLDSELALERLFSYLVNYRESHQRCLVIVEGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLQENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQDIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_92:-29.9811 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:RA36Q,IA75V,QA114N,EA138S,KA200G,EA202I; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQQPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDVITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTNLDEELG +HVGLAQPGSPKLINSLLSNGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAGAIQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_93:-32.3303 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:KA53Y,TA87H,EA153K,QA155C,DA233L,LA257A; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMYGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKHLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDKGCLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVLIASWRHA +EQLPALFNGMPMGTRIAA +>1gs5_Repair_94:-15.7568 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:SA33T,KA62R,LA115Y,PA130K,RA238H,GA253L; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRETHQRPLVIVHGGGCVVDELMKGLNLPVK +KRNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQYDEELG +HVGLAQPGSKKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWHHA +EQLPALFNGMPMLTRILA +>1gs5_Repair_95:-18.5359 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA23D,KA53L,LA65P,LA124D,EA202I,LA204D; +MMNPLIIKLGGVLLDSEEALERDFSALVNYRESHQRPLVIVHGGGCVVDELMLGLNLPVK +KKNGPRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGDSVKVTQLDEELG +HVGDAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAIQDIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_96:-8.89719 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:AA90Q,QA96P,VA122N,AA125M,DA181N,VA232W; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KKNGLRVTPADQIDIITGALAGTANKTLLQWAKKHPIAAVGLFLGDGDSVKVTQLDEELG +HNGLMQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +NVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPWDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_97:-32.2026 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:KA62Y,DA108G,PA143C,AA194L,AA201M,RA226L; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVK +KYNGLRVTPADQIDIITGALAGTANKTLLAWAKKHQIAAVGLFLGDGGSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLCVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRILEMTAAKMEQLIEQGIITDGMIVKVNAALDAALTLGRPVDIASWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_98:-14.4696 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:LA55P,PA69L,AA81I,LA89C,GA107P,AA235T; +MMNPLIIKLGGVLLDSEEALERLFSALVNYRESHQRPLVIVHGGGCVVDELMKGPNLPVK +KKNGLRVTLADQIDIITGALIGTANKTLCAWAKKHQIAAVGLFLGDPDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDITSWRHA +EQLPALFNGMPMGTRILA +>1gs5_Repair_99:-27.9348 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:EA18I,VA48M,IA75P,KA94T,LA186C,HA239K; +MMNPLIIKLGGVLLDSEIALERLFSALVNYRESHQRPLVIVHGGGCVMDELMKGLNLPVK +KKNGLRVTPADQIDPITGALAGTANKTLLAWAKTHQIAAVGLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGICDGKGQRIAEMTAAKAEQLIEQGIITDGMIVKVNAALDAARTLGRPVDIASWRKA +EQLPALFNGMPMGTRILA +>1gs5_Repair_100:-21.8819 reference-uniprot:sp|P0A6C8|ARGB_ECOLI||refence-pdb:1gs5_Repair||mutations:SA25W,KA60T,IA73Q,GA101D,GA208P,GA249S; +MMNPLIIKLGGVLLDSEEALERLFWALVNYRESHQRPLVIVHGGGCVVDELMKGLNLPVT +KKNGLRVTPADQQDIITGALAGTANKTLLAWAKKHQIAAVDLFLGDGDSVKVTQLDEELG +HVGLAQPGSPKLINSLLENGYLPVVSSIGVTDEGQLMNVNADQAATALAATLGADLILLS +DVSGILDGKGQRIAEMTAAKAEQLIEQPIITDGMIVKVNAALDAARTLGRPVDIASWRHA +EQLPALFNSMPMGTRILA