# Copyright Amazon.com, Inc. or its affiliates. All Rights Reserved. # SPDX-License-Identifier: MIT-0 import re def prep_seq(seq): """ Adding spaces between AAs and replace rare AA [UZOB] to X. ref: https://huggingface.co/Rostlab/prot_bert. Args seq: a string of AA sequence. Returns: String representing the input sequence where U,Z,O and B has been replaced by X. """ seq_spaced = " ".join(seq) seq_input = re.sub(r"[UZOB]", "X", seq_spaced) return seq_input