Skip to content

Commit

Permalink
tokenizers
Browse files Browse the repository at this point in the history
  • Loading branch information
0x00b1 committed Jul 19, 2024
1 parent a2fb9f1 commit 3815cb3
Showing 1 changed file with 12 additions and 2 deletions.
14 changes: 12 additions & 2 deletions tests/beignet/tokenizers/test__protein_tokenizer.py
Original file line number Diff line number Diff line change
Expand Up @@ -8,7 +8,12 @@ class TestProteinmMLMTokenizer:
def test_3Di_tokenizer(self):
inputs = ["GdPfQaPfIlSvRvLvEcQvClGpId"]

path = importlib.resources.files("lobster") / "assets" / "3di_tokenizer"
path = (
importlib.resources.files("beignet")
/ "data"
/ "tokenizers"
/ "3di_tokenizer"
)

tokenizer = ProteinTokenizerTransform.from_pretrained(path)
tokenized_inputs = tokenizer(inputs)
Expand All @@ -21,7 +26,12 @@ def test_3Di_tokenizer(self):
def test_cdna_tokenizer(self):
inputs = 4 * ["ATCGTACGATCGTACGATCGUN"]

path = importlib.resources.files("lobster") / "assets" / "cdna_tokenizer"
path = (
importlib.resources.files("beignet")
/ "data"
/ "tokenizers"
/ "cdna_tokenizer"
)

tokenizer = ProteinTokenizerTransform.from_pretrained(path)
tokenized_inputs = tokenizer(inputs)
Expand Down

0 comments on commit 3815cb3

Please sign in to comment.