# Copyright (c) 2024 Microsoft Corporation. # Licensed under the MIT License from graphrag.tokenizer.get_tokenizer import get_tokenizer def test_encode_basic(): tokenizer = get_tokenizer() result = tokenizer.encode("abc def") assert result == [26682, 1056], ( f"Encoding failed to return expected tokens, sent {result}" ) def test_num_tokens_empty_input(): tokenizer = get_tokenizer() result = len(tokenizer.encode("")) assert result == 0, "Token count for empty input should be 0"