conftest.py 697 B

123456789101112131415161718
  1. # Copyright (c) Meta Platforms, Inc. and affiliates.
  2. # This software may be used and distributed according to the terms of the Llama 2 Community License Agreement.
  3. import pytest
  4. from transformers import LlamaTokenizer
  5. @pytest.fixture
  6. def setup_tokenizer():
  7. def _helper(tokenizer):
  8. #Align with Llama 2 tokenizer
  9. tokenizer.from_pretrained.return_value = LlamaTokenizer.from_pretrained("decapoda-research/llama-7b-hf")
  10. tokenizer.from_pretrained.return_value.add_special_tokens({'bos_token': '<s>', 'eos_token': '</s>'})
  11. tokenizer.from_pretrained.return_value.bos_token_id = 1
  12. tokenizer.from_pretrained.return_value.eos_token_id = 2
  13. return _helper