datasets.py 986 B

12345678910111213141516171819202122232425262728293031323334
  1. # Copyright (c) Meta Platforms, Inc. and affiliates.
  2. # This software may be used and distributed according to the terms of the Llama 2 Community License Agreement.
  3. from dataclasses import dataclass
  4. @dataclass
  5. class samsum_dataset:
  6. dataset: str = "samsum_dataset"
  7. train_split: str = "train"
  8. test_split: str = "validation"
  9. @dataclass
  10. class grammar_dataset:
  11. dataset: str = "grammar_dataset"
  12. train_split: str = "src/llama_recipes/datasets/grammar_dataset/gtrain_10k.csv"
  13. test_split: str = "src/llama_recipes/datasets/grammar_dataset/grammar_validation.csv"
  14. @dataclass
  15. class alpaca_dataset:
  16. dataset: str = "alpaca_dataset"
  17. train_split: str = "train"
  18. test_split: str = "val"
  19. data_path: str = "src/llama_recipes/datasets/alpaca_data.json"
  20. @dataclass
  21. class custom_dataset:
  22. dataset: str = "custom_dataset"
  23. file: str = "examples/custom_dataset.py"
  24. train_split: str = "train"
  25. test_split: str = "validation"