doc(datasets): update docstrings and tests

This commit is contained in:
Sergey Penkovsky
2025-10-17 10:49:45 +03:00
parent 38c271ca3c
commit 613d784565
10 changed files with 563 additions and 177 deletions

View File

@@ -16,7 +16,7 @@ import torch
sys.path.append(os.path.dirname(os.path.dirname(os.path.abspath(__file__))))
from llm.tokenizers import BPETokenizer
from llm.training.dataset import TextDataset
from llm.datasets.text_dataset import TextDataset
from llm.training.trainer import Trainer
from shared.data import (