diff --git a/OpenOrca.py b/OpenOrca.py index 47e77f6..3d4f215 100644 --- a/OpenOrca.py +++ b/OpenOrca.py @@ -21,8 +21,8 @@ class CustomDataset(DatasetBuilder): split_generators = [] for folder in folders: split_generators.extend([ - SplitGenerator(name=f'{folder}_train', gen_kwargs={'filepath': os.path.join(base_path, folder, f'{folder}-train.jsonl')}), - SplitGenerator(name=f'{folder}_test', gen_kwargs={'filepath': os.path.join(base_path, folder, f'{folder}-test.jsonl')}), + SplitGenerator(name=f'{folder.replace("-", "_")}_train', gen_kwargs={"filepath": f'{folder}/train.jsonl'}), + SplitGenerator(name=f'{folder.replace("-", "_")}_test', gen_kwargs={"filepath": f'{folder}/test.jsonl'}), ]) return split_generators