Merge pull request #17 from DL4DS/dataloaderfix
Browse files
code/modules/data_loader.py
CHANGED
@@ -39,12 +39,14 @@ class DataLoader:
|
|
39 |
chunk_size=config["splitter_options"]["chunk_size"],
|
40 |
chunk_overlap=config["splitter_options"]["chunk_overlap"],
|
41 |
separators=config["splitter_options"]["chunk_separators"],
|
|
|
42 |
)
|
43 |
else:
|
44 |
self.splitter = RecursiveCharacterTextSplitter(
|
45 |
chunk_size=config["splitter_options"]["chunk_size"],
|
46 |
chunk_overlap=config["splitter_options"]["chunk_overlap"],
|
47 |
separators=config["splitter_options"]["chunk_separators"],
|
|
|
48 |
)
|
49 |
else:
|
50 |
self.splitter = None
|
|
|
39 |
chunk_size=config["splitter_options"]["chunk_size"],
|
40 |
chunk_overlap=config["splitter_options"]["chunk_overlap"],
|
41 |
separators=config["splitter_options"]["chunk_separators"],
|
42 |
+
disallowed_special=()
|
43 |
)
|
44 |
else:
|
45 |
self.splitter = RecursiveCharacterTextSplitter(
|
46 |
chunk_size=config["splitter_options"]["chunk_size"],
|
47 |
chunk_overlap=config["splitter_options"]["chunk_overlap"],
|
48 |
separators=config["splitter_options"]["chunk_separators"],
|
49 |
+
disallowed_special=()
|
50 |
)
|
51 |
else:
|
52 |
self.splitter = None
|