Update 2025-04-13_15:16:39
This commit is contained in:
11
raw_training_data.py
Normal file
11
raw_training_data.py
Normal file
@ -0,0 +1,11 @@
|
||||
import os
|
||||
|
||||
content_dir = "./content"
|
||||
output_file = "raw_training_data.txt"
|
||||
|
||||
with open(output_file, "w", encoding="utf-8") as f:
|
||||
for txt_file in os.listdir(content_dir):
|
||||
if txt_file.endswith(".txt"):
|
||||
with open(os.path.join(content_dir, txt_file), "r", encoding="utf-8") as tf:
|
||||
text = tf.read().strip()
|
||||
f.write(text + "\n") # One text per line
|
Reference in New Issue
Block a user