Update 2025-04-13_15:16:39

This commit is contained in:
2025-04-13 15:16:39 +02:00
commit 0a1a209dac
12 changed files with 986 additions and 0 deletions

11
raw_training_data.py Normal file
View File

@ -0,0 +1,11 @@
import os
content_dir = "./content"
output_file = "raw_training_data.txt"
with open(output_file, "w", encoding="utf-8") as f:
for txt_file in os.listdir(content_dir):
if txt_file.endswith(".txt"):
with open(os.path.join(content_dir, txt_file), "r", encoding="utf-8") as tf:
text = tf.read().strip()
f.write(text + "\n") # One text per line