1.针对文本开头存在空格的问题进行处理。
2.读取txt文档,将处理后的内容写回原文件。
#文本预处理5-去除文字开头的空格
import os
def left_align_text(text):
# 将文本分割成行
lines = text.split('\n')
# 去除每行的前导空格并左对齐
aligned_lines = [line.lstrip().ljust(len(lines[0])) for line in lines]
# 将对齐后的行合并回文本
aligned_text = '\n'.join(aligned_lines)
return aligned_text
def process_txt_files(folder_path):
for filename in os.listdir(folder_path):
if filename.endswith('.txt'):
file_path = os.path.join(folder_path, filename)
with open(file_path, 'r', encoding='utf-8') as file:
content = file.read()
processed_content = left_align_text(content)
# 将处理后的内容写回原文件
with open(file_path, 'w', encoding='utf-8') as file:
file.write(processed_content)
# print(f'Processed content written back to {filename}')
# 替换为你的文件夹路径
folder_path = "C:\\Users\\lenovo\\Desktop"
process_txt_files(folder_path)
标签:content,text,lines,空格,file,path,folder,文本,预处理 From: https://blog.csdn.net/weixin_53389235/article/details/139833038