41 lines
1.2 KiB
Python
41 lines
1.2 KiB
Python
|
|
import json
|
|||
|
|
import os
|
|||
|
|
import glob
|
|||
|
|
|
|||
|
|
def convert_json_to_txt(json_file_path):
|
|||
|
|
"""将JSON文件转换为TXT文件,保持换行格式"""
|
|||
|
|
with open(json_file_path, 'r', encoding='utf-8') as f:
|
|||
|
|
data = json.load(f)
|
|||
|
|
|
|||
|
|
# 创建txt文件内容
|
|||
|
|
txt_content = data.get('title', '')
|
|||
|
|
txt_content += '\n\n' # title和content之间有两个换行
|
|||
|
|
txt_content += data.get('content', '')
|
|||
|
|
txt_content += '\n' # content和tag之间有一个换行
|
|||
|
|
txt_content += data.get('tag', '')
|
|||
|
|
|
|||
|
|
# 生成输出文件路径
|
|||
|
|
txt_file_path = os.path.splitext(json_file_path)[0] + '.txt'
|
|||
|
|
|
|||
|
|
# 写入txt文件
|
|||
|
|
with open(txt_file_path, 'w', encoding='utf-8') as f:
|
|||
|
|
f.write(txt_content)
|
|||
|
|
|
|||
|
|
print(f"已转换: {json_file_path} -> {txt_file_path}")
|
|||
|
|
|
|||
|
|
def main():
|
|||
|
|
"""查找并转换所有topic_*/article_judged.json文件"""
|
|||
|
|
# 查找所有topic文件夹下的article_judged.json文件
|
|||
|
|
json_files = glob.glob('topic_*/article_judged.json')
|
|||
|
|
|
|||
|
|
if not json_files:
|
|||
|
|
print("未找到符合条件的JSON文件")
|
|||
|
|
return
|
|||
|
|
|
|||
|
|
for json_file in json_files:
|
|||
|
|
convert_json_to_txt(json_file)
|
|||
|
|
|
|||
|
|
print(f"转换完成,共处理了 {len(json_files)} 个文件")
|
|||
|
|
|
|||
|
|
if __name__ == "__main__":
|
|||
|
|
main()
|