skip to content
Liu Yang's Blog

[Script] Recursive File Search and Content Extraction for Code Files

/ 1 min read

大二的某个时间写的, 因为相对有用,特此留存

import os
from pathlib import Path
# 欲遍历的文件目录
workPath = "./work"
# 欲保存的文件位置
totalSourceFile = open("d:\\source.txt",'a+',encoding="utf-8")
def getCodeSource(filesdir):
for filename in os.listdir(filesdir):
# 合并文件名和路径
fileBasename = filename
filename = os.path.join(filesdir,filename)
if Path(filename).is_dir():
# 若为目录,递归寻找
getCodeSource(filename)
else:
# 若为文件,判断是否为需要的代码文件cpp/py/h
if filename.find('.cpp')>0 or filename.find('.py') or filename.find('.h')>0:
if filename.find('.html')<0:
# 排除html文件
print(filename)
sourcefile = open(filename,encoding="utf-8")
# 文件名
totalSourceFile.write('\n'+'文件名:'+fileBasename+'文件名'+'\n')
# 文件内容
totalSourceFile.write(sourcefile.read())
sourcefile.close()
return
getCodeSource(workPath)