Question

我希望在目录中的所有文本文件上运行我的脚本，但是我遇到了很多麻烦。

这是我到目前为止的代码：

data = {}

date = ID = values = None


infile = "z140327b.txt"
outfile = "oz140327b.txt"

sample = 1

with open(infile) as datafile, open(outfile, 'w') as f2:
    for line in datafile:
        if line.lstrip().startswith('!'):
            date = line[1:].strip()
        elif line.lstrip().startswith('?'):
            sample = 2
        elif line.lstrip().startswith('@'):
            ID = line[1:].strip()
            data[ID] = {}
            data[ID]['date'] = date
            tedtime = ID[0:2] + ":" + ID[2:]
            str_1 = str(data[ID])
            f2.write(tedtime + ' ' + date + ',' + str(sample))
        elif line.strip():
            if not ID: 
                continue
            try:
                words = line.split()
                value = float(words[-1]) # last word
                unit = words[-2].lstrip('(').rstrip(')')
                item = {'value': value, 'unit': unit}
                key = ' '.join(words[:-2])
                data[ID][key] = item
            except (ValueError) as err:
                print("Could not parse this line:")
                print(line)
                continue
        else: # if 'empty' line
            ca_str = str(data[ID]['Contact Angle']['value'])
            f2.write(',' + ca_str + '\n')
            ID = None
    ca_str2 = str(data[ID]['Contact Angle']['value'])
    f2.write(',' + ca_str2 + '\n')

此时，我手动添加文件名（infile）和输出文件名（outfile）。我希望输出文件名与输入文件相同，前面加上＆＃39; o＆＃39;，如示例代码所示。

Answer 1

您可以使用glob来获取目录中的所有文件：

from glob import glob
files=glob('*.txt')
for filename in files:
    with open(filename,'r') as f, open('o'+filename,'w') as f1:
         .... 
         #read from f
         #write to f1

只需遍历每个文件名，执行您想要的操作，然后将其写入新文件。确保您的脚本是从您所在的目录运行的，或者您需要将路径传递给glob。

Answer 2

import glob
import os.path

def text_files(target_dir):
    """Return (infile, outfile) tuple for all *.txt files in target_dir."""
    text_files = os.path.join(target_dir, '*.txt')
    for fname in glob.glob(text_files):
        outfile = 'o' + os.path.basename(fname)
        outfile = os.path.join(target_dir, outfile)
        yield fname, outfile


# Search for text files in /tmp
for inf, outf in text_files("/tmp"):
    print inf, outf

在文件夹中的每个文本文件上运行脚本

2 个答案: