Python - 使用模式匹配目录(正则表达式)

时间:2016-02-29 07:21:52

标签: python regex python-2.7

我写了一个循环,它忽略了包含.txt文件的所有子目录。

src = raw_input("Enter source disk location: ")
src = os.path.abspath(src)
dst = raw_input("Enter first destination to copy: ")
dst = os.path.abspath(dst)
dest = raw_input("Enter second destination to move : ")
dest = os.path.abspath(dest) 

path_patter = '(\S+)_(\d+)_(\d+)_(\d+)__(\d+)_(\d+)_(\d+)'

for dir, dirs, files in os.walk(src):
if any(f.endswith('.txt') for f in files):
    dirs[:] = []  # do not recurse into subdirectories
    continue  
files = [os.path.join(dir, f) for f in files ]

for f in files:

    part1 = os.path.dirname(f)
    part2 = os.path.dirname(os.path.dirname(part1))
    part3 = os.path.split(part1)[1]
    path_miss1 = os.path.join(dst, "missing_txt")
    path_miss = os.path.join(path_miss1, part3)
    path_missing = os.path.join(dest, "missing_txt")
    searchFileName = re.search(path_patter, part3)#### update

    if searchFileName:#####update
    try:
        if not os.path.exists(path_miss):
            os.makedirs(path_miss)
        else:
            pass

        if os.path.exists(path_miss):
            distutils.dir_util.copy_tree(part1, path_miss)
        else:
            debug_status += "missing_file\n"
            pass

        if (get_size(path_miss)) == 0:
            os.rmdir(path_miss)
        else:
            pass

        if not os.path.exists(path_missing):
            os.makedirs(path_missing)
        else:
            pass

        if os.path.exists(path_missing):
            shutil.move(part1, path_missing)
        else:
            pass

        if (get_size(path_missing)) == 0:
            os.rmdir(path_missing)
        else:
            pass
    except Exception:
        pass
    else:
    continue

在这种情况下,如何修改此代码以将目录名与正则表达式进行比较。 (它必须忽略带.txt文件的目录)

1 个答案:

答案 0 :(得分:0)

import os
import re

def createEscapedPattern(path,pattern):
    newPath = os.path.normpath(path)
    newPath = newPath.replace("\\","\\\\\\\\")
    return newPath + "\\\\\\\\" +  pattern

def createEscapedPath(path):
    newPath =  os.path.normpath(path)
    return newPath.replace("\\","\\\\")

src = 'C:\\Home\\test'
path_patter = '(\S+)_(\d+)_(\d+)_(\d+)__(\d+)_(\d+)_(\d+)$'
p = re.compile(createEscapedPattern(src,path_patter))
for dir, dirs, files in os.walk(src):
    if any(f.endswith('.txt') for f in files):
        dirs[:] = []
        continue
    if any(p.match(createEscapedPath(dir)) for f in files):
        for f in files:
            print createEscapedPath(dir + "/" + f)
    p = re.compile(createEscapedPattern(dir,path_patter))

我在这里做了几件事,并希望这个例子有所帮助

  • 我为windows fs写了这个,所以使用了两个路径转换函数。
  • 此脚本会忽略dirs与.txt文件一样实现它
  • 此脚本将从您启动脚本的目录开始,并且仅在模式匹配时才打印文件名。这是针对之前规则未忽略的所有子目录完成的。
  • 在python中使用了正则表达式,并为每个目录再次编译,因此得到:'目录/(\ S +)(\ d +)(\ d +)_(\ d +)__ (\ d +)(\ d +)(\ d +)$'