Python字符串和文件操作常用函数分析 - 哈喽比特

882次阅读 | 发布于6年以前
本文实例分析了Python字符串和文件操作常用函数。分享给大家供大家参考。具体如下：

    # -*- coding: UTF-8 -*-
    '''
    Created on 2010-12-27
    @author: sumory
    '''
    import itertools
    def a_containsAnyOf_b(seq,aset):
      '''判断seq中是否含有aset里的一个或者多个项
        seq可以是字符串或者列表
        aset应该是字符串或者列表'''
      for item in itertools.ifilter(aset.__contains__,seq):
        return True
      return False
    def a_allIn_b(seq,aset):
      '''判断seq中的所有项是否都在aset里
        seq可以是字符串或者列表
        aset应该是字符串或者列表'''
      for item in seq:
        if item not in aset:
          return False
      return True
    def a_containsAll_b(seq,aset):
      '''判断seq是否包含aset里的所有项
        seq可以是字符串或者列表
        aset应该是字符串或者列表
             任何一个set对象a，a.difference(b)等价于a-set(b),即返回a中所有不属于b的元素'''
      return not set(aset).difference(seq)

    import string
    #生成所有字符的可复用的字符串
    sumory_allchars=string.maketrans('','')
    def makefilter(keep):
      '''返回一个函数，此函数接受一个源字符串作为参数\
        并返回字符串的一个部分拷贝\
        此拷贝只包括keep中的字符，keep必须是一个普通的字符串\
        调用示例：makefilter('abca ')('abcdefgh ijkal cba')\
        在后面的字符串中保留前面出现的字符 abc a cba
      '''
      #按照sumory_allchars规则剔除sumory_allchars字符串中的keep里的字符
      #这里得到keep在sumory_allchars的补集
      deletechars=sumory_allchars.translate(sumory_allchars,keep)
      #生成并返回需要的过滤函数（作为闭包）
      def realdelete(sourseStr):
        return sourseStr.translate(sumory_allchars,deletechars)
      return realdelete
    def list_removesame(list):
      '''删除list中的重复项'''
      templist=[]
      for c in list:
        if c not in templist:
          templist.append(c)
      return templist
    def re_indent(str,numberofspace):
      '''
      缩进\
      将字符串str中按换行符划分并在每句前加上numberofspace个space\
      再组合成字符串'''
      spaces=numberofspace*' '
      lines=[spaces+line.strip() for line in str.splitlines()]
      return '\n'.join(lines)
    def replace_strby_dict(sourseStr,dict,marker='"',safe=False):
      '''使用字典替换源字符串中的被marker包裹的相应值'''
      #如果safe为True，那么字典中没找到key时不替换
      if safe:
        def lookup(w):
          return dict.get(w,w.join(marker*2))
       #w.join(marker*2)用marker包裹w
      #如果safe为False，那么字典中没找到key时抛异常\
      #若将dict[w]换为dict.get(w)则没找到时返回None
      else:
        def lookup(w):
          return dict[w]
      #根据marker切分源字符串
      splitparts=sourseStr.split(marker)
      #取出切分后的奇数项
      #因为切分后，列表中源字符串中marker包裹的项肯定位于基数部位
      #就算是'"first"s is one'这样的字符串也是如此
      #分割后的第0项为空串，第1项为first
      splitparts[1::2]=map(lookup,splitparts[1::2])
      return ''.join(splitparts)
    def simply_replace_strby_dict(sourseStr,dict,safe=True):
      '''根据dict内容替换sourseStr原串中$标记的子字符串\
      dict= {'name':'sumory','else':'default'}
      $$5 -> $5
      $else -> default
      ${name}'s method -> sumory's method
      '''
      style=string.Template(sourseStr)
      #如果safe，在dict中找不到的话不会替换，照样保留原串
      if safe:
        return style.safe_substitute(dict)
      #false，找不到会抛异常
      else:
        return style.substitute(dict)
    ##################################################
    def scanner(object,linehandler):
      '''用linehandler方法遍历object的每一项'''
      for line in object:
        linehandler(line)
    def printfilelines(path):
      '''读取path路径下的文件屏逐行打印'''
      fileobject=open(path,'r')#open不用放到try里
      try:
        for line in fileobject:
          print(line.rstrip('\n'))
      finally:
        fileobject.close()
    def writelisttofile(path,ilist):
      fileobject=open(path,'w')
      try:
        fileobject.writelines(ilist)
      finally:
        fileobject.close()
    import zipfile
    def listzipfilesinfo(path):
      z=zipfile.ZipFile(path,'r')
      try:
        for filename in z.namelist():
          bytes=z.read(filename)
          print('File:%s Size:%s'%(unicode(filename, 'cp936').decode('utf-8'),len(bytes)))
      finally:
        z.close()

    import os,fnmatch
    def list_all_files(root,patterns='*',single_level=False,yield_folders=False):
      '''列出目录（或者及其子目录下的文件）'''
      #分割模式到列表
      patterns=patterns.split(';')
      for path,subdirs,files in os.walk(root):
        if yield_folders:
          files.extend(subdirs)
        files.sort()
        for name in files:
          for pat in patterns:
            if fnmatch.fnmatch(name, pat):
              yield '/'.join(unicode(os.path.join(path,name),'cp936').split('\\'))
              break
        if single_level:
          break
    def swapextensions(root,before,after):
      if before[:1]!='.':
        before='.'+before
      extensionlen=-len(before)
      if after[:1]!='.':
        after='.'+after
      for path,subdirs,files in os.walk(root):
        for oldfile in files:
          if oldfile[extensionlen:]==before:
            oldfile=os.path.join(path,oldfile)
            newfile=oldfile[:extensionlen]+after
            os.rename(oldfile, newfile)
希望本文所述对大家的Python程序设计有所帮助。