本文就是做一个笔记,可能看起来很乱,仅供参考

file

# 使用 with 会保证文件被关闭
with open(file) as f, open(file1) as f2 ...
    # do some thing with f & f1
    
    f.read() # 返回一个字符串,包含文件内所有内容
    f.read(n) # 返回文件中包含的 n 个字符/文字
    f.readline() # 读取下一个\n 之前的内容,并返回一个字符串
    f.readlines() # 读取文件,返回一个行字符串列表
    
    f.seak(n) # 光标移动到索引位置
    
# 对于临时文件这样处理比较好,如果下面用不到这个文件对象
for line in open(file): 
    print(line)
    
#循环遍历文件
f = open(file)
for line in f: #无需调用 readlines
    print(line)
    
#上面的代码可以简化为
print(line) for line in f

文件打开模式

1.r只读，r+读写，不创建
#w新建只写，w+新建读写，二者都会将文件内容清零
#以w方式打开，不能读出。w+可读写

2.**w+与r+区别：
#r+：可读可写，若文件不存在，报错；w+: 可读可写，若文件不存在，创建

3.r+与a+区别：
    fd = open("1.txt",'w+')  
    fd.write('123')  
    fd = open("1.txt",'r+')  
    fd.write('456')  
    fd = open("1.txt",'a+')  
    fd.write('789') 
# 结果：456789
# 说明r+进行了覆盖写

4.以a,a+的方式打开文件，附加方式打开
#a:附加写方式打开，不可读；读取报错
#a+: 附加读写方式打开
5. wb / wb+  rb / rb+
# 针对二进制文件

递归打印目录

import sys, os
# 用 walk 函数打印目录树
def walk(currdir):
    for (thisdir, subshere, fileshere) in os.walk(currdir):
        print('thisdir-->',thisdir) #该目录下的所有的文件夹
        print('subshere-->', subshere) #当前目录下所有的子目录
        print('fileshere-->',fileshere) #当前目录下所有的文件

# 利用自己写的递归函数遍历目录
def mylister(currdir):
    print('[' + currdir + ']')
    for file in os.listdir(currdir):
        path = os.path.join(currdir, file)
        if not os.path.isdir(path): #判断是否为目录
            print(path)
        else:
            mylister(path)

if __name__ == '__main__':
    mylister(sys.argv[1])
    walk(sys.argv[1])

logging模块

# 一共五种级别的日志
logging.critical(msg)
logging.error(msg)
logging.warning(msg)
logging.info(msg)
logging.debug(msg)


#级别排序为：CRITICAL > ERROR > WARNING > INFO > DEBUG > NOTSET

#默认为WARNING 级别低的不会显示在命令行

#更改日志输出级别
logging.root.setLevel(level=logging.INFO)

gzip, zipfile, tarfile 模块

zilib

[ ] zlib.compress(orginal_string) 对字符串进行加密
[ ] zlib.decompress(compressed_string) 对加密串解密

bz2

    基本使用方法同 zilib, 作用相同,加密方式不同而已

gzip

#压缩
content = "Lots of content here"
with gzip.open('file.txt.gz', 'wb') as f:
    f.write(content)

#解压
with gzip.open('file.txt.gz', 'rb') as f:
    file_content = f.read()
    print file_content
  
#将文件解压出来    
with gzip.open('file.txt.gz', 'rb') as f_in, open('file.txt', 'wb') as f_out:
    shutil.copyfileobj(f_in, f_out)    

#目录下应有 file.txt 文件，
with open("file.txt") as f:
    print f.read()

zipfile

f = zipfile.ZipFile('files.zip','w')

for file in glob.glob("*.txt"):
    f.write(file)
    # 移除压缩完的文件
    os.remove(file)
    
f.close()

f = zipfile.ZipFile('files.zip','r')
f.namelist() #查看压缩包内子文件名 -> []

for file in f.namelist():
    # 读取 file 文件中的内容
    print file, "content:", f.read(file)

f.close()

f.extract() #解压单个文件
f.extractall() # 解压全部文件

tarfile

# 压缩文件
f = tarfile.open("file.txt.tar", "w")
f.add("file.txt")


# 解压同 zipfile
f.extract() #解压单个文件
f.extractall() # 解压全部文件

shutil模块

高级文件夹操作

[ ] shutil.copy(src, dst) 将源文件复制到目标地址(包括文件权限)
[ ] shutil.copyfile(src, dst) 将源文件复制到目标地址(仅文件内容)
[ ] shutil.copytree(src, dst) 复制文件夹
[ ] os.removedirs(dst) 删除非空文件夹(必须是非空文件夹)
[ ] shutil.move 与 os.rename 功能差不多
[ ] shutil.get_archive_formats() 查看直接查看的压缩文件格式('bztar', 'gztar' ,'tar', 'xztar', 'zip')
[ ] shutil.make_archive("test_archive", "zip", "test_dir/") 压缩 test_dir 文件夹,以 zip 格式, 名字为 test_archive

glob模块

[ ] glob.glob('*.py') 获取当前目录下所有的 py 文件

glob 函数支持三种格式的语法:
    * 匹配单个或多个字符
    ? 匹配任意单个字符
    [] 匹配指定范围内的字符，如：[0-9]匹配数字。

json模块

[ ] json.loads(json_string/file) 如果是 json_string 会将 json 转换成 dict 对象,如果是 file, 会从文件中读取 json 转换成 dict 对象
[ ] json.dumps(obj, file) 如果有 file 对象,生成 json 文件,如果没有 file将 obj 变成 json 对象

os模块

[ ] os.remove(path) 或 os.unlink(path) ：删除指定路径的文件。路径可以是全名，也可以是当前工作目录下的路径。
[ ] os.removedirs：删除文件，并删除中间路径中的空文件夹
[ ] os.chdir(path)：将当前工作目录改变为指定的路径
[ ] os.getcwd()：返回当前的工作目录
[ ] os.curdir：表示当前目录的符号
[ ] os.rename(old, new)：重命名文件
[ ] os.renames(old, new)：重命名文件，如果中间路径的文件夹不存在，则创建文件夹
[ ] os.listdir(path)：返回给定目录下的所有文件夹和文件名，不包括 '.' 和 '..' 以及子文件夹下的目录。（'.' 和 '..' 分别指当前目录和父目录）
[ ] os.mkdir(name)：产生新文件夹
[ ] os.makedirs(name)：产生新文件夹，如果中间路径的文件夹不存在，则创建文件夹
[ ] os.listdir(os.curdir) 当前目录下的文件
[ ] os.linesep 系统换行符
[ ] os.sep 系统分隔符
[ ] os.pathsep 系统环境变量分隔符
[ ] os.environ 环境变量(实际是一个dict)

os.path模块:

[ ] os.path.isfile(path) ：检测一个路径是否为普通文件
[ ] os.path.isdir(path)：检测一个路径是否为文件夹
[ ] os.path.exists(path)：检测路径是否存在
[ ] os.path.isabs(path)：检测路径是否为绝对路径
[ ] os.path.split(path)：拆分一个路径为 (head, tail) 两部分
[ ] os.path.join(a, *p)：使用系统的路径分隔符，将各个部分合成一个路径
[ ] os.path.abspath()：返回路径的绝对路径
[ ] os.path.dirname(path)：返回路径中的文件夹部分
[ ] os.path.basename(path)：返回路径中的文件部分
[ ] os.path.splitext(path)：将路径与扩展名分开
[ ] os.path.expanduser(path)：展开 '~' 和 '~user'

dict模块

创建字典
    {key:value}
    dict([(key,value),
          (key,value)])
update
    dict[key] = value
    dict.get(key)
    
pop
    dict.pop(key)
    
in
    key in dict -> bool

list
    dict.keys()   #['cows', 'cats', 'dogs']
    dict.values() #[1, 3, 5]
    dict.items()  #[('cows', 1), ('cats', 3), ('dogs', 5)]

list

创建 list
    [value1,value2]
    list()
    list([value1,value2])

append
    list1 + list2 
    
double 
    list1 * 2 #[1, 2.0, 'hello', 1, 2.0, 'hello']

delect
    del list1[index]
    del list1[index:index]    

in 
    value in list1 -> bool
 
count
    a = [11, 12, 13, 12, 11]
    a.count(11)   # 2

index
    a.index(11)
    
append
    a.append(value)
    
extend
    a = [10, 11, 12, 11]
    a.extend([1, 2]) # a = [10, 11, 12, 11, 1, 2]

insert
    list1.insert(index,value)
    
remove 
    a.remove(11) #a = [10, 12, 11, 1, 2]

pop 
    a = [10, 11, 12, 13, 11]
    a.pop(2) # 12

tuple

创建 tuple
    t = (1,2,3,4)
    t = (1,) #(1,) tuple
    t = (1) #1 int
get 
    t[index]
    
del or update
    不可变

set

创建 set
    set()
    set([1,2,3,1]) #{1, 2, 3}
    {1,2,3,1} #{1, 2, 3}
    ----------
    {} # dict
    set() # set
    ----------
    frozenset([1, 2, 3, 'a', 1]) #不可变的集合

add
    t = {1, 2, 3}
    t.add(value) # {1, 2, 3, 5}
    t.update([4,5,6]) # {1, 2, 3, 4, 5, 6}
    
remove
    t.remove(value)

pop
    t.pop #删除任意一个元素

discard 同 remove ,移除不存在的元素不会报错
    
union
    a = {1, 2, 3, 4}
    b = {3, 4, 5, 6}
    a.union(b) #{1, 2, 3, 4, 5, 6}
    a | b #{1, 2, 3, 4, 5, 6}

intersection
    a.intersection(b) # {3, 4}
    a & b  # {3, 4}
    
difference
    a.difference(b) # {1, 2}
    a - b # {1, 2}
    ---a - b 与 b - a并不一样，b - a 返回的是返回 b 不在 a 的元素组成的集合---
    b.difference(a) # {5, 6}
    b - a  # {5, 6}
    
difference_update
    # 从a中去除所有属于b的元素
    a.difference_update(b)

切片

s = 'hello world'
s[1:3] #'el'
s[:3]  # 'hel'
s[1:-2] #'ello wor'
s[-3:]  #'rld'

Python 部分基础模块

file

文件打开模式

递归打印目录

logging模块

gzip, zipfile, tarfile 模块

zilib

bz2

gzip

zipfile

tarfile

shutil模块

glob模块

json模块

os模块

os.path模块:

dict模块

list

tuple

set

切片

你可能感兴趣的:(Python 部分基础模块)