九、collection系统
先做个练习
练习一:元素分类
有如下值集合 [11,22,33,44,55,66,77,88,99,90...],将所有大于 66 的值保存至字典的第一个key中,将小于 66 的值保存至第二个key的值中。
即: {'k1': 大于66 , 'k2': 小于66}
1 #!/usr/bin/env python 2 # _*_ coding:utf-8 _*_ 3 ''' 4 将一个数字列表分割成字典,'k1'的值为小于66的值,'k2'的值为大于66的值 5 ''' 6 li = [11,22,33,44,55,66,77,88,99,90] 7 dic = {} 8 for ele in li: 9 #先判断是否小于66 10 if ele < 66: 11 #判断是否有'k1'的键,如果有就追加 12 if 'k1' in dic.keys(): 13 dic['k1'].append(ele) 14 else: 15 #创建只有一个元素的列表 16 dic['k1'] = [ele,] 17 else: 18 if 'k2' in dic.keys(): 19 dic['k2'].append(ele); 20 else: 21 dic['k2'] = [ele,] 22 23 print dic 24 25 #打印出字典的键和值,值占4个字符,前面用’*‘填充,打印时要把数值转换成字符串形式 26 for k in dic.keys(): 27 print k 28 if type(dic[k]) == list: 29 for i in dic[k]: 30 print str(i).rjust(4,'*')
练习二:将文件中读出的内容转换成字典
已知文件内容为
alex|123|1
eric|123|1
john|123|1
转换成字典形式
dic = {
'alex':[123,1]
'eric':[123,1]
'john':[123,1]
}
1 #!/usr/bin/env python 2 # _*_ coding:utf-8 _*_ 3 4 ''' 5 想要得到的效果 6 dic = { 7 'alex':[123,1] 8 'eric':[123,1] 9 'john':[123,1] 10 } 11 ''' 12 13 #打开文件,读取文件内容,用的with as,这样可以保证最后文件会被关闭 14 with open('log.txt') as f: 15 #将文件读出来赋值给一个列表 16 line_list = f.readlines(); 17 print line_list 18 dic = {} 19 #遍历列表,将每行再分割成列表 20 for line in line_list: 21 line = line.strip(); 22 ele_list = line.split('|') 23 #把姓名做成字典的key,并把后面所有元素当做这个key的值,这里用的是[1:],取出除了0外,所有的值 24 dic[ele_list[0]] = ele_list[1:] 25 26 #下面是遍历字典的两种方法,推荐使用第一种,因为在字典内容少的时候两种方法都可以 27 #但当字典内容多的时候,第二种方法的字典会先值转换成列表,会消耗时间和占用内存 28 #方法一 29 for k in dic.keys(): 30 print k,dic[k] 31 32 for ele in dic: 33 print ele,dic[ele]; 34 35 #方法二 36 for k,v in dic.items(): 37 print k,v
1、计数器(counter)
Counter是对字典类型的补充,用于追踪值的出现次数
ps:具备字典的所有功能+自己的功能
1 >>> import collections 2 NameError: name 'Counter' is not defined 3 >>> c = collections.Counter('asdfasdfasdfasdf') 4 >>> c 5 Counter({'a': 4, 's': 4, 'd': 4, 'f': 4}) 6 >>>
1 ######################################################################## 2 ### Counter 3 ######################################################################## 4 5 class Counter(dict): 6 '''Dict subclass for counting hashable items. Sometimes called a bag 7 or multiset. Elements are stored as dictionary keys and their counts 8 are stored as dictionary values. 9 10 >>> c = Counter('abcdeabcdabcaba') # count elements from a string 11 12 >>> c.most_common(3) # three most common elements 13 [('a', 5), ('b', 4), ('c', 3)] 14 >>> sorted(c) # list all unique elements 15 ['a', 'b', 'c', 'd', 'e'] 16 >>> ''.join(sorted(c.elements())) # list elements with repetitions 17 'aaaaabbbbcccdde' 18 >>> sum(c.values()) # total of all counts 19 20 >>> c['a'] # count of letter 'a' 21 >>> for elem in 'shazam': # update counts from an iterable 22 ... c[elem] += 1 # by adding 1 to each element's count 23 >>> c['a'] # now there are seven 'a' 24 >>> del c['b'] # remove all 'b' 25 >>> c['b'] # now there are zero 'b' 26 27 >>> d = Counter('simsalabim') # make another counter 28 >>> c.update(d) # add in the second counter 29 >>> c['a'] # now there are nine 'a' 30 31 >>> c.clear() # empty the counter 32 >>> c 33 Counter() 34 35 Note: If a count is set to zero or reduced to zero, it will remain 36 in the counter until the entry is deleted or the counter is cleared: 37 38 >>> c = Counter('aaabbc') 39 >>> c['b'] -= 2 # reduce the count of 'b' by two 40 >>> c.most_common() # 'b' is still in, but its count is zero 41 [('a', 3), ('c', 1), ('b', 0)] 42 43 ''' 44 # References: 45 # http://en.wikipedia.org/wiki/Multiset 46 # http://www.gnu.org/software/smalltalk/manual-base/html_node/Bag.html 47 # http://www.demo2s.com/Tutorial/Cpp/0380__set-multiset/Catalog0380__set-multiset.htm 48 # http://code.activestate.com/recipes/259174/ 49 # Knuth, TAOCP Vol. II section 4.6.3 50 51 def __init__(self, iterable=None, **kwds): 52 '''Create a new, empty Counter object. And if given, count elements 53 from an input iterable. Or, initialize the count from another mapping 54 of elements to their counts. 55 56 >>> c = Counter() # a new, empty counter 57 >>> c = Counter('gallahad') # a new counter from an iterable 58 >>> c = Counter({'a': 4, 'b': 2}) # a new counter from a mapping 59 >>> c = Counter(a=4, b=2) # a new counter from keyword args 60 61 ''' 62 super(Counter, self).__init__() 63 self.update(iterable, **kwds) 64 65 def __missing__(self, key): 66 """ 对于不存在的元素,返回计数器为0 67 >>> c 68 Counter({'a': 12, 'f': 10, 'd': 9, 's': 9, 'c': 3, 'g': 3, 'e': 1}) 69 >>> c['a'] 70 12 71 >>> c['z'] 72 0 73 #原生字典会抛异常 74 >>> a = {1:2,3:4} 75 >>> a[1] 76 2 77 >>> a[55] 78 Traceback (most recent call last): 79 File "", line 1, in 80 KeyError: 55 81 >>> 82 """ 83 'The count of elements not in the Counter is zero.' 84 # Needed so that self[missing_item] does not raise KeyError 85 return 0 86 87 def most_common(self, n=None): 88 """ 列出n个出现次数最多的元素 默认最从多到少排序的,所以看起来就像是截取了前几个元素 89 >>> c = collections.Counter('asdfasdfasdfasdfaaaacccsdfefgasdfasdfgasdfasdgf') 90 >>> c 91 Counter({'a': 12, 'f': 10, 'd': 9, 's': 9, 'c': 3, 'g': 3, 'e': 1}) 92 >>> c.most_common(3) 93 [('a', 12), ('f', 10), ('d', 9)] 94 >>> 95 """ 96 '''List the n most common elements and their counts from the most 97 common to the least. If n is None, then list all element counts. 98 99 >>> Counter('abcdeabcdabcaba').most_common(3) 100 [('a', 5), ('b', 4), ('c', 3)] 101 102 ''' 103 # Emulate Bag.sortedByCount from Smalltalk 104 if n is None: 105 return sorted(self.iteritems(), key=_itemgetter(1), reverse=True) 106 return _heapq.nlargest(n, self.iteritems(), key=_itemgetter(1)) 107 108 def elements(self): 109 """ 计数器中的所有元素,注:此处非所有元素集合,而是包含所有元素集合的迭代器 110 >>> c = collections.Counter('aaaabbbcc') 111 >>> c 112 Counter({'a': 4, 'b': 3, 'c': 2}) 113 #因为是迭代器,所以要用循环取出 114 >>> c.elements() 115116 >>> for ele in c.elements():print ele; 117 ... 118 a 119 a 120 a 121 a 122 c 123 c 124 b 125 b 126 b 127 >>> 128 """ 129 '''Iterator over elements repeating each as many times as its count. 130 131 >>> c = Counter('ABCABC') 132 >>> sorted(c.elements()) 133 ['A', 'A', 'B', 'B', 'C', 'C'] 134 135 # Knuth's example for prime factors of 1836: 2**2 * 3**3 * 17**1 136 >>> prime_factors = Counter({2: 2, 3: 3, 17: 1}) 137 >>> product = 1 138 >>> for factor in prime_factors.elements(): # loop over factors 139 ... product *= factor # and multiply them 140 >>> product 141 142 Note, if an element's count has been set to zero or is a negative 143 number, elements() will ignore it. 144 145 ''' 146 # Emulate Bag.do from Smalltalk and Multiset.begin from C++. 147 return _chain.from_iterable(_starmap(_repeat, self.iteritems())) 148 149 # Override dict methods where necessary 150 151 @classmethod 152 def fromkeys(cls, iterable, v=None): 153 # There is no equivalent method for counters because setting v=1 154 # means that no element can have a count greater than one. 155 raise NotImplementedError( 156 'Counter.fromkeys() is undefined. Use Counter(iterable) instead.') 157 158 def update(self, iterable=None, **kwds): 159 """ 更新计数器,其实就是增加;如果原来没有,则新建,如果有则加一 160 >>> c 161 Counter({'a': 4, 'b': 3, 'c': 2}) 162 >>> c.update('a') 163 >>> c 164 Counter({'a': 5, 'b': 3, 'c': 2}) 165 >>> d = collections.Counter('ccddee') 166 >>> c.update(d) 167 >>> c 168 Counter({'a': 5, 'c': 4, 'b': 3, 'e': 2, 'd': 2}) 169 >>> 170 """ 171 '''Like dict.update() but add counts instead of replacing them. 172 173 Source can be an iterable, a dictionary, or another Counter instance. 174 175 >>> c = Counter('which') 176 >>> c.update('witch') # add elements from another iterable 177 >>> d = Counter('watch') 178 >>> c.update(d) # add elements from another counter 179 >>> c['h'] # four 'h' in which, witch, and watch 180 181 ''' 182 # The regular dict.update() operation makes no sense here because the 183 # replace behavior results in the some of original untouched counts 184 # being mixed-in with all of the other counts for a mismash that 185 # doesn't have a straight-forward interpretation in most counting 186 # contexts. Instead, we implement straight-addition. Both the inputs 187 # and outputs are allowed to contain zero and negative counts. 188 189 if iterable is not None: 190 if isinstance(iterable, Mapping): 191 if self: 192 self_get = self.get 193 for elem, count in iterable.iteritems(): 194 self[elem] = self_get(elem, 0) + count 195 else: 196 super(Counter, self).update(iterable) # fast path when counter is empty 197 else: 198 self_get = self.get 199 for elem in iterable: 200 self[elem] = self_get(elem, 0) + 1 201 if kwds: 202 self.update(kwds) 203 204 def subtract(self, iterable=None, **kwds): 205 """ 相减,原来的计数器中的每一个元素的数量减去后添加的元素的数量 206 >>> c = collections.Counter('aabbcc') 207 >>> c 208 Counter({'a': 2, 'c': 2, 'b': 2}) 209 >>> c.subtract('a') 210 >>> c 211 Counter({'c': 2, 'b': 2, 'a': 1}) 212 >>> 213 """ 214 '''Like dict.update() but subtracts counts instead of replacing them. 215 Counts can be reduced below zero. Both the inputs and outputs are 216 allowed to contain zero and negative counts. 217 218 Source can be an iterable, a dictionary, or another Counter instance. 219 220 >>> c = Counter('which') 221 >>> c.subtract('witch') # subtract elements from another iterable 222 >>> c.subtract(Counter('watch')) # subtract elements from another counter 223 >>> c['h'] # 2 in which, minus 1 in witch, minus 1 in watch 224 >>> c['w'] # 1 in which, minus 1 in witch, minus 1 in watch 225 -1 226 227 ''' 228 if iterable is not None: 229 self_get = self.get 230 if isinstance(iterable, Mapping): 231 for elem, count in iterable.items(): 232 self[elem] = self_get(elem, 0) - count 233 else: 234 for elem in iterable: 235 self[elem] = self_get(elem, 0) - 1 236 if kwds: 237 self.subtract(kwds) 238 239 def copy(self): 240 """ 拷贝 """ 241 'Return a shallow copy.' 242 return self.__class__(self) 243 244 def __reduce__(self): 245 """ 返回一个元组(类型,元组) """ 246 return self.__class__, (dict(self),) 247 248 def __delitem__(self, elem): 249 """ 删除元素 """ 250 'Like dict.__delitem__() but does not raise KeyError for missing values.' 251 if elem in self: 252 super(Counter, self).__delitem__(elem) 253 254 def __repr__(self): 255 if not self: 256 return '%s()' % self.__class__.__name__ 257 items = ', '.join(map('%r: %r'.__mod__, self.most_common())) 258 return '%s({%s})' % (self.__class__.__name__, items) 259 260 # Multiset-style mathematical operations discussed in: 261 # Knuth TAOCP Volume II section 4.6.3 exercise 19 262 # and at http://en.wikipedia.org/wiki/Multiset 263 # 264 # Outputs guaranteed to only include positive counts. 265 # 266 # To strip negative and zero counts, add-in an empty counter: 267 # c += Counter() 268 269 def __add__(self, other): 270 '''Add counts from two counters. 271 272 >>> Counter('abbb') + Counter('bcc') 273 Counter({'b': 4, 'c': 2, 'a': 1}) 274 275 ''' 276 if not isinstance(other, Counter): 277 return NotImplemented 278 result = Counter() 279 for elem, count in self.items(): 280 newcount = count + other[elem] 281 if newcount > 0: 282 result[elem] = newcount 283 for elem, count in other.items(): 284 if elem not in self and count > 0: 285 result[elem] = count 286 return result 287 288 def __sub__(self, other): 289 ''' Subtract count, but keep only results with positive counts. 290 291 >>> Counter('abbbc') - Counter('bccd') 292 Counter({'b': 2, 'a': 1}) 293 294 ''' 295 if not isinstance(other, Counter): 296 return NotImplemented 297 result = Counter() 298 for elem, count in self.items(): 299 newcount = count - other[elem] 300 if newcount > 0: 301 result[elem] = newcount 302 for elem, count in other.items(): 303 if elem not in self and count < 0: 304 result[elem] = 0 - count 305 return result 306 307 def __or__(self, other): 308 '''Union is the maximum of value in either of the input counters. 309 310 >>> Counter('abbb') | Counter('bcc') 311 Counter({'b': 3, 'c': 2, 'a': 1}) 312 313 ''' 314 if not isinstance(other, Counter): 315 return NotImplemented 316 result = Counter() 317 for elem, count in self.items(): 318 other_count = other[elem] 319 newcount = other_count if count < other_count else count 320 if newcount > 0: 321 result[elem] = newcount 322 for elem, count in other.items(): 323 if elem not in self and count > 0: 324 result[elem] = count 325 return result 326 327 def __and__(self, other): 328 ''' Intersection is the minimum of corresponding counts. 329 330 >>> Counter('abbb') & Counter('bcc') 331 Counter({'b': 1}) 332 333 ''' 334 if not isinstance(other, Counter): 335 return NotImplemented 336 result = Counter() 337 for elem, count in self.items(): 338 other_count = other[elem] 339 newcount = count if count < other_count else other_count 340 if newcount > 0: 341 result[elem] = newcount 342 return result
也可以传入列表或元组
1 >>> li = [11,22,33,44,11,22,22] 2 >>> c1 = collections.Counter(li) 3 >>> c1 4 Counter({22: 3, 11: 2, 33: 1, 44: 1}) 5 >>>
2、有序字典(orderedDict)
orderedDict是对字典类型的补充,他记住了字典元素添加的顺序
有序字典和原生字典的使用完全一样
唯一的区别,orderedDict在内部做了一个排序,它其实是在内部维护一个列表,因为列表是有序的
1 class OrderedDict(dict): 2 'Dictionary that remembers insertion order' 3 # An inherited dict maps keys to values. 4 # The inherited dict provides __getitem__, __len__, __contains__, and get. 5 # The remaining methods are order-aware. 6 # Big-O running times for all methods are the same as regular dictionaries. 7 8 # The internal self.__map dict maps keys to links in a doubly linked list. 9 # The circular doubly linked list starts and ends with a sentinel element. 10 # The sentinel element never gets deleted (this simplifies the algorithm). 11 # Each link is stored as a list of length three: [PREV, NEXT, KEY]. 12 13 def __init__(self, *args, **kwds): 14 '''Initialize an ordered dictionary. The signature is the same as 15 regular dictionaries, but keyword arguments are not recommended because 16 their insertion order is arbitrary. 17 18 ''' 19 if len(args) > 1: 20 raise TypeError('expected at most 1 arguments, got %d' % len(args)) 21 try: 22 self.__root 23 except AttributeError: 24 self.__root = root = [] # sentinel node 25 root[:] = [root, root, None] 26 self.__map = {} 27 self.__update(*args, **kwds) 28 29 def __setitem__(self, key, value, dict_setitem=dict.__setitem__): 30 'od.__setitem__(i, y) <==> od[i]=y' 31 # Setting a new item creates a new link at the end of the linked list, 32 # and the inherited dictionary is updated with the new key/value pair. 33 if key not in self: 34 root = self.__root 35 last = root[0] 36 last[1] = root[0] = self.__map[key] = [last, root, key] 37 return dict_setitem(self, key, value) 38 39 def __delitem__(self, key, dict_delitem=dict.__delitem__): 40 'od.__delitem__(y) <==> del od[y]' 41 # Deleting an existing item uses self.__map to find the link which gets 42 # removed by updating the links in the predecessor and successor nodes. 43 dict_delitem(self, key) 44 link_prev, link_next, _ = self.__map.pop(key) 45 link_prev[1] = link_next # update link_prev[NEXT] 46 link_next[0] = link_prev # update link_next[PREV] 47 48 def __iter__(self): 49 'od.__iter__() <==> iter(od)' 50 # Traverse the linked list in order. 51 root = self.__root 52 curr = root[1] # start at the first node 53 while curr is not root: 54 yield curr[2] # yield the curr[KEY] 55 curr = curr[1] # move to next node 56 57 def __reversed__(self): 58 'od.__reversed__() <==> reversed(od)' 59 # Traverse the linked list in reverse order. 60 root = self.__root 61 curr = root[0] # start at the last node 62 while curr is not root: 63 yield curr[2] # yield the curr[KEY] 64 curr = curr[0] # move to previous node 65 66 def clear(self): 67 'od.clear() -> None. Remove all items from od.' 68 root = self.__root 69 root[:] = [root, root, None] 70 self.__map.clear() 71 dict.clear(self) 72 73 # -- the following methods do not depend on the internal structure -- 74 75 def keys(self): 76 'od.keys() -> list of keys in od' 77 return list(self) 78 79 def values(self): 80 'od.values() -> list of values in od' 81 return [self[key] for key in self] 82 83 def items(self): 84 'od.items() -> list of (key, value) pairs in od' 85 return [(key, self[key]) for key in self] 86 87 def iterkeys(self): 88 'od.iterkeys() -> an iterator over the keys in od' 89 return iter(self) 90 91 def itervalues(self): 92 'od.itervalues -> an iterator over the values in od' 93 for k in self: 94 yield self[k] 95 96 def iteritems(self): 97 'od.iteritems -> an iterator over the (key, value) pairs in od' 98 for k in self: 99 yield (k, self[k]) 100 101 update = MutableMapping.update 102 103 __update = update # let subclasses override update without breaking __init__ 104 105 __marker = object() 106 107 def pop(self, key, default=__marker): 108 '''od.pop(k[,d]) -> v, remove specified key and return the corresponding 109 value. If key is not found, d is returned if given, otherwise KeyError 110 is raised. 111 112 ''' 113 if key in self: 114 result = self[key] 115 del self[key] 116 return result 117 if default is self.__marker: 118 raise KeyError(key) 119 return default 120 121 def setdefault(self, key, default=None): 122 'od.setdefault(k[,d]) -> od.get(k,d), also set od[k]=d if k not in od' 123 if key in self: 124 return self[key] 125 self[key] = default 126 return default 127 128 def popitem(self, last=True): 129 '''od.popitem() -> (k, v), return and remove a (key, value) pair. 130 Pairs are returned in LIFO order if last is true or FIFO order if false. 131 132 ''' 133 if not self: 134 raise KeyError('dictionary is empty') 135 key = next(reversed(self) if last else iter(self)) 136 value = self.pop(key) 137 return key, value 138 139 def __repr__(self, _repr_running={}): 140 'od.__repr__() <==> repr(od)' 141 call_key = id(self), _get_ident() 142 if call_key in _repr_running: 143 return '...' 144 _repr_running[call_key] = 1 145 try: 146 if not self: 147 return '%s()' % (self.__class__.__name__,) 148 return '%s(%r)' % (self.__class__.__name__, self.items()) 149 finally: 150 del _repr_running[call_key] 151 152 def __reduce__(self): 153 'Return state information for pickling' 154 items = [[k, self[k]] for k in self] 155 inst_dict = vars(self).copy() 156 for k in vars(OrderedDict()): 157 inst_dict.pop(k, None) 158 if inst_dict: 159 return (self.__class__, (items,), inst_dict) 160 return self.__class__, (items,) 161 162 def copy(self): 163 'od.copy() -> a shallow copy of od' 164 return self.__class__(self) 165 166 @classmethod 167 def fromkeys(cls, iterable, value=None): 168 '''OD.fromkeys(S[, v]) -> New ordered dictionary with keys from S. 169 If not specified, the value defaults to None. 170 171 ''' 172 self = cls() 173 for key in iterable: 174 self[key] = value 175 return self 176 177 def __eq__(self, other): 178 '''od.__eq__(y) <==> od==y. Comparison to another OD is order-sensitive 179 while comparison to a regular mapping is order-insensitive. 180 181 ''' 182 if isinstance(other, OrderedDict): 183 return dict.__eq__(self, other) and all(_imap(_eq, self, other)) 184 return dict.__eq__(self, other) 185 186 def __ne__(self, other): 187 'od.__ne__(y) <==> od!=y' 188 return not self == other 189 190 # -- the following methods support python 3.x style dictionary views -- 191 192 def viewkeys(self): 193 "od.viewkeys() -> a set-like object providing a view on od's keys" 194 return KeysView(self) 195 196 def viewvalues(self): 197 "od.viewvalues() -> an object providing a view on od's values" 198 return ValuesView(self) 199 200 def viewitems(self): 201 "od.viewitems() -> a set-like object providing a view on od's items" 202 return ItemsView(self) 203 204 OrderedDict
3、默认字典(defaultdict)
学习需求:
'''
将一个数字列表分割成字典,'k1'的值为小于66的值,'k2'的值为大于66的值
li = [11,22,33,44,55,66,77,88,99,90]
'''
1 li = [11,22,33,44,55,66,77,88,99,90] 2 dic = {} 3 for ele in li: 4 if ele < 66: 5 if 'k1' in dic.keys(): 6 dic['k1'].append(ele) 7 else: 8 #创建只有一个元素的列表 9 dic['k1'] = [ele,] 10 else: 11 if 'k2' in dic.keys(): 12 dic['k2'].append(ele); 13 else: 14 dic['k2'] = [ele,]
1 from collections import Counter,defaultdict; 2 li = [11,22,33,44,55,66,77,88,99,90,87] 3 my_dic = defaultdict(list) 4 for ele in li: 5 if ele > 66: 6 my_dic['k2'].append(ele) 7 else: 8 my_dic['k1'].append(ele)
defaultdict是对字典类型的补充,他默认给字典的值设置了一个类型,字典默认的是None,可以给字典设置一个默认类型,比如列表,元组等
1 class defaultdict(dict): 2 """ 3 defaultdict(default_factory[, ...]) --> dict with default factory 4 5 The default factory is called without arguments to produce 6 a new value when a key is not present, in __getitem__ only. 7 A defaultdict compares equal to a dict with the same items. 8 All remaining arguments are treated the same as if they were 9 passed to the dict constructor, including keyword arguments. 10 """ 11 def copy(self): # real signature unknown; restored from __doc__ 12 """ D.copy() -> a shallow copy of D. """ 13 pass 14 15 def __copy__(self, *args, **kwargs): # real signature unknown 16 """ D.copy() -> a shallow copy of D. """ 17 pass 18 19 def __getattribute__(self, name): # real signature unknown; restored from __doc__ 20 """ x.__getattribute__('name') <==> x.name """ 21 pass 22 23 def __init__(self, default_factory=None, **kwargs): # known case of _collections.defaultdict.__init__ 24 """ 25 defaultdict(default_factory[, ...]) --> dict with default factory 26 27 The default factory is called without arguments to produce 28 a new value when a key is not present, in __getitem__ only. 29 A defaultdict compares equal to a dict with the same items. 30 All remaining arguments are treated the same as if they were 31 passed to the dict constructor, including keyword arguments. 32 33 # (copied from class doc) 34 """ 35 pass 36 37 def __missing__(self, key): # real signature unknown; restored from __doc__ 38 """ 39 __missing__(key) # Called by __getitem__ for missing key; pseudo-code: 40 if self.default_factory is None: raise KeyError((key,)) 41 self[key] = value = self.default_factory() 42 return value 43 """ 44 pass 45 46 def __reduce__(self, *args, **kwargs): # real signature unknown 47 """ Return state information for pickling. """ 48 pass 49 50 def __repr__(self): # real signature unknown; restored from __doc__ 51 """ x.__repr__() <==> repr(x) """ 52 pass 53 54 default_factory = property(lambda self: object(), lambda self, v: None, lambda self: None) # default 55 """Factory for default value called by __missing__().""" 56 57 defaultdict
4、可命名元组(namedtuple)
创建一个扩展tuple的类,Mytuple——类名
1 #通过可命名元组创建一个类 2 >>> Mytuple = collections.namedtuple('Mytuple',['x','y']) 3 #通过这个类创建对象 4 >>> new_tuple = Mytuple(1,2) 5 >>> new_tuple 6 Mytuple(x=1, y=2) 7 #可以通过名称来调用 8 >>> new_tuple.x 9 1 10 >>> new_tuple.y 11 2 12 >>> old_tuple = ([1,2]) 13 >>> old_tuple 14 [1, 2] 15 >>>
1 class Mytuple(__builtin__.tuple) 2 | Mytuple(x, y) 3 | 4 | Method resolution order: 5 | Mytuple 6 | __builtin__.tuple 7 | __builtin__.object 8 | 9 | Methods defined here: 10 | 11 | __getnewargs__(self) 12 | Return self as a plain tuple. Used by copy and pickle. 13 | 14 | __getstate__(self) 15 | Exclude the OrderedDict from pickling 16 | 17 | __repr__(self) 18 | Return a nicely formatted representation string 19 | 20 | _asdict(self) 21 | Return a new OrderedDict which maps field names to their values 22 | 23 | _replace(_self, **kwds) 24 | Return a new Mytuple object replacing specified fields with new values 25 | 26 | ---------------------------------------------------------------------- 27 | Class methods defined here: 28 | 29 | _make(cls, iterable, new=in method __new__ of type object>, len= in function len>) from __builtin__.type 30 | Make a new Mytuple object from a sequence or iterable 31 | 32 | ---------------------------------------------------------------------- 33 | Static methods defined here: 34 | 35 | __new__(_cls, x, y) 36 | Create new instance of Mytuple(x, y) 37 | 38 | ---------------------------------------------------------------------- 39 | Data descriptors defined here: 40 | 41 | __dict__ 42 | Return a new OrderedDict which maps field names to their values 43 | 44 | x 45 | Alias for field number 0 46 | 47 | y 48 | Alias for field number 1 49 | 50 | ---------------------------------------------------------------------- 51 | Data and other attributes defined here: 52 | 53 | _fields = ('x', 'y') 54 | 55 | ---------------------------------------------------------------------- 56 | Methods inherited from __builtin__.tuple: 57 | 58 | __add__(...) 59 | x.__add__(y) <==> x+y 60 | 61 | __contains__(...) 62 | x.__contains__(y) <==> y in x 63 | 64 | __eq__(...) 65 | x.__eq__(y) <==> x==y 66 | 67 | __ge__(...) 68 | x.__ge__(y) <==> x>=y 69 | 70 | __getattribute__(...) 71 | x.__getattribute__('name') <==> x.name 72 | 73 | __getitem__(...) 74 | x.__getitem__(y) <==> x[y] 75 | 76 | __getslice__(...) 77 | x.__getslice__(i, j) <==> x[i:j] 78 | 79 | Use of negative indices is not supported. 80 | 81 | __gt__(...) 82 | x.__gt__(y) <==> x>y 83 | 84 | __hash__(...) 85 | x.__hash__() <==> hash(x) 86 | 87 | __iter__(...) 88 | x.__iter__() <==> iter(x) 89 | 90 | __le__(...) 91 | x.__le__(y) <==> x<=y 92 | 93 | __len__(...) 94 | x.__len__() <==> len(x) 95 | 96 | __lt__(...) 97 | x.__lt__(y) <==> x<y 98 | 99 | __mul__(...) 100 | x.__mul__(n) <==> x*n 101 | 102 | __ne__(...) 103 | x.__ne__(y) <==> x!=y 104 | 105 | __rmul__(...) 106 | x.__rmul__(n) <==> n*x 107 | 108 | __sizeof__(...) 109 | T.__sizeof__() -- size of T in memory, in bytes 110 | 111 | count(...) 112 | T.count(value) -> integer -- return number of occurrences of value 113 | 114 | index(...) 115 | T.index(value, [start, [stop]]) -> integer -- return first index of value. 116 | Raises ValueError if the value is not present.
5、双向队列(deque)
两边都可以取,两边都可以插入,这就有一个线程安全的问题,谁先得到就会有一个线程锁,防止抢占资源
一个线程安全的双向队列
1 class deque(object): 2 """ 3 deque([iterable[, maxlen]]) --> deque object 4 5 Build an ordered collection with optimized access from its endpoints. 6 """ 7 def append(self, *args, **kwargs): # real signature unknown 8 """ 追加元素到队列 9 >>> q = collections.deque() 10 >>> q.append(1) 11 >>> q.append(11) 12 >>> q.append(111) 13 >>> q.append(1111) 14 >>> q 15 deque([1, 11, 111, 1111]) 16 >>> 17 """ 18 """ Add an element to the right side of the deque. """ 19 pass 20 21 def appendleft(self, *args, **kwargs): # real signature unknown 22 """ 加入元素到队列的左边 23 >>> q 24 deque([1, 11, 111]) 25 >>> q.appendleft(2) 26 >>> q 27 deque([2, 1, 11, 111]) 28 >>> 29 """ 30 """ Add an element to the left side of the deque. """ 31 pass 32 33 def clear(self, *args, **kwargs): # real signature unknown 34 """ 清除队列中所有元素 35 >>> q 36 deque([2, 2, 1, 11, 111]) 37 >>> q.clear() 38 >>> q 39 deque([]) 40 >>> 41 """ 42 """ Remove all elements from the deque. """ 43 pass 44 45 def count(self, value): # real signature unknown; restored from __doc__ 46 """ 计算元素的个数 47 >>> q 48 deque([2, 1, 11, 111]) 49 >>> q.count(2) 50 1 51 >>> q.appendleft(2) 52 >>> q.count(2) 53 2 54 >>> q 55 deque([2, 2, 1, 11, 111]) 56 >>> 57 """ 58 """ D.count(value) -> integer -- return number of occurrences of value """ 59 return 0 60 61 def extend(self, *args, **kwargs): # real signature unknown 62 """ 扩展队列从一个迭代器中 63 >>> q 64 deque([]) 65 >>> li = [11,22,33,44,55] 66 >>> q.extend(li) 67 >>> q 68 deque([11, 22, 33, 44, 55]) 69 >>> 70 """ 71 """ Extend the right side of the deque with elements from the iterable """ 72 pass 73 74 def extendleft(self, *args, **kwargs): # real signature unknown 75 """ 从队列左边扩展元素 76 >>> q 77 deque([11, 22, 33, 44, 55]) 78 >>> lileft = (1,2,3,4,5) 79 >>> q.extendleft(lileft) 80 >>> q 81 deque([5, 4, 3, 2, 1, 11, 22, 33, 44, 55]) 82 >>> 83 """ 84 """ Extend the left side of the deque with elements from the iterable """ 85 pass 86 87 def pop(self, *args, **kwargs): # real signature unknown 88 """移除队列最后一个元素并取得 89 >>> q = collections.deque() 90 >>> q.append(1) 91 >>> q.append(11) 92 >>> q.append(111) 93 >>> q.append(1111) 94 >>> q 95 deque([1, 11, 111, 1111]) 96 >>> a = q.pop() 97 >>> a 98 1111 99 >>> q 100 deque([1, 11, 111]) 101 >>> 102 """ 103 """ Remove and return the rightmost element. """ 104 pass 105 106 def popleft(self, *args, **kwargs): # real signature unknown 107 """ 从队列左边移除一个元素并取得 108 >>> q 109 deque([5, 4, 3, 2, 1, 11, 22, 33, 44, 55]) 110 >>> b = q.popleft() 111 >>> b 112 5 113 >>> 114 """ 115 """ Remove and return the leftmost element. """ 116 pass 117 118 def remove(self, value): # real signature unknown; restored from __doc__ 119 """ 移除第一个被找到的值,如果没有,会抛出异常 120 >>> q 121 deque([4, 3, 2, 1, 11, 22, 33, 44, 55]) 122 >>> q.remove(5) 123 Traceback (most recent call last): 124 File "", line 1, in 125 ValueError: deque.remove(x): x not in deque 126 >>> q.remove(4) 127 >>> q 128 deque([3, 2, 1, 11, 22, 33, 44, 55]) 129 >>> 130 """ 131 """ D.remove(value) -- remove first occurrence of value. """ 132 pass 133 134 def reverse(self): # real signature unknown; restored from __doc__ 135 """ 反转队列 136 >>> q 137 deque([3, 2, 1, 11, 22, 33, 44, 55]) 138 >>> q.reverse() 139 >>> q 140 deque([55, 44, 33, 22, 11, 1, 2, 3]) 141 >>> 142 """ 143 """ D.reverse() -- reverse *IN PLACE* """ 144 pass 145 146 def rotate(self, *args, **kwargs): # real signature unknown 147 """ 从右边移动值到左边,默认移动一个 148 >>> q 149 deque([55, 44, 33, 22, 11, 1, 2, 3]) 150 >>> q.rotate() 151 >>> q 152 deque([3, 55, 44, 33, 22, 11, 1, 2]) 153 >>> q.rotate(2) 154 >>> q 155 deque([1, 2, 3, 55, 44, 33, 22, 11]) 156 >>> q.rotate(2) 157 >>> q 158 deque([22, 11, 1, 2, 3, 55, 44, 33]) 159 >>> 160 """ 161 """ Rotate the deque n steps to the right (default n=1). If n is negative, rotates left. """ 162 pass 163 164 def __copy__(self, *args, **kwargs): # real signature unknown 165 """ Return a shallow copy of a deque. """ 166 pass 167 168 def __delitem__(self, y): # real signature unknown; restored from __doc__ 169 """ x.__delitem__(y) <==> del x[y] """ 170 pass 171 172 def __eq__(self, y): # real signature unknown; restored from __doc__ 173 """ x.__eq__(y) <==> x==y """ 174 pass 175 176 def __getattribute__(self, name): # real signature unknown; restored from __doc__ 177 """ x.__getattribute__('name') <==> x.name """ 178 pass 179 180 def __getitem__(self, y): # real signature unknown; restored from __doc__ 181 """ x.__getitem__(y) <==> x[y] """ 182 pass 183 184 def __ge__(self, y): # real signature unknown; restored from __doc__ 185 """ x.__ge__(y) <==> x>=y """ 186 pass 187 188 def __gt__(self, y): # real signature unknown; restored from __doc__ 189 """ x.__gt__(y) <==> x>y """ 190 pass 191 192 def __iadd__(self, y): # real signature unknown; restored from __doc__ 193 """ x.__iadd__(y) <==> x+=y """ 194 pass 195 196 def __init__(self, iterable=(), maxlen=None): # known case of _collections.deque.__init__ 197 """ 198 deque([iterable[, maxlen]]) --> deque object 199 200 Build an ordered collection with optimized access from its endpoints. 201 # (copied from class doc) 202 """ 203 pass 204 205 def __iter__(self): # real signature unknown; restored from __doc__ 206 """ x.__iter__() <==> iter(x) """ 207 pass 208 209 def __len__(self): # real signature unknown; restored from __doc__ 210 """ x.__len__() <==> len(x) """ 211 pass 212 213 def __le__(self, y): # real signature unknown; restored from __doc__ 214 """ x.__le__(y) <==> x<=y """ 215 pass 216 217 def __lt__(self, y): # real signature unknown; restored from __doc__ 218 """ x.__lt__(y) <==> x""" 219 pass 220 221 @staticmethod # known case of __new__ 222 def __new__(S, *more): # real signature unknown; restored from __doc__ 223 """ T.__new__(S, ...) -> a new object with type S, a subtype of T """ 224 pass 225 226 def __ne__(self, y): # real signature unknown; restored from __doc__ 227 """ x.__ne__(y) <==> x!=y """ 228 pass 229 230 def __reduce__(self, *args, **kwargs): # real signature unknown 231 """ Return state information for pickling. """ 232 pass 233 234 def __repr__(self): # real signature unknown; restored from __doc__ 235 """ x.__repr__() <==> repr(x) """ 236 pass 237 238 def __reversed__(self): # real signature unknown; restored from __doc__ 239 """ D.__reversed__() -- return a reverse iterator over the deque """ 240 pass 241 242 def __setitem__(self, i, y): # real signature unknown; restored from __doc__ 243 """ x.__setitem__(i, y) <==> x[i]=y """ 244 pass 245 246 def __sizeof__(self): # real signature unknown; restored from __doc__ 247 """ D.__sizeof__() -- size of D in memory, in bytes """ 248 pass 249 250 maxlen = property(lambda self: object(), lambda self, v: None, lambda self: None) # default 251 """maximum size of a deque or None if unbounded""" 252 253 254 __hash__ = None
6、单向队列(Queue.Queue)——先进先出(FIFO(First In First Out))
队列:先进先出 FIFO
栈:先进后出 弹夹
1 #创建一个最多十个内容的队列 2 >>> q = Queue.Queue(10) 3 >>> q 45 #给队列放值,用put 6 >>> q.put(1) 7 >>> q.put(2) 8 >>> q.put(3) 9 #取值用get,get取值是阻塞的 10 >>> q.get() 11 1 12 >>> q.get() 13 2 14 >>> q.get() 15 3 16 #当取完后,再取就会阻塞住,直到队列中有值才继续 17 >>> q.get()
1 class Queue: 2 """Create a queue object with a given maximum size. 3 4 If maxsize is <= 0, the queue size is infinite. 5 """ 6 def __init__(self, maxsize=0): 7 self.maxsize = maxsize 8 self._init(maxsize) 9 # mutex must be held whenever the queue is mutating. All methods 10 # that acquire mutex must release it before returning. mutex 11 # is shared between the three conditions, so acquiring and 12 # releasing the conditions also acquires and releases mutex. 13 self.mutex = _threading.Lock() 14 # Notify not_empty whenever an item is added to the queue; a 15 # thread waiting to get is notified then. 16 self.not_empty = _threading.Condition(self.mutex) 17 # Notify not_full whenever an item is removed from the queue; 18 # a thread waiting to put is notified then. 19 self.not_full = _threading.Condition(self.mutex) 20 # Notify all_tasks_done whenever the number of unfinished tasks 21 # drops to zero; thread waiting to join() is notified to resume 22 self.all_tasks_done = _threading.Condition(self.mutex) 23 self.unfinished_tasks = 0 24 25 def task_done(self): 26 """Indicate that a formerly enqueued task is complete. 27 28 Used by Queue consumer threads. For each get() used to fetch a task, 29 a subsequent call to task_done() tells the queue that the processing 30 on the task is complete. 31 32 If a join() is currently blocking, it will resume when all items 33 have been processed (meaning that a task_done() call was received 34 for every item that had been put() into the queue). 35 36 Raises a ValueError if called more times than there were items 37 placed in the queue. 38 """ 39 self.all_tasks_done.acquire() 40 try: 41 unfinished = self.unfinished_tasks - 1 42 if unfinished <= 0: 43 if unfinished < 0: 44 raise ValueError('task_done() called too many times') 45 self.all_tasks_done.notify_all() 46 self.unfinished_tasks = unfinished 47 finally: 48 self.all_tasks_done.release() 49 50 def join(self): 51 """Blocks until all items in the Queue have been gotten and processed. 52 53 The count of unfinished tasks goes up whenever an item is added to the 54 queue. The count goes down whenever a consumer thread calls task_done() 55 to indicate the item was retrieved and all work on it is complete. 56 57 When the count of unfinished tasks drops to zero, join() unblocks. 58 """ 59 self.all_tasks_done.acquire() 60 try: 61 while self.unfinished_tasks: 62 self.all_tasks_done.wait() 63 finally: 64 self.all_tasks_done.release() 65 66 def qsize(self): 67 """Return the approximate size of the queue (not reliable!).""" 68 self.mutex.acquire() 69 n = self._qsize() 70 self.mutex.release() 71 return n 72 73 def empty(self): 74 """Return True if the queue is empty, False otherwise (not reliable!).""" 75 self.mutex.acquire() 76 n = not self._qsize() 77 self.mutex.release() 78 return n 79 80 def full(self): 81 """Return True if the queue is full, False otherwise (not reliable!).""" 82 self.mutex.acquire() 83 n = 0 < self.maxsize == self._qsize() 84 self.mutex.release() 85 return n 86 87 def put(self, item, block=True, timeout=None): 88 """Put an item into the queue. 89 90 If optional args 'block' is true and 'timeout' is None (the default), 91 block if necessary until a free slot is available. If 'timeout' is 92 a non-negative number, it blocks at most 'timeout' seconds and raises 93 the Full exception if no free slot was available within that time. 94 Otherwise ('block' is false), put an item on the queue if a free slot 95 is immediately available, else raise the Full exception ('timeout' 96 is ignored in that case). 97 """ 98 self.not_full.acquire() 99 try: 100 if self.maxsize > 0: 101 if not block: 102 if self._qsize() == self.maxsize: 103 raise Full 104 elif timeout is None: 105 while self._qsize() == self.maxsize: 106 self.not_full.wait() 107 elif timeout < 0: 108 raise ValueError("'timeout' must be a non-negative number") 109 else: 110 endtime = _time() + timeout 111 while self._qsize() == self.maxsize: 112 remaining = endtime - _time() 113 if remaining <= 0.0: 114 raise Full 115 self.not_full.wait(remaining) 116 self._put(item) 117 self.unfinished_tasks += 1 118 self.not_empty.notify() 119 finally: 120 self.not_full.release() 121 122 def put_nowait(self, item): 123 """Put an item into the queue without blocking. 124 125 Only enqueue the item if a free slot is immediately available. 126 Otherwise raise the Full exception. 127 """ 128 return self.put(item, False) 129 130 def get(self, block=True, timeout=None): 131 """Remove and return an item from the queue. 132 133 If optional args 'block' is true and 'timeout' is None (the default), 134 block if necessary until an item is available. If 'timeout' is 135 a non-negative number, it blocks at most 'timeout' seconds and raises 136 the Empty exception if no item was available within that time. 137 Otherwise ('block' is false), return an item if one is immediately 138 available, else raise the Empty exception ('timeout' is ignored 139 in that case). 140 """ 141 self.not_empty.acquire() 142 try: 143 if not block: 144 if not self._qsize(): 145 raise Empty 146 elif timeout is None: 147 while not self._qsize(): 148 self.not_empty.wait() 149 elif timeout < 0: 150 raise ValueError("'timeout' must be a non-negative number") 151 else: 152 endtime = _time() + timeout 153 while not self._qsize(): 154 remaining = endtime - _time() 155 if remaining <= 0.0: 156 raise Empty 157 self.not_empty.wait(remaining) 158 item = self._get() 159 self.not_full.notify() 160 return item 161 finally: 162 self.not_empty.release() 163 164 def get_nowait(self): 165 """Remove and return an item from the queue without blocking. 166 167 Only get an item if one is immediately available. Otherwise 168 raise the Empty exception. 169 """ 170 return self.get(False) 171 172 # Override these methods to implement other queue organizations 173 # (e.g. stack or priority queue). 174 # These will only be called with appropriate locks held 175 176 # Initialize the queue representation 177 def _init(self, maxsize): 178 self.queue = deque() 179 180 def _qsize(self, len=len): 181 return len(self.queue) 182 183 # Put a new item in the queue 184 def _put(self, item): 185 self.queue.append(item) 186 187 # Get an item from the queue 188 def _get(self): 189 return self.queue.popleft()
双向队列和单向队列的区别
双向队列是两边都可以插入数据和读取数据,单向队列只能从一边取和插
双向队列是在collections模块中,单向队列是在Queue模块中
都是线程安全的
会通过help方法找到collections,大致知道计算器、有序字典、默认字典、可命名元组和双向队列
迭代器和生成器
一、迭代器
对于python列表的for循环,他的内部原理:查看下一个元素是否存在,如果存在,则取出,如果不存在,则报异常StopIteration。(python内部对异常已处理)
1 >>> c 2 Counter({'d': 4, 's': 4, 'a': 2, 'c': 2, 'b': 2, 'e': 2, 'f': 2, 'g': 1}) 3 >>> c.elements() 45 >>>
迭代器的内容要用循环取出来
1 class listiterator(object) 2 | Methods defined here: 3 | 4 | __getattribute__(...) 5 | x.__getattribute__('name') <==> x.name 6 | 7 | __iter__(...) 8 | x.__iter__() <==> iter(x) 9 | 10 | __length_hint__(...) 11 | Private method returning an estimate of len(list(it)). 12 | 13 | next(...) 14 | x.next() -> the next value, or raise StopIteration
二、生成器
range不是生成器 xrange是生成器
redlines不是生成器 xreadlines是生成器
1 >>> print range(10) 2 [0, 1, 2, 3, 4, 5, 6, 7, 8, 9] 3 >>> print xrange(10) 4 xrange(10) 5 >>>
xrange(10)创建时只是一个对象,只有在循环或使用时才会在内存中开辟空间
生成器内部基于yield创建,即:对于生成器只有使用时才创建,从而避免内存浪费
练习:有如下列表:
[13, 22, 6, 99, 11]
利用列表的下标进行循环
>>> li
[13, 22, 6, 99, 11]
>>> i = 0
>>> while i < len(li):
... print li[i]
... i += 1
...
13
22
6
99
11
练习:有如下列表:
[13, 22, 6, 99, 11]
请按照一下规则计算:
13 和 22 比较,将大的值放在右侧,即:[13, 22, 6, 99, 11]
22 和 6 比较,将大的值放在右侧,即:[13, 6, 22, 99, 11]
22 和 99 比较,将大的值放在右侧,即:[13, 6, 22, 99, 11]
99 和 42 比较,将大的值放在右侧,即:[13, 6, 22, 11, 99,]
13 和 6 比较,将大的值放在右侧,即:[6, 13, 22, 11, 99,]
...
1 #!/usr/bin/env python 2 # _*_ coding:utf-8 _*_ 3 li = [12, 33, 6, 99, 11] 4 ''' 5 方法一:第一种方法是固定一个数a与后面的数b相比,如果a大于b,就把a\b对调,再用a和下面的一个数比,全部比完后会得到一个最小的数放在最左面,然后用第二个数继续往下比,以此类推就得到了从小到大的排序 6 ''' 7 for i in range(len(li) - 1): 8 for j in range(i+1,len(li)): 9 if li[i] > li[j]: 10 temp = li[i]; 11 li[i] = li[j] 12 li[j] = temp 13 14 print li 15 16 ''' 17 方法二:两个相邻的数比较,如果左边的数比右边的大,就调换位置,一个循环后会把最大的数放在最右边,以此类推,所有数字都循环完后会得到从小到大的排序 18 ''' 19 for x in range(len(li)): 20 for i in range(len(li)-1): 21 if li[i] > li[i+1]: 22 t = li[i]; 23 li[i] = li[i+1]; 24 li[i+1] = t 25 print li;
函数
函数分为内置函数、自定义函数、导入函数。函数就是按功能划分的代码块
一、内置函数
内置函数就是python为用户提供的快捷方法
先看几个常用的
help()函数可以得到方法的一些帮助
1 >>> help(list) 2 Help on class list in module __builtin__: 3 4 class list(object) 5 | list() -> new empty list 6 | list(iterable) -> new list initialized from iterable's items 7 | 8 | Methods defined here: 9 | 10 | __add__(...) 11 | x.__add__(y) <==> x+y 12 | 13 | __contains__(...) 14 | x.__contains__(y) <==> y in x 15 | 16 | __delitem__(...) 17 | x.__delitem__(y) <==> del x[y] 18 | 19 | __delslice__(...) 20 | x.__delslice__(i, j) <==> del x[i:j] 21 | 22 | Use of negative indices is not supported.
dir()可以把一个类的方法全部打印出来
1 >>> dir(list) 2 ['__add__', '__class__', '__contains__', '__delattr__', '__delitem__', '__delslice__', '__doc__', '__eq__', '__format__', '__ge__', '__getattribute__', '__getitem__', '__getslice__', '__gt__', '__hash__', '__iadd__', '__imul__', '__init__', '__iter__', '__le__', '__len__', '__lt__', '__mul__', '__ne__', '__new__', '__reduce__', '__reduce_ex__', '__repr__', '__reversed__', '__rmul__', '__setattr__', '__setitem__', '__setslice__', '__sizeof__', '__str__', '__subclasshook__', 'append', 'count', 'extend', 'index', 'insert', 'pop', 'remove', 'reverse', 'sort'] 3 >>>
vars()可以显示出所有的变量
1 >>> vars() 2 {'a': xrange(10), 'c': Counter({'d': 4, 's': 4, 'a': 2, 'c': 2, 'b': 2, 'e': 2, 'f': 2, 'g': 1}), '__builtins__':'__builtin__' (built-in)>, '__package__': None, 'i': 1, 'collections': 'collections' from '/usr/lib/python2.7/collections.pyc'>, 'tab': 'tab' from '/usr/lib/python2.7/dist-packages/tab.pyc'>, '__name__': '__main__', 'li': [13, 22, 6, 99, 11], '__doc__': None} 3 >>>
type()查看变量的类型
>>> type(li)'list'> >>>
abc()取绝对值
>>> abs(-9) 9 >>> abs(0) 0 >>> abs(33) 33 >>>
divmod()输入两个数字,得到一个元组(商、余数)
>>> divmod(10,3)
(3, 1)
>>> divmod(10,2)
(5, 0)
>>>
ord()输入一个字符,返回ASCII
>>> ord('a')
97
>>>
chr()输入ASCII,返回字符
>>> chr(100)
'd'
>>>
cmp()比较两个数大小,大于返回1,小于返回-1,等于返回0
>>> cmp(20,2)
1
>>> cmp(20,20)
0
>>> cmp(20,21)
-1
>>>
eval()可以计算一个字符串的值
>>> eval('200/4+4')
54
>>>
format()格式化输出字符串
>>> a = 'I am a {0},hello {1}'
>>> print a.format('techer','world')
I am a techer,hello world
>>>
hex(x)转换成十六进制
>>> hex(255)
'0xff'
>>>
id()返回对象的内存地址
>>> a = 20
>>> id(a)
22802320
>>>
input()输入内容
1 #input接收到的是输入的是什么就是什么类型,比如输入22,那么a类型就是数值类型 2 >>> a = input() 3 22 4 >>> type(a) 5'int'> 6 #输入一个hello,接收到的就是一个变量名,根据下面的异常提示也可以知道 7 >>> a = input() 8 hello 9 Traceback (most recent call last): 10 File " ", line 1, in 11 File " ", line 1, in 12 NameError: name 'hello' is not defined 13 #如果想得到一个字符串,输入的时候要加引号 14 >>> a = input() 15 'hello' 16 >>> type(a) 17 'str'> 18 >>>
int()输入一个数字,转换成整型,字符串不能是小数形式的
>>> a = '22'
>>> type(a)
>>> b = int(a)
>>> type(b)
>>> b
22
>>>
len()计算长度
>>> li
[13, 22, 6, 99, 11]
>>> len(li)
5
>>> s = 'hello world'
>>> len(s)
11
>>>
max()找出最大值
>>> a = 22
>>> b = 33
>>> c = 21
>>> max(a,b,c)
33
>>>
min()找出最小值
>>> a,b,c
(22, 33, 21)
>>> min(a,b,c)
21
>>> t = (11,111,1111)
>>> min(t)
11
>>>
oct()转换成八进制
>>> a = 100
>>> oct(a)
'0144'
>>>
pow()求幂
>>> pow(2,2)
4
>>> pow(2,10)
1024
>>>
range()生成一个连续的数字序列
>>> range(5)
[0, 1, 2, 3, 4]
>>> range(2,8)
[2, 3, 4, 5, 6, 7]
>>>
raw_input()接收终端输入的内容
>>> a = raw_input()
hello
>>> a
'hello'
>>> a = raw_input()
33
>>> a
'33'
>>>
reload(module)重新导入模块
如果一个模块已经导入,修改过这个模块后需要重新导入,就需要用reload重新导入
sum()计算一个数字序列的和
>>> sum([1,2,3])
6
>>>
all()如果里面有空值,就返回False
>>> a = [1,2,3,'']
>>> all(a)
False
>>> a = [1,2,3,'a']
>>> all(a)
True
>>>
any()只要有一个是真就是真
>>> a = []
>>> any(a)
False
>>> a = [1,2,'']
>>> any(a)
True
>>>
enumerate()循环序列,前面加一个序号,默认从0开始,可以指定起始值
>>> a = [11,22,33,44,55]
>>> for k,v in enumerate(a,1):
... print k,v
...
1 11
2 22
3 33
4 44
5 55
>>>
二、自定义函数
一、在学习函数之前,一直遵循:面向过程编程,即:根据业务逻辑从上到下实现功能,其往往用一长段代码来实现指定功能,开发过程中最常见的操作就是粘贴复制,也就是将之前实现的代码块复制到现需要功能处。
while True:
if cpu利用率 > 90%:
#发送邮件提醒
连接邮箱服务器
发送邮件
关闭连接
if 硬盘使用空间 > 90%:
#发送邮件提醒
连接邮箱服务器
发送邮件
关闭连接
if 内存占用 > 80%:
#发送邮件提醒
连接邮箱服务器
发送邮件
关闭连接
如上述代码,if条件语句下的内容可以被提取出来公用,如下:
def 发送邮件(内容)
#发送邮件提醒
连接邮箱服务器
发送邮件
关闭连接
while True:
if cpu利用率 > 90%:
发送邮件('CPU报警')
if 硬盘使用空间 > 90%:
发送邮件('硬盘报警')
if 内存占用 > 80%:
对于上述的两种实现方式,第二次必然比第一次的重用性和可读性要好,其实这就是函数式编程和面向过程编程的区别:
- 函数式:将某功能代码封装到函数中,日后便无需重复编写,仅调用函数即可
- 面向对象:对函数进行分类和封装,让开始“更快更好更强……”
函数式编程最重要的是增强代码的重用性和可读性
二、函数的定义和使用
def 函数名(参数):
...
函数体
...
函数的定义主要有如下要点:
- def:表示函数的关键字
- 函数名:函数的名称,日后根据函数名调用函数
- 函数体:函数中进行一系列的逻辑计算,如:发送邮件、计算出 [11,22,38,888,2]中的最大数等...
- 参数:为函数体提供数据
- 返回值:当函数执行完毕后,可以给调用者返回数据。
以上要点中,比较重要有参数和返回值:
1、返回值
函数是一个功能块,该功能到底执行成功与否,需要通过返回值来告知调用者。
def 发送短信():
发送短信的代码...
if 发送成功:
return True
else:
return False
while True:
# 每次执行发送短信函数,都会将返回值自动赋值给result
# 之后,可以根据result来写日志,或重发等操作
result = 发送短信()
if result == False:
记录日志,短信发送失败...
2、参数
函数中有三种不同的参数
- 普通参数
- 默认参数
- 动态参数
1 # ######### 定义函数 ######### 2 3 # name 叫做函数func的形式参数,简称:形参 4 def func(name): 5 print name 6 7 # ######### 执行函数 ######### 8 # 'wangwei' 叫做函数func的实际参数,简称:实参 9 func('wangwei')
1 def func(name, age = 18): 2 3 print "%s:%s" %(name,age) 4 5 # 指定参数 6 func('wupeiqi', 19) 7 # 使用默认参数 8 func('alex') 9 10 注:默认参数需要放在参数列表最后
1 def func(**kwargs): 2 3 print args 4 5 6 # 执行方式一 7 func(name='wupeiqi',age=18) 8 9 # 执行方式二 10 li = {'name':'wupeiqi', age:18, 'gender':'male'} 11 func(**li) 12 #传入字典时前面要加两个星
1 def func(*args, **kwargs): 2 3 print args 4 print kwargs
1 >>> def func(*args,**kwargs): 2 ... print args 3 ... print kwargs 4 ... 5 >>> func(11,22,33) 6 (11, 22, 33) 7 {} 8 >>> func(k1=123,k2=321) 9 () 10 {'k2': 321, 'k1': 123} 11 >>> func(1,2,3,4,k1=123,k2=321) 12 (1, 2, 3, 4) 13 {'k2': 321, 'k1': 123} 14 >>> func([1,2,3],k1=123,k2=321) 15 ([1, 2, 3],) 16 {'k2': 321, 'k1': 123} 17 >>>
文件操作
操作文件时,一般需要经历如下步骤:
- 打开文件
- 操作文件
一、打开文件
文件句柄 = file('文件路径','模式')
注:python中打开文件有两种方式,即:open(...)和file(...),本质上前者在内部会调用后者来进行文件操作,推荐使用open
打开文件时,需要指定文件路径和以何种方式打开文件,打开后,即可获取该文件句柄,日后通过此文件句柄对该文件操作。
打开文件的模式有:
- r,只读模式(默认)
- w,只写模式。——不可读,不存在则创建,存在则删除内容。
- a,追加模式。——可读,不存在则创建,存在则只追加内容。
“+”表示可以同时读写某个文件。“+”只有在r+有意思,w+和a+和w、a的效果是一样的
- r+,可读写文件——可读,可写,可追加
- w+,写读
- a+,同a
“U”表示在读取时,可以将\r \n \r\n自动转换成\n(与r或r+模式同时使用)
- rU
- r+U
“b”表示处理二进制文件(如:FTP发送上传ISO去镜像文件,linux可忽略,windows处理二进制文件时需标注)
- rb
- wb
- ab
二、操作文件
1 class file(object): 2 3 def close(self): # real signature unknown; restored from __doc__ 4 #关闭文件 5 """ 6 close() -> None or (perhaps) an integer. Close the file. 7 8 Sets data attribute .closed to True. A closed file cannot be used for 9 further I/O operations. close() may be called more than once without 10 error. Some kinds of file objects (for example, opened by popen()) 11 may return an exit status upon closing. 12 """ 13 14 def fileno(self): # real signature unknown; restored from __doc__ 15 #文件描述符 16 """ 17 fileno() -> integer "file descriptor". 18 19 This is needed for lower-level file interfaces, such os.read(). 20 """ 21 return 0 22 23 def flush(self): # real signature unknown; restored from __doc__ 24 #刷新文件内部缓冲区 25 """ flush() -> None. Flush the internal I/O buffer. """ 26 pass 27 28 29 def isatty(self): # real signature unknown; restored from __doc__ 30 #判断文件是否是同意tty设备 31 """ isatty() -> true or false. True if the file is connected to a tty device. """ 32 return False 33 34 35 def next(self): # real signature unknown; restored from __doc__ 36 #获取下一行数据,不存在,则报错 37 """ x.next() -> the next value, or raise StopIteration """ 38 pass 39 40 def read(self, size=None): # real signature unknown; restored from __doc__ 41 #读取指定字节数据 42 """ 43 read([size]) -> read at most size bytes, returned as a string. 44 45 If the size argument is negative or omitted, read until EOF is reached. 46 Notice that when in non-blocking mode, less data than what was requested 47 may be returned, even if no size parameter was given. 48 """ 49 pass 50 51 def readinto(self): # real signature unknown; restored from __doc__ 52 #读取到缓冲区,不要用,将被遗弃 53 """ readinto() -> Undocumented. Don't use this; it may go away. """ 54 pass 55 56 def readline(self, size=None): # real signature unknown; restored from __doc__ 57 #仅读取一行数据 58 """ 59 readline([size]) -> next line from the file, as a string. 60 61 Retain newline. A non-negative size argument limits the maximum 62 number of bytes to return (an incomplete line may be returned then). 63 Return an empty string at EOF. 64 """ 65 pass 66 67 def readlines(self, size=None): # real signature unknown; restored from __doc__ 68 #读取所有数据,并根据换行保存值列表 69 """ 70 readlines([size]) -> list of strings, each a line from the file. 71 72 Call readline() repeatedly and return a list of the lines so read. 73 The optional size argument, if given, is an approximate bound on the 74 total number of bytes in the lines returned. 75 """ 76 return [] 77 78 def seek(self, offset, whence=None): # real signature unknown; restored from __doc__ 79 #指定文件中指针位置 80 """ 81 seek(offset[, whence]) -> None. Move to new file position. 82 83 Argument offset is a byte count. Optional argument whence defaults to 84 0 (offset from start of file, offset should be >= 0); other values are 1 85 (move relative to current position, positive or negative), and 2 (move 86 relative to end of file, usually negative, although many platforms allow 87 seeking beyond the end of a file). If the file is opened in text mode, 88 only offsets returned by tell() are legal. Use of other offsets causes 89 undefined behavior. 90 Note that not all file objects are seekable. 91 """ 92 pass 93 94 def tell(self): # real signature unknown; restored from __doc__ 95 #获取当前指针位置 96 """ tell() -> current file position, an integer (may be a long integer). """ 97 pass 98 99 def truncate(self, size=None): # real signature unknown; restored from __doc__ 100 #截断数据,仅保留指定之前数据 101 """ 102 truncate([size]) -> None. Truncate the file to at most size bytes. 103 104 Size defaults to the current file position, as returned by tell(). 105 """ 106 pass 107 108 def write(self, p_str): # real signature unknown; restored from __doc__ 109 #写内容 110 """ 111 write(str) -> None. Write string str to file. 112 113 Note that due to buffering, flush() or close() may be needed before 114 the file on disk reflects the data written. 115 """ 116 pass 117 118 def writelines(self, sequence_of_strings): # real signature unknown; restored from __doc__ 119 #将一个字符串列表写入文件 120 """ 121 writelines(sequence_of_strings) -> None. Write the strings to the file. 122 123 Note that newlines are not added. The sequence can be any iterable object 124 producing strings. This is equivalent to calling write() for each string. 125 """ 126 pass 127 128 def xreadlines(self): # real signature unknown; restored from __doc__ 129 #可用于逐行读取文件,非全部 130 """ 131 将弃用,可以用下面的方法 132 for line in f: 133 print line.strip(); 134 """ 135 """ 136 xreadlines() -> returns self. 137 138 For backward compatibility. File objects now include the performance 139 optimizations previously implemented in the xreadlines module. 140 """ 141 pass
三、with
为了避免打开文件后忘记关闭,可以通过管理上下文,即:
with open('log','r') as f:
......
如此方式,当with代码块执行完毕时,内部会自动关闭并释放文件资源。
在python2.7后,with又支持同时对多个文件的上下文进行管理,即:
with open('log1') as obj1,open('log2') as obj2:
pass