Python处理MLDonkey 下载中文文件乱码问题 (2)

上次写了一篇关于mldonkey转码的东西,最近作了一次修改,不过仍然需要Python2.4版本的支持,代码如下:

mldonkey.py

# -*- coding: cp936 -*-

############################################################

# convert mldonkey's chinese

# Version: 0.1

# Author: kongxx

# Email: [email protected]

############################################################

import os ,sys ,string ,urllib ,telnetlib ,operator

# define the mldonkey incoming dir

sdir='/usr/local/mldonkey/incoming/'

#flag the num

sNum='0123456789'

#length

len8 = 8

len12 = 12

lengths = [len8 ,len12]

def convert():

filenames=os.listdir(sdir)

for filename in filenames :

for length in lengths :

s1 = filename

s2 = convertName(filename ,length)

try :

if s1 != s2 :

print '############################################################'

print 'The source name is:' + s1

print 'The target name is:' + s2

print ''

confirm = raw_input('Do you confirm rename the file[yes or no]? ')

if confirm == 'yes' :

os.rename(sdir + s1 ,sdir + s2)

break

except UnicodeDecodeError:

print ''

# convert ths file name

# param s the filename

# param length

def convertName(s ,length) :

location = 0

ret = ''

if length not in lengths:

return s

while True :

if location + length <= len(s) :

subStr = s[location:location + length]

if check(subStr) :

if length == len8 :

ret += "%" + hex((int)(subStr[1:4]))[2:4] + "%" + hex((int)(subStr[5:8]))[2:4]

if length == len12 :

ret += "%" + hex((int)(subStr[1:4]))[2:4] + "%" + hex((int)(subStr[5:8]))[2:4] + "%" + hex((int)(subStr[9:12]))[2:4]

location = location + length

else :

ret += s[location :location + 1]

location = location + 1

else :

ret += s[location:]

break

ret = urllib.unquote(ret)

if ret == s : return s

try :

if length == len8 :

return ret.decode('GBK')

if length == len12 :

return ret.decode('UTF-8')

except UnicodeDecodeError:

return ret

def check(s):

if len(s) != len8 and len(s) != len12:

return False

if s[0] != '_' or s[4] != '_' :

return False

if len(s) == len12 and s[8] != '_':

return False

s = s.replace('_','')

for c in s :

if (c not in sNum) :return False

return True

convert()

在命令行输入python mldonkey.py即可以转换。

在命令行输入python mldonkey.py即可以转换。

你可能感兴趣的:(python)