def URLtoUTF8(string):
""""""
g_code_type = ['utf-8', 'utf8', 'gb18030', 'gb2312', 'gbk', 'ISO-8859-2']
try:
tmp = urllib.unquote(str(string))
code = chardet.detect(tmp)['encoding']
try:
g_code_type.index(code.lower())
tmp = tmp.decode(code)
except:
try:
tmp = tmp.decode('utf8')
except:
tmp = tmp.decode('gb18030')
except:
tmp = json.dumps(string)
tmp = tmp.replace(u'"','')
pass
tmp = tmp.replace(u'/xa0',' ')
return tmp
原创文章,作者:Maggie-Hunter,如若转载,请注明出处:https://blog.ytso.com/tech/pnotes/8476.html