f = urllib2.urlopen(url,timeout=10)data = f.read() # decode the htmlcontentType = f.headers.get('Content-Type')if contentType.find("gbk"): data = unicode(data, "GBK").encode("utf-8")elif contentType.find("utf-8"): pass