#-- coding:gbk -- 指定文件编码 #Author:lei import sys print(sys.getdefaultencoding()) s = "你好" print(s) print(s.encode("gbk")) #编码都会转成bytes类型 print(s.encode("utf-8")) gbk_to_utf8 = s.encode("gbk").decode("gbk").encode("utf-8") print(gbk_to_utf8) #unicode 统一的万维码
import sys print(sys.getdefaultencoding()) s = "你哈" print(s.encode("gbk")) print(s.encode("utf-8")) print(s.encode("utf-8").decode("utf-8").encode("gb2312").decode("gb2312")) #decode("utf-8") 文件本身为utf-8格式 解码成unicode #gb2312向下兼容 gbk #python 3.x所有的编码成utf-8 gb2312 gbk 都成了byte类型文件,只有 decode 解码之后才成为字符串