ASCII 只能存英文 ,8位
utf-8 可變長的字符編碼,所有英文按ascll佔一個字節,常用中文字符用utf-8編碼佔用3個字節
#-*- coding:gbk -*-
import sys
# with語句 爲了避免打開文件後忘記關閉,可以通過管理上下文,即
#好處 他不用在關閉文件close 他會自動操作關閉
with open("yesterday","r",encoding="utf-8") as f:
for line in f:
print(line.strip())
#查看系統默認編碼
print(sys.getdefaultencoding())
#----------------------python2轉碼-----------------------
'''
s="你好"
# uft-8 -->uniconde -->gbk
s_to_unicode=s.decode("utf-8") #UTF-8轉換爲unicode 告訴Uuniconde 我原來是UTF-8
print(s_to_unicode)
s_to_gbk=s_to_unicode.encode("gbk")#uniconde轉換爲gbk
print(s_to_gbk)
#gbk --> uniconde -->utf-8
#gbk轉爲uniconde ,uniconde轉爲utf-8
gbk_to_utf=s_to_gbk.decode("gbk").encode("utf-8")
'''
#---------------------python3轉碼-----------------------
#unicode 可以等於utf-8 所以可一直直接轉個gbk
s="你好"
s_gbk=s.encode("gbk")
print(s_gbk)
print(s.encode())
gbk_to_utf8=s_gbk.decode("gbk").encode("utf-8")
print(gbk_to_utf8)
print("utf-8",gbk_to_utf8)