with open('contacts.txt', 'r', encoding='utf-8') as f:
data = f.read()
二进制模式读
使用场景:网络传输(视频、图片或进行网络传输的文本)
with open('contacts.txt', 'rb') as f:
data = f.read()
print(data) # 打印出16进制的编码格式
检测编码的工具
import chardet
with open('contacts.txt', 'rb') as f:
data = f.read()
print(data)
print(chardet.detect(data)) # {'encoding': 'utf-8', 'confidence': 0.99, 'language': ''} confidence是自信程度print(data.decode('utf-8')) # 文本的内容
循环文件和写模式操作文件
with open('contacts.txt', 'r', encoding='utf-8') as f:
for line in f:
print(line) # 会多出很多空格'''
因为print()打印时默认加了换行,所以加上,如果出现文件输出有空行的情况直接将print的换行取消即可。
给print()加一个取消自动换行的end=""参数即可:print(line,end=""),跟windows,unix没有关系。就是这么简单。
'''
with open('兼职.txt', 'w', encoding='utf-8') as f: # w是创建,会清空以前的内容,慎用。
f.write('好好学编程')
with open('兼职.txt', 'wb') as f:
f.write('好好学编程'.encode('utf-8'))
追加模式操作文件
with open('contacts.txt', 'a', encoding='utf-8') as f:
f.write('
小胖 河北 182 100 13222222222')
with open('contacts.txt', 'ab') as f:
f.write('
小胖 河北 182 100 13222222222'.encode('utf-8')) # 把二进制用utf-8编码
读写混合模式
with open('contacts.txt', 'r+', encoding='utf-8') as f:
data = f.read()
print('content', data)
f.write('
newline 1哈哈')
f.write('
newline 2哈哈')
f.write('
newline 3哈哈')
f.write('
newline 4哈哈') # 在后面追加写的内容print('new content', f.read()) # 不显示新写的内容,因为写完后光标在最后的位置,后面是空的,所以读出来是空的。
写读模式 ---> 先写后读(几乎没有应用场景)
with open('contacts.txt', 'w+', encoding='utf-8') as f:
data = f.read()
print('content', data)
f.write('
newline 1哈哈')
f.write('
newline 2哈哈')
f.write('
newline 3哈哈')
f.write('
newline 4哈哈') # 重新创建,把之前的清空掉在写print('new content', f.read())
import os
f_name = 'contacts.txt'
f_new_name = "%s.new" % f_name
old_str = '马纤羽'
new_str = 'new马纤羽'
f = open(f_name, 'r', encoding='utf-8')
f_new = open(f_new_name, 'w', encoding='utf-8')
for line in f:
if old_str in line:
line = line.replace(old_str, new_str)
f_new.write(line)
with open(f_name, 'r', encoding='utf-8') as f:
for line in f:
if old_str in line:
line = line.replace(old_str, new_str)
with open(f_new_name, 'a', encoding='utf-8') as f_new:
f_new.write(line)
os.rename(f_new_name, f_name) # 把新文件名替换成旧文件名,这样就替换了旧文件# 完成后contacts.txt文件里之前是马纤羽的都变成了new马纤羽
下面是用占内存的方式来修改
with open('contacts.txt', 'r+', encoding='utf-8') as f:
data = f.read()
data = data.replace('杜姗姗', 'Alex')
f.seek(0)
f.write(data) # 如果是减内容的话(比如以前是1个G,改完后就剩800MB了),可以用truncate截取到800MB那个点。