赞
踩
实际应用中,我们绝大多数的数据都是通过文件的交互完成的
with open("文件路径", "打开模式", encoding="操作文件的字符编码") as f:
"对文件进行相应的读写操作"
# 使用with块的好处:执行完毕后,自动对文件进行close操作
【例1】 一个简单的文件读取
with open("E:/python/测试文件.txt", "t", encoding="gbk") as f: # 第一步:打开文件
text = f.read() # 第二步:读取文件
print(text)
with open("测试文件.txt", "r", encoding="gbk") as f: # 第一步:打开文件
text = f.read() # 第二步:读取文件
print(text)
with open("三国演义片头曲_utf.txt", encoding="utf-8") as f:
text = f.read()
print(text)
with open("三国演义片头曲_utf.txt", encoding="gbk") as f:
text = f.read()
print(text)
with open("三国演义片头曲_utf.txt", encoding="gbk") as f:
text = f.readline() # 每次读取一行
print(text)
with open("三国演义片头曲_utf.txt", encoding="utf-8") as f:
while True:
text = f.readline()
if not text:
# print(text is "")
break
else:
# print(text == "\n")
print(text, end="") # 保留原文的换行,使print()的换行不起作用
with open("三国演义片头曲_utf.txt", encoding="utf-8") as f:
text = f.readlines() # 注意每行末尾有换行符
print(text)
with open("三国演义片头曲_utf.txt", encoding="utf-8") as f:
for text in f.readlines():
print(text) # 不想换行则用print(text, end="")
文件比较大时,read()和readlines()占用内存过大,不建议使用
readline()用起来又不太方便
with open("三国演义片头曲_utf.txt", encoding="utf-8") as f:
for text in f: # f本身就是可迭代对象,每次迭代读取一行内容
print(text)
图片:二进制文件
with open("text.jpg", "rb") as f:
print(len(f.readlines())) # 读取行数
with open("恋曲1980.txt", "w", encoding="utf-8") as f:
f.write("你曾经对我说\n") # 文件不存在则立刻创建一个
f.write("你永远爱着我\n") # 如需换行,末尾加换行符\n
f.write("爱情这东西我明白\n")
f.write("但永远是什么\n")
# 若文件存在,新写入的内容会覆盖掉原内容,一定要注意!!
with open("恋曲1980.txt", "a", encoding="utf-8") as f:
f.write("姑娘你别哭泣\n") # 若文件存在,新写入的内容会追加内容
f.write("我俩还在一起\n")
f.write("今天的欢乐\n")
f.write("将是明天创痛的回忆\n")
ls = ["春天刮着风\n", "秋天下着雨\n", "春风秋雨多少海誓山盟随风远去\n"]
with open("恋曲1980.txt", "a", encoding="utf-8") as f:
f.writelines(ls)
with open("浪淘沙_北戴河.txt", "r+", encoding="utf-8") as f:
# for line in f:
# print(line) # 全部读一遍后,指针到达末尾
f.seek(0, 2) # 或者可以将指针移到末尾f.seek(偏移字节数,偏移起点位置(0:开始;1:当前位置;2:结尾))
text = ["萧瑟秋风今又是,\n", "换了人间。\n"]
f.writelines(text)
with open("浪淘沙_北戴河.txt", "w+", encoding="utf-8") as f:
text = ["萧瑟秋风今又是,\n", "换了人间。\n"] # 清空原内容
f.writelines(text)
f.seek(0, 0) # 指针移到开始
print(f.read()) # 读取内容
with open("浪淘沙_北戴河.txt", "a+", encoding="utf-8") as f:
text = ["萧瑟秋风今又是,\n", "换了人间。\n"]
f.writelines(text) # 指针在最后,追加新内容
f.seek(0, 0) # 指针移到开始
print(f.read()) # 读取内容
通用的数据格式,可以在不同语言中加载和存储
本节简单了解两种数据存储结构csv和json
由逗号将数据分开的字符序列,可以由excel打开
with open("成绩.csv", "r", encoding="gbk") as f:
ls = []
for line in f: # 逐行提取
ls.append(line.strip("\n").split(",")) # 去掉每行的换行符,然后用","进行分割
for res in ls:
print(res)
示例如图:
运行结果为:
[‘编号’, ‘数学成绩’, ‘语文成绩’]
[‘1’, ‘100’, ‘98’]
[‘2’, ‘96’, ‘99’]
[‘3’, ‘97’, ‘95’]
with open("成绩.csv", "w", encoding="gbk") as f:
ls = [['编号', '数学成绩', '语文成绩'], ['1', '100', '98'], ['2', '96', '99'], ['3', '97', '95']] # encoding= "utf-8"中文出现乱码
for row in ls: # 逐行写入
f.write(",".join(row)+"\n") # 用逗号组合成字符串形式,末尾加换行符
也可以借助csv模块完成上述操作
常用来存储字典类型
import json
scores = {"Petter": {"math": 96, "physics": 98},
"Paul": {"math": 92, "physics": 99},
"Mary": {"math": 98, "physics": 97}}
with open("score.json", "w", encoding="utf-8") as f: # 写入整个对象
# indent 表示字符串换行+缩进 ensure_ascii=False 显示中文
json.dump(scores, f, indent=4, ensure_ascii=False)
运行结果:
{
"Petter": {
"math": 96,
"physics": 98
},
"Paul": {
"math": 92,
"physics": 99
},
"Mary": {
"math": 98,
"physics": 97
}
}
import json
with open("score.json", "r", encoding="utf-8") as f:
scores = json.load(f) # 加载整个对象
for k, v in scores.items():
print(k, v)
运行结果为:
Petter {‘math’: 96, ‘physics’: 98}
Paul {‘math’: 92, ‘physics’: 99}
Mary {‘math’: 98, ‘physics’: 97}
1 / 0
with open("nobody.csv") as f:
pass
传入一个调用者不期望的值,即使这个值的类型是正确的
s = "1.3"
n = int(s)
下标超出序列边界
ls = [1, 2, 3]
ls[5]
传入对象类型与要求不符
1 + "3"
NameError 使用一个还未被赋予对象的变量
KeyError 试图访问字典里不存在的键
当异常发生的时候,如果不预先设定处理方法,程序就会中断
提高程序的稳定性和可靠性
x = 10
y = 0
try:
z = x / y
except ZeroDivisionError: # 一般来说会预判出现什么错误
# z = x/(y+le-7)
# print(z)
print("0不可以被整除!")
结果:
0不可以被整除!
ls = []
d = {"name": "DoubleS"}
try:
# y = x
# ls[3]
d["age"]
except NameError:
print("变量名不存在")
except IndexError:
print("索引超出界限")
except KeyError:
print("键不存在")
结果:
键不存在
ls = []
d = {"name": "DoubleS"}
try:
# y = x
# ls[3]
d["age"]
except Exception:
print("出错啦!")
结果:
出错啦!
ls = []
d = {"name": "DoubleS"}
try:
y = m
except Exception as e:
print(e)
结果:
name ‘m’ is not defined
try:
with open("浪淘沙_北戴河.txt", encoding="utf-8") as f:
text = f.read()
except FileNotFoundError:
print("找不到该文件")
else:
for s in ["\n", ",", "。", "?"]: # 去掉换行符和标点符号
text = text.replace(s, "")
print("毛主席名作《浪淘沙_北戴河》共由{}个字组成".format(len(text)))
ls = []
d = {"name": "DoubleS"}
# y = x
try:
y = x
# ls[3]
# d["age"]
except Exception as e: # 虽不能获得错误具体类型,但可以获得错误的值
print(e)
finally:
print("不论触不触发异常,都将执行")
结果:
name ‘x’ is not defined
不论触不触发异常,都将执行
已经被封装好
无需再自己“造轮子”
声明导入后,拿来即用
时间库time
随机库random
容器数据类型collection
迭代器函数itertools
数据分析numpy、pandas
数据可视化matplotlib
机器学习scikit-learn
深度学习Tensorflow
文件夹内多个py文件,再加一个__init__.py文件(内容可为空)
import time
start = time.time() # 调用time模块中的time()
time.sleep(3) # 调用time模块中的sleep 休息3秒钟
end = time.time()
print("程序运行用时:{:.2f}秒".format(end-start))
运行结果为:
程序运行用时:3.00秒
from itertools import product
ls = list(product("AB", "123"))
print(ls)
运行结果为:
[(‘A’, ‘1’), (‘A’, ‘2’), (‘A’, ‘3’), (‘B’, ‘1’), (‘B’, ‘2’), (‘B’, ‘3’)]
一次导入多个
from function import fun1, fun2
fun1.f1()
fun2.f2()
from random import *
print(randint(1, 100)) # 产生一个[1, 100]之间的随机整数
print(random()) # 产生一个[0, 1)之间的随机小数
模块搜索查找顺序:
import sys
sys.path.append("C:\\xxxxx") # 注意是双斜杠
以上,为第7节全部内容。
Copyright © 2003-2013 www.wpsshop.cn 版权所有,并保留所有权利。