Python 文件操作深度解析与避坑指南

Python 文件操作深度解析与避坑指南 | 极客日志

# 打开文件（模式：'r' 读取，'w' 写入，'a' 追加，'b' 二进制）
file = open('example.txt', 'r')  # 默认模式是 'r'

# 读取文件内容
content = file.read()      # 读取全部内容
content = file.readline()  # 读取一行
content = file.readlines() # 读取所有行，返回列表

# 写入文件
file.write("Hello, World!\n")           # 写入字符串
file.writelines(["Line 1\n", "Line 2\n"]) # 写入多行

# 关闭文件（重要！）
file.close()

# ✅ 最佳实践：使用 with 语句
with open('example.txt', 'r') as file:
    content = file.read()
    # 文件在代码块结束时自动关闭

模式	说明	适用场景
`'r'`	读取（默认）	读取现有文件
`'w'`	写入（覆盖）	创建新文件或覆盖现有文件
`'a'`	追加	在文件末尾添加内容（不覆盖）
`'b'`	二进制模式	处理图片、音频等二进制文件
`'+'`	读写模式	同时读写（如 `'r+'`）
`'t'`	文本模式（默认）	处理文本文件
`'x'`	独占创建	仅当文件不存在时创建

# ✅ 正确：逐行读取大文件
with open('big_file.txt', 'r') as file:
    for line in file:
        # 处理每一行（避免内存溢出）
        process_line(line.strip())

import csv

# 写入 CSV
data = [['Name', 'Age'], ['Alice', 30], ['Bob', 25]]
with open('users.csv', 'w', newline='') as file:
    writer = csv.writer(file)
    writer.writerows(data)

# 读取 CSV
with open('users.csv', 'r') as file:
    reader = csv.reader(file)
    for row in reader:
        print(row)  # 输出：['Name', 'Age'], ['Alice', '30'], ...

import json

# 写入 JSON
data = {"name": "Alice", "age": 30}
with open('data.json', 'w') as file:
    json.dump(data, file, indent=2)  # 格式化输出

# 读取 JSON
with open('data.json', 'r') as file:
    loaded_data = json.load(file)
    print(loaded_data['name'])  # Alice

# 读取二进制文件
with open('image.jpg', 'rb') as file:
    image_data = file.read()

# 写入二进制文件
with open('copy.jpg', 'wb') as file:
    file.write(image_data)

import os

# 获取当前脚本目录
BASE_DIR = os.path.dirname(os.path.abspath(__file__))

# 安全构建路径
file_path = os.path.join(BASE_DIR, 'data', 'file.txt')

# 创建目录（如果不存在）
os.makedirs(os.path.dirname(file_path), exist_ok=True)

# 写入文件
with open(file_path, 'w') as file:
    file.write("Hello")

# ❌ 错误：忘记关闭文件
file = open('data.txt', 'r')
content = file.read()
# 没有 file.close()，可能造成资源泄漏

# ❌ 错误：使用 'w' 模式追加内容
with open('log.txt', 'w') as file:
    file.write("New log entry\n")  # 会覆盖原有内容

# ✅ 正确：使用 'a' 模式追加
with open('log.txt', 'a') as file:
    file.write("New log entry\n")

# ❌ 错误：未指定编码
with open('chinese.txt', 'r') as file:
    content = file.read()

# ✅ 正确：指定编码
with open('chinese.txt', 'r', encoding='utf-8') as file:
    content = file.read()

# ❌ 错误：大文件一次性读取
with open('huge_file.txt', 'r') as file:
    content = file.read()  # 如果文件很大，会内存溢出

# ✅ 正确：逐行处理
with open('huge_file.txt', 'r') as file:
    for line in file:
        # 处理每一行

# ❌ 错误：相对路径
with open('data.csv', 'r') as file:
    # 如果当前工作目录不是代码所在目录，会找不到文件

# ✅ 正确：使用 os.path
import os
BASE_DIR = os.path.dirname(os.path.abspath(__file__))
file_path = os.path.join(BASE_DIR, 'data.csv')
with open(file_path, 'r') as file:
    content = file.read()

# ❌ 错误：未处理异常
with open('missing_file.txt', 'r') as file:
    content = file.read()

# ✅ 正确：处理异常
try:
    with open('missing_file.txt', 'r') as file:
        content = file.read()
except FileNotFoundError:
    print("File not found")

# ❌ 错误：未刷新缓冲区
with open('data.txt', 'w') as file:
    file.write("Hello")  # 数据可能还在缓冲区，未写入磁盘

# ✅ 正确：使用 flush()
with open('data.txt', 'w') as file:
    file.write("Hello")
    file.flush()  # 强制刷新到磁盘

最佳实践	说明	示例
始终使用 `with` 语句	自动管理文件关闭，避免泄漏	`with open(...):`
指定编码	避免乱码	`open(..., encoding='utf-8')`
大文件用逐行处理	避免内存溢出	`for line in file:`
使用 `os.path` 处理路径	确保跨平台兼容	`os.path.join(BASE_DIR, 'file')`
处理文件不存在异常	防止程序崩溃	`try/except FileNotFoundError`
使用标准库模块	避免手动解析	`csv`, `json`, `pickle`

import datetime

def log_message(message):
    """记录日志到文件（安全追加）"""
    with open('app.log', 'a', encoding='utf-8') as log_file:
        log_file.write(f"{datetime.datetime.now()}: {message}\n")

# 使用 log_message("Application started")
log_message("User logged in")

import csv
import os

def process_csv(input_file, output_file):
    """处理 CSV 文件：添加一列"""
    # 确保输出目录存在
    os.makedirs(os.path.dirname(os.path.abspath(output_file)), exist_ok=True)
    
    with open(input_file, 'r', encoding='utf-8') as infile, \
         open(output_file, 'w', encoding='utf-8', newline='') as outfile:
        reader = csv.reader(infile)
        writer = csv.writer(outfile)
        
        # 读取标题行
        header = next(reader)
        header.append('processed')
        writer.writerow(header)
        
        for row in reader:
            row.append('yes')
            writer.writerow(row)

# 使用 process_csv('input.csv', 'output/processed.csv')

import json
import os

def load_config(config_path):
    """安全加载 JSON 配置文件"""
    if not os.path.exists(config_path):
        raise FileNotFoundError(f"Config file not found: {config_path}")
    try:
        with open(config_path, 'r', encoding='utf-8') as config_file:
            return json.load(config_file)
    except json.JSONDecodeError as e:
        raise ValueError(f"Invalid JSON format in {config_path}: {e}")

# 使用
try:
    config = load_config('config.json')
    print(config['database'])
except FileNotFoundError as e:
    print(f"Error: {e}")

陷阱	问题	解决方案
忘记关闭文件	资源泄漏	使用 `with` 语句
错误模式（覆盖）	丢失数据	用 `'a'` 模式追加
大文件一次性读取	内存溢出	逐行读取
未指定编码	乱码	指定 `encoding='utf-8'`
相对路径问题	文件找不到	使用 `os.path`
未处理文件不存在	程序崩溃	添加 `FileNotFoundError` 处理
未刷新缓冲区	数据未写入磁盘	`file.flush()`

import os
import json
from datetime import datetime

def safe_write_file(file_path, content, encoding='utf-8'):
    """安全写入文件（带异常处理）"""
    try:
        # 确保目录存在
        os.makedirs(os.path.dirname(os.path.abspath(file_path)), exist_ok=True)
        with open(file_path, 'w', encoding=encoding) as file:
            file.write(content)
        print(f"Successfully wrote to {file_path}")
    except IOError as e:
        print(f"IO error writing to {file_path}: {e}")
        raise

def safe_read_file(file_path, encoding='utf-8'):
    """安全读取文件（带异常处理）"""
    try:
        with open(file_path, 'r', encoding=encoding) as file:
            return file.read()
    except IOError as e:
        print(f"IO error reading from {file_path}: {e}")
        raise

def process_data():
    """处理数据并保存为 JSON"""
    data = {
        "timestamp": datetime.now().isoformat(),
        "content": "Processed data"
    }
    # 生成安全的文件路径
    output_dir = "data"
    output_file = os.path.join(output_dir, "processed_data.json")
    # 安全写入
    safe_write_file(output_file, json.dumps(data, indent=2))

if __name__ == "__main__":
    try:
        process_data()
        print("Data processing completed successfully")
    except Exception as e:
        print(f"Critical error: {e}")

Python 文件操作深度解析与避坑指南

📌 一、文件操作的基本语法结构

1. 基础语法：打开、读取、写入、关闭

2. 推荐方式：使用 `with` 语句（自动管理文件关闭）

3. 文件模式速查表

🔧 二、进阶使用与实际场景

场景 1：处理大文件（逐行读取）

场景 2：CSV 文件操作（使用 `csv` 模块）

场景 3：JSON 文件操作（使用 `json` 模块）

场景 4：二进制文件操作

场景 5：文件路径安全处理（使用 `os.path`）

⚠️ 三、致命陷阱与避坑指南

陷阱 1：忘记关闭文件（资源泄漏）

陷阱 2：错误的文件模式（覆盖数据）

陷阱 3：未处理编码问题（乱码）

陷阱 4：大文件一次性读取（内存溢出）

陷阱 5：相对路径问题（文件找不到）

陷阱 6：未处理文件不存在异常

陷阱 7：在写入后未刷新缓冲区

📌 四、文件操作最佳实践

🌟 五、实际场景实例

实例 1：日志记录（安全追加）

实例 2：批量处理 CSV 文件

实例 3：安全读取配置文件

📊 六、文件操作陷阱速查表

💡 七、总结：文件操作的 Pythonic 哲学

✅ 八、实践示例：完整文件处理流程

🏆 九、推荐：文件操作的 5 个黄金法则

更多推荐文章

相关免费在线工具

Python 文件操作深度解析与避坑指南

📌 一、文件操作的基本语法结构

1. 基础语法：打开、读取、写入、关闭

2. 推荐方式：使用 with 语句（自动管理文件关闭）

3. 文件模式速查表

🔧 二、进阶使用与实际场景

场景 1：处理大文件（逐行读取）

场景 2：CSV 文件操作（使用 csv 模块）

场景 3：JSON 文件操作（使用 json 模块）

场景 4：二进制文件操作

场景 5：文件路径安全处理（使用 os.path）

⚠️ 三、致命陷阱与避坑指南

陷阱 1：忘记关闭文件（资源泄漏）

陷阱 2：错误的文件模式（覆盖数据）

陷阱 3：未处理编码问题（乱码）

陷阱 4：大文件一次性读取（内存溢出）

陷阱 5：相对路径问题（文件找不到）

陷阱 6：未处理文件不存在异常

陷阱 7：在写入后未刷新缓冲区

📌 四、文件操作最佳实践

🌟 五、实际场景实例

实例 1：日志记录（安全追加）

实例 2：批量处理 CSV 文件

实例 3：安全读取配置文件

📊 六、文件操作陷阱速查表

💡 七、总结：文件操作的 Pythonic 哲学

✅ 八、实践示例：完整文件处理流程

🏆 九、推荐：文件操作的 5 个黄金法则

微信扫一扫，关注极客日志

更多推荐文章

相关免费在线工具

2. 推荐方式：使用 `with` 语句（自动管理文件关闭）

场景 2：CSV 文件操作（使用 `csv` 模块）

场景 3：JSON 文件操作（使用 `json` 模块）

场景 5：文件路径安全处理（使用 `os.path`）