Python架构知识点大全（一）

2026-04-02 48

版权

本文内容由阿里云实名注册用户自发贡献，版权归原作者所有，阿里云开发者社区不拥有其著作权，亦不承担相应法律责任。具体规则请查看《阿里云开发者社区用户服务协议》和《阿里云开发者社区知识产权保护指引》。如果您发现本社区中有涉嫌抄袭的内容，填写侵权投诉表单进行举报，一经查实，本社区将立刻删除涉嫌侵权内容。

简介： 教程来源 https://htnus.cn/category/artificial-intelligence.html 本文系统解析Python架构核心：从三层架构（用户代码→核心层→内置库→C扩展）、CPython等五大解释器，到对象模型、引用计数与分代GC、内存池机制等底层原理，助开发者深入理解运行机制，提升代码性能与可靠性。

Python作为一门高级编程语言，其架构设计体现了“优雅、明确、简单”的哲学思想。从解释器的核心实现到内存管理机制，从字节码执行到垃圾回收，Python的架构设计融合了多种经典的设计模式和技术方案。本文将系统全面地梳理Python架构的核心知识点，从解释器原理到并发模型，从内存管理到性能优化，帮助开发者深入理解Python的内部工作机制，写出更高效、更可靠的Python程序。

一、Python架构概述

1.1 Python的整体架构
Python的架构可以分为三个主要层次：

┌─────────────────────────────────────────────────────────────┐
│                    Python层（用户代码）                       │
│  ┌─────────────┐ ┌─────────────┐ ┌─────────────────────┐    │
│  │  .py文件    │ │  模块/包    │ │  用户定义的类/函数   │    │
│  └─────────────┘ └─────────────┘ └─────────────────────┘    │
├─────────────────────────────────────────────────────────────┤
│                    核心层（Core）                            │
│  ┌─────────────────────────────────────────────────────┐    │
│  │                  编译器（Compiler）                   │    │
│  │  词法分析 → 语法分析 → 抽象语法树 → 字节码生成        │    │
│  └─────────────────────────────────────────────────────┘    │
│  ┌─────────────────────────────────────────────────────┐    │
│  │                  虚拟机（VM）                        │    │
│  │  字节码解释器 | 帧栈管理 | 异常处理 | 协程支持       │    │
│  └─────────────────────────────────────────────────────┘    │
│  ┌─────────────────────────────────────────────────────┐    │
│  │                  运行时（Runtime）                   │    │
│  │  对象模型 | 类型系统 | 内存管理 | 垃圾回收           │    │
│  └─────────────────────────────────────────────────────┘    │
├─────────────────────────────────────────────────────────────┤
│                     内置库层（Built-ins）                     │
│  ┌──────────┐ ┌──────────┐ ┌──────────┐ ┌──────────┐       │
│  │ 内置类型 │ │ 内置函数 │ │ 异常系统 │ │ 核心模块 │       │
│  └──────────┘ └──────────┘ └──────────┘ └──────────┘       │
├─────────────────────────────────────────────────────────────┤
│                    C语言扩展层（Extension）                   │
│  ┌─────────────────────────────────────────────────────┐    │
│  │         C API | Cython | ctypes | CFFI               │    │
│  └─────────────────────────────────────────────────────┘    │
└─────────────────────────────────────────────────────────────┘

1.2 Python解释器的类型

# Python有多种解释器实现

# 1. CPython - 官方参考实现（C语言编写）
# 最常用的Python解释器

# 2. PyPy - JIT编译实现（RPython编写）
# 适合长时间运行的程序
def heavy_computation():
    total = 0
    for i in range(10000000):
        total += i
    return total

# 3. Jython - Java平台实现
# 可以无缝调用Java库

# 4. IronPython - .NET平台实现
# 可以无缝调用.NET库

# 5. MicroPython - 嵌入式设备实现
# 适合资源受限的环境

1.3 Python的执行模型

# Python执行流程：源代码 → 字节码 → 虚拟机执行

import dis

def example_function(x, y):
    result = x + y
    return result

# 查看字节码
print("字节码:")
dis.dis(example_function)

# 编译为字节码
code = compile('print("Hello")', '<string>', 'exec')
print(f"\n代码对象类型: {type(code)}")
print(f"字节码: {code.co_code}")

# 执行字节码
exec(code)

# Python字节码指令示例
def loop_example(n):
    total = 0
    for i in range(n):
        total += i
    return total

print("\n循环的字节码:")
dis.dis(loop_example)

二、对象模型

2.1 Python对象体系

# Python中一切皆对象
print("对象类型层次结构:")

# 类型对象
print(f"int的类型: {type(int)}")
print(f"str的类型: {type(str)}")
print(f"list的类型: {type(list)}")

# 元类（metaclass）
class Meta(type):
    pass

class MyClass(metaclass=Meta):
    pass

print(f"MyClass的类型: {type(MyClass)}")  # <class '__main__.Meta'>

# 对象的基本结构
class Demo:
    pass

obj = Demo()
print(f"对象ID: {id(obj)}")
print(f"对象类型: {type(obj)}")
print(f"对象属性: {dir(obj)}")

# PyObject结构（C层面）
# typedef struct _object {
#     Py_ssize_t ob_refcnt;  // 引用计数
#     PyTypeObject *ob_type; // 类型指针
# } PyObject;

2.2 可变对象与不可变对象

# 不可变对象：int, float, str, tuple, frozenset
# 可变对象：list, dict, set, bytearray

# 不可变对象的行为
a = 10
b = a
print(f"a = {a}, b = {b}, a is b: {a is b}")

a += 5
print(f"a = {a}, b = {b}, a is b: {a is b}")  # a改变，b不变

# 可变对象的行为
list1 = [1, 2, 3]
list2 = list1
print(f"list1 = {list1}, list2 = {list2}, list1 is list2: {list1 is list2}")

list1.append(4)
print(f"list1 = {list1}, list2 = {list2}")  # list2也跟着改变

# 小整数缓存（-5到256）
a = 256
b = 256
print(f"256的地址相同: {a is b}")  # True

c = 257
d = 257
print(f"257的地址相同: {c is d}")  # False（CPython特性）

2.3 类型系统

# Python的鸭子类型（Duck Typing）
class Duck:
    def quack(self):
        return "嘎嘎"

    def swim(self):
        return "游泳"

class Person:
    def quack(self):
        return "模仿鸭子叫"

    def swim(self):
        return "学游泳"

def make_it_quack(obj):
    # 不检查类型，只检查行为
    return obj.quack()

duck = Duck()
person = Person()
print(make_it_quack(duck))    # 嘎嘎
print(make_it_quack(person))  # 模仿鸭子叫

# 抽象基类（ABC）
from abc import ABC, abstractmethod

class Animal(ABC):
    @abstractmethod
    def make_sound(self):
        pass

class Dog(Animal):
    def make_sound(self):
        return "汪汪"

class Cat(Animal):
    def make_sound(self):
        return "喵喵"

# Animal()  # TypeError: 不能实例化抽象类

# 类型注解（Type Hints）
from typing import List, Dict, Optional

def process_items(items: List[str]) -> Dict[str, int]:
    return {item: len(item) for item in items}

def find_user(user_id: int) -> Optional[Dict[str, str]]:
    if user_id == 1:
        return {"name": "张三"}
    return None

三、内存管理

3.1 引用计数

import sys

# 引用计数机制
class RefCounter:
    pass

obj = RefCounter()
print(f"初始引用计数: {sys.getrefcount(obj) - 1}")  # 减去临时引用

# 增加引用计数
ref1 = obj
ref2 = obj
print(f"添加引用后: {sys.getrefcount(obj) - 1}")

# 删除引用
del ref1
print(f"删除一个引用后: {sys.getrefcount(obj) - 1}")

# 循环引用问题
class Node:
    def __init__(self, value):
        self.value = value
        self.next = None

# 创建循环引用
a = Node(1)
b = Node(2)
a.next = b
b.next = a

# 引用计数无法回收循环引用
del a
del b
# Node对象仍在内存中，需要垃圾回收

3.2 垃圾回收

import gc

# 分代垃圾回收
# 三代：0代（年轻代）、1代、2代（老年代）

# 查看垃圾回收阈值
print(f"垃圾回收阈值: {gc.get_threshold()}")  # (700, 10, 10)

# 手动触发垃圾回收
gc.collect()

# 监控垃圾回收
gc.set_debug(gc.DEBUG_STATS)

class WithFinalizer:
    def __del__(self):
        print(f"对象 {id(self)} 被销毁")

# 创建大量对象触发垃圾回收
objects = []
for i in range(10000):
    objects.append(WithFinalizer())

objects.clear()
gc.collect()

# 禁用垃圾回收（不推荐）
gc.disable()
# 执行代码
gc.enable()

# 查看无法回收的对象
import gc

class Circular:
    def __init__(self):
        self.self = self

circular = Circular()
circular_ref = circular
del circular

# 查看垃圾回收器中的对象
print(f"垃圾回收器中的对象数: {len(gc.get_objects())}")

3.3 内存池机制

# Python的内存管理层次：
# 1. 小块内存（< 256字节）：使用内存池（arena）
# 2. 大块内存（>= 256字节）：使用系统malloc

import sys
import tracemalloc

# 查看对象内存大小
small_list = [1, 2, 3]
large_list = list(range(1000))

print(f"小列表内存: {sys.getsizeof(small_list)} 字节")
print(f"大列表内存: {sys.getsizeof(large_list)} 字节")

# 内存跟踪
tracemalloc.start()

# 分配内存
data = [bytearray(1000) for _ in range(100)]

# 获取内存快照
snapshot = tracemalloc.take_snapshot()
top_stats = snapshot.statistics('lineno')

print("\n内存分配统计:")
for stat in top_stats[:5]:
    print(stat)

tracemalloc.stop()

# 对象内存布局
class Point:
    __slots__ = ('x', 'y')  # 减少内存占用
    def __init__(self, x, y):
        self.x = x
        self.y = y

class PointRegular:
    def __init__(self, x, y):
        self.x = x
        self.y = y

p1 = PointRegular(1, 2)
p2 = Point(1, 2)
print(f"普通类内存: {sys.getsizeof(p1)} 字节")
print(f"__slots__类内存: {sys.getsizeof(p2)} 字节")

来源：
https://htnus.cn/

Python架构知识点大全（一）

一、Python架构概述

二、对象模型

三、内存管理

热门文章

最新文章

相关电子书

探索云世界

热门

云计算

大数据

云原生

人工智能

数据库

开发与运维

活动广场

任务中心

训练营

直播

乘风者计划

下载

镜像站

技术资料

Python架构知识点大全（一）

一、Python架构概述

二、对象模型

三、内存管理

热门文章

最新文章

相关电子书