Linux poll 多路复用：select 的改良版及其局限

导读：在理解了 select 之后，我们来看看它的改进版本——poll。它通过更合理的数据结构解决了 fd 数量上限和接口混乱的问题，但核心的性能瓶颈依然存在。本文将深入解析 poll 的设计细节、对比分析以及完整服务器实现。

一、select 的痛点回顾

学习 poll 之前，有必要再次明确 select 的缺陷，因为 poll 的设计初衷就是为了解决这些问题：

1. fd 数量上限 1024

select 使用位图（bitmask），fd_set 大小固定。大多数系统下 FD_SETSIZE = 1024，超过这个数就无法监控了。

2. 接口设计不友好

select 需要三个独立的位图分别管理读、写和异常事件。每次调用前必须手动重建集合，且返回后集合会被修改，导致逻辑复杂。

// select 需要三个集合，每次都要重建
fd_set readfds, writefds;
FD_ZERO(&readfds);
FD_SET(fd, &readfds);
// ... select 返回后 readfds 被修改，下次循环前必须重新初始化

3. 核心性能问题未解决

poll 主要解决了问题 1 和 2，但问题 3（每次全量拷贝 + O(n) 遍历）依然保留，这需要等到 epoll 来解决。

二、poll 函数接口详解

1. 函数原型

#include <poll.h>
int poll(struct pollfd *fds, nfds_t nfds, int timeout);

相比 select，poll 的参数更少，不需要分开传递三个集合，接口更加简洁。

2. 核心数据结构：pollfd

poll 的关键在于 pollfd 结构体，它将文件描述符与关注的事件封装在一起：

struct pollfd {
    int fd;       /* 要监控的文件描述符 */
    short events; /* 关注的事件（输入参数）*/
    short revents;/* 实际发生的事件（输出参数）*/
};

events 和 revents 的取值

宏名	值	含义

timeout 值	行为
`-1`	无限等待（永远阻塞）
`0`	立即返回，只检查当前状态
`> 0`	等待最多 timeout 毫秒

改进项	select	poll
fd 数量限制	1024（固定）	无上限（数组大小可动态扩展）
接口设计	三个位图，输入输出混用	pollfd 结构体，events/revents 分离
重建集合	每次必须重建	events 保持不变，只需清零 revents
事件表达	三个集合（读/写/异常）	单结构体内用 events/revents 标志

问题	select	poll
用户态到内核态拷贝	每次拷贝整个 fd_set	每次拷贝整个 pollfd 数组
内核查找就绪 fd	遍历所有 fd，O(n)	遍历所有 pollfd，O(n)

#pragma once #include <iostream> #include <string> #include <memory> #include <poll.h> #include <sys/socket.h> #include <netinet/in.h> #include <arpa/inet.h> #include <unistd.h> #include <cerrno> #include <cstring> const static int g_default_port = 8888; const static int g_backlog = 8; const static int g_max_fds = 1024; // pollfd 数组的初始大小 /** * 简单的 TCP Socket 封装 */ class TcpSocket { public: TcpSocket(int fd = -1) : fd_(fd) {} int GetFd() const { return fd_; } bool Build(int port) { fd_ = socket(AF_INET, SOCK_STREAM, 0); if (fd_ < 0) return false; int opt = 1; setsockopt(fd_, SOL_SOCKET, SO_REUSEADDR, &opt, sizeof(opt)); struct sockaddr_in addr; addr.sin_family = AF_INET; addr.sin_port = htons(port); addr.sin_addr.s_addr = INADDR_ANY; if (bind(fd_, (struct sockaddr*)&addr, sizeof(addr)) < 0) return false; if (listen(fd_, g_backlog) < 0) return false; return true; } int AcceptConnection(std::string* ip = nullptr, uint16_t* port = nullptr) { struct sockaddr_in peer; socklen_t len = sizeof(peer); int sock = accept(fd_, (struct sockaddr*)&peer, &len); if (sock < 0) return -1; if (ip) *ip = inet_ntoa(peer.sin_addr); if (port) *port = ntohs(peer.sin_port); return sock; } int GetSockFd() const { return fd_; } private: int fd_; }; /** * 基于 poll 的 TCP 服务器 */ class PollServer { public: PollServer(int port = g_default_port) : _port(port), _listen_sock(std::make_unique<TcpSocket>()), _is_running(false), _num(g_max_fds) {} void InitServer() { // 初始化监听 socket if (!_listen_sock->Build(_port)) { perror("build listen socket failed"); exit(1); } printf("[PollServer] 服务器初始化完成，监听端口 %d\n", _port); // 初始化 pollfd 数组 _rfds = new struct pollfd[_num]; for (int i = 0; i < _num; i++) { _rfds[i].fd = -1; // -1 表示空闲槽位 _rfds[i].events = 0; _rfds[i].revents = 0; } // 把监听 socket 放入数组第 0 号位 _rfds[0].fd = _listen_sock->GetSockFd(); _rfds[0].events = POLLIN; } void Loop() { _is_running = true; while (_is_running) { PrintDebug(); int timeout = -1; // 永久阻塞 int n = poll(_rfds, _num, timeout); switch (n) { case 0: printf("[PollServer] poll 超时\n"); break; case -1: perror("poll error"); break; default: // 有 n 个 fd 就绪 HandleEvent(n); break; } } _is_running = false; } void Stop() { _is_running = false; } ~PollServer() { delete[] _rfds; } private: /** * 处理就绪事件 */ void HandleEvent(int ready_count) { for (int i = 0; i < _num; i++) { if (_rfds[i].fd == -1) continue; // 跳过空闲槽位 int fd = _rfds[i].fd; short revents = _rfds[i].revents; // 只处理读就绪事件 if (!(revents & POLLIN)) continue; if (fd == _listen_sock->GetSockFd()) { // 监听 socket 就绪：有新连接 HandleNewConnection(); } else { // 普通 socket 就绪：有数据可读 HandleData(i, fd); } // 清零 revents（poll 不会自动清零） _rfds[i].revents = 0; } } /** * 处理新连接 */ void HandleNewConnection() { std::string client_ip; uint16_t client_port; int sock = _listen_sock->AcceptConnection(&client_ip, &client_port); if (sock == -1) { perror("accept error"); return; } printf("[PollServer] 新连接：%s:%d, fd=%d\n", client_ip.c_str(), client_port, sock); // 在 pollfd 数组中找一个空闲槽位 int pos = FindEmptySlot(); if (pos == -1) { // 数组满了，可以扩容或拒绝 printf("[PollServer] 服务器已满，拒绝连接 fd=%d\n", sock); close(sock); return; } // 将新连接加入 pollfd 数组 _rfds[pos].fd = sock; _rfds[pos].events = POLLIN; _rfds[pos].revents = 0; printf("[PollServer] fd=%d 加入监控，位置 pos=%d\n", sock, pos); } /** * 处理普通连接的数据 */ void HandleData(int pos, int fd) { char buffer[1024] = {0}; ssize_t n = recv(fd, buffer, sizeof(buffer) - 1, 0); if (n > 0) { // 正常数据 buffer[n] = '\0'; printf("[PollServer] fd=%d 收到：%s\n", fd, buffer); // 简单的回显服务：原样返回 std::string response = std::string("服务器收到：") + buffer; send(fd, response.c_str(), response.size(), 0); } else if (n == 0) { // 客户端正常关闭 printf("[PollServer] fd=%d 正常断开\n", fd); CloseConnection(pos); } else { // 出错 if (errno != EINTR) { perror("recv error"); printf("[PollServer] fd=%d 出错，关闭\n", fd); CloseConnection(pos); } } } /** * 关闭连接，清理 pollfd 槽位 */ void CloseConnection(int pos) { close(_rfds[pos].fd); _rfds[pos].fd = -1; _rfds[pos].events = 0; _rfds[pos].revents = 0; } /** * 在数组中找第一个空闲槽位（fd == -1） */ int FindEmptySlot() { for (int i = 1; i < _num; i++) { // 从 1 开始，0 是 listen_sock if (_rfds[i].fd == -1) { return i; } } return -1; // 没有空闲槽位 } /** * 打印当前监控的 fd 列表（调试用） */ void PrintDebug() { printf("[PollServer] 当前监控的 fd："); for (int i = 0; i < _num; i++) { if (_rfds[i].fd != -1) { printf("%d ", _rfds[i].fd); } } printf("\n"); } private: int _port; std::unique_ptr<TcpSocket> _listen_sock; bool _is_running; struct pollfd* _rfds; // pollfd 数组 int _num; // 数组大小 };

比较项	select	poll	epoll
fd 数量限制	1024（FD_SETSIZE）	无限制	无限制
数据结构	三个位图（fd_set）	pollfd 数组	红黑树 + 就绪队列
用户到内核拷贝	每次全量拷贝	每次全量拷贝	只在 ctl 时拷贝
查找就绪 fd	遍历所有，O(n)	遍历所有，O(n)	回调机制，O(k)
集合重建	每次必须重建	events 保留，revents 清零	内核维护，无需重建
工作模式	LT 模式	LT 模式	LT + ET 模式
跨平台	所有平台支持	类 Unix 平台支持	Linux 专属
适用场景	连接数少（<100）	连接数中等	高并发（万级以上）

#	要点	关键点
1	pollfd 结构体	fd + events（输入）+ revents（输出），设计比 select 清晰
2	无数量限制	数组大小由用户决定，可动态扩容
3	-1 标记空闲	poll 自动忽略 fd < 0 的条目
4	revents 需手动清零	poll 不会自动清零，每次处理后需手动清零
5	仍是 O(n)	全量拷贝 + 全量遍历的问题未解决

Linux poll 多路复用：select 的改良版及其局限