Linux 基础 IO 详解：从 C 标准库到系统调用的底层逻辑

Linux 基础 IO 详解：从 C 标准库到系统调用的底层逻辑 | 极客日志

#include <stdio.h>
#include <stdlib.h>

int main() {
    FILE *file;
    int numbers[] = {1, 2, 3, 4, 5};
    // 写入数据
    file = fopen("data.bin", "wb");
    if (file != NULL) {
        size_t written = fwrite(numbers, sizeof(int), 5, file);
        printf("写入了 %zu 个整数\n", written);
        fclose(file);
    }
    return 0;
}

#include <stdio.h>
#include <stdlib.h>

int main() {
    FILE *file;
    int read_numbers[5];
    // 读取数据
    file = fopen("data.bin", "rb");
    if (file != NULL) {
        size_t read = fread(read_numbers, sizeof(int), 5, file);
        printf("读取了 %zu 个整数\n", read);
        for (int i = 0; i < read; i++) {
            printf("%d ", read_numbers[i]);
        }
        printf("\n");
        fclose(file);
    }
    return 0;
}

fseek(FILE *stream, long offset, int whence);
// stream 为需要设置的文件指针
// offset 为偏移量，单位为字节
// whence 为基准值，也就是从哪个位置偏移

常量	含义
`SEEK_SET`	从文件开头开始偏移
`SEEK_CUR`	从当前位置偏移
`SEEK_END`	从文件末尾开始偏移

rewind(FILE *stream);
// stream 为需要重置的文件指针

名称	类型	默认连接的设备	用途
`stdin`	输入流	键盘	接收输入
`stdout`	输出流	屏幕（终端）	打印正常输出内容
`stderr`	输出流	屏幕（终端）	打印错误或调试信息

#include <stdio.h>
#include <string.h>

int main() {
    const char *msg = "hello fwrite\n";
    fwrite(msg, strlen(msg), 1, stdout);
    printf("hello printf\n");
    fprintf(stdout, "hello fprintf\n");
    return 0;
}

#include <stdio.h>
#define ONE 0x01 // 0000 0001
#define TWO 0x02 // 0000 0010
#define THREE 0x04 // 0000 0100

void func(int flags) {
    if (flags & ONE) printf("flags has ONE! ");
    if (flags & TWO) printf("flags has TWO! ");
    if (flags & THREE) printf("flags has THREE! ");
    printf("\n");
}

int main() {
    func(ONE);
    func(THREE);
    func(ONE | TWO);
    func(ONE | THREE | TWO);
    return 0;
}

宏名	含义
`O_RDONLY`	只读
`O_WRONLY`	只写
`O_RDWR`	读写
`O_CREAT`	文件不存在则创建
`O_TRUNC`	文件存在则清空内容
`O_APPEND`	每次写入都追加到文件末尾
`O_EXCL`	和 `O_CREAT` 一起用，确保文件不存在
`O_NONBLOCK`	非阻塞打开（如设备或管道）

open("log.txt", O_WRONLY | O_CREAT, 0644);

#include <stdio.h>
#include <sys/types.h>
#include <sys/stat.h>
#include <fcntl.h>
#include <unistd.h>
#include <string.h>

int main() {
    int fd = open("myfile", O_RDONLY);
    if (fd < 0) {
        perror("open");
        return 1;
    }
    const char *msg = "hello bit!\n";
    char buf[1024];
    while (1) {
        ssize_t s = read(fd, buf, strlen(msg));
        if (s > 0) {
            printf("%s", buf);
        } else {
            break;
        }
    }
    close(fd);
    return 0;
}

#include <stdio.h>
#include <sys/types.h>
#include <sys/stat.h>
#include <fcntl.h>
#include <unistd.h>
#include <string.h>

int main() {
    umask(0);
    int fd = open("myfile", O_WRONLY | O_CREAT, 0644);
    if (fd < 0) {
        perror("open");
        return 1;
    }
    int count = 5;
    const char *msg = "hello bit!\n";
    int len = strlen(msg);
    while (count--) {
        write(fd, msg, len); // fd: 后面讲，msg：缓冲区首地址，len: 本次读取，期望写入多少个字节的数据。返回值：实际写了多少字节数据
    }
    close(fd);
    return 0;
}

#include <stdio.h>
#include <sys/types.h>
#include <sys/stat.h>
#include <fcntl.h>
#include <stdlib.h>

int main() {
    close(1);
    int fd = open("myfile", O_WRONLY | O_CREAT, 00644);
    if (fd < 0) {
        perror("open");
        return 1;
    }
    printf("fd: %d\n", fd);
    fflush(stdout);
    close(fd);
    exit(0);
}

#include <fcntl.h>
#include <unistd.h>
#include <stdio.h>

int main() {
    int fd = open("out.txt", O_WRONLY | O_CREAT | O_TRUNC, 0644);
    if (fd < 0) {
        perror("open");
        return 1;
    }
    dup2(fd, 1); // 标准输出 → out.txt
    close(fd); // fd 已不再需要
    printf("Hello, world!\n"); // 实际写入到 out.txt
    return 0;
}

#include <fcntl.h>
#include <unistd.h>
#include <stdio.h>

int main() {
    int fd = open("input.txt", O_RDONLY);
    if (fd < 0) {
        perror("open");
        return 1;
    }
    dup2(fd, 0); // 标准输入 ← input.txt
    close(fd);
    char buf[128];
    fgets(buf, sizeof(buf), stdin); // 从 input.txt 读取
    printf("Read: %s", buf);
    return 0;
}

#include <fcntl.h>
#include <unistd.h>
#include <stdio.h>

int main() {
    int fd = open("log.txt", O_WRONLY | O_CREAT | O_APPEND, 0644);
    if (fd < 0) {
        perror("open");
        return 1;
    }
    dup2(fd, 2); // 标准输出 → 追加到 log.txt
    close(fd);
    printf("Appended line\n"); // 会追加而不是覆盖
    return 0;
}

#include <iostream>
#include <cstdio>

int main() {
    printf("hello printf\n");
    std::cout << "hello cout" << std::endl;
    fprintf(stderr, "hello perror\n");
    std::cerr << "hello cerr" << std::endl;
    return 0;
}

atomic_long_t f_count; // 表示打开文件的引用计数，如果有多个文件指针指向它，就会增加 f_count 的值。
unsigned int f_flags; // 表示打开文件的权限
fmode_t f_mode; // 设置对文件的访问模式，例如：只读，只写等。所有的标志在头文件<fcntl.h> 中定义
loff_t f_pos; // 表示当前读写文件的位置

struct file_operations {
    struct module *owner; // 指向拥有该模块的指针；
    loff_t (*llseek)(struct file *, loff_t, int); // llseek 方法用作改变文件中的当前读/写位置，并且新位置作为 (正的) 返回值.
    ssize_t (*read)(struct file *, char __user *, size_t, loff_t *); // 用来从设备中获取数据。在这个位置的一个空指针导致 read 系统调用以 -EINVAL("Invalid argument") 失败。一个非负返回值代表了成功读取的字节数 (返回值是一个"signed size" 类型，常常是目标平台本地的整数类型).
    ssize_t (*write)(struct file *, const char __user *, size_t, loff_t *); // 发送数据给设备。如果 NULL，-EINVAL 返回给调用 write 系统调用的程序。如果非负，返回值代表成功写的字节数.
    ssize_t (*aio_read)(struct kiocb *, const struct iovec *, unsigned long, loff_t *); // 初始化一个异步读 -- 可能在函数返回前不结束的读操作.
    ssize_t (*aio_write)(struct kiocb *, const struct iovec *, unsigned long, loff_t *); // 初始化设备上的一个异步写.
    int (*readdir)(struct file *, void *, filldir_t); // 对于设备文件这个成员应当为 NULL; 它用来读取目录，并且仅对**文件系统**有用.
    unsigned int (*poll)(struct file *, struct poll_table_struct *);
    int (*ioctl)(struct inode *, struct file *, unsigned int, unsigned long);
    long (*unlocked_ioctl)(struct file *, unsigned int, unsigned long);
    long (*compat_ioctl)(struct file *, unsigned int, unsigned long);
    int (*mmap)(struct file *, struct vm_area_struct *); // mmap 用来请求将设备内存映射到进程的地址空间。如果这个方法是 NULL，mmap 系统调用返回 -ENODEV.
    int (*open)(struct inode *, struct file *); // 打开一个文件
    int (*flush)(struct file *, fl_owner_t id); // flush 操作在进程关闭它的设备文件描述符的拷贝时调用;
    int (*release)(struct inode *, struct file *); // 在文件结构被释放时引用这个操作。如同 open, release 可以为 NULL.
    int (*fsync)(struct file *, struct dentry *, int datasync); // 用户调用来刷新任何挂着的数据.
    int (*aio_fsync)(struct kiocb *, int datasync);
    int (*fasync)(int, struct file *, int);
    int (*lock)(struct file *, int, struct file_lock *); // lock 方法用来实现文件加锁; 加锁对常规文件是必不可少的特性，但是设备驱动几乎从不实现它.
    ssize_t (*sendpage)(struct file *, struct page *, int, size_t, loff_t *, int);
    unsigned long (*get_unmapped_area)(struct file *, unsigned long, unsigned long, unsigned long, unsigned long);
    int (*check_flags)(int);
    int (*flock)(struct file *, int, struct file_lock *);
    ssize_t (*splice_write)(struct pipe_inode_info *, struct file *, loff_t *, size_t, unsigned int);
    ssize_t (*splice_read)(struct file *, loff_t *, struct pipe_inode_info *, size_t, unsigned int);
    int (*setlease)(struct file *, long, struct file_lock **);
};

用户空间：open(), read(), write(), close()
↓ VFS 层：统一的文件操作接口
↓ 具体文件系统：ext4, proc, sysfs, devfs, tmpfs...
↓ 硬件层：磁盘、内存、设备等

// 没有缓冲区：每次都是系统调用
for (int i = 0; i < 1000; i++) {
    write(fd, &i, sizeof(int)); // 1000 次系统调用！
}
// 有缓冲区：攒够了再写
// 可能只需要几次系统调用
for (int i = 0; i < 1000; i++) {
    fprintf(fp, "%d ", i); // 数据先存在缓冲区
}
// 缓冲区满了或程序结束时才真正写入

#include <stdio.h>
#include <string.h>
#include <sys/types.h>
#include <sys/stat.h>
#include <fcntl.h>
#include <unistd.h>

int main() {
    close(1);
    int fd = open("log.txt", O_WRONLY | O_CREAT | O_TRUNC, 0666);
    if (fd < 0) {
        perror("open");
        return 0;
    }
    printf("hello world: %d\n", fd);
    close(fd);
    return 0;
}

#include <stdio.h>
#include <string.h>
#include <sys/types.h>
#include <sys/stat.h>
#include <fcntl.h>
#include <unistd.h>

int main() {
    close(1);
    int fd = open("log.txt", O_WRONLY | O_CREAT | O_TRUNC, 0666);
    if (fd < 0) {
        perror("open");
        return 0;
    }
    printf("hello world: %d\n", fd);
    fflush(stdout);
    close(fd);
    return 0;
}

#include <stdio.h>
#include <string.h>

int main() {
    const char *msg0 = "hello printf\n";
    const char *msg1 = "hello fwrite\n";
    const char *msg2 = "hello write\n";
    printf("%s", msg0);
    fwrite(msg1, strlen(msg0), 1, stdout);
    write(1, msg2, strlen(msg2));
    fork();
    return 0;
}

// 在/usr/include/libio.h
struct _IO_FILE {
    int _flags; /* High-order word is _IO_MAGIC; rest is flags. */
#define _IO_file_flags flags
    /* 缓冲区相关 */
    /* The following pointers correspond to the C++ streambuf protocol. */
    /* Note: Tk uses the _IO_read_ptr and _IO_read_end fields directly. */
    char *_IO_read_ptr; /* Current read pointer */
    char *_IO_read_end; /* End of get area. */
    char *_IO_read_base; /* Start of putback+get area. */
    char *_IO_write_base; /* Start of put area. */
    char *_IO_write_ptr; /* Current put pointer. */
    char *_IO_write_end; /* End of put area. */
    char *_IO_buf_base; /* Start of reserve area. */
    char *_IO_buf_end; /* End of reserve area. */
    /* The following fields are used to support backing up and undo. */
    char *_IO_save_base; /* Pointer to start of non-current get area. */
    char *_IO_backup_base; /* Pointer to first valid character of backup area */
    char *_IO_save_end; /* Pointer to end of non-current get area. */
    struct _IO_marker *_markers;
    struct _IO_FILE *_chain; // 链接进程中打开的文件
    int _fileno; // 封装的文件描述符
#if 0
    int _blksize;
#else
    int _flags2;
#endif
    _IO_off_t _old_offset; /* This used to be _offset but it's too small. */
#define __HAVE_COLUMN
    /* temporary */
    /* 1+column number of pbase(); 0 is unknown. */
    unsigned short _cur_column;
    signed char _vtable_offset;
    char _shortbuf[1];
    /* char* _save_gptr; char* _save_egptr; */
    _IO_lock_t *_lock;
#ifdef _IO_USE_OLD_IO_FILE
};

// 在/usr/include/stdio.h
typedef struct _IO_FILE FILE;

#pragma once
#define SIZE 1024
#define FLUSH_NONE 0
#define FLUSH_LINE 1
#define FLUSH_FULL 2

struct IO_FILE {
    int flag; // 刷新方式
    int fileno; // 文件描述符
    char outbuffer[SIZE]; // 缓冲区
    int cap;
    int size; // TODO
};
typedef struct IO_FILE mFILE;

mFILE *mfopen(const char *filename, const char *mode);
int mfwrite(const void *ptr, int num, mFILE *stream);
void mfflush(mFILE *stream);
void mfclose(mFILE *stream);

#include "my_stdio.h"
#include <string.h>
#include <stdlib.h>
#include <sys/stat.h>
#include <sys/types.h>
#include <fcntl.h>
#include <unistd.h>

mFILE *mfopen(const char *filename, const char *mode) {
    int fd = -1;
    if (strcmp(mode, "r") == 0) {
        fd = open(filename, O_RDONLY);
    } else if (strcmp(mode, "w") == 0) {
        fd = open(filename, O_CREAT | O_WRONLY | O_TRUNC, 0666);
    } else if (strcmp(mode, "a") == 0) {
        fd = open(filename, O_CREAT | O_WRONLY | O_APPEND, 0666);
    }
    if (fd < 0) return NULL;
    mFILE *mf = (mFILE *)malloc(sizeof(mFILE));
    if (!mf) {
        close(fd);
        return NULL;
    }
    mf->fileno = fd;
    mf->flag = FLUSH_LINE;
    mf->size = 0;
    mf->cap = SIZE;
    return mf;
}

void mfflush(mFILE *stream) {
    if (stream->size > 0) {
        // 写到内核文件的文件缓冲区中!
        write(stream->fileno, stream->outbuffer, stream->size);
        // 刷新到外设
        fsync(stream->fileno);
        stream->size = 0;
    }
}

int mfwrite(const void *ptr, int num, mFILE *stream) {
    // 1. 拷贝
    memcpy(stream->outbuffer + stream->size, ptr, num);
    stream->size += num;
    // 2. 检测是否要刷新
    if (stream->flag == FLUSH_LINE && stream->size > 0 && stream->outbuffer[stream->size - 1] == '\n') {
        mfflush(stream);
    }
    return num;
}

void mfclose(mFILE *stream) {
    if (stream->size > 0) {
        mfflush(stream);
    }
    close(stream->fileno);
}

#include "my_stdio.h"
#include <stdio.h>
#include <string.h>
#include <unistd.h>

int main() {
    mFILE *fp = mfopen("./log.txt", "a");
    if (fp == NULL) {
        return 1;
    }
    int cnt = 10;
    while (cnt) {
        printf("write %d\n", cnt);
        char buffer[64];
        snprintf(buffer, sizeof(buffer), "hello message, number is : %d", cnt);
        cnt--;
        mfwrite(buffer, strlen(buffer), fp);
        mfflush(fp);
        sleep(1);
    }
    mfclose(fp);
}

Linux 基础 IO 详解：从 C 标准库到系统调用的底层逻辑

前言

一. 理解'文件'

1.1 一般角度

1.2 系统角度

二. 回顾 C 语言文件接口

2.1 C 中的读写操作

更多推荐文章

相关免费在线工具

2.2 标准输入输出流

三. 系统文件 IO

3.1 标志位

3.2 文件系统调用

3.2.1 open

3.2.2 close

3.2.3 read

3.2.4 write

3.3 文件描述符

四. 重定向

五. 理解标准错误

六. 理解'一切皆文件'

七. 缓冲区

7.1 什么是缓冲区

7.2 缓冲区的作用

7.3 简单设计一下 libc 库

八. 总结：基础 IO 的核心脉络

更多推荐文章

相关免费在线工具

Linux 基础 IO 详解：从 C 标准库到系统调用的底层逻辑

前言

一. 理解'文件'

1.1 一般角度

1.2 系统角度

二. 回顾 C 语言文件接口

2.1 C 中的读写操作

微信扫一扫，关注极客日志

更多推荐文章

相关免费在线工具

2.2 标准输入输出流

三. 系统文件 IO

3.1 标志位

3.2 文件系统调用

3.2.1 open

3.2.2 close

3.2.3 read

3.2.4 write

3.3 文件描述符

四. 重定向

五. 理解标准错误

六. 理解'一切皆文件'

七. 缓冲区

7.1 什么是缓冲区

7.2 缓冲区的作用

7.3 简单设计一下 libc 库

八. 总结：基础 IO 的核心脉络

微信扫一扫，关注极客日志

更多推荐文章

相关免费在线工具