共识原理

文件 = 内容 + 属性
被打开的文件需要加载到内存中
内存中的文件需要被操作系统管理

用户级文件接口

详见C++文件操作

详见C语言文件操作

Linux系统调用接口

fd 文件描述符与访问文件的本质

fd(file descriptor),即文件描述符,下文的系统调用接口经常以fd命名变量，fd是整形变量，作为数组下标，用于管理打开的文件

可以看到,一个进程通过struct files _struct里的指针数组，管理多个同时打开的文件

且每个进程启动时，会默认打开三个文件,且默认fd固定

stdout

read

所需头文件
#include <unistd.h>
声明
ssize_t read(int fd, void *buf, size_t count);

参数

fd即为目标文件的文件描述符
buf为要从文件读取字节到的内存地址
count为最大读取字节数

返回值

若成功，返回读取文件的字节数,类型为ssize_t,是层层封装的long int
若失败，返回-1,并设置errno的值

write

所需头文件
#include <unistd.h>
声明
ssize_t write(int fd, const void *buf, size_t count);

参数

fd 为目标文件的文件描述符
buf为要写入文件的源内存地址,输入字节数量取决于count形参
count为要输入的字节数量,若要输入为字符串，且要输入字符串的全部内容，建议使用strlen(buf)，防止输入\0,因为对于文件来说，\0是非法字符

返回值

若成功，返回写入文件的字节数,类型为ssize_t,是层层封装的long int
若失败，返回-1,并设置errno的值

特别的
read函数从文件中读取的是字节内容，不把读取的内容看作字符串，因此，不会自动添加\0在写入buf内容的结尾

用法见后文对open的介绍

open

所需头文件

1
2
3

#include <sys/types.h>
#include <sys/stat.h>
#include <fcntl.h>

声明
int open(const char *pathname, int flags);
int open(const char *pathname, int flags，mode_t mode);

参数:

pathname为文件路径，若只有文件名，则默认在当前工作路径搜索
flag则是一个位图,而不应看作整型参数，传参时可用|位运算传递多个参数到位图中,例如O_CREAT | O_WRONLY
mode则是在创建文件时,传入权限信息,这里使用八进制表示法，例如传入0666
返回值:
若成功，返回打开文件的fd值
若失败，则返回-1

写入操作

打开已有文件并写入

#include <stdio.h>
#include <string.h>
#include <unistd.h>
#include <sys/types.h>
#include <sys/stat.h>
#include <fcntl.h>

int main()
{
    //前提是log.txt已存在
    int fd = open("log.txt",O_WRONLY,0666);//只写模式打开文件
    
    char msg[] = "this is a msg";//准备字符串
    write(fd,msg,strlen(msg));//写入
    close(fd);//关闭文件
    return 0;
}

当原本log.txt为空文件时

1	this is a msg

当原log.txt不为空且内容长度大于程序输入的msg时，发生部分覆写

例如原内容为0000111100001111时，执行后为

1	this is a msg111

可以看到有一部分没有被覆盖

打开空文件或创建空文件

#include <stdio.h>
#include <string.h>
#include <unistd.h>
#include <sys/types.h>
#include <sys/stat.h>
#include <fcntl.h>

int main()
{
    //唯一的区别是这里的参数
    //O_CREAT可以创建空文件
    //O_TRUNC保证打开已有文件时，清空原文内容
    int fd = open("log.txt",O_CREAT|O_WRONLY|O_TRUNC,0666);
    
    char msg[] = "this is a msg";
    write(fd,msg,strlen(msg));
    close(fd);
    return 0;
}

追加写入

追加写入只需把O_TRUNC改成O_APPEND即可

#include <stdio.h>
#include <string.h>
#include <unistd.h>
#include <sys/types.h>
#include <sys/stat.h>
#include <fcntl.h>

int main()
{
    int fd = open("log.txt",O_CREAT|O_WRONLY|O_APPEND,0666);//追加模式打开文化
    
    char msg[] = "this is a msg";
    write(fd,msg,strlen(msg));
    close(fd);
    return 0;
}

这里我们事先删除log.txt文件，然后运行两次编译出的程序,可以获得如下内容

1	this is a msgthis is a msg

可以看到内容追加了两次

读取操作

只读模式读取内容

#include <stdio.h>
#include <string.h>
#include <unistd.h>
#include <sys/types.h>
#include <sys/stat.h>
#include <fcntl.h>

int main()
{
    int fd = open("log.txt",O_RDONLY);
    char* buf[1024];
    ssize_t n = read(fd,buf,sizeof(buf)-1);//这里要储存字符串，所以要留一位给\0
    if(n<0) perror("read");//打开失败，输出错误信息
    else buf[n] = '\0';//添加结尾
    printf("%s\n",buf);//打印读取到的内容
    return 0;
}

实现准备内容为123456的log.txt文件

然后运行./mycmd

得到输出和文件内容

zzz456

关于read没读取到前面新写入的zzz,是因为wtrite和read操作都是从文件的同一处继续操作的，并不会发生回退

close

int close(int fd);

用于冲刷缓冲区，并关闭一个文件描述符

dup2 文件重定向

int dup2(int oldfd, int newfd);

如图所示，dup2能将oldfd对应的数组元素覆盖到newfd对应的数组元素处，完成对newfd对应文件的重定向

图中就是完成了对标准输出的重定向,像printf之类的函数会直接输出内容到文件中,而不是显示器

#include <stdio.h>
#include <string.h>
#include <unistd.h>
#include <sys/types.h>
#include <sys/stat.h>
#include <fcntl.h>

int main()
{
    int fd = open("log.txt",O_RDWR|O_CREAT|O_TRUNC,0666);//打开一个新的空文件
    dup2(fd,1);//标准输出重定向

    printf("output1\n");//输出
    printf("output2\n");//输出

    return 0;
}

运行代码后，可以看到终端没有输出

而打开log.txt

1 2	output1 output2

子进程与父进程的文件关系

子进程对父进程的拷贝

先运行一段代码测试子进程是否继承父进程的打开文件

#include <stdio.h>
#include <string.h>
#include <unistd.h>
#include <sys/types.h>
#include <sys/stat.h>
#include <fcntl.h>
#include <sys/wait.h>

int main()
{
    int fd = open("log.txt",O_RDWR|O_CREAT|O_TRUNC|O_APPEND);//追加模式打开一个新文件
    dup2(fd,1);//在fork前就打开文件

    pid_t id = fork();//创建子进程
    if(id == 0)
    {
        printf("child output\n");//子进程输出到文件
        exit(0);
    }
    else 
    {
        waitpid(id,0,0);//阻塞等待子进程
        printf("parent output\n");//父进程输出
    }

    return 0;
}

这段代码中，我们在fork之前完成了对标准输出的重定向,然后fork之后令父进程和子进程进行不同的标准输出

运行结果为父进程和子进程的标准输出都重定向到了文件

1 2	child output parent output

子进程和父进程的独立性

接下来一段代码测试父进程和子进程的打开文件是否独立

#include <stdio.h>
#include <string.h>
#include <unistd.h>
#include <sys/types.h>
#include <sys/stat.h>
#include <fcntl.h>
#include <sys/wait.h>

int main()
{
    int fd = open("log.txt",O_RDWR|O_CREAT|O_TRUNC|O_APPEND);//追加模式打开一个新文件

    pid_t id = fork();//创建子进程
    if(id == 0)
    {
        dup2(fd,1);//只有子进程重定向了标准输出
        printf("child output\n");//子进程输出到文件
        exit(0);
    }
    else 
    {
        waitpid(id,0,0);//阻塞等待子进程
        printf("parent output\n");//父进程输出
    }

    return 0;
}

这里我们在fork之前都不进行重定向，fork后仅对子进程进行了标准输出重定向，而父进程不作任何重定向

在运行后发现子进程的输出重定向不会影响父进程,二者有独立性

1	parent output

1	child output

进程替换

先在同级文件夹准备一个待替换的程序

execute.c

#include <stdio.h>

int main()
{
    printf("exe output\n");
}

然后运行gcc -o execute execute.c编译获得一个程序

然后准备主程序

mycmd.c

#include <stdio.h>
#include <string.h>
#include <unistd.h>
#include <sys/types.h>
#include <sys/stat.h>
#include <fcntl.h>
#include <sys/wait.h>

int main()
{
    int fd = open("log.txt",O_RDWR|O_CREAT|O_TRUNC|O_APPEND);//追加模式打开一个新文件

    pid_t id = fork();//创建子进程
    if(id == 0)
    {
        dup2(fd,1);//只有子进程重定向了标准输出
        execvp("./execute",NULL);//进程替换
        exit(0);
    }
    else 
    {
        waitpid(id,0,0);//阻塞等待子进程
        printf("parent wait success\n");//父进程输出
    }

    return 0;
}

这里我们使子进程先标准输出重定向，再进行进程替换，发现替换后的进程，也是标准输出重定向的状态

1	exe output

结论

进程替换不会改变原进程的文件打开状态和重定向关系