UNIX 高级环境编程 实验二目录树的遍历

it2024-11-01  17

实验二 目录树的遍历

1. 实验内容




myfind <pathname> [-comp <filename> | -name <str>…]


myfind <pathname> 的功能:除了具有与程序4-7相同的功能外,还要输出在目录子树之下,文件长度不大于4096字节的常规文件,在所有允许访问的普通文件中所占的百分比。程序不允许打印出任何路径名。myfind <pathname> -comp <filename> 的功能:是常规文件的路径名(非目录名,但是其路径可以包含目录)。命令仅仅输出在目录子树之下,所有与文件内容一致的文件的绝对路径名。不允许输出任何其它的路径名,包括不可访问的路径名。myfind <pathname> -name <str>… 的功能:…是一个以空格分隔的文件名序列(不带路径)。命令输出在目录子树之下,所有与…序列中文件名相同的文件的绝对路径名。不允许输出不可访问的或无关的路径名。

<pathname> 和 <filename> 均既可以是绝对路径名,也可以是相对路径名。<pathname> 即可以是目录,也可以是文件,此时,目录为当前工作目录。

2. 实验设计与实现

2.1 前置知识掌握,课本程序理解

static Myfunc myfunc; static int myftw(char *, Myfunc *); static int dopath(Myfunc *);


myftw:程序的主要功能封装,包括目录名的预处理,目录名存储空间的分配,以及调用dopath函数。dopath:深度优先遍历目录,并对每个文件调用myfunc函数进行计数。myfunc:使用lstat统计各类文件信息,以及相应打不开文件或未知文件类型出错处理。 int ret; if (argc != 2) err_quit("usage: ftw <starting-pathname>"); ret = myftw(argv[1], myfunc); /* does it all */ ntot = nreg + ndir + nblk + nchr + nfifo + nslink + nsock; if (ntot == 0) ntot = 1; /* avoid divide by 0; print 0 for all counts */ printf("regular files = %7ld, %5.2f %%\n", nreg, nreg*100.0/ntot); printf("directories = %7ld, %5.2f %%\n", ndir, ndir*100.0/ntot); printf("block special = %7ld, %5.2f %%\n", nblk, nblk*100.0/ntot); printf("char special = %7ld, %5.2f %%\n", nchr, nchr*100.0/ntot); printf("FIFOs = %7ld, %5.2f %%\n", nfifo, nfifo*100.0/ntot); printf("symbolic links = %7ld, %5.2f %%\n", nslink, nslink*100.0/ntot); printf("sockets = %7ld, %5.2f %%\n", nsock, nsock*100.0/ntot); exit(ret);


static int /* we return whatever func() returns */ myftw(char *pathname, Myfunc *func) { int len; fullpath = path_alloc(&len); /* malloc's for PATH_MAX+1 bytes */ /* ({Prog pathalloc}) */ strncpy(fullpath, pathname, len); /* protect against */ fullpath[len-1] = 0; /* buffer overrun */ return(dopath(func)); }


static int /* we return whatever func() returns */ dopath(Myfunc* func) { struct stat statbuf; struct dirent *dirp; DIR *dp; int ret; char *ptr; if (lstat(fullpath, &statbuf) < 0) /* stat error */ return(func(fullpath, &statbuf, FTW_NS)); if (S_ISDIR(statbuf.st_mode) == 0) /* not a directory */ return(func(fullpath, &statbuf, FTW_F)); /* * It's a directory. First call func() for the directory, * then process each filename in the directory. */ if ((ret = func(fullpath, &statbuf, FTW_D)) != 0) return(ret); ptr = fullpath + strlen(fullpath); /* point to end of fullpath */ *ptr++ = '/'; *ptr = 0; if ((dp = opendir(fullpath)) == NULL) /* can't read directory */ return(func(fullpath, &statbuf, FTW_DNR)); while ((dirp = readdir(dp)) != NULL) { if (strcmp(dirp->d_name, ".") == 0 || strcmp(dirp->d_name, "..") == 0) continue; /* ignore dot and dot-dot */ strcpy(ptr, dirp->d_name); /* append name after slash */ if ((ret = dopath(func)) != 0) /* recursive */ break; /* time to leave */ } ptr[-1] = 0; /* erase everything from slash onwards */ if (closedir(dp) < 0) err_ret("can't close directory %s", fullpath); return(ret); }


2.2 自写程序功能解析


#include <dirent.h> #include <fcntl.h> #include "apue.h" dirent.h:用到 opendir、closedirapue.h :用到 malloc、 stdio.h、 printf 、 string.h、strcat、memcpy、strlen、sys/stat.h:lstat、unistd.h、lseek、getcwd、chdir、宏定义常量fcntl.h:用到open //Parameter: //Regular file //Directory file //Character file //Block file //FIFO file //Socket file //Symbol link file enum descrip{ S_REGULAR,S_DIR,S_CHAR,S_BLOCK,S_FIFO,S_LINK,S_SOCKET,S_SPE,S_TOT,S_LENGTH };


// find function void find(char *basename, void (*visit)(char *, struct stat *)) { if (chdir(basename) == -1) // use chdir and getcwd to obtain fullpath of argv[1] return; long int len_pathname_max = pathconf("/", _PC_PATH_MAX); //printf("%ld\n",len_pathname_max); if ((pathname = (char *) malloc(len_pathname_max)) == NULL) return; if (getcwd(pathname, len_pathname_max) == NULL)return; len_pathname = strlen(pathname); //printf("%ld\n",len_pathname); deep_first_search(visit); }


// myfunc for `-name` option void work_name(char *path_name, struct stat *st) { int i; for (i=0;i<len_filenames;i++) { //printf("%s %s\n",pathname,filenames[i]); if (strcmp(path_name, filenames[i]) == 0)printf("%s\n", pathname); } }


// myfunc for `-comp` option void work_comp(char *path_name, struct stat *st) { //printf("%s %d st->st_size:%d\n", pathname,filesize,st->st_size); if (st->st_size!=filesize)return; int fd2; if ((fd2=open(pathname,O_RDONLY)) == -1) return; if (~lseek(fd,0,SEEK_SET)) { //printf("%s ac\n", pathname); char buf1[buffer]="",buf2[buffer]=""; while (read(fd,buf1,buffer) > 0 && read(fd2,buf2,buffer)>0) if (memcmp(buf1, buf2, buffer) != 0) { close(fd2); return; } close(fd2); printf("%s\n", pathname); } }


// dopath function void deep_first_search(void (*visit)(char *, struct stat *)) { int len_filename; DIR *dp; struct dirent *dirp; struct stat st; //printf("%s\n",pathname); if ((dp = opendir(pathname)) == NULL) return; if (pathname[len_pathname - 1] == '/') // truncate redundant '/' { len_pathname -= 1; pathname[len_pathname] = '\0'; } //printf("%s\n",pathname); while ((dirp = readdir(dp)) != NULL) { if (strcmp(dirp->d_name, ".") == 0 || strcmp(dirp->d_name, "..") == 0) continue; // filter two special dirs len_filename = strlen(dirp->d_name); len_pathname += len_filename + 1; strcat(pathname, "/"); strcat(pathname, dirp->d_name); //printf("%s\n",pathname); if(~(lstat(pathname,&st))) { //printf("%s\n",pathname); visit(dirp->d_name, &st); if (S_ISDIR(st.st_mode)) deep_first_search(visit); // recursive if it's a dir } len_pathname -= len_filename + 1; pathname[len_pathname] = '\0'; } closedir(dp); }



gcc -o myfind myfind.c libapue.a

调用二参数模式 ./myfind /


调用四参数模式 ./myfind / -comp apue.h



调用多(>=4)参数模式 ./myfind / -name apue.h apue.2e string.h

从二参数模式的统计信息可以看出,这台服务器上的文件分布与课本上给出的文件分布示例大致相符,绝大部分还是常规文件,其次是目录,再其次是符号链接。而其他的字符文件、套接字等也都存在,但有个不完美的地方就是其实很多其他用户的目录文件都没有打开。从四参数模式 ./myfind / -comp apue.h 输出来看,程序成功比较了根目录下能成功打开的文件内容,输出了与用户提供的文件内容一致的文件绝对路径从调用多(>=4)参数模式 ./myfind / -name apue.h apue.2e string.h 输出来看,程序可以找出同个目录下的多个相同文件名的文件,对输入多文件名也支持




#include "apue.h" #include <dirent.h> #include <limits.h> /* function type that is called for each filename */ typedef int Myfunc(const char *, const struct stat *, int); static Myfunc myfunc; static int myftw(char *, Myfunc *); static int dopath(Myfunc *); static long nreg, ndir, nblk, nchr, nfifo, nslink, nsock, ntot; int main(int argc, char *argv[]) { int ret; if (argc != 2) err_quit("usage: ftw <starting-pathname>"); ret = myftw(argv[1], myfunc); /* does it all */ ntot = nreg + ndir + nblk + nchr + nfifo + nslink + nsock; if (ntot == 0) ntot = 1; /* avoid divide by 0; print 0 for all counts */ printf("regular files = %7ld, %5.2f %%\n", nreg, nreg*100.0/ntot); printf("directories = %7ld, %5.2f %%\n", ndir, ndir*100.0/ntot); printf("block special = %7ld, %5.2f %%\n", nblk, nblk*100.0/ntot); printf("char special = %7ld, %5.2f %%\n", nchr, nchr*100.0/ntot); printf("FIFOs = %7ld, %5.2f %%\n", nfifo, nfifo*100.0/ntot); printf("symbolic links = %7ld, %5.2f %%\n", nslink, nslink*100.0/ntot); printf("sockets = %7ld, %5.2f %%\n", nsock, nsock*100.0/ntot); exit(ret); } /* * Descend through the hierarchy, starting at "pathname". * The caller's func() is called for every file. */ #define FTW_F 1 /* file other than directory */ #define FTW_D 2 /* directory */ #define FTW_DNR 3 /* directory that can't be read */ #define FTW_NS 4 /* file that we can't stat */ static char *fullpath; /* contains full pathname for every file */ static int /* we return whatever func() returns */ myftw(char *pathname, Myfunc *func) { int len; fullpath = path_alloc(&len); /* malloc's for PATH_MAX+1 bytes */ /* ({Prog pathalloc}) */ strncpy(fullpath, pathname, len); /* protect against */ fullpath[len-1] = 0; /* buffer overrun */ return(dopath(func)); } /* * Descend through the hierarchy, starting at "fullpath". * If "fullpath" is anything other than a directory, we lstat() it, * call func(), and return. For a directory, we call ourself * recursively for each name in the directory. */ static int /* we return whatever func() returns */ dopath(Myfunc* func) { struct stat statbuf; struct dirent *dirp; DIR *dp; int ret; char *ptr; if (lstat(fullpath, &statbuf) < 0) /* stat error */ return(func(fullpath, &statbuf, FTW_NS)); if (S_ISDIR(statbuf.st_mode) == 0) /* not a directory */ return(func(fullpath, &statbuf, FTW_F)); /* * It's a directory. First call func() for the directory, * then process each filename in the directory. */ if ((ret = func(fullpath, &statbuf, FTW_D)) != 0) return(ret); ptr = fullpath + strlen(fullpath); /* point to end of fullpath */ *ptr++ = '/'; *ptr = 0; if ((dp = opendir(fullpath)) == NULL) /* can't read directory */ return(func(fullpath, &statbuf, FTW_DNR)); while ((dirp = readdir(dp)) != NULL) { if (strcmp(dirp->d_name, ".") == 0 || strcmp(dirp->d_name, "..") == 0) continue; /* ignore dot and dot-dot */ strcpy(ptr, dirp->d_name); /* append name after slash */ if ((ret = dopath(func)) != 0) /* recursive */ break; /* time to leave */ } ptr[-1] = 0; /* erase everything from slash onwards */ if (closedir(dp) < 0) err_ret("can't close directory %s", fullpath); return(ret); } static int myfunc(const char *pathname, const struct stat *statptr, int type) { switch (type) { case FTW_F: switch (statptr->st_mode & S_IFMT) { case S_IFREG: nreg++; break; case S_IFBLK: nblk++; break; case S_IFCHR: nchr++; break; case S_IFIFO: nfifo++; break; case S_IFLNK: nslink++; break; case S_IFSOCK: nsock++; break; case S_IFDIR: err_dump("for S_IFDIR for %s", pathname); /* directories should have type = FTW_D */ } break; case FTW_D: ndir++; break; case FTW_DNR: err_ret("can't read directory %s", pathname); break; case FTW_NS: err_ret("stat error for %s", pathname); break; default: err_dump("unknown type %d for pathname %s", type, pathname); } return(0); }