ruby/dir.c

1003 строки
19 KiB
C

/**********************************************************************
dir.c -
$Author$
$Date$
created at: Wed Jan 5 09:51:01 JST 1994
Copyright (C) 1993-2001 Yukihiro Matsumoto
Copyright (C) 2000 Network Applied Communication Laboratory, Inc.
Copyright (C) 2000 Information-technology Promotion Agency, Japan
**********************************************************************/
#include "ruby.h"
#include <sys/types.h>
#include <sys/stat.h>
#ifdef HAVE_SYS_PARAM_H
# include <sys/param.h>
#else
# define MAXPATHLEN 1024
#endif
#ifdef HAVE_UNISTD_H
#include <unistd.h>
#endif
#if defined HAVE_DIRENT_H && !defined NT
# include <dirent.h>
# define NAMLEN(dirent) strlen((dirent)->d_name)
#elif defined HAVE_DIRECT_H && !defined NT
# include <direct.h>
# define NAMLEN(dirent) strlen((dirent)->d_name)
#else
# define dirent direct
# define NAMLEN(dirent) (dirent)->d_namlen
# if HAVE_SYS_NDIR_H
# include <sys/ndir.h>
# endif
# if HAVE_SYS_DIR_H
# include <sys/dir.h>
# endif
# if HAVE_NDIR_H
# include <ndir.h>
# endif
# if defined(NT)
# include "win32/dir.h"
# endif
#endif
#include <errno.h>
#ifndef HAVE_STDLIB_H
char *getenv();
#endif
#ifndef HAVE_STRING_H
char *strchr _((char*,char));
#endif
#include <ctype.h>
#ifndef HAVE_LSTAT
#define lstat(path,st) stat(path,st)
#endif
#define FNM_NOESCAPE 0x01
#define FNM_PATHNAME 0x02
#define FNM_PERIOD 0x04
#define FNM_CASEFOLD 0x08
#define FNM_NOMATCH 1
#define FNM_ERROR 2
#define downcase(c) (nocase && ISUPPER(c) ? tolower(c) : (c))
#if defined DOSISH
#define isdirsep(c) ((c) == '/' || (c) == '\\')
static char *
find_dirsep(s)
char *s;
{
while (*s) {
if (isdirsep(*s))
return s;
s++;
}
return 0;
}
#else
#define isdirsep(c) ((c) == '/')
#define find_dirsep(s) strchr(s, '/')
#endif
static char *
range(pat, test, flags)
char *pat;
char test;
int flags;
{
int not, ok = 0;
int nocase = flags & FNM_CASEFOLD;
int escape = !(flags & FNM_NOESCAPE);
not = *pat == '!' || *pat == '^';
if (not)
pat++;
test = downcase(test);
while (*pat) {
int cstart, cend;
cstart = cend = *pat++;
if (cstart == ']')
return ok == not ? 0 : pat;
else if (escape && cstart == '\\')
cstart = cend = *pat++;
if (*pat == '-' && pat[1] != ']') {
if (escape && pat[1] == '\\')
pat++;
cend = pat[1];
if (!cend)
return 0;
pat += 2;
}
if (downcase(cstart) <= test && test <= downcase(cend))
ok = 1;
}
return 0;
}
#define ISDIRSEP(c) (pathname && isdirsep(c))
#define PERIOD(s) (period && *(s) == '.' && \
((s) == string || ISDIRSEP((s)[-1])))
static int
fnmatch(pat, string, flags)
const char *pat;
const char *string;
int flags;
{
int c;
int test;
const char *s = string;
int escape = !(flags & FNM_NOESCAPE);
int pathname = flags & FNM_PATHNAME;
int period = flags & FNM_PERIOD;
int nocase = flags & FNM_CASEFOLD;
while (c = *pat++) {
switch (c) {
case '?':
if (!*s || ISDIRSEP(*s) || PERIOD(s))
return FNM_NOMATCH;
s++;
break;
case '*':
while ((c = *pat++) == '*')
;
if (PERIOD(s))
return FNM_NOMATCH;
if (!c) {
if (pathname && find_dirsep(s))
return FNM_NOMATCH;
else
return 0;
}
else if (ISDIRSEP(c)) {
s = find_dirsep(s);
if (s)
break;
return FNM_NOMATCH;
}
test = escape && c == '\\' ? *pat : c;
test = downcase(test);
pat--;
while (*s) {
if ((c == '[' || downcase(*s) == test) &&
!fnmatch(pat, s, flags & ~FNM_PERIOD))
return 0;
else if (ISDIRSEP(*s))
break;
s++;
}
return FNM_NOMATCH;
case '[':
if (!*s || ISDIRSEP(*s) || PERIOD(s))
return FNM_NOMATCH;
pat = range(pat, *s, flags);
if (!pat)
return FNM_NOMATCH;
s++;
break;
case '\\':
if (escape
#if defined DOSISH
&& *pat && strchr("*?[\\", *pat)
#endif
) {
c = *pat;
if (!c)
c = '\\';
else
pat++;
}
/* FALLTHROUGH */
default:
#if defined DOSISH
if (ISDIRSEP(c) && isdirsep(*s))
;
else
#endif
if(downcase(c) != downcase(*s))
return FNM_NOMATCH;
s++;
break;
}
}
return !*s ? 0 : FNM_NOMATCH;
}
VALUE rb_cDir;
static void
free_dir(dir)
DIR *dir;
{
if (dir) closedir(dir);
}
static VALUE dir_close _((VALUE));
static VALUE
dir_s_new(argc, argv, klass)
int argc;
VALUE *argv;
VALUE klass;
{
VALUE obj = Data_Wrap_Struct(klass, 0, free_dir, 0);
rb_obj_call_init(obj, argc, argv);
return obj;
}
static VALUE
dir_initialize(dir, dirname)
VALUE dir, dirname;
{
DIR *dirp;
SafeStringValue(dirname);
if (DATA_PTR(dir)) closedir(DATA_PTR(dir));
DATA_PTR(dir) = NULL;
dirp = opendir(RSTRING(dirname)->ptr);
if (dirp == NULL) {
if (errno == EMFILE || errno == ENFILE) {
rb_gc();
dirp = opendir(RSTRING(dirname)->ptr);
}
if (dirp == NULL) {
rb_sys_fail(RSTRING(dirname)->ptr);
}
}
DATA_PTR(dir) = dirp;
return dir;
}
static VALUE
dir_s_open(klass, dirname)
VALUE klass, dirname;
{
VALUE dir = Data_Wrap_Struct(klass, 0, free_dir, 0);
dir_initialize(dir, dirname);
if (rb_block_given_p()) {
return rb_ensure(rb_yield, dir, dir_close, dir);
}
return dir;
}
static void
dir_closed()
{
rb_raise(rb_eIOError, "closed directory");
}
#define GetDIR(obj, dirp) {\
Data_Get_Struct(obj, DIR, dirp);\
if (dirp == NULL) dir_closed();\
}
static VALUE
dir_read(dir)
VALUE dir;
{
DIR *dirp;
struct dirent *dp;
GetDIR(dir, dirp);
errno = 0;
dp = readdir(dirp);
if (dp)
return rb_tainted_str_new(dp->d_name, NAMLEN(dp));
else if (errno == 0) { /* end of stream */
return Qnil;
}
else {
rb_sys_fail(0);
}
return Qnil; /* not reached */
}
static VALUE
dir_each(dir)
VALUE dir;
{
DIR *dirp;
struct dirent *dp;
GetDIR(dir, dirp);
for (dp = readdir(dirp); dp != NULL; dp = readdir(dirp)) {
rb_yield(rb_tainted_str_new(dp->d_name, NAMLEN(dp)));
if (DATA_PTR(dir) == NULL) dir_closed();
}
return dir;
}
static VALUE
dir_tell(dir)
VALUE dir;
{
#ifdef HAVE_TELLDIR
DIR *dirp;
long pos;
GetDIR(dir, dirp);
pos = telldir(dirp);
return rb_int2inum(pos);
#else
rb_notimplement();
#endif
}
static VALUE
dir_seek(dir, pos)
VALUE dir, pos;
{
DIR *dirp;
#ifdef HAVE_SEEKDIR
GetDIR(dir, dirp);
seekdir(dirp, NUM2INT(pos));
return dir;
#else
rb_notimplement();
#endif
}
static VALUE
dir_rewind(dir)
VALUE dir;
{
DIR *dirp;
GetDIR(dir, dirp);
rewinddir(dirp);
return dir;
}
static VALUE
dir_close(dir)
VALUE dir;
{
DIR *dirp;
Data_Get_Struct(dir, DIR, dirp);
if (dirp == NULL) dir_closed();
closedir(dirp);
DATA_PTR(dir) = NULL;
return Qnil;
}
static void
dir_chdir(path)
const char *path;
{
if (chdir(path) < 0)
rb_sys_fail(path);
}
static int chdir_blocking = 0;
static VALUE chdir_thread = Qnil;
static VALUE
chdir_restore(path)
const char *path;
{
chdir_blocking--;
if (chdir_blocking == 0)
chdir_thread = Qnil;
dir_chdir(path);
return Qnil;
}
#ifdef HAVE_GETCWD
#define GETCWD(path) if (getcwd(path, sizeof(path)) == 0) rb_sys_fail(path)
#else
#define GETCWD(path) if (getwd(path) == 0) rb_sys_fail(path)
#endif
static VALUE
dir_s_chdir(argc, argv, obj)
int argc;
VALUE *argv;
VALUE obj;
{
VALUE path = Qnil;
char *dist = "";
rb_secure(2);
if (rb_scan_args(argc, argv, "01", &path) == 1) {
SafeStringValue(path);
dist = RSTRING(path)->ptr;
}
else {
dist = getenv("HOME");
if (!dist) {
dist = getenv("LOGDIR");
if (!dist) rb_raise(rb_eArgError, "HOME/LOGDIR not set");
}
}
if (chdir_blocking > 0) {
if (!rb_block_given_p() || rb_thread_current() != chdir_thread)
rb_warn("conflicting chdir during another chdir block");
}
if (rb_block_given_p()) {
char cwd[MAXPATHLEN];
GETCWD(cwd);
chdir_blocking++;
if (chdir_thread == Qnil)
chdir_thread = rb_thread_current();
dir_chdir(dist);
return rb_ensure(rb_yield, path, chdir_restore, (VALUE)cwd);
}
dir_chdir(dist);
return INT2FIX(0);
}
static VALUE
dir_s_getwd(dir)
VALUE dir;
{
char path[MAXPATHLEN];
GETCWD(path);
return rb_tainted_str_new2(path);
}
static VALUE
dir_s_chroot(dir, path)
VALUE dir, path;
{
#if defined(HAVE_CHROOT) && !defined(__CHECKER__)
rb_secure(2);
SafeStringValue(path);
if (chroot(RSTRING(path)->ptr) == -1)
rb_sys_fail(RSTRING(path)->ptr);
return INT2FIX(0);
#else
rb_notimplement();
return Qnil; /* not reached */
#endif
}
static VALUE
dir_s_mkdir(argc, argv, obj)
int argc;
VALUE *argv;
VALUE obj;
{
VALUE path, vmode;
int mode;
if (rb_scan_args(argc, argv, "11", &path, &vmode) == 2) {
mode = NUM2INT(vmode);
}
else {
mode = 0777;
}
SafeStringValue(path);
rb_secure(2);
#if !defined(NT)
if (mkdir(RSTRING(path)->ptr, mode) == -1)
rb_sys_fail(RSTRING(path)->ptr);
#else
if (mkdir(RSTRING(path)->ptr) == -1)
rb_sys_fail(RSTRING(path)->ptr);
#endif
return INT2FIX(0);
}
static VALUE
dir_s_rmdir(obj, dir)
VALUE obj, dir;
{
SafeStringValue(dir);
rb_secure(2);
if (rmdir(RSTRING(dir)->ptr) < 0)
rb_sys_fail(RSTRING(dir)->ptr);
return INT2FIX(0);
}
/* Return nonzero if S has any special globbing chars in it. */
static int
has_magic(s, send, flags)
char *s, *send;
int flags;
{
register char *p = s;
register char c;
int open = 0;
int escape = !(flags & FNM_NOESCAPE);
while ((c = *p++) != '\0') {
switch (c) {
case '?':
case '*':
return Qtrue;
case '[': /* Only accept an open brace if there is a close */
open++; /* brace to match it. Bracket expressions must be */
continue; /* complete, according to Posix.2 */
case ']':
if (open)
return Qtrue;
continue;
case '\\':
if (escape && *p++ == '\0')
return Qfalse;
}
if (send && p >= send) break;
}
return Qfalse;
}
static char*
extract_path(p, pend)
char *p, *pend;
{
char *alloc;
int len;
len = pend - p;
alloc = ALLOC_N(char, len+1);
memcpy(alloc, p, len);
if (len > 1 && pend[-1] == '/'
#if defined DOSISH
&& pend[-2] != ':'
#endif
) {
alloc[len-1] = 0;
}
else {
alloc[len] = 0;
}
return alloc;
}
static char*
extract_elem(path)
char *path;
{
char *pend;
pend = strchr(path, '/');
if (!pend) pend = path + strlen(path);
return extract_path(path, pend);
}
static void
remove_backslashes(p)
char *p;
{
#if defined DOSISH
char *pend = p + strlen(p);
char *t = p;
while (p < pend) {
if (*p == '\\') {
if (++p == pend) break;
}
*t++ = *p++;
}
*t = '\0';
#endif
}
#ifndef S_ISDIR
# define S_ISDIR(m) ((m & S_IFMT) == S_IFDIR)
#endif
static void
glob_helper(path, sub, flags, func, arg)
char *path;
char *sub;
int flags;
void (*func) _((const char*, VALUE));
VALUE arg;
{
struct stat st;
char *p, *m;
p = sub ? sub : path;
if (!has_magic(p, 0, flags)) {
remove_backslashes(path);
if (stat(path, &st) == 0) {
(*func)(path, arg);
}
else if (errno != ENOENT) {
/* In case stat error is other than ENOENT and
we may want to know what is wrong. */
rb_sys_warning(path);
}
return;
}
while (p) {
if (*p == '/') p++;
m = strchr(p, '/');
if (has_magic(p, m, flags)) {
char *dir, *base, *magic, *buf;
DIR *dirp;
struct dirent *dp;
int recursive = 0;
struct d_link {
char *path;
struct d_link *next;
} *tmp, *link = 0;
base = extract_path(path, p);
if (path == p) dir = ".";
else dir = base;
magic = extract_elem(p);
if (stat(dir, &st) < 0) {
if (errno != ENOENT) rb_sys_warning(dir);
free(base);
break;
}
if (S_ISDIR(st.st_mode)) {
if (m && strcmp(magic, "**") == 0) {
int n = strlen(base);
recursive = 1;
buf = ALLOC_N(char, n+strlen(m)+3);
sprintf(buf, "%s%s", base, *base ? m : m+1);
glob_helper(buf, buf+n, flags, func, arg);
free(buf);
}
dirp = opendir(dir);
if (dirp == NULL) {
rb_sys_warning(dir);
free(base);
break;
}
}
else {
free(base);
break;
}
#if defined DOSISH
#define BASE (*base && !((isdirsep(*base) && !base[1]) || (base[1] == ':' && isdirsep(base[2]) && !base[3])))
#else
#define BASE (*base && !(*base == '/' && !base[1]))
#endif
for (dp = readdir(dirp); dp != NULL; dp = readdir(dirp)) {
if (recursive) {
if (strcmp(".", dp->d_name) == 0 || strcmp("..", dp->d_name) == 0)
continue;
buf = ALLOC_N(char, strlen(base)+NAMLEN(dp)+strlen(m)+6);
sprintf(buf, "%s%s%s", base, (BASE)?"/":"", dp->d_name);
if (lstat(buf, &st) < 0) {
if (errno != ENOENT) rb_sys_warning(buf);
continue;
}
if (S_ISDIR(st.st_mode)) {
char *t = buf+strlen(buf);
strcpy(t, "/**");
strcpy(t+3, m);
glob_helper(buf, t, flags, func, arg);
}
free(buf);
continue;
}
if (fnmatch(magic, dp->d_name, flags) == 0) {
buf = ALLOC_N(char, strlen(base)+NAMLEN(dp)+2);
sprintf(buf, "%s%s%s", base, (BASE)?"/":"", dp->d_name);
if (!m) {
(*func)(buf, arg);
free(buf);
continue;
}
tmp = ALLOC(struct d_link);
tmp->path = buf;
tmp->next = link;
link = tmp;
}
}
closedir(dirp);
free(base);
free(magic);
if (link) {
while (link) {
if (stat(link->path, &st) == 0) {
if (S_ISDIR(st.st_mode)) {
int len = strlen(link->path);
int mlen = strlen(m);
char *t = ALLOC_N(char, len+mlen+1);
sprintf(t, "%s%s", link->path, m);
glob_helper(t, t+len, flags, func, arg);
free(t);
}
tmp = link;
link = link->next;
free(tmp->path);
free(tmp);
}
else {
rb_sys_warning(link->path);
}
}
break;
}
}
p = m;
}
}
void
rb_glob(path, func, arg)
char *path;
void (*func) _((const char*, VALUE));
VALUE arg;
{
glob_helper(path, 0, FNM_PERIOD, func, arg);
}
void
rb_globi(path, func, arg)
char *path;
void (*func) _((const char*, VALUE));
VALUE arg;
{
glob_helper(path, 0, FNM_PERIOD|FNM_CASEFOLD, func, arg);
}
static void push_pattern _((const char *path, VALUE ary));
static void
push_pattern(path, ary)
const char *path;
VALUE ary;
{
VALUE str = rb_tainted_str_new2(path);
if (ary) {
rb_ary_push(ary, str);
}
else {
rb_yield(str);
}
}
static void
push_globs(ary, s)
VALUE ary;
char *s;
{
rb_glob(s, push_pattern, ary);
}
static void
push_braces(ary, s)
VALUE ary;
char *s;
{
char buffer[MAXPATHLEN], *buf = buffer;
char *p, *t, *b;
char *lbrace, *rbrace;
int nest = 0;
p = s;
lbrace = rbrace = 0;
while (*p) {
if (*p == '{') {
lbrace = p;
break;
}
p++;
}
while (*p) {
if (*p == '{') nest++;
if (*p == '}' && --nest == 0) {
rbrace = p;
break;
}
p++;
}
if (lbrace) {
int len = strlen(s);
if (len >= MAXPATHLEN)
buf = xmalloc(len + 1);
memcpy(buf, s, lbrace-s);
b = buf + (lbrace-s);
p = lbrace;
while (*p != '}') {
t = p + 1;
for (p = t; *p!='}' && *p!=','; p++) {
/* skip inner braces */
if (*p == '{') while (*p!='}') p++;
}
memcpy(b, t, p-t);
strcpy(b+(p-t), rbrace+1);
push_braces(ary, buf);
}
if (buf != buffer)
free(buf);
}
else {
push_globs(ary, s);
}
}
#define isdelim(c) ((c)=='\0')
static VALUE
dir_s_glob(dir, str)
VALUE dir, str;
{
char *p, *pend;
char buffer[MAXPATHLEN], *buf;
char *t;
int nest;
VALUE ary = 0;
SafeStringValue(str);
if (!rb_block_given_p()) {
ary = rb_ary_new();
}
if (RSTRING(str)->len >= MAXPATHLEN) {
buf = xmalloc(RSTRING(str)->len + 1);
} else {
buf = buffer;
}
p = RSTRING(str)->ptr;
pend = p + RSTRING(str)->len;
while (p < pend) {
t = buf;
nest = 0;
while (p < pend && isdelim(*p)) p++;
while (p < pend && !isdelim(*p)) {
if (*p == '{') nest+=2;
if (*p == '}') nest+=3;
if (*p == '\\') {
*t++ = *p++;
if (p == pend) break;
}
*t++ = *p++;
}
*t = '\0';
if (nest == 0) {
push_globs(ary, buf);
}
else if (nest % 5 == 0) {
push_braces(ary, buf);
}
/* else unmatched braces */
}
if (buf != buffer)
free(buf);
if (ary && RARRAY(ary)->len == 0) {
rb_warning("no matches found: %s", RSTRING(str)->ptr);
}
return ary;
}
static VALUE
dir_foreach(io, dirname)
VALUE io, dirname;
{
VALUE dir;
dir = rb_funcall(rb_cDir, rb_intern("open"), 1, dirname);
rb_ensure(dir_each, dir, dir_close, dir);
return Qnil;
}
static VALUE
dir_entries(io, dirname)
VALUE io, dirname;
{
VALUE dir;
dir = rb_funcall(rb_cDir, rb_intern("open"), 1, dirname);
return rb_ensure(rb_Array, dir, dir_close, dir);
}
static VALUE
file_s_fnmatch(argc, argv, obj)
int argc;
VALUE *argv;
VALUE obj;
{
VALUE pattern, path;
VALUE rflags;
int flags;
if (rb_scan_args(argc, argv, "21", &pattern, &path, &rflags) == 3)
flags = NUM2INT(rflags);
else
flags = 0;
StringValue(pattern);
StringValue(path);
if (fnmatch(RSTRING(pattern)->ptr, RSTRING(path)->ptr, flags) == 0)
return Qtrue;
return Qfalse;
}
void
Init_Dir()
{
rb_cDir = rb_define_class("Dir", rb_cObject);
rb_include_module(rb_cDir, rb_mEnumerable);
rb_define_singleton_method(rb_cDir, "new", dir_s_new, -1);
rb_define_singleton_method(rb_cDir, "open", dir_s_open, 1);
rb_define_singleton_method(rb_cDir, "foreach", dir_foreach, 1);
rb_define_singleton_method(rb_cDir, "entries", dir_entries, 1);
rb_define_method(rb_cDir,"initialize", dir_initialize, 1);
rb_define_method(rb_cDir,"read", dir_read, 0);
rb_define_method(rb_cDir,"each", dir_each, 0);
rb_define_method(rb_cDir,"rewind", dir_rewind, 0);
rb_define_method(rb_cDir,"tell", dir_tell, 0);
rb_define_method(rb_cDir,"seek", dir_seek, 1);
rb_define_method(rb_cDir,"pos", dir_tell, 0);
rb_define_method(rb_cDir,"pos=", dir_seek, 1);
rb_define_method(rb_cDir,"close", dir_close, 0);
rb_define_singleton_method(rb_cDir,"chdir", dir_s_chdir, -1);
rb_define_singleton_method(rb_cDir,"getwd", dir_s_getwd, 0);
rb_define_singleton_method(rb_cDir,"pwd", dir_s_getwd, 0);
rb_define_singleton_method(rb_cDir,"chroot", dir_s_chroot, 1);
rb_define_singleton_method(rb_cDir,"mkdir", dir_s_mkdir, -1);
rb_define_singleton_method(rb_cDir,"rmdir", dir_s_rmdir, 1);
rb_define_singleton_method(rb_cDir,"delete", dir_s_rmdir, 1);
rb_define_singleton_method(rb_cDir,"unlink", dir_s_rmdir, 1);
rb_define_singleton_method(rb_cDir,"glob", dir_s_glob, 1);
rb_define_singleton_method(rb_cDir,"[]", dir_s_glob, 1);
rb_define_singleton_method(rb_cFile,"fnmatch", file_s_fnmatch, -1);
rb_define_singleton_method(rb_cFile,"fnmatch?", file_s_fnmatch, -1);
rb_file_const("FNM_NOESCAPE", INT2FIX(FNM_NOESCAPE));
rb_file_const("FNM_PATHNAME", INT2FIX(FNM_PATHNAME));
rb_file_const("FNM_PERIOD", INT2FIX(FNM_PERIOD));
rb_file_const("FNM_CASEFOLD", INT2FIX(FNM_CASEFOLD));
}