12 changed files with 16 additions and 857 deletions
@ -1 +0,0 @@ |
|||
* text=auto |
@ -1,4 +0,0 @@ |
|||
*.pyc |
|||
*.pyd |
|||
benchtree |
|||
build |
@ -1,373 +0,0 @@ |
|||
// scandir C speedups
|
|||
//
|
|||
// TODO: this is a work in progress!
|
|||
//
|
|||
// There's a fair bit of PY_MAJOR_VERSION boilerplate to support both Python 2
|
|||
// and Python 3 -- the structure of this is taken from here:
|
|||
// http://docs.python.org/3.3/howto/cporting.html
|
|||
|
|||
#include <Python.h> |
|||
#include <structseq.h> |
|||
|
|||
#ifdef MS_WINDOWS |
|||
#include <windows.h> |
|||
#endif |
|||
|
|||
#if PY_MAJOR_VERSION >= 3 |
|||
#define INITERROR return NULL |
|||
#define FROM_LONG PyLong_FromLong |
|||
#define FROM_STRING PyUnicode_FromStringAndSize |
|||
#else |
|||
#define INITERROR return |
|||
#define FROM_LONG PyInt_FromLong |
|||
#define FROM_STRING PyString_FromStringAndSize |
|||
#endif |
|||
|
|||
#ifdef MS_WINDOWS |
|||
|
|||
static PyObject * |
|||
win32_error_unicode(char* function, Py_UNICODE* filename) |
|||
{ |
|||
errno = GetLastError(); |
|||
if (filename) |
|||
return PyErr_SetFromWindowsErrWithUnicodeFilename(errno, filename); |
|||
else |
|||
return PyErr_SetFromWindowsErr(errno); |
|||
} |
|||
|
|||
/* Below, we *know* that ugo+r is 0444 */ |
|||
#if _S_IREAD != 0400 |
|||
#error Unsupported C library |
|||
#endif |
|||
static int |
|||
attributes_to_mode(DWORD attr) |
|||
{ |
|||
int m = 0; |
|||
if (attr & FILE_ATTRIBUTE_DIRECTORY) |
|||
m |= _S_IFDIR | 0111; /* IFEXEC for user,group,other */ |
|||
else |
|||
m |= _S_IFREG; |
|||
if (attr & FILE_ATTRIBUTE_READONLY) |
|||
m |= 0444; |
|||
else |
|||
m |= 0666; |
|||
if (attr & FILE_ATTRIBUTE_REPARSE_POINT) |
|||
m |= 0120000; // S_IFLNK
|
|||
return m; |
|||
} |
|||
|
|||
double |
|||
filetime_to_time(FILETIME *filetime) |
|||
{ |
|||
const double SECONDS_BETWEEN_EPOCHS = 11644473600.0; |
|||
|
|||
unsigned long long total = (unsigned long long)filetime->dwHighDateTime << 32 | |
|||
(unsigned long long)filetime->dwLowDateTime; |
|||
return (double)total / 10000000.0 - SECONDS_BETWEEN_EPOCHS; |
|||
} |
|||
|
|||
static PyTypeObject StatResultType; |
|||
|
|||
static PyObject * |
|||
find_data_to_statresult(WIN32_FIND_DATAW *data) |
|||
{ |
|||
PY_LONG_LONG size; |
|||
PyObject *v = PyStructSequence_New(&StatResultType); |
|||
if (v == NULL) |
|||
return NULL; |
|||
|
|||
size = (PY_LONG_LONG)data->nFileSizeHigh << 32 | |
|||
(PY_LONG_LONG)data->nFileSizeLow; |
|||
|
|||
PyStructSequence_SET_ITEM(v, 0, FROM_LONG(attributes_to_mode(data->dwFileAttributes))); |
|||
PyStructSequence_SET_ITEM(v, 1, FROM_LONG(0)); |
|||
PyStructSequence_SET_ITEM(v, 2, FROM_LONG(0)); |
|||
PyStructSequence_SET_ITEM(v, 3, FROM_LONG(0)); |
|||
PyStructSequence_SET_ITEM(v, 4, FROM_LONG(0)); |
|||
PyStructSequence_SET_ITEM(v, 5, FROM_LONG(0)); |
|||
PyStructSequence_SET_ITEM(v, 6, PyLong_FromLongLong((PY_LONG_LONG)size)); |
|||
PyStructSequence_SET_ITEM(v, 7, PyFloat_FromDouble(filetime_to_time(&data->ftLastAccessTime))); |
|||
PyStructSequence_SET_ITEM(v, 8, PyFloat_FromDouble(filetime_to_time(&data->ftLastWriteTime))); |
|||
PyStructSequence_SET_ITEM(v, 9, PyFloat_FromDouble(filetime_to_time(&data->ftCreationTime))); |
|||
|
|||
if (PyErr_Occurred()) { |
|||
Py_DECREF(v); |
|||
return NULL; |
|||
} |
|||
|
|||
return v; |
|||
} |
|||
|
|||
static PyStructSequence_Field stat_result_fields[] = { |
|||
{"st_mode", "protection bits"}, |
|||
{"st_ino", "inode"}, |
|||
{"st_dev", "device"}, |
|||
{"st_nlink", "number of hard links"}, |
|||
{"st_uid", "user ID of owner"}, |
|||
{"st_gid", "group ID of owner"}, |
|||
{"st_size", "total size, in bytes"}, |
|||
{"st_atime", "time of last access"}, |
|||
{"st_mtime", "time of last modification"}, |
|||
{"st_ctime", "time of last change"}, |
|||
{0} |
|||
}; |
|||
|
|||
static PyStructSequence_Desc stat_result_desc = { |
|||
"stat_result", /* name */ |
|||
NULL, /* doc */ |
|||
stat_result_fields, |
|||
10 |
|||
}; |
|||
|
|||
static PyObject * |
|||
scandir_helper(PyObject *self, PyObject *args) |
|||
{ |
|||
PyObject *d, *v; |
|||
HANDLE hFindFile; |
|||
BOOL result; |
|||
WIN32_FIND_DATAW wFileData; |
|||
Py_UNICODE *wnamebuf; |
|||
Py_ssize_t len; |
|||
PyObject *po; |
|||
PyObject *name_stat; |
|||
|
|||
if (!PyArg_ParseTuple(args, "U:scandir_helper", &po)) |
|||
return NULL; |
|||
|
|||
/* Overallocate for \\*.*\0 */ |
|||
len = PyUnicode_GET_SIZE(po); |
|||
wnamebuf = malloc((len + 5) * sizeof(wchar_t)); |
|||
if (!wnamebuf) { |
|||
PyErr_NoMemory(); |
|||
return NULL; |
|||
} |
|||
wcscpy(wnamebuf, PyUnicode_AS_UNICODE(po)); |
|||
if (len > 0) { |
|||
Py_UNICODE wch = wnamebuf[len-1]; |
|||
if (wch != L'/' && wch != L'\\' && wch != L':') |
|||
wnamebuf[len++] = L'\\'; |
|||
wcscpy(wnamebuf + len, L"*.*"); |
|||
} |
|||
if ((d = PyList_New(0)) == NULL) { |
|||
free(wnamebuf); |
|||
return NULL; |
|||
} |
|||
Py_BEGIN_ALLOW_THREADS |
|||
hFindFile = FindFirstFileW(wnamebuf, &wFileData); |
|||
Py_END_ALLOW_THREADS |
|||
if (hFindFile == INVALID_HANDLE_VALUE) { |
|||
int error = GetLastError(); |
|||
if (error == ERROR_FILE_NOT_FOUND) { |
|||
free(wnamebuf); |
|||
return d; |
|||
} |
|||
Py_DECREF(d); |
|||
win32_error_unicode("FindFirstFileW", wnamebuf); |
|||
free(wnamebuf); |
|||
return NULL; |
|||
} |
|||
do { |
|||
/* Skip over . and .. */ |
|||
if (wcscmp(wFileData.cFileName, L".") != 0 && |
|||
wcscmp(wFileData.cFileName, L"..") != 0) { |
|||
v = PyUnicode_FromUnicode(wFileData.cFileName, wcslen(wFileData.cFileName)); |
|||
if (v == NULL) { |
|||
Py_DECREF(d); |
|||
d = NULL; |
|||
break; |
|||
} |
|||
name_stat = Py_BuildValue("ON", v, find_data_to_statresult(&wFileData)); |
|||
if (name_stat == NULL) { |
|||
Py_DECREF(v); |
|||
Py_DECREF(d); |
|||
d = NULL; |
|||
break; |
|||
} |
|||
if (PyList_Append(d, name_stat) != 0) { |
|||
Py_DECREF(v); |
|||
Py_DECREF(d); |
|||
Py_DECREF(name_stat); |
|||
d = NULL; |
|||
break; |
|||
} |
|||
Py_DECREF(name_stat); |
|||
Py_DECREF(v); |
|||
} |
|||
Py_BEGIN_ALLOW_THREADS |
|||
result = FindNextFileW(hFindFile, &wFileData); |
|||
Py_END_ALLOW_THREADS |
|||
/* FindNextFile sets error to ERROR_NO_MORE_FILES if
|
|||
it got to the end of the directory. */ |
|||
if (!result && GetLastError() != ERROR_NO_MORE_FILES) { |
|||
Py_DECREF(d); |
|||
win32_error_unicode("FindNextFileW", wnamebuf); |
|||
FindClose(hFindFile); |
|||
free(wnamebuf); |
|||
return NULL; |
|||
} |
|||
} while (result == TRUE); |
|||
|
|||
if (FindClose(hFindFile) == FALSE) { |
|||
Py_DECREF(d); |
|||
win32_error_unicode("FindClose", wnamebuf); |
|||
free(wnamebuf); |
|||
return NULL; |
|||
} |
|||
free(wnamebuf); |
|||
return d; |
|||
} |
|||
|
|||
#else // Linux / OS X
|
|||
|
|||
#include <dirent.h> |
|||
#define NAMLEN(dirent) strlen((dirent)->d_name) |
|||
|
|||
static PyObject * |
|||
posix_error_with_allocated_filename(char* name) |
|||
{ |
|||
PyObject *rc = PyErr_SetFromErrnoWithFilename(PyExc_OSError, name); |
|||
PyMem_Free(name); |
|||
return rc; |
|||
} |
|||
|
|||
static PyObject * |
|||
scandir_helper(PyObject *self, PyObject *args) |
|||
{ |
|||
char *name = NULL; |
|||
PyObject *d, *v, *name_type; |
|||
DIR *dirp; |
|||
struct dirent *ep; |
|||
int arg_is_unicode = 1; |
|||
|
|||
errno = 0; |
|||
if (!PyArg_ParseTuple(args, "U:scandir_helper", &v)) { |
|||
arg_is_unicode = 0; |
|||
PyErr_Clear(); |
|||
} |
|||
if (!PyArg_ParseTuple(args, "et:scandir_helper", Py_FileSystemDefaultEncoding, &name)) |
|||
return NULL; |
|||
Py_BEGIN_ALLOW_THREADS |
|||
dirp = opendir(name); |
|||
Py_END_ALLOW_THREADS |
|||
if (dirp == NULL) { |
|||
return posix_error_with_allocated_filename(name); |
|||
} |
|||
if ((d = PyList_New(0)) == NULL) { |
|||
Py_BEGIN_ALLOW_THREADS |
|||
closedir(dirp); |
|||
Py_END_ALLOW_THREADS |
|||
PyMem_Free(name); |
|||
return NULL; |
|||
} |
|||
for (;;) { |
|||
errno = 0; |
|||
Py_BEGIN_ALLOW_THREADS |
|||
ep = readdir(dirp); |
|||
Py_END_ALLOW_THREADS |
|||
if (ep == NULL) { |
|||
if (errno == 0) { |
|||
break; |
|||
} else { |
|||
Py_BEGIN_ALLOW_THREADS |
|||
closedir(dirp); |
|||
Py_END_ALLOW_THREADS |
|||
Py_DECREF(d); |
|||
return posix_error_with_allocated_filename(name); |
|||
} |
|||
} |
|||
if (ep->d_name[0] == '.' && |
|||
(NAMLEN(ep) == 1 || |
|||
(ep->d_name[1] == '.' && NAMLEN(ep) == 2))) |
|||
continue; |
|||
v = FROM_STRING(ep->d_name, NAMLEN(ep)); |
|||
if (v == NULL) { |
|||
Py_DECREF(d); |
|||
d = NULL; |
|||
break; |
|||
} |
|||
if (arg_is_unicode) { |
|||
PyObject *w; |
|||
|
|||
w = PyUnicode_FromEncodedObject(v, |
|||
Py_FileSystemDefaultEncoding, |
|||
"strict"); |
|||
if (w != NULL) { |
|||
Py_DECREF(v); |
|||
v = w; |
|||
} |
|||
else { |
|||
/* fall back to the original byte string, as
|
|||
discussed in patch #683592 */ |
|||
PyErr_Clear(); |
|||
} |
|||
} |
|||
name_type = Py_BuildValue("ON", v, FROM_LONG(ep->d_type)); |
|||
if (name_type == NULL) { |
|||
Py_DECREF(v); |
|||
Py_DECREF(d); |
|||
d = NULL; |
|||
break; |
|||
} |
|||
if (PyList_Append(d, name_type) != 0) { |
|||
Py_DECREF(v); |
|||
Py_DECREF(d); |
|||
Py_DECREF(name_type); |
|||
d = NULL; |
|||
break; |
|||
} |
|||
Py_DECREF(name_type); |
|||
Py_DECREF(v); |
|||
} |
|||
Py_BEGIN_ALLOW_THREADS |
|||
closedir(dirp); |
|||
Py_END_ALLOW_THREADS |
|||
PyMem_Free(name); |
|||
|
|||
return d; |
|||
} |
|||
|
|||
#endif |
|||
|
|||
static PyMethodDef scandir_methods[] = { |
|||
{"scandir_helper", (PyCFunction)scandir_helper, METH_VARARGS, NULL}, |
|||
{NULL, NULL}, |
|||
}; |
|||
|
|||
#if PY_MAJOR_VERSION >= 3 |
|||
static struct PyModuleDef moduledef = { |
|||
PyModuleDef_HEAD_INIT, |
|||
"_scandir", |
|||
NULL, |
|||
0, |
|||
scandir_methods, |
|||
NULL, |
|||
NULL, |
|||
NULL, |
|||
NULL, |
|||
}; |
|||
#endif |
|||
|
|||
#if PY_MAJOR_VERSION >= 3 |
|||
PyObject * |
|||
PyInit__scandir(void) |
|||
{ |
|||
PyObject *module = PyModule_Create(&moduledef); |
|||
#else |
|||
void |
|||
init_scandir(void) |
|||
{ |
|||
PyObject *module = Py_InitModule("_scandir", scandir_methods); |
|||
#endif |
|||
if (module == NULL) { |
|||
INITERROR; |
|||
} |
|||
|
|||
#ifdef MS_WINDOWS |
|||
stat_result_desc.name = "scandir.stat_result"; |
|||
PyStructSequence_InitType(&StatResultType, &stat_result_desc); |
|||
#endif |
|||
|
|||
#if PY_MAJOR_VERSION >= 3 |
|||
return module; |
|||
#endif |
|||
} |
@ -1,456 +0,0 @@ |
|||
"""scandir, a better directory iterator that exposes all file info OS provides |
|||
|
|||
scandir is a generator version of os.listdir() that returns an iterator over |
|||
files in a directory, and also exposes the extra information most OSes provide |
|||
while iterating files in a directory. |
|||
|
|||
See README.md or https://github.com/benhoyt/scandir for rationale and docs. |
|||
|
|||
scandir is released under the new BSD 3-clause license. See LICENSE.txt for |
|||
the full license text. |
|||
""" |
|||
|
|||
from __future__ import division |
|||
|
|||
import ctypes |
|||
import os |
|||
import stat |
|||
import sys |
|||
|
|||
__version__ = '0.3' |
|||
__all__ = ['scandir', 'walk'] |
|||
|
|||
# Shortcuts to these functions for speed and ease |
|||
join = os.path.join |
|||
lstat = os.lstat |
|||
|
|||
S_IFDIR = stat.S_IFDIR |
|||
S_IFREG = stat.S_IFREG |
|||
S_IFLNK = stat.S_IFLNK |
|||
|
|||
# 'unicode' isn't defined on Python 3 |
|||
try: |
|||
unicode |
|||
except NameError: |
|||
unicode = str |
|||
|
|||
_scandir = None |
|||
|
|||
|
|||
class GenericDirEntry(object): |
|||
__slots__ = ('name', '_lstat', '_path') |
|||
|
|||
def __init__(self, path, name): |
|||
self._path = path |
|||
self.name = name |
|||
self._lstat = None |
|||
|
|||
def lstat(self): |
|||
if self._lstat is None: |
|||
self._lstat = lstat(join(self._path, self.name)) |
|||
return self._lstat |
|||
|
|||
def is_dir(self): |
|||
try: |
|||
self.lstat() |
|||
except OSError: |
|||
return False |
|||
return self._lstat.st_mode & 0o170000 == S_IFDIR |
|||
|
|||
def is_file(self): |
|||
try: |
|||
self.lstat() |
|||
except OSError: |
|||
return False |
|||
return self._lstat.st_mode & 0o170000 == S_IFREG |
|||
|
|||
def is_symlink(self): |
|||
try: |
|||
self.lstat() |
|||
except OSError: |
|||
return False |
|||
return self._lstat.st_mode & 0o170000 == S_IFLNK |
|||
|
|||
def __str__(self): |
|||
return '<{0}: {1!r}>'.format(self.__class__.__name__, self.name) |
|||
|
|||
__repr__ = __str__ |
|||
|
|||
|
|||
if sys.platform == 'win32': |
|||
from ctypes import wintypes |
|||
|
|||
# Various constants from windows.h |
|||
INVALID_HANDLE_VALUE = ctypes.c_void_p(-1).value |
|||
ERROR_FILE_NOT_FOUND = 2 |
|||
ERROR_NO_MORE_FILES = 18 |
|||
FILE_ATTRIBUTE_READONLY = 1 |
|||
FILE_ATTRIBUTE_DIRECTORY = 16 |
|||
FILE_ATTRIBUTE_REPARSE_POINT = 1024 |
|||
|
|||
# Numer of seconds between 1601-01-01 and 1970-01-01 |
|||
SECONDS_BETWEEN_EPOCHS = 11644473600 |
|||
|
|||
kernel32 = ctypes.windll.kernel32 |
|||
|
|||
# ctypes wrappers for (wide string versions of) FindFirstFile, |
|||
# FindNextFile, and FindClose |
|||
FindFirstFile = kernel32.FindFirstFileW |
|||
FindFirstFile.argtypes = [ |
|||
wintypes.LPCWSTR, |
|||
ctypes.POINTER(wintypes.WIN32_FIND_DATAW), |
|||
] |
|||
FindFirstFile.restype = wintypes.HANDLE |
|||
|
|||
FindNextFile = kernel32.FindNextFileW |
|||
FindNextFile.argtypes = [ |
|||
wintypes.HANDLE, |
|||
ctypes.POINTER(wintypes.WIN32_FIND_DATAW), |
|||
] |
|||
FindNextFile.restype = wintypes.BOOL |
|||
|
|||
FindClose = kernel32.FindClose |
|||
FindClose.argtypes = [wintypes.HANDLE] |
|||
FindClose.restype = wintypes.BOOL |
|||
|
|||
def filetime_to_time(filetime): |
|||
"""Convert Win32 FILETIME to time since Unix epoch in seconds.""" |
|||
total = filetime.dwHighDateTime << 32 | filetime.dwLowDateTime |
|||
return total / 10000000 - SECONDS_BETWEEN_EPOCHS |
|||
|
|||
def find_data_to_stat(data): |
|||
"""Convert Win32 FIND_DATA struct to stat_result.""" |
|||
# First convert Win32 dwFileAttributes to st_mode |
|||
attributes = data.dwFileAttributes |
|||
st_mode = 0 |
|||
if attributes & FILE_ATTRIBUTE_DIRECTORY: |
|||
st_mode |= S_IFDIR | 0o111 |
|||
else: |
|||
st_mode |= S_IFREG |
|||
if attributes & FILE_ATTRIBUTE_READONLY: |
|||
st_mode |= 0o444 |
|||
else: |
|||
st_mode |= 0o666 |
|||
if attributes & FILE_ATTRIBUTE_REPARSE_POINT: |
|||
st_mode |= S_IFLNK |
|||
|
|||
st_size = data.nFileSizeHigh << 32 | data.nFileSizeLow |
|||
st_atime = filetime_to_time(data.ftLastAccessTime) |
|||
st_mtime = filetime_to_time(data.ftLastWriteTime) |
|||
st_ctime = filetime_to_time(data.ftCreationTime) |
|||
|
|||
# Some fields set to zero per CPython's posixmodule.c: st_ino, st_dev, |
|||
# st_nlink, st_uid, st_gid |
|||
return os.stat_result((st_mode, 0, 0, 0, 0, 0, st_size, st_atime, |
|||
st_mtime, st_ctime)) |
|||
|
|||
class Win32DirEntry(object): |
|||
__slots__ = ('name', '_lstat', '_find_data') |
|||
|
|||
def __init__(self, name, find_data): |
|||
self.name = name |
|||
self._lstat = None |
|||
self._find_data = find_data |
|||
|
|||
def lstat(self): |
|||
if self._lstat is None: |
|||
# Lazily convert to stat object, because it's slow, and often |
|||
# we only need is_dir() etc |
|||
self._lstat = find_data_to_stat(self._find_data) |
|||
return self._lstat |
|||
|
|||
def is_dir(self): |
|||
return (self._find_data.dwFileAttributes & |
|||
FILE_ATTRIBUTE_DIRECTORY != 0) |
|||
|
|||
def is_file(self): |
|||
return (self._find_data.dwFileAttributes & |
|||
FILE_ATTRIBUTE_DIRECTORY == 0) |
|||
|
|||
def is_symlink(self): |
|||
return (self._find_data.dwFileAttributes & |
|||
FILE_ATTRIBUTE_REPARSE_POINT != 0) |
|||
|
|||
def __str__(self): |
|||
return '<{0}: {1!r}>'.format(self.__class__.__name__, self.name) |
|||
|
|||
__repr__ = __str__ |
|||
|
|||
def win_error(error, filename): |
|||
exc = WindowsError(error, ctypes.FormatError(error)) |
|||
exc.filename = filename |
|||
return exc |
|||
|
|||
def scandir(path='.', windows_wildcard='*.*'): |
|||
"""Like os.listdir(), but yield DirEntry objects instead of returning |
|||
a list of names. |
|||
""" |
|||
# Call FindFirstFile and handle errors |
|||
data = wintypes.WIN32_FIND_DATAW() |
|||
data_p = ctypes.byref(data) |
|||
filename = join(path, windows_wildcard) |
|||
handle = FindFirstFile(filename, data_p) |
|||
if handle == INVALID_HANDLE_VALUE: |
|||
error = ctypes.GetLastError() |
|||
if error == ERROR_FILE_NOT_FOUND: |
|||
# No files, don't yield anything |
|||
return |
|||
raise win_error(error, path) |
|||
|
|||
# Call FindNextFile in a loop, stopping when no more files |
|||
try: |
|||
while True: |
|||
# Skip '.' and '..' (current and parent directory), but |
|||
# otherwise yield (filename, stat_result) tuple |
|||
name = data.cFileName |
|||
if name not in ('.', '..'): |
|||
yield Win32DirEntry(name, data) |
|||
|
|||
data = wintypes.WIN32_FIND_DATAW() |
|||
data_p = ctypes.byref(data) |
|||
success = FindNextFile(handle, data_p) |
|||
if not success: |
|||
error = ctypes.GetLastError() |
|||
if error == ERROR_NO_MORE_FILES: |
|||
break |
|||
raise win_error(error, path) |
|||
finally: |
|||
if not FindClose(handle): |
|||
raise win_error(ctypes.GetLastError(), path) |
|||
|
|||
try: |
|||
import _scandir |
|||
|
|||
scandir_helper = _scandir.scandir_helper |
|||
|
|||
class Win32DirEntry(object): |
|||
__slots__ = ('name', '_lstat') |
|||
|
|||
def __init__(self, name, lstat): |
|||
self.name = name |
|||
self._lstat = lstat |
|||
|
|||
def lstat(self): |
|||
return self._lstat |
|||
|
|||
def is_dir(self): |
|||
return self._lstat.st_mode & 0o170000 == S_IFDIR |
|||
|
|||
def is_file(self): |
|||
return self._lstat.st_mode & 0o170000 == S_IFREG |
|||
|
|||
def is_symlink(self): |
|||
return self._lstat.st_mode & 0o170000 == S_IFLNK |
|||
|
|||
def __str__(self): |
|||
return '<{0}: {1!r}>'.format(self.__class__.__name__, self.name) |
|||
|
|||
__repr__ = __str__ |
|||
|
|||
def scandir(path='.'): |
|||
for name, stat in scandir_helper(unicode(path)): |
|||
yield Win32DirEntry(name, stat) |
|||
|
|||
except ImportError: |
|||
pass |
|||
|
|||
|
|||
# Linux, OS X, and BSD implementation |
|||
elif sys.platform.startswith(('linux', 'darwin')) or 'bsd' in sys.platform: |
|||
import ctypes.util |
|||
|
|||
DIR_p = ctypes.c_void_p |
|||
|
|||
# Rather annoying how the dirent struct is slightly different on each |
|||
# platform. The only fields we care about are d_name and d_type. |
|||
class Dirent(ctypes.Structure): |
|||
if sys.platform.startswith('linux'): |
|||
_fields_ = ( |
|||
('d_ino', ctypes.c_ulong), |
|||
('d_off', ctypes.c_long), |
|||
('d_reclen', ctypes.c_ushort), |
|||
('d_type', ctypes.c_byte), |
|||
('d_name', ctypes.c_char * 256), |
|||
) |
|||
else: |
|||
_fields_ = ( |
|||
('d_ino', ctypes.c_uint32), # must be uint32, not ulong |
|||
('d_reclen', ctypes.c_ushort), |
|||
('d_type', ctypes.c_byte), |
|||
('d_namlen', ctypes.c_byte), |
|||
('d_name', ctypes.c_char * 256), |
|||
) |
|||
|
|||
DT_UNKNOWN = 0 |
|||
DT_DIR = 4 |
|||
DT_REG = 8 |
|||
DT_LNK = 10 |
|||
|
|||
Dirent_p = ctypes.POINTER(Dirent) |
|||
Dirent_pp = ctypes.POINTER(Dirent_p) |
|||
|
|||
libc = ctypes.CDLL(ctypes.util.find_library('c'), use_errno=True) |
|||
opendir = libc.opendir |
|||
opendir.argtypes = [ctypes.c_char_p] |
|||
opendir.restype = DIR_p |
|||
|
|||
readdir_r = libc.readdir_r |
|||
readdir_r.argtypes = [DIR_p, Dirent_p, Dirent_pp] |
|||
readdir_r.restype = ctypes.c_int |
|||
|
|||
closedir = libc.closedir |
|||
closedir.argtypes = [DIR_p] |
|||
closedir.restype = ctypes.c_int |
|||
|
|||
file_system_encoding = sys.getfilesystemencoding() |
|||
|
|||
class PosixDirEntry(object): |
|||
__slots__ = ('name', '_d_type', '_lstat', '_path') |
|||
|
|||
def __init__(self, path, name, d_type): |
|||
self._path = path |
|||
self.name = name |
|||
self._d_type = d_type |
|||
self._lstat = None |
|||
|
|||
def lstat(self): |
|||
if self._lstat is None: |
|||
self._lstat = lstat(join(self._path, self.name)) |
|||
return self._lstat |
|||
|
|||
# Ridiculous duplication between these is* functions -- helps a little |
|||
# bit with os.walk() performance compared to calling another function. |
|||
def is_dir(self): |
|||
d_type = self._d_type |
|||
if d_type != DT_UNKNOWN: |
|||
return d_type == DT_DIR |
|||
try: |
|||
self.lstat() |
|||
except OSError: |
|||
return False |
|||
return self._lstat.st_mode & 0o170000 == S_IFDIR |
|||
|
|||
def is_file(self): |
|||
d_type = self._d_type |
|||
if d_type != DT_UNKNOWN: |
|||
return d_type == DT_REG |
|||
try: |
|||
self.lstat() |
|||
except OSError: |
|||
return False |
|||
return self._lstat.st_mode & 0o170000 == S_IFREG |
|||
|
|||
def is_symlink(self): |
|||
d_type = self._d_type |
|||
if d_type != DT_UNKNOWN: |
|||
return d_type == DT_LNK |
|||
try: |
|||
self.lstat() |
|||
except OSError: |
|||
return False |
|||
return self._lstat.st_mode & 0o170000 == S_IFLNK |
|||
|
|||
def __str__(self): |
|||
return '<{0}: {1!r}>'.format(self.__class__.__name__, self.name) |
|||
|
|||
__repr__ = __str__ |
|||
|
|||
def posix_error(filename): |
|||
errno = ctypes.get_errno() |
|||
exc = OSError(errno, os.strerror(errno)) |
|||
exc.filename = filename |
|||
return exc |
|||
|
|||
def scandir(path='.'): |
|||
"""Like os.listdir(), but yield DirEntry objects instead of returning |
|||
a list of names. |
|||
""" |
|||
dir_p = opendir(path.encode(file_system_encoding)) |
|||
if not dir_p: |
|||
raise posix_error(path) |
|||
try: |
|||
result = Dirent_p() |
|||
while True: |
|||
entry = Dirent() |
|||
if readdir_r(dir_p, entry, result): |
|||
raise posix_error(path) |
|||
if not result: |
|||
break |
|||
name = entry.d_name.decode(file_system_encoding) |
|||
if name not in ('.', '..'): |
|||
yield PosixDirEntry(path, name, entry.d_type) |
|||
finally: |
|||
if closedir(dir_p): |
|||
raise posix_error(path) |
|||
|
|||
try: |
|||
import _scandir |
|||
|
|||
scandir_helper = _scandir.scandir_helper |
|||
|
|||
def scandir(path='.'): |
|||
for name, d_type in scandir_helper(unicode(path)): |
|||
yield PosixDirEntry(path, name, d_type) |
|||
|
|||
except ImportError: |
|||
pass |
|||
|
|||
|
|||
# Some other system -- no d_type or stat information |
|||
else: |
|||
def scandir(path='.'): |
|||
"""Like os.listdir(), but yield DirEntry objects instead of returning |
|||
a list of names. |
|||
""" |
|||
for name in os.listdir(path): |
|||
yield GenericDirEntry(path, name) |
|||
|
|||
|
|||
def walk(top, topdown=True, onerror=None, followlinks=False): |
|||
"""Like os.walk(), but faster, as it uses scandir() internally.""" |
|||
# Determine which are files and which are directories |
|||
dirs = [] |
|||
nondirs = [] |
|||
try: |
|||
for entry in scandir(top): |
|||
if entry.is_dir(): |
|||
dirs.append(entry) |
|||
else: |
|||
nondirs.append(entry) |
|||
except OSError as error: |
|||
if onerror is not None: |
|||
onerror(error) |
|||
return |
|||
|
|||
# Yield before recursion if going top down |
|||
if topdown: |
|||
# Need to do some fancy footwork here as caller is allowed to modify |
|||
# dir_names, and we really want them to modify dirs (list of DirEntry |
|||
# objects) instead. Keep a mapping of entries keyed by name. |
|||
dir_names = [] |
|||
entries_by_name = {} |
|||
for entry in dirs: |
|||
dir_names.append(entry.name) |
|||
entries_by_name[entry.name] = entry |
|||
|
|||
yield top, dir_names, [e.name for e in nondirs] |
|||
|
|||
dirs = [] |
|||
for dir_name in dir_names: |
|||
entry = entries_by_name.get(dir_name) |
|||
if entry is None: |
|||
# Only happens when caller creates a new directory and adds it |
|||
# to dir_names |
|||
entry = GenericDirEntry(top, dir_name) |
|||
dirs.append(entry) |
|||
|
|||
# Recurse into sub-directories, following symbolic links if "followlinks" |
|||
for entry in dirs: |
|||
if followlinks or not entry.is_symlink(): |
|||
new_path = join(top, entry.name) |
|||
for x in walk(new_path, topdown, onerror, followlinks): |
|||
yield x |
|||
|
|||
# Yield before recursion if going bottom up |
|||
if not topdown: |
|||
yield top, [e.name for e in dirs], [e.name for e in nondirs] |
Loading…
Reference in new issue