/* fhandler_disk_file.cc Copyright 1996, 1997, 1998, 1999, 2000, 2001, 2002, 2003, 2004, 2005, 2006, 2007 Red Hat, Inc. This file is part of Cygwin. This software is a copyrighted work licensed under the terms of the Cygwin license. Please consult the file "CYGWIN_LICENSE" for details. */ #include "winsup.h" #include #include #include #include #include #include #include "cygerrno.h" #include "perprocess.h" #include "security.h" #include "cygwin/version.h" #include "path.h" #include "fhandler.h" #include "dtable.h" #include "cygheap.h" #include "shared_info.h" #include "pinfo.h" #include #include "ntdll.h" #include #include #include #define _COMPILING_NEWLIB #include class __DIR_mounts { int count; const char *parent_dir; int parent_dir_len; char *mounts[MAX_MOUNTS]; bool found[MAX_MOUNTS + 2]; #define __DIR_PROC (MAX_MOUNTS) #define __DIR_CYGDRIVE (MAX_MOUNTS+1) __ino64_t eval_ino (int idx) { __ino64_t ino = 0; char fname[CYG_MAX_PATH]; struct __stat64 st; int len = parent_dir_len; strcpy (fname, parent_dir); if (fname[len - 1] != '/') fname[len++] = '/'; strcpy (fname + len, mounts[idx]); if (!lstat64 (fname, &st)) ino = st.st_ino; return ino; } public: __DIR_mounts (const char *posix_path) : parent_dir (posix_path) { parent_dir_len = strlen (parent_dir); count = mount_table->get_mounts_here (parent_dir, parent_dir_len, mounts); rewind (); } __ino64_t check_mount (const char *name, __ino64_t ino, bool eval = true) { if (parent_dir_len == 1) /* root dir */ { if (strcasematch (name, "proc")) { found[__DIR_PROC] = true; return hash_path_name (0, "/proc"); } if (strlen (name) == mount_table->cygdrive_len - 2 && strncasematch (name, mount_table->cygdrive + 1, mount_table->cygdrive_len - 2)) { found[__DIR_CYGDRIVE] = true; return 2; } } for (int i = 0; i < count; ++i) if (strcasematch (name, mounts[i])) { found[i] = true; return eval ? eval_ino (i) : 1; } return ino; } __ino64_t check_missing_mount (char *ret_name, bool eval = true) { for (int i = 0; i < count; ++i) if (!found[i]) { found[i] = true; strcpy (ret_name, mounts[i]); return eval ? eval_ino (i) : 1; } if (parent_dir_len == 1) /* root dir */ { if (!found[__DIR_PROC]) { found[__DIR_PROC] = true; strcpy (ret_name, "proc"); return hash_path_name (0, "/proc"); } if (!found[__DIR_CYGDRIVE]) { found[__DIR_CYGDRIVE] = true; if (mount_table->cygdrive_len > 1) { strncpy (ret_name, mount_table->cygdrive + 1, mount_table->cygdrive_len - 2); ret_name[mount_table->cygdrive_len - 2] = '\0'; return 2; } } } return 0; } void rewind () { memset (found, 0, sizeof found); } }; unsigned __stdcall path_conv::ndisk_links (DWORD nNumberOfLinks) { if (!isdir () || isremote ()) return nNumberOfLinks; int len = strlen (*this); char fn[len + 3]; strcpy (fn, *this); const char *s; unsigned count; __DIR_mounts *dir = new __DIR_mounts (normalized_path); if (nNumberOfLinks <= 1) { s = "\\*"; count = 0; } else { s = "\\.."; count = nNumberOfLinks; } if (len == 0 || isdirsep (fn[len - 1])) strcpy (fn + len, s + 1); else strcpy (fn + len, s); WIN32_FIND_DATA buf; HANDLE h = FindFirstFile (fn, &buf); int saw_dot = 2; if (h != INVALID_HANDLE_VALUE) { if (nNumberOfLinks > 1) saw_dot--; else do { if (buf.dwFileAttributes & FILE_ATTRIBUTE_DIRECTORY) count++; if (buf.cFileName[0] == '.' && (buf.cFileName[1] == '\0' || (buf.cFileName[1] == '.' && buf.cFileName[2] == '\0'))) saw_dot--; dir->check_mount (buf.cFileName, 0, false); } while (FindNextFileA (h, &buf)); FindClose (h); } if (nNumberOfLinks > 1) { fn[len + 2] = '\0'; h = FindFirstFile (fn, &buf); if (h) saw_dot--; FindClose (h); } while (dir->check_missing_mount (buf.cFileName, false)) ++count; delete dir; return count + saw_dot; } inline bool path_conv::isgood_inode (__ino64_t ino) const { /* We can't trust remote inode numbers of only 32 bit. That means, all remote inode numbers when running under NT4, as well as remote NT4 NTFS, as well as shares of Samba version < 3.0. The known exception are SFU NFS shares, which return the valid 32 bit inode number from the remote file system unchanged. */ return hasgood_inode () && (ino > UINT32_MAX || !isremote () || fs_is_nfs ()); } int __stdcall fhandler_base::fstat_by_handle (struct __stat64 *buf) { NTSTATUS status; IO_STATUS_BLOCK io; /* The entries potentially contain a name of MAX_PATH wide characters. */ const DWORD fvi_size = 2 * CYG_MAX_PATH + sizeof (FILE_FS_VOLUME_INFORMATION); const DWORD fai_size = 2 * CYG_MAX_PATH + sizeof (FILE_ALL_INFORMATION); PFILE_FS_VOLUME_INFORMATION pfvi = (PFILE_FS_VOLUME_INFORMATION) alloca (fvi_size); PFILE_ALL_INFORMATION pfai = (PFILE_ALL_INFORMATION) alloca (fai_size); status = NtQueryVolumeInformationFile (get_handle (), &io, pfvi, fvi_size, FileFsVolumeInformation); if (!NT_SUCCESS (status)) { debug_printf ("%u = NtQueryVolumeInformationFile)", RtlNtStatusToDosError (status)); pfvi->VolumeSerialNumber = 0; /* Set to pc.volser () in helper. */ } status = NtQueryInformationFile (get_handle (), &io, pfai, fai_size, FileAllInformation); if (NT_SUCCESS (status)) { /* If the change time is 0, it's a file system which doesn't support a change timestamp. In that case use the LastWriteTime entry, as in other calls to fstat_helper. */ if (pc.is_rep_symlink ()) pfai->BasicInformation.FileAttributes &= ~FILE_ATTRIBUTE_DIRECTORY; pc.file_attributes (pfai->BasicInformation.FileAttributes); return fstat_helper (buf, pfai->BasicInformation.ChangeTime.QuadPart ? *(FILETIME *) &pfai->BasicInformation.ChangeTime : *(FILETIME *) &pfai->BasicInformation.LastWriteTime, *(FILETIME *) &pfai->BasicInformation.LastAccessTime, *(FILETIME *) &pfai->BasicInformation.LastWriteTime, *(FILETIME *) &pfai->BasicInformation.CreationTime, pfvi->VolumeSerialNumber, pfai->StandardInformation.EndOfFile.QuadPart, pfai->StandardInformation.AllocationSize.QuadPart, pfai->InternalInformation.FileId.QuadPart, pfai->StandardInformation.NumberOfLinks, pfai->BasicInformation.FileAttributes); } debug_printf ("%u = NtQueryInformationFile)", RtlNtStatusToDosError (status)); /* Last resort */ FILETIME ft = { 0, 0 }; DWORD lowfs, highfs; lowfs = GetFileSize (get_handle (), &highfs); if (lowfs == 0xffffffff && GetLastError ()) lowfs = highfs = 0; return fstat_helper (buf, ft, ft, ft, ft, 0, (ULONGLONG) highfs << 32 | lowfs, -1LL, 0ULL, 1, DWORD (pc)); } int __stdcall fhandler_base::fstat_by_name (struct __stat64 *buf) { int res; HANDLE handle; WIN32_FIND_DATA local; if (!pc.exists ()) { debug_printf ("already determined that pc does not exist"); set_errno (ENOENT); res = -1; } else if ((handle = FindFirstFile (pc, &local)) != INVALID_HANDLE_VALUE) { FindClose (handle); if (pc.is_rep_symlink ()) local.dwFileAttributes &= ~FILE_ATTRIBUTE_DIRECTORY; pc.file_attributes (local.dwFileAttributes); res = fstat_helper (buf, local.ftLastWriteTime, /* see fstat_helper comment */ local.ftLastAccessTime, local.ftLastWriteTime, local.ftCreationTime, pc.volser (), (ULONGLONG) local.nFileSizeHigh << 32 | local.nFileSizeLow, -1LL, 0ULL, 1, local.dwFileAttributes); } else if (pc.isdir ()) { FILETIME ft = {}; res = fstat_helper (buf, ft, ft, ft, ft, pc.volser (), 0ULL, -1LL, 0ULL, 1, FILE_ATTRIBUTE_DIRECTORY); } else { debug_printf ("FindFirstFile failed for '%s', %E", (char *) pc); __seterrno (); res = -1; } return res; } int __stdcall fhandler_base::fstat_fs (struct __stat64 *buf) { int res = -1; int oret; int open_flags = O_RDONLY | O_BINARY; if (get_io_handle ()) { if (nohandle () || is_fs_special ()) return fstat_by_name (buf); else return fstat_by_handle (buf); } /* If we don't care if the file is executable or we already know if it is, then just do a "query open" as it is apparently much faster. */ if (pc.exec_state () != dont_know_if_executable) { if (pc.fs_is_fat () && !strpbrk (get_win32_name (), "?*|<>")) return fstat_by_name (buf); query_open (query_stat_control); } if (!(oret = open_fs (open_flags, 0)) && get_errno () == EACCES) { /* If we couldn't open the file, try a query open with no permissions. This allows us to determine *some* things about the file, at least. */ pc.set_exec (0); query_open (query_read_attributes); oret = open_fs (open_flags, 0); } if (oret) { /* We now have a valid handle, regardless of the "nohandle" state. Since fhandler_base::open only calls CloseHandle if !nohandle, we have to set it to false before calling close_fs and restore the state afterwards. */ res = fstat_by_handle (buf); bool no_handle = nohandle (); nohandle (false); close_fs (); nohandle (no_handle); set_io_handle (NULL); } else res = fstat_by_name (buf); return res; } /* The ftChangeTime is taken from the NTFS ChangeTime entry, if reading the file information using NtQueryInformationFile succeeded. If not, it's faked using the LastWriteTime entry from GetFileInformationByHandle or FindFirstFile. We're deliberatly not using the creation time anymore to simplify interaction with native Windows applications which choke on creation times >= access or write times. Note that the dwFileAttributes member of the file information evaluated in the calling function is used here, not the pc.fileattr member, since the latter might be old and not reflect the actual state of the file. */ int __stdcall fhandler_base::fstat_helper (struct __stat64 *buf, FILETIME ftChangeTime, FILETIME ftLastAccessTime, FILETIME ftLastWriteTime, FILETIME ftCreationTime, DWORD dwVolumeSerialNumber, ULONGLONG nFileSize, LONGLONG nAllocSize, ULONGLONG nFileIndex, DWORD nNumberOfLinks, DWORD dwFileAttributes) { IO_STATUS_BLOCK st; FILE_COMPRESSION_INFORMATION fci; to_timestruc_t (&ftLastAccessTime, &buf->st_atim); to_timestruc_t (&ftLastWriteTime, &buf->st_mtim); to_timestruc_t (&ftChangeTime, &buf->st_ctim); to_timestruc_t (&ftCreationTime, &buf->st_birthtim); buf->st_dev = dwVolumeSerialNumber ?: pc.volser (); buf->st_size = (_off64_t) nFileSize; /* The number of links to a directory includes the number of subdirectories in the directory, since all those subdirectories point to it. This is too slow on remote drives, so we do without it. Setting the count to 2 confuses `find (1)' command. So let's try it with `1' as link count. */ buf->st_nlink = pc.ndisk_links (nNumberOfLinks); /* Enforce namehash as inode number on untrusted file systems. */ if (pc.isgood_inode (nFileIndex)) buf->st_ino = (__ino64_t) nFileIndex; else buf->st_ino = get_namehash (); buf->st_blksize = PREFERRED_IO_BLKSIZE; if (nAllocSize >= 0LL) /* A successful NtQueryInformationFile returns the allocation size correctly for compressed and sparse files as well. */ buf->st_blocks = (nAllocSize + S_BLKSIZE - 1) / S_BLKSIZE; else if (::has_attribute (dwFileAttributes, FILE_ATTRIBUTE_COMPRESSED | FILE_ATTRIBUTE_SPARSE_FILE) && get_io_handle () && !is_fs_special () && !NtQueryInformationFile (get_io_handle (), &st, (PVOID) &fci, sizeof fci, FileCompressionInformation)) /* Otherwise we request the actual amount of bytes allocated for compressed and sparsed files. */ buf->st_blocks = (fci.CompressedSize.QuadPart + S_BLKSIZE - 1) / S_BLKSIZE; else /* Otherwise compute no. of blocks from file size. */ buf->st_blocks = (buf->st_size + S_BLKSIZE - 1) / S_BLKSIZE; buf->st_mode = 0; /* Using a side effect: get_file_attibutes checks for directory. This is used, to set S_ISVTX, if needed. */ if (pc.isdir ()) buf->st_mode = S_IFDIR; else if (pc.issymlink ()) { buf->st_size = pc.get_symlink_length (); /* symlinks are everything for everyone! */ buf->st_mode = S_IFLNK | S_IRWXU | S_IRWXG | S_IRWXO; get_file_attribute (pc.has_acls (), get_io_handle (), get_win32_name (), NULL, &buf->st_uid, &buf->st_gid); goto done; } else if (pc.issocket ()) buf->st_mode = S_IFSOCK; if (!get_file_attribute (pc.has_acls (), is_fs_special () ? NULL: get_io_handle (), get_win32_name (), &buf->st_mode, &buf->st_uid, &buf->st_gid)) { /* If read-only attribute is set, modify ntsec return value */ if (::has_attribute (dwFileAttributes, FILE_ATTRIBUTE_READONLY) && !pc.issymlink ()) buf->st_mode &= ~(S_IWUSR | S_IWGRP | S_IWOTH); if (buf->st_mode & S_IFMT) /* nothing */; else if (!is_fs_special ()) buf->st_mode |= S_IFREG; else { buf->st_dev = dev (); buf->st_mode = dev ().mode; buf->st_size = 0; } } else { buf->st_mode |= STD_RBITS; if (!::has_attribute (dwFileAttributes, FILE_ATTRIBUTE_READONLY) && !pc.issymlink ()) buf->st_mode |= STD_WBITS; /* | S_IWGRP | S_IWOTH; we don't give write to group etc */ if (S_ISDIR (buf->st_mode)) buf->st_mode |= S_IFDIR | STD_XBITS; else if (buf->st_mode & S_IFMT) /* nothing */; else if (is_fs_special ()) { buf->st_dev = dev (); buf->st_mode = dev ().mode; buf->st_size = 0; } else { buf->st_mode |= S_IFREG; if (pc.exec_state () == dont_know_if_executable) { DWORD cur, done; LONG curhigh = 0; char magic[3]; /* First retrieve current position, set to beginning of file if not already there. */ cur = SetFilePointer (get_handle (), 0, &curhigh, FILE_CURRENT); if ((cur != INVALID_SET_FILE_POINTER || GetLastError () == NO_ERROR) && ((!cur && !curhigh) || SetFilePointer (get_handle (), 0, NULL, FILE_BEGIN) != INVALID_SET_FILE_POINTER)) { /* FIXME should we use /etc/magic ? */ magic[0] = magic[1] = magic[2] = '\0'; if (ReadFile (get_handle (), magic, 3, &done, NULL) && has_exec_chars (magic, done)) { pc.set_exec (); buf->st_mode |= STD_XBITS; } SetFilePointer (get_handle (), cur, &curhigh, FILE_BEGIN); } } } if (pc.exec_state () == is_executable) buf->st_mode |= STD_XBITS; /* This fakes the permissions of all files to match the current umask. */ buf->st_mode &= ~(cygheap->umask); } done: syscall_printf ("0 = fstat (, %p) st_atime=%x st_size=%D, st_mode=%p, st_ino=%D, sizeof=%d", buf, buf->st_atime, buf->st_size, buf->st_mode, buf->st_ino, sizeof (*buf)); return 0; } int __stdcall fhandler_disk_file::fstat (struct __stat64 *buf) { return fstat_fs (buf); } int __stdcall fhandler_disk_file::fstatvfs (struct statvfs *sfs) { int ret = -1, oret = 0; NTSTATUS status; IO_STATUS_BLOCK io; const size_t fvi_size = sizeof (FILE_FS_VOLUME_INFORMATION) + 256 * sizeof (WCHAR); PFILE_FS_VOLUME_INFORMATION pfvi = (PFILE_FS_VOLUME_INFORMATION) alloca (fvi_size); const size_t fai_size = sizeof (FILE_FS_ATTRIBUTE_INFORMATION) + 256 * sizeof (WCHAR); PFILE_FS_ATTRIBUTE_INFORMATION pfai = (PFILE_FS_ATTRIBUTE_INFORMATION) alloca (fai_size); FILE_FS_FULL_SIZE_INFORMATION full_fsi; FILE_FS_SIZE_INFORMATION fsi; if (!get_io_handle ()) { query_open (query_read_control); oret = open_fs (O_RDONLY | O_BINARY, 0); if (!oret) { /* Can't open file. Try again with rootdir. */ char root[CYG_MAX_PATH]; if (!rootdir (get_win32_name (), root)) goto out; pc.check (root, PC_SYM_NOFOLLOW); oret = open_fs (O_RDONLY | O_BINARY, 0); if (!oret) goto out; } } /* Get basic volume information. */ status = NtQueryVolumeInformationFile (get_handle (), &io, pfvi, fvi_size, FileFsVolumeInformation); if (!NT_SUCCESS (status)) { __seterrno_from_nt_status (status); goto out; } status = NtQueryVolumeInformationFile (get_handle (), &io, pfai, fai_size, FileFsAttributeInformation); if (!NT_SUCCESS (status)) { __seterrno_from_nt_status (status); goto out; } sfs->f_files = ULONG_MAX; sfs->f_ffree = ULONG_MAX; sfs->f_favail = ULONG_MAX; sfs->f_fsid = pfvi->VolumeSerialNumber; sfs->f_flag = pfai->FileSystemAttributes; sfs->f_namemax = pfai->MaximumComponentNameLength; /* Get allocation related information. Try to get "full" information first, which is only available since W2K. If that fails, try to retrieve normal allocation information. */ status = NtQueryVolumeInformationFile (get_handle (), &io, &full_fsi, sizeof full_fsi, FileFsFullSizeInformation); if (NT_SUCCESS (status)) { sfs->f_bsize = full_fsi.BytesPerSector * full_fsi.SectorsPerAllocationUnit; sfs->f_frsize = sfs->f_bsize; sfs->f_blocks = full_fsi.TotalAllocationUnits.LowPart; sfs->f_bfree = full_fsi.ActualAvailableAllocationUnits.LowPart; sfs->f_bavail = full_fsi.CallerAvailableAllocationUnits.LowPart; if (sfs->f_bfree > sfs->f_bavail) { /* Quotas active. We can't trust TotalAllocationUnits. */ NTFS_VOLUME_DATA_BUFFER nvdb; DWORD bytes; if (!DeviceIoControl (get_handle (), FSCTL_GET_NTFS_VOLUME_DATA, NULL, 0, &nvdb, sizeof nvdb, &bytes, NULL)) debug_printf ("DeviceIoControl (%s) failed, %E", get_name ()); else sfs->f_blocks = nvdb.TotalClusters.QuadPart; } ret = 0; } else { status = NtQueryVolumeInformationFile (get_handle (), &io, &fsi, sizeof fsi, FileFsSizeInformation); if (!NT_SUCCESS (status)) { __seterrno_from_nt_status (status); goto out; } sfs->f_bsize = fsi.BytesPerSector * fsi.SectorsPerAllocationUnit; sfs->f_frsize = sfs->f_bsize; sfs->f_blocks = fsi.TotalAllocationUnits.LowPart; sfs->f_bfree = fsi.AvailableAllocationUnits.LowPart; sfs->f_bavail = sfs->f_bfree; ret = 0; } out: if (oret) close_fs (); syscall_printf ("%d = fstatvfs (%s, %p)", ret, get_name (), sfs); return ret; } int __stdcall fhandler_disk_file::fchmod (mode_t mode) { extern int chmod_device (path_conv& pc, mode_t mode); int res = -1; int oret = 0; if (pc.is_fs_special ()) return chmod_device (pc, mode); if (!get_io_handle ()) { query_open (query_write_control); if (!(oret = open (O_BINARY, 0))) { /* If the file couldn't be opened, that's really only a problem if ACLs or EAs should get written. */ if (allow_ntsec && pc.has_acls ()) return -1; } } if (allow_ntsec && pc.has_acls ()) { if (pc.isdir ()) mode |= S_IFDIR; if (!set_file_attribute (pc.has_acls (), get_io_handle (), pc, ILLEGAL_UID, ILLEGAL_GID, mode) && allow_ntsec) res = 0; } /* if the mode we want has any write bits set, we can't be read only. */ if (mode & (S_IWUSR | S_IWGRP | S_IWOTH)) pc &= (DWORD) ~FILE_ATTRIBUTE_READONLY; else pc |= (DWORD) FILE_ATTRIBUTE_READONLY; if (!SetFileAttributes (pc, pc)) __seterrno (); else if (!allow_ntsec || !pc.has_acls ()) /* Correct NTFS security attributes have higher priority */ res = 0; if (oret) close (); return res; } int __stdcall fhandler_disk_file::fchown (__uid32_t uid, __gid32_t gid) { int oret = 0; if (!pc.has_acls () || !allow_ntsec) { /* fake - if not supported, pretend we're like win95 where it just works */ return 0; } if (!get_io_handle ()) { query_open (query_write_control); if (!(oret = fhandler_disk_file::open (O_BINARY, 0))) return -1; } mode_t attrib = 0; if (pc.isdir ()) attrib |= S_IFDIR; int res = get_file_attribute (pc.has_acls (), get_io_handle (), pc, &attrib); if (!res) { /* Typical Windows default ACLs can contain permissions for one group, while being owned by another user/group. The permission bits returned above are pretty much useless then. Creating a new ACL with these useless permissions results in a potentially broken symlink. So what we do here is to set the underlying permissions of symlinks to a sensible value which allows the world to read the symlink and only the new owner to change it. */ if (pc.issymlink ()) attrib = S_IFLNK | STD_RBITS | STD_WBITS; res = set_file_attribute (pc.has_acls (), get_io_handle (), pc, uid, gid, attrib); } if (oret) close (); return res; } int _stdcall fhandler_disk_file::facl (int cmd, int nentries, __aclent32_t *aclbufp) { int res = -1; int oret = 0; if (!pc.has_acls () || !allow_ntsec) { switch (cmd) { struct __stat64 st; case SETACL: /* Open for writing required to be able to set ctime (even though setting the ACL is just pretended). */ if (!get_io_handle ()) oret = open (O_WRONLY | O_BINARY, 0); res = 0; break; case GETACL: if (!aclbufp) set_errno (EFAULT); else if (nentries < MIN_ACL_ENTRIES) set_errno (ENOSPC); else { if (!get_io_handle ()) { query_open (query_read_attributes); if (!(oret = open (O_BINARY, 0))) return -1; } if (!fstat_by_handle (&st)) { aclbufp[0].a_type = USER_OBJ; aclbufp[0].a_id = st.st_uid; aclbufp[0].a_perm = (st.st_mode & S_IRWXU) >> 6; aclbufp[1].a_type = GROUP_OBJ; aclbufp[1].a_id = st.st_gid; aclbufp[1].a_perm = (st.st_mode & S_IRWXG) >> 3; aclbufp[2].a_type = OTHER_OBJ; aclbufp[2].a_id = ILLEGAL_GID; aclbufp[2].a_perm = st.st_mode & S_IRWXO; aclbufp[3].a_type = CLASS_OBJ; aclbufp[3].a_id = ILLEGAL_GID; aclbufp[3].a_perm = S_IRWXU | S_IRWXG | S_IRWXO; res = MIN_ACL_ENTRIES; } } break; case GETACLCNT: res = MIN_ACL_ENTRIES; break; default: set_errno (EINVAL); break; } } else { if (!get_io_handle ()) { query_open (cmd == SETACL ? query_write_control : query_read_attributes); if (!(oret = open (O_BINARY, 0))) return -1; } switch (cmd) { case SETACL: if (!aclsort32 (nentries, 0, aclbufp)) { bool rw = false; res = setacl (get_io_handle (), pc, nentries, aclbufp, rw); if (rw) SetFileAttributes (pc, (DWORD) pc & ~FILE_ATTRIBUTE_READONLY); } break; case GETACL: if (!aclbufp) set_errno(EFAULT); else res = getacl (get_io_handle (), pc, pc, nentries, aclbufp); break; case GETACLCNT: res = getacl (get_io_handle (), pc, pc, 0, NULL); break; default: set_errno (EINVAL); break; } } if (oret) close (); return res; } int fhandler_disk_file::fadvise (_off64_t offset, _off64_t length, int advice) { if (advice < POSIX_FADV_NORMAL || advice > POSIX_FADV_NOREUSE) { set_errno (EINVAL); return -1; } /* Windows only supports advice flags for the whole file. We're using a simplified test here so that we don't have to ask for the actual file size. Length == 0 means all bytes starting at offset anyway. So we only actually follow the advice, if it's given for offset == 0. */ if (offset != 0) return 0; /* We only support normal and sequential mode for now. Everything which is not POSIX_FADV_SEQUENTIAL is treated like POSIX_FADV_NORMAL. */ if (advice != POSIX_FADV_SEQUENTIAL) advice = POSIX_FADV_NORMAL; IO_STATUS_BLOCK io; FILE_MODE_INFORMATION fmi; NTSTATUS status = NtQueryInformationFile (get_handle (), &io, &fmi, sizeof fmi, FileModeInformation); if (!NT_SUCCESS (status)) __seterrno_from_nt_status (status); else { fmi.Mode &= ~FILE_SEQUENTIAL_ONLY; if (advice == POSIX_FADV_SEQUENTIAL) fmi.Mode |= FILE_SEQUENTIAL_ONLY; status = NtSetInformationFile (get_handle (), &io, &fmi, sizeof fmi, FileModeInformation); if (NT_SUCCESS (status)) return 0; __seterrno_from_nt_status (status); } return -1; } int fhandler_disk_file::ftruncate (_off64_t length, bool allow_truncate) { int res = -1; if (length < 0 || !get_handle ()) set_errno (EINVAL); else if (pc.isdir ()) set_errno (EISDIR); else if (!(get_access () & GENERIC_WRITE)) set_errno (EBADF); else { _off64_t actual_length; DWORD size_high = 0; NTSTATUS status; IO_STATUS_BLOCK io; FILE_END_OF_FILE_INFORMATION feofi; actual_length = GetFileSize (get_handle (), &size_high); actual_length += ((_off64_t) size_high) << 32; /* If called through posix_fallocate, silently succeed if length is less than the file's actual length. */ if (!allow_truncate && length < actual_length) return 0; feofi.EndOfFile.QuadPart = length; /* Create sparse files only when called through ftruncate, not when called through posix_fallocate. */ if (allow_truncate && get_fs_flags (FILE_SUPPORTS_SPARSE_FILES) && length >= actual_length + (128 * 1024)) { DWORD dw; BOOL r = DeviceIoControl (get_handle (), FSCTL_SET_SPARSE, NULL, 0, NULL, 0, &dw, NULL); syscall_printf ("%d = DeviceIoControl(%p, FSCTL_SET_SPARSE)", r, get_handle ()); } status = NtSetInformationFile (get_handle (), &io, &feofi, sizeof feofi, FileEndOfFileInformation); if (!NT_SUCCESS (status)) __seterrno_from_nt_status (status); else res = 0; } return res; } int fhandler_disk_file::link (const char *newpath) { extern bool allow_winsymlinks; extern suffix_info stat_suffixes[]; path_conv newpc (newpath, PC_SYM_NOFOLLOW | PC_POSIX, transparent_exe ? stat_suffixes : NULL); if (newpc.error) { set_errno (newpc.case_clash ? ECASECLASH : newpc.error); return -1; } if (newpc.exists ()) { syscall_printf ("file '%s' exists?", (char *) newpc); set_errno (EEXIST); return -1; } if (newpc[strlen (newpc) - 1] == '.') { syscall_printf ("trailing dot, bailing out"); set_errno (EINVAL); return -1; } char new_buf[CYG_MAX_PATH + 5]; if (!newpc.error && !newpc.case_clash) { DWORD bintype; int len; if (allow_winsymlinks && pc.is_lnk_special ()) { /* Shortcut hack. */ strcpy (new_buf, newpath); strcat (new_buf, ".lnk"); newpath = new_buf; newpc.check (newpath, PC_SYM_NOFOLLOW); } else if (transparent_exe && !pc.isdir () && GetBinaryType (pc, &bintype) && (len = strlen (newpc)) > 4 && !strcasematch ((const char *) newpc + len - 4, ".exe")) { /* Executable hack. */ strcpy (new_buf, newpath); strcat (new_buf, ".exe"); newpath = new_buf; newpc.check (newpath, PC_SYM_NOFOLLOW); } } query_open (query_write_attributes); if (!open (O_BINARY, 0)) { syscall_printf ("Opening file failed"); __seterrno (); return -1; } if (CreateHardLinkA (newpc, pc, NULL)) goto success; /* There are two cases to consider: - The FS doesn't support hard links ==> ERROR_INVALID_FUNCTION We copy the file. - CreateHardLinkA is not supported ==> ERROR_PROC_NOT_FOUND In that case (<= NT4) we try the old-style method. Any other error should be taken seriously. */ if (GetLastError () == ERROR_INVALID_FUNCTION) { syscall_printf ("FS doesn't support hard links: Copy file"); goto docopy; } if (GetLastError () != ERROR_PROC_NOT_FOUND) { syscall_printf ("CreateHardLinkA failed"); __seterrno (); close (); return -1; } WIN32_STREAM_ID stream_id; LPVOID context; WCHAR wbuf[CYG_MAX_PATH]; BOOL ret; DWORD written, write_err, path_len, size; path_len = sys_mbstowcs (wbuf, newpc, CYG_MAX_PATH) * sizeof (WCHAR); stream_id.dwStreamId = BACKUP_LINK; stream_id.dwStreamAttributes = 0; stream_id.dwStreamNameSize = 0; stream_id.Size.HighPart = 0; stream_id.Size.LowPart = path_len; size = sizeof (WIN32_STREAM_ID) - sizeof (WCHAR**) + stream_id.dwStreamNameSize; context = NULL; write_err = 0; /* Write WIN32_STREAM_ID */ ret = BackupWrite (get_handle (), (LPBYTE) &stream_id, size, &written, FALSE, FALSE, &context); if (ret) { /* write the buffer containing the path */ /* FIXME: BackupWrite sometimes traps if linkname is invalid. Need to handle. */ ret = BackupWrite (get_handle (), (LPBYTE) wbuf, path_len, &written, FALSE, FALSE, &context); if (!ret) { write_err = GetLastError (); syscall_printf ("cannot write linkname, %E"); } /* Free context */ BackupWrite (get_handle (), NULL, 0, &written, TRUE, FALSE, &context); } else { write_err = GetLastError (); syscall_printf ("cannot write stream_id, %E"); } if (!ret) { /* Only copy file if FS doesn't support hard links */ if (write_err == ERROR_INVALID_FUNCTION) { syscall_printf ("FS doesn't support hard links: Copy file"); goto docopy; } close (); __seterrno_from_win_error (write_err); return -1; } success: close (); if (!allow_winsymlinks && pc.is_lnk_special ()) SetFileAttributes (newpc, (DWORD) pc | FILE_ATTRIBUTE_SYSTEM | FILE_ATTRIBUTE_READONLY); return 0; docopy: /* do this with a copy */ if (!CopyFileA (pc, newpc, 1)) { __seterrno (); return -1; } close (); fhandler_disk_file fh (newpc); fh.query_open (query_write_attributes); if (fh.open (O_BINARY, 0)) fh.close (); return 0; } int fhandler_disk_file::utimes (const struct timeval *tvp) { return utimes_fs (tvp); } int fhandler_base::utimes_fs (const struct timeval *tvp) { FILETIME lastaccess, lastwrite; struct timeval tmp[2]; bool closeit; if (get_handle ()) closeit = false; else { query_open (query_write_attributes); if (!open_fs (O_BINARY, 0)) { /* It's documented in MSDN that FILE_WRITE_ATTRIBUTES is sufficient to change the timestamps. Unfortunately it's not sufficient for a remote HPFS which requires GENERIC_WRITE, so we just retry to open for writing, though this fails for R/O files of course. */ query_open (no_query); if (!open_fs (O_WRONLY | O_BINARY, 0)) { syscall_printf ("Opening file failed"); return -1; } } closeit = true; } if (nohandle ()) /* Directory query_open on 9x. */ return 0; gettimeofday (&tmp[0], 0); if (!tvp) { tmp[1] = tmp[0]; tvp = tmp; } timeval_to_filetime (&tvp[0], &lastaccess); timeval_to_filetime (&tvp[1], &lastwrite); debug_printf ("incoming lastaccess %08x %08x", tvp[0].tv_sec, tvp[0].tv_usec); if (is_fs_special ()) SetFileAttributes (pc, (DWORD) pc & ~FILE_ATTRIBUTE_READONLY); BOOL res = SetFileTime (get_handle (), NULL, &lastaccess, &lastwrite); DWORD errcode = GetLastError (); if (is_fs_special ()) SetFileAttributes (pc, pc); /* Opening a directory on a 9x share from a NT machine works(!), but then the SetFileTimes fails with ERROR_NOT_SUPPORTED. Oh well... */ if (!res && errcode != ERROR_NOT_SUPPORTED) { close (); __seterrno_from_win_error (errcode); return -1; } if (closeit) close (); return 0; } fhandler_disk_file::fhandler_disk_file () : fhandler_base () { } fhandler_disk_file::fhandler_disk_file (path_conv &pc) : fhandler_base () { set_name (pc); } int fhandler_disk_file::open (int flags, mode_t mode) { return open_fs (flags, mode); } int fhandler_base::open_fs (int flags, mode_t mode) { if (pc.case_clash && flags & O_CREAT) { debug_printf ("case clash detected"); set_errno (ECASECLASH); return 0; } /* Unfortunately NT allows to open directories for writing, but that's disallowed according to SUSv3. */ if (pc.isdir () && (flags & O_ACCMODE) != O_RDONLY) { set_errno (EISDIR); return 0; } int res = fhandler_base::open (flags | O_DIROPEN, mode); if (!res) goto out; /* This is for file systems known for having a buggy CreateFile call which might return a valid HANDLE without having actually opened the file. The only known file system to date is the SUN NFS Solstice Client 3.1 which returns a valid handle when trying to open a file in a nonexistent directory. */ if (pc.has_buggy_open () && !pc.exists ()) { debug_printf ("Buggy open detected."); close_fs (); set_errno (ENOENT); return 0; } set_fs_flags (pc.fs_flags ()); out: syscall_printf ("%d = fhandler_disk_file::open (%s, %p)", res, get_win32_name (), flags); return res; } int fhandler_disk_file::close () { return close_fs (); } int fhandler_base::close_fs () { int res = fhandler_base::close (); if (!res) user_shared->delqueue.process_queue (); return res; } ssize_t __stdcall fhandler_disk_file::pread (void *buf, size_t count, _off64_t offset) { ssize_t res; _off64_t curpos = lseek (0, SEEK_CUR); if (curpos < 0 || lseek (offset, SEEK_SET) < 0) res = -1; else { size_t tmp_count = count; read (buf, tmp_count); if (lseek (curpos, SEEK_SET) >= 0) res = (ssize_t) tmp_count; else res = -1; } debug_printf ("%d = pread (%p, %d, %d)\n", res, buf, count, offset); return res; } ssize_t __stdcall fhandler_disk_file::pwrite (void *buf, size_t count, _off64_t offset) { int res; _off64_t curpos = lseek (0, SEEK_CUR); if (curpos < 0 || lseek (offset, SEEK_SET) < 0) res = curpos; else { res = (ssize_t) write (buf, count); if (lseek (curpos, SEEK_SET) < 0) res = -1; } debug_printf ("%d = pwrite (%p, %d, %d)\n", res, buf, count, offset); return res; } /* FIXME: The correct way to do this to get POSIX locking semantics is to keep a linked list of posix lock requests and map them into Win32 locks. he problem is that Win32 does not deal correctly with overlapping lock requests. Also another pain is that Win95 doesn't do non-blocking or non-exclusive locks at all. For '95 just convert all lock requests into blocking,exclusive locks. This shouldn't break many apps but denying all locking would. For now just convert to Win32 locks and hope for the best. */ int fhandler_disk_file::lock (int cmd, struct __flock64 *fl) { _off64_t win32_start; _off64_t win32_len; _off64_t startpos; /* * We don't do getlck calls yet. */ if (cmd == F_GETLK) { set_errno (ENOSYS); return -1; } /* * Calculate where in the file to start from, * then adjust this by fl->l_start. */ switch (fl->l_whence) { case SEEK_SET: startpos = 0; break; case SEEK_CUR: if ((startpos = lseek (0, SEEK_CUR)) == ILLEGAL_SEEK) return -1; break; case SEEK_END: { BY_HANDLE_FILE_INFORMATION finfo; if (GetFileInformationByHandle (get_handle (), &finfo) == 0) { __seterrno (); return -1; } startpos = ((_off64_t)finfo.nFileSizeHigh << 32) + finfo.nFileSizeLow; break; } default: set_errno (EINVAL); return -1; } /* * Now the fun starts. Adjust the start and length * fields until they make sense. */ win32_start = startpos + fl->l_start; if (fl->l_len < 0) { win32_start -= fl->l_len; win32_len = -fl->l_len; } else win32_len = fl->l_len; if (win32_start < 0) { /* watch the signs! */ win32_len -= -win32_start; if (win32_len <= 0) { /* Failure ! */ set_errno (EINVAL); return -1; } win32_start = 0; } DWORD off_high, off_low, len_high, len_low; off_low = (DWORD)(win32_start & UINT32_MAX); off_high = (DWORD)(win32_start >> 32); if (win32_len == 0) { /* Special case if len == 0 for POSIX means lock to the end of the entire file (and all future extensions). */ len_low = len_high = UINT32_MAX; } else { len_low = (DWORD)(win32_len & UINT32_MAX); len_high = (DWORD)(win32_len >> 32); } BOOL res; DWORD lock_flags = (cmd == F_SETLK) ? LOCKFILE_FAIL_IMMEDIATELY : 0; lock_flags |= (fl->l_type == F_WRLCK) ? LOCKFILE_EXCLUSIVE_LOCK : 0; OVERLAPPED ov; ov.Internal = 0; ov.InternalHigh = 0; ov.Offset = off_low; ov.OffsetHigh = off_high; ov.hEvent = (HANDLE) 0; if (fl->l_type == F_UNLCK) { res = UnlockFileEx (get_handle (), 0, len_low, len_high, &ov); if (res == 0 && GetLastError () == ERROR_NOT_LOCKED) res = 1; } else { res = LockFileEx (get_handle (), lock_flags, 0, len_low, len_high, &ov); /* Deal with the fail immediately case. */ /* * FIXME !! I think this is the right error to check for * but I must admit I haven't checked.... */ if ((res == 0) && (lock_flags & LOCKFILE_FAIL_IMMEDIATELY) && (GetLastError () == ERROR_LOCK_FAILED)) { set_errno (EAGAIN); return -1; } } if (res == 0) { __seterrno (); return -1; } return 0; } int fhandler_disk_file::mkdir (mode_t mode) { int res = -1; SECURITY_ATTRIBUTES sa = sec_none_nih; security_descriptor sd; if (allow_ntsec && has_acls ()) set_security_attribute (S_IFDIR | ((mode & 07777) & ~cygheap->umask), &sa, sd); if (CreateDirectoryA (get_win32_name (), &sa)) { #ifdef HIDDEN_DOT_FILES char *c = strrchr (real_dir.get_win32 (), '\\'); if ((c && c[1] == '.') || *get_win32_name () == '.') SetFileAttributes (get_win32_name (), FILE_ATTRIBUTE_HIDDEN); #endif res = 0; } else __seterrno (); return res; } int fhandler_disk_file::rmdir () { extern DWORD unlink_nt (path_conv &win32_name, bool setattrs); int res = -1; if (!pc.isdir ()) { set_errno (ENOTDIR); return -1; } /* Even own directories can't be removed if R/O attribute is set. */ if (pc.has_attribute (FILE_ATTRIBUTE_READONLY)) SetFileAttributes (get_win32_name (), (DWORD) pc & ~FILE_ATTRIBUTE_READONLY); DWORD err, att = 0; int rc = !(err = unlink_nt (pc, pc.has_attribute (FILE_ATTRIBUTE_READONLY))); if (err) SetLastError (err); if (isremote () && exists ()) att = GetFileAttributes (get_win32_name ()); /* Sometimes smb indicates failure when it really succeeds, so check for this case specifically. */ if (rc || att == INVALID_FILE_ATTRIBUTES) { /* RemoveDirectory on a samba drive doesn't return an error if the directory can't be removed because it's not empty. Checking for existence afterwards keeps us informed about success. */ if (!isremote () || att == INVALID_FILE_ATTRIBUTES) return 0; err = ERROR_DIR_NOT_EMPTY; } else err = GetLastError (); __seterrno_from_win_error (err); return res; } /* This is the minimal number of entries which fit into the readdir cache. The number of bytes allocated by the cache is determined by this number, To tune caching, just tweak this number. To get a feeling for the size, the size of the readdir cache is DIR_NUM_ENTRIES * 632 + 264 bytes. */ #define DIR_NUM_ENTRIES 100 /* Cache size 63464 bytes */ #define DIR_BUF_SIZE (DIR_NUM_ENTRIES \ * (sizeof (FILE_ID_BOTH_DIR_INFORMATION) \ + 2 * CYG_MAX_PATH)) struct __DIR_cache { char __name[CYG_MAX_PATH]; ULONG __pos; char __cache[DIR_BUF_SIZE]; }; #define d_dirname(d) (((__DIR_cache *) (d)->__d_dirname)->__name) #define d_cachepos(d) (((__DIR_cache *) (d)->__d_dirname)->__pos) #define d_cache(d) (((__DIR_cache *) (d)->__d_dirname)->__cache) #define d_mounts(d) ((__DIR_mounts *) (d)->__d_internal) DIR * fhandler_disk_file::opendir () { DIR *dir; DIR *res = NULL; size_t len; if (!pc.isdir ()) set_errno (ENOTDIR); else if ((len = strlen (pc)) > CYG_MAX_PATH - 3) set_errno (ENAMETOOLONG); else if ((dir = (DIR *) malloc (sizeof (DIR))) == NULL) set_errno (ENOMEM); else if ((dir->__d_dirname = (char *) malloc ( sizeof (struct __DIR_cache))) == NULL) { set_errno (ENOMEM); goto free_dir; } else if ((dir->__d_dirent = (struct dirent *) malloc (sizeof (struct dirent))) == NULL) { set_errno (ENOMEM); goto free_dirname; } else { strcpy (d_dirname (dir), get_win32_name ()); dir->__d_dirent->__d_version = __DIRENT_VERSION; cygheap_fdnew fd; if (fd < 0) goto free_dirent; /* FindFirstFile doesn't seem to like duplicate /'s. The dirname is generated with trailing backslash here which simplifies later usage of dirname for checking symlinks. Appending a "*" is moved right before calling FindFirstFile. Since FindFirstFile is only called once, this should even be a teeny little bit faster. */ len = strlen (d_dirname (dir)); if (len && !isdirsep (d_dirname (dir)[len - 1])) strcpy (d_dirname (dir) + len, "\\"); dir->__d_cookie = __DIRENT_COOKIE; dir->__handle = INVALID_HANDLE_VALUE; dir->__d_position = 0; dir->__flags = (pc.normalized_path[0] == '/' && pc.normalized_path[1] == '\0') ? dirent_isroot : 0; dir->__d_internal = (unsigned) new __DIR_mounts (pc.normalized_path); d_cachepos (dir) = 0; if (!pc.iscygdrive ()) { OBJECT_ATTRIBUTES attr; WCHAR wpath[CYG_MAX_PATH + 10]; UNICODE_STRING upath = {0, sizeof (wpath), wpath}; IO_STATUS_BLOCK io; NTSTATUS status; SECURITY_ATTRIBUTES sa = sec_none; pc.get_nt_native_path (upath); InitializeObjectAttributes (&attr, &upath, OBJ_CASE_INSENSITIVE | OBJ_INHERIT, NULL, sa.lpSecurityDescriptor); status = NtOpenFile (&dir->__handle, SYNCHRONIZE | FILE_LIST_DIRECTORY, &attr, &io, FILE_SHARE_VALID_FLAGS, FILE_SYNCHRONOUS_IO_NONALERT | FILE_OPEN_FOR_BACKUP_INTENT | FILE_DIRECTORY_FILE); if (!NT_SUCCESS (status)) { __seterrno_from_nt_status (status); goto free_mounts; } /* FileIdBothDirectoryInformation is apparently unsupported on XP when accessing directories on UDF. When trying to use it so, NtQueryDirectoryFile returns with STATUS_ACCESS_VIOLATION. It's not clear if the call isn't also unsupported on other OS/FS combinations (say, Win2K/CDFS or so). Instead of testing in readdir for yet another error code, let's use FileIdBothDirectoryInformation only on filesystems supporting persistent ACLs, FileBothDirectoryInformation otherwise. */ if (pc.hasgood_inode ()) { dir->__flags |= dirent_set_d_ino; if (wincap.has_fileid_dirinfo ()) dir->__flags |= dirent_get_d_ino; } } /* Filling fd with `this' (aka storing this in the file descriptor table should only happen after it's clear that opendir doesn't fail, otherwise we end up cfree'ing the fhandler twice, once in opendir() in dir.cc, the second time on exit. Nasty, nasty... */ fd = this; fd->nohandle (true); dir->__d_fd = fd; dir->__fh = this; res = dir; } syscall_printf ("%p = opendir (%s)", res, get_name ()); return res; free_mounts: delete d_mounts (dir); free_dirent: free (dir->__d_dirent); free_dirname: free (dir->__d_dirname); free_dir: free (dir); return res; } int fhandler_disk_file::readdir_helper (DIR *dir, dirent *de, DWORD w32_err, DWORD attr, char *fname) { if (w32_err) { bool added = false; if ((de->d_ino = d_mounts (dir)->check_missing_mount (fname))) added = true; if (!added) return geterrno_from_win_error (w32_err); attr = 0; dir->__flags &= ~dirent_set_d_ino; } /* Check for Windows shortcut. If it's a Cygwin or U/WIN symlink, drop the .lnk suffix. */ if (attr & FILE_ATTRIBUTE_READONLY) { char *c = fname; char *e = strchr (fname, '\0') - 4; if (e > c && strcasematch (e, ".lnk")) { char fbuf[CYG_MAX_PATH]; strcpy (fbuf, d_dirname (dir)); strcat (fbuf, c); path_conv fpath (fbuf, PC_SYM_NOFOLLOW); if (fpath.issymlink () || fpath.is_fs_special ()) *e = '\0'; } } if (pc.isencoded ()) fnunmunge (de->d_name, fname); else strcpy (de->d_name, fname); if (dir->__d_position == 0 && !strcmp (fname, ".")) dir->__flags |= dirent_saw_dot; else if (dir->__d_position == 1 && !strcmp (fname, "..")) dir->__flags |= dirent_saw_dot_dot; return 0; } static inline __ino64_t readdir_get_ino_by_handle (HANDLE hdl) { IO_STATUS_BLOCK io; FILE_INTERNAL_INFORMATION pfai; if (!NtQueryInformationFile (hdl, &io, &pfai, sizeof pfai, FileInternalInformation)) return pfai.FileId.QuadPart; return 0; } __ino64_t __stdcall readdir_get_ino (DIR *dir, const char *path, bool dot_dot) { char fname[CYG_MAX_PATH]; struct __stat64 st; HANDLE hdl; __ino64_t ino = 0; if (!(dir->__flags & dirent_isroot)) { strcpy (fname, path); if (dot_dot) strcat (fname, (*fname && fname[strlen (fname) - 1] == '/') ? ".." : "/.."); path_conv pc (fname, PC_SYM_NOFOLLOW); if (pc.isspecial ()) { if (!lstat64 (fname, &st)) ino = st.st_ino; } else if (!pc.hasgood_inode ()) ino = hash_path_name (0, pc); else if ((hdl = CreateFile (pc, GENERIC_READ, FILE_SHARE_VALID_FLAGS, NULL, OPEN_EXISTING, FILE_FLAG_BACKUP_SEMANTICS, NULL)) != INVALID_HANDLE_VALUE) { ino = readdir_get_ino_by_handle (hdl); CloseHandle (hdl); } } else ino = readdir_get_ino_by_handle (dir->__handle); return ino; } int fhandler_disk_file::readdir (DIR *dir, dirent *de) { int res = 0; NTSTATUS status = STATUS_SUCCESS; PFILE_ID_BOTH_DIR_INFORMATION buf = NULL; wchar_t *FileName; char fname[CYG_MAX_PATH]; IO_STATUS_BLOCK io; /* d_cachepos always refers to the next cache entry to use. If it's 0 we must reload the cache. */ if (d_cachepos (dir) == 0) { if ((dir->__flags & dirent_get_d_ino)) { status = NtQueryDirectoryFile (dir->__handle, NULL, NULL, 0, &io, d_cache (dir), DIR_BUF_SIZE, FileIdBothDirectoryInformation, FALSE, NULL, dir->__d_position == 0); /* FileIdBothDirectoryInformation isn't supported for remote drives on NT4 and 2K systems, and it's also not supported on 2K at all, when accessing network drives on any remote OS. We just fall back to using a standard directory query in this case and note this case using the dirent_get_d_ino flag. */ if (status == STATUS_INVALID_LEVEL || status == STATUS_INVALID_PARAMETER || status == STATUS_INVALID_INFO_CLASS) dir->__flags &= ~dirent_get_d_ino; /* Something weird happens on Samba up to version 3.0.21c, which is fixed in 3.0.22. FileIdBothDirectoryInformation seems to work nicely, but only up to the 128th entry in the directory. After reaching this entry, the next call to NtQueryDirectoryFile (FileIdBothDirectoryInformation) returns STATUS_INVALID_LEVEL. Why should we care, we can just switch to FileBothDirectoryInformation, isn't it? Nope! The next call to NtQueryDirectoryFile(FileBothDirectoryInformation) actually returns STATUS_NO_MORE_FILES, regardless how many files are left unread in the directory. This does not happen when using FileBothDirectoryInformation right from the start, but since we can't decide whether the server we're talking with has this bug or not, we end up serving Samba shares always in the slow mode using FileBothDirectoryInformation. So, what we do here is to implement the solution suggested by Andrew Tridgell, we just reread all entries up to dir->d_position using FileBothDirectoryInformation. However, We do *not* mark this server as broken and fall back to using FileBothDirectoryInformation further on. This would slow down every access to such a server, even for directories under 128 entries. Also, bigger dirs only suffer from one additional call per full directory scan, which shouldn't be too big a hit. This can easily be changed if necessary. */ if (status == STATUS_INVALID_LEVEL && dir->__d_position) { d_cachepos (dir) = 0; for (int cnt = 0; cnt < dir->__d_position; ++cnt) { if (d_cachepos (dir) == 0) { status = NtQueryDirectoryFile (dir->__handle, NULL, NULL, 0, &io, d_cache (dir), DIR_BUF_SIZE, FileBothDirectoryInformation, FALSE, NULL, cnt == 0); if (!NT_SUCCESS (status)) goto go_ahead; } buf = (PFILE_ID_BOTH_DIR_INFORMATION) (d_cache (dir) + d_cachepos (dir)); if (buf->NextEntryOffset == 0) d_cachepos (dir) = 0; else d_cachepos (dir) += buf->NextEntryOffset; } goto go_ahead; } } if (!(dir->__flags & dirent_get_d_ino)) status = NtQueryDirectoryFile (dir->__handle, NULL, NULL, 0, &io, d_cache (dir), DIR_BUF_SIZE, FileBothDirectoryInformation, FALSE, NULL, dir->__d_position == 0); } go_ahead: if (!NT_SUCCESS (status)) debug_printf ("NtQueryDirectoryFile failed, status %p, win32 error %lu", status, RtlNtStatusToDosError (status)); else { buf = (PFILE_ID_BOTH_DIR_INFORMATION) (d_cache (dir) + d_cachepos (dir)); if (buf->NextEntryOffset == 0) d_cachepos (dir) = 0; else d_cachepos (dir) += buf->NextEntryOffset; if ((dir->__flags & dirent_get_d_ino)) { FileName = buf->FileName; if ((dir->__flags & dirent_set_d_ino)) de->d_ino = buf->FileId.QuadPart; } else FileName = ((PFILE_BOTH_DIR_INFORMATION) buf)->FileName; sys_wcstombs (fname, CYG_MAX_PATH - 1, FileName, buf->FileNameLength / 2); de->d_ino = d_mounts (dir)->check_mount (fname, de->d_ino); if (de->d_ino == 0 && (dir->__flags & dirent_set_d_ino)) { OBJECT_ATTRIBUTES attr; if (dir->__d_position == 0 && buf->FileNameLength == 2 && FileName[0] == '.') de->d_ino = readdir_get_ino_by_handle (dir->__handle); else if (dir->__d_position == 1 && buf->FileNameLength == 4 && FileName[0] == '.' && FileName[1] == '.') de->d_ino = readdir_get_ino (dir, pc.normalized_path, true); else { HANDLE hdl; UNICODE_STRING upath = {buf->FileNameLength, CYG_MAX_PATH * 2, FileName}; InitializeObjectAttributes (&attr, &upath, OBJ_CASE_INSENSITIVE, dir->__handle , NULL); if (!NtOpenFile (&hdl, READ_CONTROL, &attr, &io, FILE_SHARE_VALID_FLAGS, FILE_OPEN_FOR_BACKUP_INTENT)) { de->d_ino = readdir_get_ino_by_handle (hdl); CloseHandle (hdl); } } /* Enforce namehash as inode number on untrusted file systems. */ if (!pc.isgood_inode (de->d_ino)) { dir->__flags &= ~dirent_set_d_ino; de->d_ino = 0; } } } if (!(res = readdir_helper (dir, de, RtlNtStatusToDosError (status), buf ? buf->FileAttributes : 0, fname))) dir->__d_position++; else if (!(dir->__flags & dirent_saw_dot)) { strcpy (de->d_name , "."); de->d_ino = readdir_get_ino_by_handle (dir->__handle); dir->__d_position++; dir->__flags |= dirent_saw_dot; res = 0; } else if (!(dir->__flags & dirent_saw_dot_dot)) { strcpy (de->d_name , ".."); de->d_ino = readdir_get_ino (dir, pc.normalized_path, true); dir->__d_position++; dir->__flags |= dirent_saw_dot_dot; res = 0; } syscall_printf ("%d = readdir (%p, %p) (%s)", res, dir, &de, res ? "***" : de->d_name); return res; } _off64_t fhandler_disk_file::telldir (DIR *dir) { return dir->__d_position; } void fhandler_disk_file::seekdir (DIR *dir, _off64_t loc) { rewinddir (dir); while (loc > dir->__d_position) if (!::readdir (dir)) break; } void fhandler_disk_file::rewinddir (DIR *dir) { d_cachepos (dir) = 0; if (wincap.has_buggy_restart_scan () && isremote ()) { /* This works around a W2K bug. The RestartScan parameter in calls to NtQueryDirectoryFile on remote shares is ignored, thus resulting in not being able to rewind on remote shares. By reopening the directory, we get a fresh new directory pointer. */ UNICODE_STRING fname = {0, CYG_MAX_PATH * 2, (WCHAR *) L""}; OBJECT_ATTRIBUTES attr; NTSTATUS status; IO_STATUS_BLOCK io; HANDLE new_dir; InitializeObjectAttributes (&attr, &fname, OBJ_CASE_INSENSITIVE, dir->__handle, NULL); status = NtOpenFile (&new_dir, SYNCHRONIZE | FILE_LIST_DIRECTORY, &attr, &io, FILE_SHARE_VALID_FLAGS, FILE_SYNCHRONOUS_IO_NONALERT | FILE_OPEN_FOR_BACKUP_INTENT | FILE_DIRECTORY_FILE); if (!NT_SUCCESS (stat)) debug_printf ("Unable to reopen dir %s, NT error: 0x%08x, " "win32: %lu", get_name (), status, RtlNtStatusToDosError (status)); else { CloseHandle (dir->__handle); dir->__handle = new_dir; } } dir->__d_position = 0; d_mounts (dir)->rewind (); } int fhandler_disk_file::closedir (DIR *dir) { int res = 0; NTSTATUS status; delete d_mounts (dir); if (!dir->__handle) /* ignore */; else if (dir->__handle == INVALID_HANDLE_VALUE) { set_errno (EBADF); res = -1; } else if (!NT_SUCCESS (status = NtClose (dir->__handle))) { __seterrno_from_nt_status (status); res = -1; } syscall_printf ("%d = closedir (%p, %s)", res, dir, get_name ()); return res; } fhandler_cygdrive::fhandler_cygdrive () : fhandler_disk_file (), ndrives (0), pdrive (NULL) { } int fhandler_cygdrive::open (int flags, mode_t mode) { if ((flags & (O_CREAT | O_EXCL)) == (O_CREAT | O_EXCL)) { set_errno (EEXIST); return 0; } if (flags & O_WRONLY) { set_errno (EISDIR); return 0; } flags |= O_DIROPEN; set_flags (flags); nohandle (true); return 1; } int fhandler_cygdrive::close () { return 0; } #define DRVSZ sizeof ("x:\\") void fhandler_cygdrive::set_drives () { const int len = 2 + 26 * DRVSZ; char *p = const_cast (get_win32_name ()); pdrive = p; ndrives = GetLogicalDriveStrings (len, p) / DRVSZ; } int fhandler_cygdrive::fstat (struct __stat64 *buf) { buf->st_mode = S_IFDIR | 0555; buf->st_ino = 2; buf->st_nlink = 1; return 0; } DIR * fhandler_cygdrive::opendir () { DIR *dir; dir = fhandler_disk_file::opendir (); if (dir && !ndrives) set_drives (); return dir; } int fhandler_cygdrive::readdir (DIR *dir, dirent *de) { while (true) { if (!pdrive || !*pdrive) { if (!(dir->__flags & dirent_saw_dot)) { de->d_name[0] = '.'; de->d_name[1] = '\0'; de->d_ino = 2; } return ENMFILE; } if (GetFileAttributes (pdrive) != INVALID_FILE_ATTRIBUTES) break; pdrive = strchr (pdrive, '\0') + 1; } *de->d_name = cyg_tolower (*pdrive); de->d_name[1] = '\0'; de->d_ino = readdir_get_ino (dir, pdrive, false); dir->__d_position++; pdrive = strchr (pdrive, '\0') + 1; syscall_printf ("%p = readdir (%p) (%s)", &de, dir, de->d_name); return 0; } void fhandler_cygdrive::rewinddir (DIR *dir) { pdrive = get_win32_name (); dir->__d_position = 0; } int fhandler_cygdrive::closedir (DIR *dir) { pdrive = get_win32_name (); return 0; }