Skip to content

Commit 73265df

Browse files
benpeartGit for Windows Build Agent
authored andcommitted
fscache: teach fscache to use NtQueryDirectoryFile
Using FindFirstFileExW() requires the OS to allocate a 64K buffer for each directory and then free it when we call FindClose(). Update fscache to call the underlying kernel API NtQueryDirectoryFile so that we can do the buffer management ourselves. That allows us to allocate a single buffer for the lifetime of the cache and reuse it for each directory. This change improves performance of 'git status' by 18% in a repo with ~200K files and 30k folders. Documentation for NtQueryDirectoryFile can be found at: https://docs.microsoft.com/en-us/windows-hardware/drivers/ddi/content/ntifs/nf-ntifs-ntquerydirectoryfile https://docs.microsoft.com/en-us/windows/desktop/FileIO/file-attribute-constants https://docs.microsoft.com/en-us/windows/desktop/fileio/reparse-point-tags To determine if the specified directory is a symbolic link, inspect the FileAttributes member to see if the FILE_ATTRIBUTE_REPARSE_POINT flag is set. If so, EaSize will contain the reparse tag (this is a so far undocumented feature, but confirmed by the NTFS developers). To determine if the reparse point is a symbolic link (and not some other form of reparse point), test whether the tag value equals the value IO_REPARSE_TAG_SYMLINK. The NtQueryDirectoryFile() call works best (and on Windows 8.1 and earlier, it works *only*) with buffer sizes up to 64kB. Which is 32k wide characters, so let's use that as our buffer size. Signed-off-by: Ben Peart <[email protected]> Signed-off-by: Johannes Schindelin <[email protected]>
1 parent 1de83ad commit 73265df

File tree

2 files changed

+224
-30
lines changed

2 files changed

+224
-30
lines changed

compat/win32/fscache.c

Lines changed: 93 additions & 30 deletions
Original file line numberDiff line numberDiff line change
@@ -7,6 +7,7 @@
77
#include "../../trace.h"
88
#include "config.h"
99
#include "../../mem-pool.h"
10+
#include "ntifs.h"
1011

1112
static volatile long initialized;
1213
static DWORD dwTlsIndex;
@@ -26,6 +27,13 @@ struct fscache {
2627
unsigned int opendir_requests;
2728
unsigned int fscache_requests;
2829
unsigned int fscache_misses;
30+
/*
31+
* 32k wide characters translates to 64kB, which is the maximum that
32+
* Windows 8.1 and earlier can handle. On network drives, not only
33+
* the client's Windows version matters, but also the server's,
34+
* therefore we need to keep this to 64kB.
35+
*/
36+
WCHAR buffer[32 * 1024];
2937
};
3038
static struct trace_key trace_fscache = TRACE_KEY_INIT(FSCACHE);
3139

@@ -166,27 +174,44 @@ static void fsentry_release(struct fsentry *fse)
166174
InterlockedDecrement(&(fse->u.refcnt));
167175
}
168176

177+
static int xwcstoutfn(char *utf, int utflen, const wchar_t *wcs, int wcslen)
178+
{
179+
if (!wcs || !utf || utflen < 1) {
180+
errno = EINVAL;
181+
return -1;
182+
}
183+
utflen = WideCharToMultiByte(CP_UTF8, 0, wcs, wcslen, utf, utflen, NULL, NULL);
184+
if (utflen)
185+
return utflen;
186+
errno = ERANGE;
187+
return -1;
188+
}
189+
169190
/*
170-
* Allocate and initialize an fsentry from a WIN32_FIND_DATA structure.
191+
* Allocate and initialize an fsentry from a FILE_FULL_DIR_INFORMATION structure.
171192
*/
172193
static struct fsentry *fseentry_create_entry(struct fscache *cache,
173194
struct fsentry *list,
174-
const WIN32_FIND_DATAW *fdata)
195+
PFILE_FULL_DIR_INFORMATION fdata)
175196
{
176197
char buf[MAX_PATH * 3];
177198
int len;
178199
struct fsentry *fse;
179-
len = xwcstoutf(buf, fdata->cFileName, ARRAY_SIZE(buf));
200+
201+
len = xwcstoutfn(buf, ARRAY_SIZE(buf), fdata->FileName, fdata->FileNameLength / sizeof(wchar_t));
180202

181203
fse = fsentry_alloc(cache, list, buf, len);
182204

183-
fse->st_mode = file_attr_to_st_mode(fdata->dwFileAttributes);
205+
fse->st_mode = file_attr_to_st_mode(fdata->FileAttributes);
184206
fse->dirent.d_type = S_ISDIR(fse->st_mode) ? DT_DIR : DT_REG;
185-
fse->u.s.st_size = (((off64_t) (fdata->nFileSizeHigh)) << 32)
186-
| fdata->nFileSizeLow;
187-
filetime_to_timespec(&(fdata->ftLastAccessTime), &(fse->u.s.st_atim));
188-
filetime_to_timespec(&(fdata->ftLastWriteTime), &(fse->u.s.st_mtim));
189-
filetime_to_timespec(&(fdata->ftCreationTime), &(fse->u.s.st_ctim));
207+
fse->u.s.st_size = fdata->EndOfFile.LowPart |
208+
(((off_t)fdata->EndOfFile.HighPart) << 32);
209+
filetime_to_timespec((FILETIME *)&(fdata->LastAccessTime),
210+
&(fse->u.s.st_atim));
211+
filetime_to_timespec((FILETIME *)&(fdata->LastWriteTime),
212+
&(fse->u.s.st_mtim));
213+
filetime_to_timespec((FILETIME *)&(fdata->CreationTime),
214+
&(fse->u.s.st_ctim));
190215

191216
return fse;
192217
}
@@ -199,8 +224,10 @@ static struct fsentry *fseentry_create_entry(struct fscache *cache,
199224
static struct fsentry *fsentry_create_list(struct fscache *cache, const struct fsentry *dir,
200225
int *dir_not_found)
201226
{
202-
wchar_t pattern[MAX_PATH + 2]; /* + 2 for '/' '*' */
203-
WIN32_FIND_DATAW fdata;
227+
wchar_t pattern[MAX_PATH];
228+
NTSTATUS status;
229+
IO_STATUS_BLOCK iosb;
230+
PFILE_FULL_DIR_INFORMATION di;
204231
HANDLE h;
205232
int wlen;
206233
struct fsentry *list, **phead;
@@ -216,15 +243,18 @@ static struct fsentry *fsentry_create_list(struct fscache *cache, const struct f
216243
return NULL;
217244
}
218245

219-
/* append optional '/' and wildcard '*' */
220-
if (wlen)
221-
pattern[wlen++] = '/';
222-
pattern[wlen++] = '*';
223-
pattern[wlen] = 0;
246+
/* handle CWD */
247+
if (!wlen) {
248+
wlen = GetCurrentDirectoryW(ARRAY_SIZE(pattern), pattern);
249+
if (!wlen || wlen >= (ssize_t)ARRAY_SIZE(pattern)) {
250+
errno = wlen ? ENAMETOOLONG : err_win_to_posix(GetLastError());
251+
return NULL;
252+
}
253+
}
224254

225-
/* open find handle */
226-
h = FindFirstFileExW(pattern, FindExInfoBasic, &fdata, FindExSearchNameMatch,
227-
NULL, FIND_FIRST_EX_LARGE_FETCH);
255+
h = CreateFileW(pattern, FILE_LIST_DIRECTORY,
256+
FILE_SHARE_READ | FILE_SHARE_WRITE | FILE_SHARE_DELETE,
257+
NULL, OPEN_EXISTING, FILE_FLAG_BACKUP_SEMANTICS, NULL);
228258
if (h == INVALID_HANDLE_VALUE) {
229259
err = GetLastError();
230260
*dir_not_found = 1; /* or empty directory */
@@ -241,22 +271,55 @@ static struct fsentry *fsentry_create_list(struct fscache *cache, const struct f
241271

242272
/* walk directory and build linked list of fsentry structures */
243273
phead = &list->next;
244-
do {
245-
*phead = fseentry_create_entry(cache, list, &fdata);
274+
status = NtQueryDirectoryFile(h, NULL, 0, 0, &iosb, cache->buffer,
275+
sizeof(cache->buffer), FileFullDirectoryInformation, FALSE, NULL, FALSE);
276+
if (!NT_SUCCESS(status)) {
277+
/*
278+
* NtQueryDirectoryFile returns STATUS_INVALID_PARAMETER when
279+
* asked to enumerate an invalid directory (ie it is a file
280+
* instead of a directory). Verify that is the actual cause
281+
* of the error.
282+
*/
283+
if (status == (NTSTATUS)STATUS_INVALID_PARAMETER) {
284+
DWORD attributes = GetFileAttributesW(pattern);
285+
if (!(attributes & FILE_ATTRIBUTE_DIRECTORY))
286+
status = ERROR_DIRECTORY;
287+
}
288+
goto Error;
289+
}
290+
di = (PFILE_FULL_DIR_INFORMATION)(cache->buffer);
291+
for (;;) {
292+
293+
*phead = fseentry_create_entry(cache, list, di);
246294
phead = &(*phead)->next;
247-
} while (FindNextFileW(h, &fdata));
248295

249-
/* remember result of last FindNextFile, then close find handle */
250-
err = GetLastError();
251-
FindClose(h);
296+
/* If there is no offset in the entry, the buffer has been exhausted. */
297+
if (di->NextEntryOffset == 0) {
298+
status = NtQueryDirectoryFile(h, NULL, 0, 0, &iosb, cache->buffer,
299+
sizeof(cache->buffer), FileFullDirectoryInformation, FALSE, NULL, FALSE);
300+
if (!NT_SUCCESS(status)) {
301+
if (status == STATUS_NO_MORE_FILES)
302+
break;
303+
goto Error;
304+
}
305+
306+
di = (PFILE_FULL_DIR_INFORMATION)(cache->buffer);
307+
continue;
308+
}
309+
310+
/* Advance to the next entry. */
311+
di = (PFILE_FULL_DIR_INFORMATION)(((PUCHAR)di) + di->NextEntryOffset);
312+
}
252313

253-
/* return the list if we've got all the files */
254-
if (err == ERROR_NO_MORE_FILES)
255-
return list;
314+
CloseHandle(h);
315+
return list;
256316

257-
/* otherwise release the list and return error */
317+
Error:
318+
trace_printf_key(&trace_fscache,
319+
"fscache: status(%ld) unable to query directory "
320+
"contents '%s'\n", status, dir->dirent.d_name);
321+
CloseHandle(h);
258322
fsentry_release(list);
259-
errno = err_win_to_posix(err);
260323
return NULL;
261324
}
262325

compat/win32/ntifs.h

Lines changed: 131 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,131 @@
1+
#ifndef _NTIFS_
2+
#define _NTIFS_
3+
4+
/*
5+
* Copy necessary structures and definitions out of the Windows DDK
6+
* to enable calling NtQueryDirectoryFile()
7+
*/
8+
9+
typedef _Return_type_success_(return >= 0) LONG NTSTATUS;
10+
#define NT_SUCCESS(Status) (((NTSTATUS)(Status)) >= 0)
11+
12+
#if !defined(_NTSECAPI_) && !defined(_WINTERNL_) && \
13+
!defined(__UNICODE_STRING_DEFINED)
14+
#define __UNICODE_STRING_DEFINED
15+
typedef struct _UNICODE_STRING {
16+
USHORT Length;
17+
USHORT MaximumLength;
18+
PWSTR Buffer;
19+
} UNICODE_STRING;
20+
typedef UNICODE_STRING *PUNICODE_STRING;
21+
typedef const UNICODE_STRING *PCUNICODE_STRING;
22+
#endif /* !_NTSECAPI_ && !_WINTERNL_ && !__UNICODE_STRING_DEFINED */
23+
24+
typedef enum _FILE_INFORMATION_CLASS {
25+
FileDirectoryInformation = 1,
26+
FileFullDirectoryInformation,
27+
FileBothDirectoryInformation,
28+
FileBasicInformation,
29+
FileStandardInformation,
30+
FileInternalInformation,
31+
FileEaInformation,
32+
FileAccessInformation,
33+
FileNameInformation,
34+
FileRenameInformation,
35+
FileLinkInformation,
36+
FileNamesInformation,
37+
FileDispositionInformation,
38+
FilePositionInformation,
39+
FileFullEaInformation,
40+
FileModeInformation,
41+
FileAlignmentInformation,
42+
FileAllInformation,
43+
FileAllocationInformation,
44+
FileEndOfFileInformation,
45+
FileAlternateNameInformation,
46+
FileStreamInformation,
47+
FilePipeInformation,
48+
FilePipeLocalInformation,
49+
FilePipeRemoteInformation,
50+
FileMailslotQueryInformation,
51+
FileMailslotSetInformation,
52+
FileCompressionInformation,
53+
FileObjectIdInformation,
54+
FileCompletionInformation,
55+
FileMoveClusterInformation,
56+
FileQuotaInformation,
57+
FileReparsePointInformation,
58+
FileNetworkOpenInformation,
59+
FileAttributeTagInformation,
60+
FileTrackingInformation,
61+
FileIdBothDirectoryInformation,
62+
FileIdFullDirectoryInformation,
63+
FileValidDataLengthInformation,
64+
FileShortNameInformation,
65+
FileIoCompletionNotificationInformation,
66+
FileIoStatusBlockRangeInformation,
67+
FileIoPriorityHintInformation,
68+
FileSfioReserveInformation,
69+
FileSfioVolumeInformation,
70+
FileHardLinkInformation,
71+
FileProcessIdsUsingFileInformation,
72+
FileNormalizedNameInformation,
73+
FileNetworkPhysicalNameInformation,
74+
FileIdGlobalTxDirectoryInformation,
75+
FileIsRemoteDeviceInformation,
76+
FileAttributeCacheInformation,
77+
FileNumaNodeInformation,
78+
FileStandardLinkInformation,
79+
FileRemoteProtocolInformation,
80+
FileMaximumInformation
81+
} FILE_INFORMATION_CLASS, *PFILE_INFORMATION_CLASS;
82+
83+
typedef struct _FILE_FULL_DIR_INFORMATION {
84+
ULONG NextEntryOffset;
85+
ULONG FileIndex;
86+
LARGE_INTEGER CreationTime;
87+
LARGE_INTEGER LastAccessTime;
88+
LARGE_INTEGER LastWriteTime;
89+
LARGE_INTEGER ChangeTime;
90+
LARGE_INTEGER EndOfFile;
91+
LARGE_INTEGER AllocationSize;
92+
ULONG FileAttributes;
93+
ULONG FileNameLength;
94+
ULONG EaSize;
95+
WCHAR FileName[1];
96+
} FILE_FULL_DIR_INFORMATION, *PFILE_FULL_DIR_INFORMATION;
97+
98+
typedef struct _IO_STATUS_BLOCK {
99+
union {
100+
NTSTATUS Status;
101+
PVOID Pointer;
102+
} u;
103+
ULONG_PTR Information;
104+
} IO_STATUS_BLOCK, *PIO_STATUS_BLOCK;
105+
106+
typedef VOID
107+
(NTAPI *PIO_APC_ROUTINE)(
108+
IN PVOID ApcContext,
109+
IN PIO_STATUS_BLOCK IoStatusBlock,
110+
IN ULONG Reserved);
111+
112+
NTSYSCALLAPI
113+
NTSTATUS
114+
NTAPI
115+
NtQueryDirectoryFile(
116+
_In_ HANDLE FileHandle,
117+
_In_opt_ HANDLE Event,
118+
_In_opt_ PIO_APC_ROUTINE ApcRoutine,
119+
_In_opt_ PVOID ApcContext,
120+
_Out_ PIO_STATUS_BLOCK IoStatusBlock,
121+
_Out_writes_bytes_(Length) PVOID FileInformation,
122+
_In_ ULONG Length,
123+
_In_ FILE_INFORMATION_CLASS FileInformationClass,
124+
_In_ BOOLEAN ReturnSingleEntry,
125+
_In_opt_ PUNICODE_STRING FileName,
126+
_In_ BOOLEAN RestartScan
127+
);
128+
129+
#define STATUS_NO_MORE_FILES ((NTSTATUS)0x80000006L)
130+
131+
#endif

0 commit comments

Comments
 (0)