]> git.ipfire.org Git - thirdparty/git.git/blame - fsmonitor.c
fsm-listen-darwin: shutdown daemon if worktree root is moved/renamed
[thirdparty/git.git] / fsmonitor.c
CommitLineData
883e248b
BP
1#include "cache.h"
2#include "config.h"
3#include "dir.h"
4#include "ewah/ewok.h"
5#include "fsmonitor.h"
1e0ea5c4 6#include "fsmonitor-ipc.h"
883e248b
BP
7#include "run-command.h"
8#include "strbuf.h"
9
56c69100
KW
10#define INDEX_EXTENSION_VERSION1 (1)
11#define INDEX_EXTENSION_VERSION2 (2)
8da2c576
KW
12#define HOOK_INTERFACE_VERSION1 (1)
13#define HOOK_INTERFACE_VERSION2 (2)
883e248b
BP
14
15struct trace_key trace_fsmonitor = TRACE_KEY_INIT(FSMONITOR);
16
cae70acf
DS
17static void assert_index_minimum(struct index_state *istate, size_t pos)
18{
19 if (pos > istate->cache_nr)
20 BUG("fsmonitor_dirty has more entries than the index (%"PRIuMAX" > %u)",
21 (uintmax_t)pos, istate->cache_nr);
22}
23
883e248b
BP
24static void fsmonitor_ewah_callback(size_t pos, void *is)
25{
26 struct index_state *istate = (struct index_state *)is;
3444ec2e 27 struct cache_entry *ce;
883e248b 28
cae70acf 29 assert_index_minimum(istate, pos + 1);
3444ec2e
WB
30
31 ce = istate->cache[pos];
883e248b
BP
32 ce->ce_flags &= ~CE_FSMONITOR_VALID;
33}
34
8da2c576
KW
35static int fsmonitor_hook_version(void)
36{
37 int hook_version;
38
39 if (git_config_get_int("core.fsmonitorhookversion", &hook_version))
40 return -1;
41
42 if (hook_version == HOOK_INTERFACE_VERSION1 ||
43 hook_version == HOOK_INTERFACE_VERSION2)
44 return hook_version;
45
46 warning("Invalid hook version '%i' in core.fsmonitorhookversion. "
47 "Must be 1 or 2.", hook_version);
48 return -1;
49}
50
883e248b
BP
51int read_fsmonitor_extension(struct index_state *istate, const void *data,
52 unsigned long sz)
53{
54 const char *index = data;
55 uint32_t hdr_version;
56 uint32_t ewah_size;
57 struct ewah_bitmap *fsmonitor_dirty;
883e248b 58 int ret;
56c69100
KW
59 uint64_t timestamp;
60 struct strbuf last_update = STRBUF_INIT;
883e248b 61
56c69100 62 if (sz < sizeof(uint32_t) + 1 + sizeof(uint32_t))
883e248b
BP
63 return error("corrupt fsmonitor extension (too short)");
64
65 hdr_version = get_be32(index);
66 index += sizeof(uint32_t);
56c69100
KW
67 if (hdr_version == INDEX_EXTENSION_VERSION1) {
68 timestamp = get_be64(index);
69 strbuf_addf(&last_update, "%"PRIu64"", timestamp);
70 index += sizeof(uint64_t);
71 } else if (hdr_version == INDEX_EXTENSION_VERSION2) {
72 strbuf_addstr(&last_update, index);
73 index += last_update.len + 1;
74 } else {
883e248b 75 return error("bad fsmonitor version %d", hdr_version);
56c69100 76 }
883e248b 77
56c69100 78 istate->fsmonitor_last_update = strbuf_detach(&last_update, NULL);
883e248b
BP
79
80 ewah_size = get_be32(index);
81 index += sizeof(uint32_t);
82
83 fsmonitor_dirty = ewah_new();
84 ret = ewah_read_mmap(fsmonitor_dirty, index, ewah_size);
85 if (ret != ewah_size) {
86 ewah_free(fsmonitor_dirty);
87 return error("failed to parse ewah bitmap reading fsmonitor index extension");
88 }
ba1b9cac 89 istate->fsmonitor_dirty = fsmonitor_dirty;
883e248b 90
cae70acf
DS
91 if (!istate->split_index)
92 assert_index_minimum(istate, istate->fsmonitor_dirty->bit_size);
3444ec2e 93
29fbbf43
JH
94 trace2_data_string("index", NULL, "extension/fsmn/read/token",
95 istate->fsmonitor_last_update);
96 trace_printf_key(&trace_fsmonitor,
97 "read fsmonitor extension successful '%s'",
98 istate->fsmonitor_last_update);
883e248b
BP
99 return 0;
100}
101
3bd28eb2
AV
102void fill_fsmonitor_bitmap(struct index_state *istate)
103{
3444ec2e 104 unsigned int i, skipped = 0;
3bd28eb2 105 istate->fsmonitor_dirty = ewah_new();
3444ec2e
WB
106 for (i = 0; i < istate->cache_nr; i++) {
107 if (istate->cache[i]->ce_flags & CE_REMOVE)
108 skipped++;
109 else if (!(istate->cache[i]->ce_flags & CE_FSMONITOR_VALID))
110 ewah_set(istate->fsmonitor_dirty, i - skipped);
111 }
3bd28eb2
AV
112}
113
883e248b
BP
114void write_fsmonitor_extension(struct strbuf *sb, struct index_state *istate)
115{
116 uint32_t hdr_version;
883e248b
BP
117 uint32_t ewah_start;
118 uint32_t ewah_size = 0;
119 int fixup = 0;
120
cae70acf
DS
121 if (!istate->split_index)
122 assert_index_minimum(istate, istate->fsmonitor_dirty->bit_size);
3444ec2e 123
56c69100 124 put_be32(&hdr_version, INDEX_EXTENSION_VERSION2);
883e248b
BP
125 strbuf_add(sb, &hdr_version, sizeof(uint32_t));
126
56c69100
KW
127 strbuf_addstr(sb, istate->fsmonitor_last_update);
128 strbuf_addch(sb, 0); /* Want to keep a NUL */
129
883e248b
BP
130 fixup = sb->len;
131 strbuf_add(sb, &ewah_size, sizeof(uint32_t)); /* we'll fix this up later */
132
133 ewah_start = sb->len;
3bd28eb2
AV
134 ewah_serialize_strbuf(istate->fsmonitor_dirty, sb);
135 ewah_free(istate->fsmonitor_dirty);
136 istate->fsmonitor_dirty = NULL;
883e248b
BP
137
138 /* fix up size field */
139 put_be32(&ewah_size, sb->len - ewah_start);
140 memcpy(sb->buf + fixup, &ewah_size, sizeof(uint32_t));
141
29fbbf43
JH
142 trace2_data_string("index", NULL, "extension/fsmn/write/token",
143 istate->fsmonitor_last_update);
144 trace_printf_key(&trace_fsmonitor,
145 "write fsmonitor extension successful '%s'",
146 istate->fsmonitor_last_update);
883e248b
BP
147}
148
149/*
56c69100 150 * Call the query-fsmonitor hook passing the last update token of the saved results.
883e248b 151 */
1e0ea5c4
JH
152static int query_fsmonitor_hook(struct repository *r,
153 int version,
154 const char *last_update,
155 struct strbuf *query_result)
883e248b
BP
156{
157 struct child_process cp = CHILD_PROCESS_INIT;
940b94f3 158 int result;
883e248b 159
1e0ea5c4 160 if (fsm_settings__get_mode(r) != FSMONITOR_MODE_HOOK)
883e248b
BP
161 return -1;
162
1e0ea5c4 163 strvec_push(&cp.args, fsm_settings__get_hook_path(r));
ef8d7ac4
JK
164 strvec_pushf(&cp.args, "%d", version);
165 strvec_pushf(&cp.args, "%s", last_update);
883e248b 166 cp.use_shell = 1;
11cf33be 167 cp.dir = get_git_work_tree();
883e248b 168
940b94f3
JH
169 trace2_region_enter("fsm_hook", "query", NULL);
170
171 result = capture_command(&cp, query_result, 1024);
172
173 if (result)
174 trace2_data_intmax("fsm_hook", NULL, "query/failed", result);
974c1b39 175 else
940b94f3
JH
176 trace2_data_intmax("fsm_hook", NULL, "query/response-length",
177 query_result->len);
178
940b94f3
JH
179 trace2_region_leave("fsm_hook", "query", NULL);
180
181 return result;
883e248b
BP
182}
183
ff03836b 184static void fsmonitor_refresh_callback(struct index_state *istate, char *name)
883e248b 185{
ff03836b
KW
186 int i, len = strlen(name);
187 if (name[len - 1] == '/') {
188
189 /*
190 * TODO We should binary search to find the first path with
191 * TODO this directory prefix. Then linearly update entries
192 * TODO while the prefix matches. Taking care to search without
193 * TODO the trailing slash -- because '/' sorts after a few
194 * TODO interesting special chars, like '.' and ' '.
195 */
196
197 /* Mark all entries for the folder invalid */
198 for (i = 0; i < istate->cache_nr; i++) {
199 if (istate->cache[i]->ce_flags & CE_FSMONITOR_VALID &&
200 starts_with(istate->cache[i]->name, name))
201 istate->cache[i]->ce_flags &= ~CE_FSMONITOR_VALID;
202 }
203 /* Need to remove the / from the path for the untracked cache */
204 name[len - 1] = '\0';
205 } else {
206 int pos = index_name_pos(istate, name, strlen(name));
883e248b 207
ff03836b
KW
208 if (pos >= 0) {
209 struct cache_entry *ce = istate->cache[pos];
210 ce->ce_flags &= ~CE_FSMONITOR_VALID;
211 }
883e248b
BP
212 }
213
214 /*
215 * Mark the untracked cache dirty even if it wasn't found in the index
216 * as it could be a new untracked file.
217 */
218 trace_printf_key(&trace_fsmonitor, "fsmonitor_refresh_callback '%s'", name);
0cacebf0 219 untracked_cache_invalidate_path(istate, name, 0);
883e248b
BP
220}
221
26b9f34a
JH
222/*
223 * The number of pathnames that we need to receive from FSMonitor
224 * before we force the index to be updated.
225 *
226 * Note that any pathname within the set of received paths MAY cause
227 * cache-entry or istate flag bits to be updated and thus cause the
228 * index to be updated on disk.
229 *
230 * However, the response may contain many paths (such as ignored
231 * paths) that will not update any flag bits. And thus not force the
232 * index to be updated. (This is fine and normal.) It also means
233 * that the token will not be updated in the FSMonitor index
234 * extension. So the next Git command will find the same token in the
235 * index, make the same token-relative request, and receive the same
236 * response (plus any newly changed paths). If this response is large
237 * (and continues to grow), performance could be impacted.
238 *
239 * For example, if the user runs a build and it writes 100K object
240 * files but doesn't modify any source files, the index would not need
241 * to be updated. The FSMonitor response (after the build and
242 * relative to a pre-build token) might be 5MB. Each subsequent Git
243 * command will receive that same 100K/5MB response until something
244 * causes the index to be updated. And `refresh_fsmonitor()` will
245 * have to iterate over those 100K paths each time.
246 *
247 * Performance could be improved if we optionally force update the
248 * index after a very large response and get an updated token into
249 * the FSMonitor index extension. This should allow subsequent
250 * commands to get smaller and more current responses.
251 *
252 * The value chosen here does not need to be precise. The index
253 * will be updated automatically the first time the user touches
254 * a tracked file and causes a command like `git status` to
255 * update an mtime to be updated and/or set a flag bit.
256 */
257static int fsmonitor_force_update_threshold = 100;
258
883e248b
BP
259void refresh_fsmonitor(struct index_state *istate)
260{
883e248b 261 struct strbuf query_result = STRBUF_INIT;
8da2c576
KW
262 int query_success = 0, hook_version = -1;
263 size_t bol = 0; /* beginning of line */
883e248b 264 uint64_t last_update;
56c69100 265 struct strbuf last_update_token = STRBUF_INIT;
883e248b 266 char *buf;
5d137fc2 267 unsigned int i;
974c1b39 268 int is_trivial = 0;
1e0ea5c4
JH
269 struct repository *r = istate->repo ? istate->repo : the_repository;
270 enum fsmonitor_mode fsm_mode = fsm_settings__get_mode(r);
883e248b 271
1e0ea5c4
JH
272 if (fsm_mode <= FSMONITOR_MODE_DISABLED ||
273 istate->fsmonitor_has_run_once)
883e248b 274 return;
8da2c576 275
398a3b08 276 istate->fsmonitor_has_run_once = 1;
883e248b
BP
277
278 trace_printf_key(&trace_fsmonitor, "refresh fsmonitor");
1e0ea5c4
JH
279
280 if (fsm_mode == FSMONITOR_MODE_IPC) {
9c307e8a
JH
281 query_success = !fsmonitor_ipc__send_query(
282 istate->fsmonitor_last_update ?
283 istate->fsmonitor_last_update : "builtin:fake",
284 &query_result);
285 if (query_success) {
286 /*
287 * The response contains a series of nul terminated
288 * strings. The first is the new token.
289 *
290 * Use `char *buf` as an interlude to trick the CI
291 * static analysis to let us use `strbuf_addstr()`
292 * here (and only copy the token) rather than
293 * `strbuf_addbuf()`.
294 */
295 buf = query_result.buf;
296 strbuf_addstr(&last_update_token, buf);
297 bol = last_update_token.len + 1;
298 is_trivial = query_result.buf[bol] == '/';
299 if (is_trivial)
300 trace2_data_intmax("fsm_client", NULL,
301 "query/trivial-response", 1);
302 } else {
303 /*
304 * The builtin daemon is not available on this
305 * platform -OR- we failed to get a response.
306 *
307 * Generate a fake token (rather than a V1
308 * timestamp) for the index extension. (If
309 * they switch back to the hook API, we don't
310 * want ambiguous state.)
311 */
312 strbuf_addstr(&last_update_token, "builtin:fake");
313 }
314
315 goto apply_results;
1e0ea5c4
JH
316 }
317
318 assert(fsm_mode == FSMONITOR_MODE_HOOK);
319
320 hook_version = fsmonitor_hook_version();
321
883e248b 322 /*
1e0ea5c4 323 * This could be racy so save the date/time now and query_fsmonitor_hook
883e248b
BP
324 * should be inclusive to ensure we don't miss potential changes.
325 */
326 last_update = getnanotime();
8da2c576
KW
327 if (hook_version == HOOK_INTERFACE_VERSION1)
328 strbuf_addf(&last_update_token, "%"PRIu64"", last_update);
883e248b
BP
329
330 /*
1e0ea5c4 331 * If we have a last update token, call query_fsmonitor_hook for the set of
8da2c576 332 * changes since that token, else assume everything is possibly dirty
883e248b
BP
333 * and check it all.
334 */
335 if (istate->fsmonitor_last_update) {
8da2c576 336 if (hook_version == -1 || hook_version == HOOK_INTERFACE_VERSION2) {
1e0ea5c4
JH
337 query_success = !query_fsmonitor_hook(
338 r, HOOK_INTERFACE_VERSION2,
8da2c576
KW
339 istate->fsmonitor_last_update, &query_result);
340
341 if (query_success) {
342 if (hook_version < 0)
343 hook_version = HOOK_INTERFACE_VERSION2;
344
345 /*
346 * First entry will be the last update token
347 * Need to use a char * variable because static
348 * analysis was suggesting to use strbuf_addbuf
349 * but we don't want to copy the entire strbuf
6d12b533 350 * only the chars up to the first NUL
8da2c576
KW
351 */
352 buf = query_result.buf;
353 strbuf_addstr(&last_update_token, buf);
354 if (!last_update_token.len) {
355 warning("Empty last update token.");
356 query_success = 0;
357 } else {
358 bol = last_update_token.len + 1;
974c1b39 359 is_trivial = query_result.buf[bol] == '/';
8da2c576
KW
360 }
361 } else if (hook_version < 0) {
362 hook_version = HOOK_INTERFACE_VERSION1;
363 if (!last_update_token.len)
364 strbuf_addf(&last_update_token, "%"PRIu64"", last_update);
365 }
366 }
367
368 if (hook_version == HOOK_INTERFACE_VERSION1) {
1e0ea5c4
JH
369 query_success = !query_fsmonitor_hook(
370 r, HOOK_INTERFACE_VERSION1,
8da2c576 371 istate->fsmonitor_last_update, &query_result);
974c1b39
JH
372 if (query_success)
373 is_trivial = query_result.buf[0] == '/';
8da2c576
KW
374 }
375
974c1b39
JH
376 if (is_trivial)
377 trace2_data_intmax("fsm_hook", NULL,
378 "query/trivial-response", 1);
379
1e0ea5c4
JH
380 trace_performance_since(last_update, "fsmonitor process '%s'",
381 fsm_settings__get_hook_path(r));
382 trace_printf_key(&trace_fsmonitor,
383 "fsmonitor process '%s' returned %s",
384 fsm_settings__get_hook_path(r),
385 query_success ? "success" : "failure");
883e248b
BP
386 }
387
9c307e8a 388apply_results:
974c1b39
JH
389 /*
390 * The response from FSMonitor (excluding the header token) is
391 * either:
392 *
393 * [a] a (possibly empty) list of NUL delimited relative
394 * pathnames of changed paths. This list can contain
395 * files and directories. Directories have a trailing
396 * slash.
397 *
398 * [b] a single '/' to indicate the provider had no
399 * information and that we should consider everything
400 * invalid. We call this a trivial response.
401 */
26b9f34a
JH
402 trace2_region_enter("fsmonitor", "apply_results", istate->repo);
403
974c1b39
JH
404 if (query_success && !is_trivial) {
405 /*
406 * Mark all pathnames returned by the monitor as dirty.
407 *
408 * This updates both the cache-entries and the untracked-cache.
409 */
26b9f34a
JH
410 int count = 0;
411
883e248b 412 buf = query_result.buf;
8da2c576 413 for (i = bol; i < query_result.len; i++) {
883e248b
BP
414 if (buf[i] != '\0')
415 continue;
416 fsmonitor_refresh_callback(istate, buf + bol);
417 bol = i + 1;
26b9f34a 418 count++;
883e248b 419 }
26b9f34a 420 if (bol < query_result.len) {
883e248b 421 fsmonitor_refresh_callback(istate, buf + bol);
26b9f34a
JH
422 count++;
423 }
679f2f9f
US
424
425 /* Now mark the untracked cache for fsmonitor usage */
426 if (istate->untracked)
427 istate->untracked->use_fsmonitor = 1;
26b9f34a
JH
428
429 if (count > fsmonitor_force_update_threshold)
430 istate->cache_changed |= FSMONITOR_CHANGED;
431
432 trace2_data_intmax("fsmonitor", istate->repo, "apply_count",
433 count);
434
883e248b 435 } else {
974c1b39
JH
436 /*
437 * We failed to get a response or received a trivial response,
438 * so invalidate everything.
439 *
440 * We only want to run the post index changed hook if
441 * we've actually changed entries, so keep track if we
442 * actually changed entries or not.
443 */
679f2f9f 444 int is_cache_changed = 0;
974c1b39 445
679f2f9f
US
446 for (i = 0; i < istate->cache_nr; i++) {
447 if (istate->cache[i]->ce_flags & CE_FSMONITOR_VALID) {
448 is_cache_changed = 1;
449 istate->cache[i]->ce_flags &= ~CE_FSMONITOR_VALID;
450 }
451 }
883e248b 452
974c1b39
JH
453 /*
454 * If we're going to check every file, ensure we save
455 * the results.
456 */
679f2f9f
US
457 if (is_cache_changed)
458 istate->cache_changed |= FSMONITOR_CHANGED;
ca598d5f 459
883e248b
BP
460 if (istate->untracked)
461 istate->untracked->use_fsmonitor = 0;
462 }
26b9f34a
JH
463 trace2_region_leave("fsmonitor", "apply_results", istate->repo);
464
883e248b
BP
465 strbuf_release(&query_result);
466
56c69100
KW
467 /* Now that we've updated istate, save the last_update_token */
468 FREE_AND_NULL(istate->fsmonitor_last_update);
469 istate->fsmonitor_last_update = strbuf_detach(&last_update_token, NULL);
883e248b
BP
470}
471
fcd19b09
JH
472/*
473 * The caller wants to turn on FSMonitor. And when the caller writes
474 * the index to disk, a FSMonitor extension should be included. This
475 * requires that `istate->fsmonitor_last_update` not be NULL. But we
476 * have not actually talked to a FSMonitor process yet, so we don't
477 * have an initial value for this field.
478 *
479 * For a protocol V1 FSMonitor process, this field is a formatted
480 * "nanoseconds since epoch" field. However, for a protocol V2
481 * FSMonitor process, this field is an opaque token.
482 *
483 * Historically, `add_fsmonitor()` has initialized this field to the
484 * current time for protocol V1 processes. There are lots of race
485 * conditions here, but that code has shipped...
486 *
487 * The only true solution is to use a V2 FSMonitor and get a current
488 * or default token value (that it understands), but we cannot do that
489 * until we have actually talked to an instance of the FSMonitor process
490 * (but the protocol requires that we send a token first...).
491 *
492 * For simplicity, just initialize like we have a V1 process and require
493 * that V2 processes adapt.
494 */
495static void initialize_fsmonitor_last_update(struct index_state *istate)
496{
497 struct strbuf last_update = STRBUF_INIT;
498
499 strbuf_addf(&last_update, "%"PRIu64"", getnanotime());
500 istate->fsmonitor_last_update = strbuf_detach(&last_update, NULL);
501}
502
883e248b
BP
503void add_fsmonitor(struct index_state *istate)
504{
5d137fc2 505 unsigned int i;
883e248b
BP
506
507 if (!istate->fsmonitor_last_update) {
508 trace_printf_key(&trace_fsmonitor, "add fsmonitor");
509 istate->cache_changed |= FSMONITOR_CHANGED;
fcd19b09 510 initialize_fsmonitor_last_update(istate);
883e248b
BP
511
512 /* reset the fsmonitor state */
513 for (i = 0; i < istate->cache_nr; i++)
514 istate->cache[i]->ce_flags &= ~CE_FSMONITOR_VALID;
515
516 /* reset the untracked cache */
517 if (istate->untracked) {
518 add_untracked_cache(istate);
519 istate->untracked->use_fsmonitor = 1;
520 }
521
522 /* Update the fsmonitor state */
523 refresh_fsmonitor(istate);
524 }
525}
526
527void remove_fsmonitor(struct index_state *istate)
528{
529 if (istate->fsmonitor_last_update) {
530 trace_printf_key(&trace_fsmonitor, "remove fsmonitor");
531 istate->cache_changed |= FSMONITOR_CHANGED;
56c69100 532 FREE_AND_NULL(istate->fsmonitor_last_update);
883e248b
BP
533 }
534}
535
536void tweak_fsmonitor(struct index_state *istate)
537{
5d137fc2 538 unsigned int i;
1e0ea5c4
JH
539 int fsmonitor_enabled = (fsm_settings__get_mode(istate->repo)
540 > FSMONITOR_MODE_DISABLED);
ba1b9cac
AV
541
542 if (istate->fsmonitor_dirty) {
543 if (fsmonitor_enabled) {
544 /* Mark all entries valid */
545 for (i = 0; i < istate->cache_nr; i++) {
546 istate->cache[i]->ce_flags |= CE_FSMONITOR_VALID;
547 }
548
549 /* Mark all previously saved entries as dirty */
cae70acf 550 assert_index_minimum(istate, istate->fsmonitor_dirty->bit_size);
ba1b9cac
AV
551 ewah_each_bit(istate->fsmonitor_dirty, fsmonitor_ewah_callback, istate);
552
679f2f9f 553 refresh_fsmonitor(istate);
ba1b9cac
AV
554 }
555
556 ewah_free(istate->fsmonitor_dirty);
557 istate->fsmonitor_dirty = NULL;
558 }
559
1e0ea5c4 560 if (fsmonitor_enabled)
883e248b 561 add_fsmonitor(istate);
1e0ea5c4
JH
562 else
563 remove_fsmonitor(istate);
883e248b 564}