Skip to content

Commit 38a323e

Browse files
committed
Merge branch 'pt/fsmonitor-linux' into seen
The fsmonitor daemon has been implemented for Linux. * pt/fsmonitor-linux: fsmonitor: fix split-index bitmap bounds in tweak_fsmonitor() fsmonitor: convert shown khash to strset in do_handle_client fsmonitor: add tests for Linux fsmonitor: add timeout to daemon stop command fsmonitor: close inherited file descriptors and detach in daemon run-command: add close_fd_above_stderr option fsmonitor: implement filesystem change listener for Linux fsmonitor: rename fsm-settings-darwin.c to fsm-settings-unix.c fsmonitor: rename fsm-ipc-darwin.c to fsm-ipc-unix.c fsmonitor: use pthread_cond_timedwait for cookie wait compat/win32: add pthread_cond_timedwait fsmonitor: fix hashmap memory leak in fsmonitor_run_daemon fsmonitor: fix khash memory leak in do_handle_client
2 parents 6517afb + a155ee6 commit 38a323e

19 files changed

+1266
-65
lines changed

Documentation/config/fsmonitor--daemon.adoc

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -4,8 +4,8 @@ fsmonitor.allowRemote::
44
behavior. Only respected when `core.fsmonitor` is set to `true`.
55

66
fsmonitor.socketDir::
7-
This Mac OS-specific option, if set, specifies the directory in
7+
This Mac OS and Linux-specific option, if set, specifies the directory in
88
which to create the Unix domain socket used for communication
99
between the fsmonitor daemon and various Git commands. The directory must
10-
reside on a native Mac OS filesystem. Only respected when `core.fsmonitor`
10+
reside on a native filesystem. Only respected when `core.fsmonitor`
1111
is set to `true`.

Documentation/git-fsmonitor--daemon.adoc

Lines changed: 24 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -76,9 +76,9 @@ repositories; this may be overridden by setting `fsmonitor.allowRemote` to
7676
correctly with all network-mounted repositories, so such use is considered
7777
experimental.
7878

79-
On Mac OS, the inter-process communication (IPC) between various Git
79+
On Mac OS and Linux, the inter-process communication (IPC) between various Git
8080
commands and the fsmonitor daemon is done via a Unix domain socket (UDS) -- a
81-
special type of file -- which is supported by native Mac OS filesystems,
81+
special type of file -- which is supported by native Mac OS and Linux filesystems,
8282
but not on network-mounted filesystems, NTFS, or FAT32. Other filesystems
8383
may or may not have the needed support; the fsmonitor daemon is not guaranteed
8484
to work with these filesystems and such use is considered experimental.
@@ -87,13 +87,33 @@ By default, the socket is created in the `.git` directory. However, if the
8787
`.git` directory is on a network-mounted filesystem, it will instead be
8888
created at `$HOME/.git-fsmonitor-*` unless `$HOME` itself is on a
8989
network-mounted filesystem, in which case you must set the configuration
90-
variable `fsmonitor.socketDir` to the path of a directory on a Mac OS native
90+
variable `fsmonitor.socketDir` to the path of a directory on a native
9191
filesystem in which to create the socket file.
9292

9393
If none of the above directories (`.git`, `$HOME`, or `fsmonitor.socketDir`)
94-
is on a native Mac OS file filesystem the fsmonitor daemon will report an
94+
is on a native filesystem the fsmonitor daemon will report an
9595
error that will cause the daemon and the currently running command to exit.
9696

97+
LINUX CAVEATS
98+
~~~~~~~~~~~~~
99+
100+
On Linux, the fsmonitor daemon uses inotify to monitor filesystem events.
101+
The inotify system has per-user limits on the number of watches that can
102+
be created. The default limit is typically 8192 watches per user.
103+
104+
For large repositories with many directories, you may need to increase
105+
this limit. Check the current limit with:
106+
107+
cat /proc/sys/fs/inotify/max_user_watches
108+
109+
To temporarily increase the limit:
110+
111+
sudo sysctl fs.inotify.max_user_watches=65536
112+
113+
To make the change permanent, add to `/etc/sysctl.conf`:
114+
115+
fs.inotify.max_user_watches=65536
116+
97117
CONFIGURATION
98118
-------------
99119

Makefile

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -420,7 +420,7 @@ include shared.mak
420420
# If your platform has OS-specific ways to tell if a repo is incompatible with
421421
# fsmonitor (whether the hook or IPC daemon version), set FSMONITOR_OS_SETTINGS
422422
# to the "<name>" of the corresponding `compat/fsmonitor/fsm-settings-<name>.c`
423-
# that implements the `fsm_os_settings__*()` routines.
423+
# and `compat/fsmonitor/fsm-ipc-<name>.c` files.
424424
#
425425
# Define LINK_FUZZ_PROGRAMS if you want `make all` to also build the fuzz test
426426
# programs in oss-fuzz/.
@@ -2385,13 +2385,13 @@ ifdef FSMONITOR_DAEMON_BACKEND
23852385
COMPAT_CFLAGS += -DHAVE_FSMONITOR_DAEMON_BACKEND
23862386
COMPAT_OBJS += compat/fsmonitor/fsm-listen-$(FSMONITOR_DAEMON_BACKEND).o
23872387
COMPAT_OBJS += compat/fsmonitor/fsm-health-$(FSMONITOR_DAEMON_BACKEND).o
2388-
COMPAT_OBJS += compat/fsmonitor/fsm-ipc-$(FSMONITOR_DAEMON_BACKEND).o
23892388
endif
23902389

23912390
ifdef FSMONITOR_OS_SETTINGS
23922391
COMPAT_CFLAGS += -DHAVE_FSMONITOR_OS_SETTINGS
2392+
COMPAT_OBJS += compat/fsmonitor/fsm-ipc-$(FSMONITOR_OS_SETTINGS).o
23932393
COMPAT_OBJS += compat/fsmonitor/fsm-settings-$(FSMONITOR_OS_SETTINGS).o
2394-
COMPAT_OBJS += compat/fsmonitor/fsm-path-utils-$(FSMONITOR_OS_SETTINGS).o
2394+
COMPAT_OBJS += compat/fsmonitor/fsm-path-utils-$(FSMONITOR_DAEMON_BACKEND).o
23952395
endif
23962396

23972397
ifdef WITH_BREAKING_CHANGES

builtin/fsmonitor--daemon.c

Lines changed: 64 additions & 28 deletions
Original file line numberDiff line numberDiff line change
@@ -16,7 +16,7 @@
1616
#include "fsmonitor--daemon.h"
1717

1818
#include "simple-ipc.h"
19-
#include "khash.h"
19+
#include "strmap.h"
2020
#include "run-command.h"
2121
#include "trace.h"
2222
#include "trace2.h"
@@ -86,6 +86,8 @@ static int do_as_client__send_stop(void)
8686
{
8787
struct strbuf answer = STRBUF_INIT;
8888
int ret;
89+
int max_wait_ms = 30000;
90+
int elapsed_ms = 0;
8991

9092
ret = fsmonitor_ipc__send_command("quit", &answer);
9193

@@ -96,8 +98,16 @@ static int do_as_client__send_stop(void)
9698
return ret;
9799

98100
trace2_region_enter("fsm_client", "polling-for-daemon-exit", NULL);
99-
while (fsmonitor_ipc__get_state() == IPC_STATE__LISTENING)
101+
while (fsmonitor_ipc__get_state() == IPC_STATE__LISTENING) {
102+
if (elapsed_ms >= max_wait_ms) {
103+
trace2_region_leave("fsm_client",
104+
"polling-for-daemon-exit", NULL);
105+
return error(_("daemon did not stop within %d seconds"),
106+
max_wait_ms / 1000);
107+
}
100108
sleep_millisec(50);
109+
elapsed_ms += 50;
110+
}
101111
trace2_region_leave("fsm_client", "polling-for-daemon-exit", NULL);
102112

103113
return 0;
@@ -197,20 +207,31 @@ static enum fsmonitor_cookie_item_result with_lock__wait_for_cookie(
197207
unlink(cookie_pathname.buf);
198208

199209
/*
200-
* Technically, this is an infinite wait (well, unless another
201-
* thread sends us an abort). I'd like to change this to
202-
* use `pthread_cond_timedwait()` and return an error/timeout
203-
* and let the caller do the trivial response thing, but we
204-
* don't have that routine in our thread-utils.
205-
*
206-
* After extensive beta testing I'm not really worried about
207-
* this. Also note that the above open() and unlink() calls
208-
* will cause at least two FS events on that path, so the odds
209-
* of getting stuck are pretty slim.
210+
* Wait for the listener thread to observe the cookie file.
211+
* Time out after a short interval so that the client
212+
* does not hang forever if the filesystem does not deliver
213+
* events (e.g., on certain container/overlay filesystems
214+
* where inotify watches succeed but events never arrive).
210215
*/
211-
while (cookie->result == FCIR_INIT)
212-
pthread_cond_wait(&state->cookies_cond,
213-
&state->main_lock);
216+
{
217+
struct timeval now;
218+
struct timespec ts;
219+
int err = 0;
220+
221+
gettimeofday(&now, NULL);
222+
ts.tv_sec = now.tv_sec + 1;
223+
ts.tv_nsec = now.tv_usec * 1000;
224+
225+
while (cookie->result == FCIR_INIT && !err)
226+
err = pthread_cond_timedwait(&state->cookies_cond,
227+
&state->main_lock,
228+
&ts);
229+
if (err == ETIMEDOUT && cookie->result == FCIR_INIT) {
230+
trace_printf_key(&trace_fsmonitor,
231+
"cookie_wait timed out");
232+
cookie->result = FCIR_ERROR;
233+
}
234+
}
214235

215236
done:
216237
hashmap_remove(&state->cookies, &cookie->entry, NULL);
@@ -653,8 +674,6 @@ static int fsmonitor_parse_client_token(const char *buf_token,
653674
return 0;
654675
}
655676

656-
KHASH_INIT(str, const char *, int, 0, kh_str_hash_func, kh_str_hash_equal)
657-
658677
static int do_handle_client(struct fsmonitor_daemon_state *state,
659678
const char *command,
660679
ipc_server_reply_cb *reply,
@@ -671,8 +690,7 @@ static int do_handle_client(struct fsmonitor_daemon_state *state,
671690
const struct fsmonitor_batch *batch;
672691
struct fsmonitor_batch *remainder = NULL;
673692
intmax_t count = 0, duplicates = 0;
674-
kh_str_t *shown;
675-
int hash_ret;
693+
struct strset shown = STRSET_INIT;
676694
int do_trivial = 0;
677695
int do_flush = 0;
678696
int do_cookie = 0;
@@ -861,14 +879,14 @@ static int do_handle_client(struct fsmonitor_daemon_state *state,
861879
* so walk the batch list backwards from the current head back
862880
* to the batch (sequence number) they named.
863881
*
864-
* We use khash to de-dup the list of pathnames.
882+
* We use a strset to de-dup the list of pathnames.
865883
*
866884
* NEEDSWORK: each batch contains a list of interned strings,
867885
* so we only need to do pointer comparisons here to build the
868886
* hash table. Currently, we're still comparing the string
869887
* values.
870888
*/
871-
shown = kh_init_str();
889+
strset_init_with_options(&shown, NULL, 0);
872890
for (batch = batch_head;
873891
batch && batch->batch_seq_nr > requested_oldest_seq_nr;
874892
batch = batch->next) {
@@ -878,11 +896,9 @@ static int do_handle_client(struct fsmonitor_daemon_state *state,
878896
const char *s = batch->interned_paths[k];
879897
size_t s_len;
880898

881-
if (kh_get_str(shown, s) != kh_end(shown))
899+
if (!strset_add(&shown, s))
882900
duplicates++;
883901
else {
884-
kh_put_str(shown, s, &hash_ret);
885-
886902
trace_printf_key(&trace_fsmonitor,
887903
"send[%"PRIuMAX"]: %s",
888904
count, s);
@@ -909,8 +925,6 @@ static int do_handle_client(struct fsmonitor_daemon_state *state,
909925
total_response_len += payload.len;
910926
}
911927

912-
kh_release_str(shown);
913-
914928
pthread_mutex_lock(&state->main_lock);
915929

916930
if (token_data->client_ref_count > 0)
@@ -954,6 +968,7 @@ static int do_handle_client(struct fsmonitor_daemon_state *state,
954968
trace2_data_intmax("fsmonitor", the_repository, "response/count/duplicates", duplicates);
955969

956970
cleanup:
971+
strset_clear(&shown);
957972
strbuf_release(&response_token);
958973
strbuf_release(&requested_token_id);
959974
strbuf_release(&payload);
@@ -1405,6 +1420,15 @@ static int fsmonitor_run_daemon(void)
14051420
done:
14061421
pthread_cond_destroy(&state.cookies_cond);
14071422
pthread_mutex_destroy(&state.main_lock);
1423+
{
1424+
struct hashmap_iter iter;
1425+
struct fsmonitor_cookie_item *cookie;
1426+
1427+
hashmap_for_each_entry(&state.cookies, &iter, cookie, entry)
1428+
free(cookie->name);
1429+
hashmap_clear_and_free(&state.cookies,
1430+
struct fsmonitor_cookie_item, entry);
1431+
}
14081432
fsm_listen__dtor(&state);
14091433
fsm_health__dtor(&state);
14101434

@@ -1420,7 +1444,7 @@ static int fsmonitor_run_daemon(void)
14201444
return err;
14211445
}
14221446

1423-
static int try_to_run_foreground_daemon(int detach_console MAYBE_UNUSED)
1447+
static int try_to_run_foreground_daemon(int detach_console)
14241448
{
14251449
/*
14261450
* Technically, we don't need to probe for an existing daemon
@@ -1440,10 +1464,21 @@ static int try_to_run_foreground_daemon(int detach_console MAYBE_UNUSED)
14401464
fflush(stderr);
14411465
}
14421466

1467+
if (detach_console) {
14431468
#ifdef GIT_WINDOWS_NATIVE
1444-
if (detach_console)
14451469
FreeConsole();
1470+
#else
1471+
/*
1472+
* Create a new session so that the daemon is detached
1473+
* from the parent's process group. This prevents
1474+
* shells with job control (e.g. bash with "set -m")
1475+
* from waiting on the daemon when they wait for a
1476+
* foreground command that implicitly spawned it.
1477+
*/
1478+
if (setsid() == -1)
1479+
warning_errno(_("setsid failed"));
14461480
#endif
1481+
}
14471482

14481483
return !!fsmonitor_run_daemon();
14491484
}
@@ -1506,6 +1541,7 @@ static int try_to_start_background_daemon(void)
15061541
cp.no_stdin = 1;
15071542
cp.no_stdout = 1;
15081543
cp.no_stderr = 1;
1544+
cp.close_fd_above_stderr = 1;
15091545

15101546
sbgr = start_bg_command(&cp, bg_wait_cb, NULL,
15111547
fsmonitor__start_timeout_sec);
Lines changed: 33 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,33 @@
1+
#include "git-compat-util.h"
2+
#include "config.h"
3+
#include "fsmonitor-ll.h"
4+
#include "fsm-health.h"
5+
#include "fsmonitor--daemon.h"
6+
7+
/*
8+
* The Linux fsmonitor implementation uses inotify which has its own
9+
* mechanisms for detecting filesystem unmount and other events that
10+
* would require the daemon to shutdown. Therefore, we don't need
11+
* a separate health thread like Windows does.
12+
*
13+
* These stub functions satisfy the interface requirements.
14+
*/
15+
16+
int fsm_health__ctor(struct fsmonitor_daemon_state *state UNUSED)
17+
{
18+
return 0;
19+
}
20+
21+
void fsm_health__dtor(struct fsmonitor_daemon_state *state UNUSED)
22+
{
23+
return;
24+
}
25+
26+
void fsm_health__loop(struct fsmonitor_daemon_state *state UNUSED)
27+
{
28+
return;
29+
}
30+
31+
void fsm_health__stop_async(struct fsmonitor_daemon_state *state UNUSED)
32+
{
33+
}

0 commit comments

Comments
 (0)