3 provide API to do non-blocking locks for single or all databases
5 Copyright (C) Amitay Isaacs 2012
7 This program is free software; you can redistribute it and/or modify
8 it under the terms of the GNU General Public License as published by
9 the Free Software Foundation; either version 3 of the License, or
10 (at your option) any later version.
12 This program is distributed in the hope that it will be useful,
13 but WITHOUT ANY WARRANTY; without even the implied warranty of
14 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
15 GNU General Public License for more details.
17 You should have received a copy of the GNU General Public License
18 along with this program; if not, see <http://www.gnu.org/licenses/>.
21 #include "include/ctdb_private.h"
22 #include "include/ctdb_protocol.h"
26 #include "system/filesys.h"
27 #include "lib/util/dlinklist.h"
30 * Non-blocking Locking API
32 * 1. Create a child process to do blocking locks.
33 * 2. Once the locks are obtained, signal parent process via fd.
34 * 3. Invoke registered callback routine with locking status.
35 * 4. If the child process cannot get locks within certain time,
36 * diagnose using /proc/locks and log warning message
38 * ctdb_lock_record() - get a lock on a record
39 * ctdb_lock_db() - get a lock on a DB
40 * ctdb_lock_alldb_prio() - get a lock on all DBs with given priority
41 * ctdb_lock_alldb() - get a lock on all DBs
43 * auto_mark - whether to mark/unmark DBs in before/after callback
46 /* FIXME: Add a tunable max_lock_processes_per_db */
47 #define MAX_LOCK_PROCESSES_PER_DB (100)
56 static const char * const lock_type_str[] = {
65 /* lock_context is the common part for a lock request */
67 struct lock_context *next, *prev;
69 struct ctdb_context *ctdb;
70 struct ctdb_db_context *ctdb_db;
74 struct lock_request *req_queue;
77 struct tevent_fd *tfd;
78 struct tevent_timer *ttimer;
81 struct timeval start_time;
84 /* lock_request is the client specific part for a lock request */
86 struct lock_request *next, *prev;
87 struct lock_context *lctx;
88 void (*callback)(void *, bool);
94 * Support samba 3.6.x (and older) versions which do not set db priority.
96 * By default, all databases are set to priority 1. So only when priority
97 * is set to 1, check for databases that need higher priority.
99 static bool later_db(struct ctdb_context *ctdb, const char *name)
101 if (ctdb->tunable.samba3_hack == 0) {
105 if (strstr(name, "brlock") ||
106 strstr(name, "g_lock") ||
107 strstr(name, "notify_onelevel") ||
108 strstr(name, "serverid") ||
109 strstr(name, "xattr_tdb")) {
119 int ctdb_lockall_prio(struct ctdb_context *ctdb, uint32_t priority)
121 struct ctdb_db_context *ctdb_db;
123 for (ctdb_db = ctdb->db_list; ctdb_db; ctdb_db = ctdb_db->next) {
124 if (ctdb_db->priority != priority) {
127 if (later_db(ctdb, ctdb_db->db_name)) {
130 DEBUG(DEBUG_INFO, ("locking database %s, priority:%u\n",
131 ctdb_db->db_name, priority));
132 if (tdb_lockall(ctdb_db->ltdb->tdb) != 0) {
133 DEBUG(DEBUG_ERR, ("Failed to lock database %s\n",
139 /* If priority != 1, later_db check is not required and can return */
144 for (ctdb_db = ctdb->db_list; ctdb_db; ctdb_db = ctdb_db->next) {
145 if (!later_db(ctdb, ctdb_db->db_name)) {
148 DEBUG(DEBUG_INFO, ("locking database %s, priority:%u\n",
149 ctdb_db->db_name, priority));
150 if (tdb_lockall(ctdb_db->ltdb->tdb) != 0) {
151 DEBUG(DEBUG_ERR, ("Failed to lock database %s\n",
160 static int ctdb_lockall(struct ctdb_context *ctdb)
164 for (priority=1; priority<=NUM_DB_PRIORITIES; priority++) {
165 if (ctdb_lockall_prio(ctdb, priority) != 0) {
175 * unlock all databases
177 int ctdb_unlockall_prio(struct ctdb_context *ctdb, uint32_t priority)
179 struct ctdb_db_context *ctdb_db;
181 for (ctdb_db = ctdb->db_list; ctdb_db; ctdb_db = ctdb_db->next) {
182 if (ctdb_db->priority != priority) {
185 DEBUG(DEBUG_INFO, ("unlocking database %s, priority:%u\n",
186 ctdb_db->db_name, priority));
187 if (tdb_unlockall(ctdb_db->ltdb->tdb) != 0) {
188 DEBUG(DEBUG_ERR, ("Failed to unlock database %s\n",
197 static int ctdb_unlockall(struct ctdb_context *ctdb)
201 for (priority=NUM_DB_PRIORITIES; priority>=0; priority--) {
202 if (ctdb_unlockall_prio(ctdb, priority) != 0) {
212 * lock all databases - mark only
214 int ctdb_lockall_mark_prio(struct ctdb_context *ctdb, uint32_t priority)
216 struct ctdb_db_context *ctdb_db;
217 int tdb_transaction_write_lock_mark(struct tdb_context *);
220 * This function is only used by the main dameon during recovery.
221 * At this stage, the databases have already been locked, by a
222 * dedicated child process. The freeze_mode variable is used to track
223 * whether the actual locks are held by the child process or not.
226 if (ctdb->freeze_mode[priority] != CTDB_FREEZE_FROZEN) {
227 DEBUG(DEBUG_ERR, ("Attempt to mark all databases locked when not frozen\n"));
231 for (ctdb_db = ctdb->db_list; ctdb_db; ctdb_db = ctdb_db->next) {
232 if (ctdb_db->priority != priority) {
235 if (later_db(ctdb, ctdb_db->db_name)) {
238 if (tdb_transaction_write_lock_mark(ctdb_db->ltdb->tdb) != 0) {
241 if (tdb_lockall_mark(ctdb_db->ltdb->tdb) != 0) {
242 /* FIXME: Shouldn't we unmark here? */
247 /* If priority != 1, later_db check is not required and can return */
252 for (ctdb_db = ctdb->db_list; ctdb_db; ctdb_db = ctdb_db->next) {
253 if (!later_db(ctdb, ctdb_db->db_name)) {
256 if (tdb_transaction_write_lock_mark(ctdb_db->ltdb->tdb) != 0) {
259 if (tdb_lockall_mark(ctdb_db->ltdb->tdb) != 0) {
260 /* FIXME: Shouldn't we unmark here? */
268 static int ctdb_lockall_mark(struct ctdb_context *ctdb)
272 for (priority=1; priority<=NUM_DB_PRIORITIES; priority++) {
273 if (ctdb_lockall_mark_prio(ctdb, priority) != 0) {
283 * lock all databases - unmark only
285 int ctdb_lockall_unmark_prio(struct ctdb_context *ctdb, uint32_t priority)
287 struct ctdb_db_context *ctdb_db;
288 int tdb_transaction_write_lock_unmark(struct tdb_context *);
291 * This function is only used by the main dameon during recovery.
292 * At this stage, the databases have already been locked, by a
293 * dedicated child process. The freeze_mode variable is used to track
294 * whether the actual locks are held by the child process or not.
297 if (ctdb->freeze_mode[priority] != CTDB_FREEZE_FROZEN) {
298 DEBUG(DEBUG_ERR, ("Attempt to unmark all databases locked when not frozen\n"));
302 for (ctdb_db = ctdb->db_list; ctdb_db; ctdb_db = ctdb_db->next) {
303 if (ctdb_db->priority != priority) {
306 if (tdb_transaction_write_lock_unmark(ctdb_db->ltdb->tdb) != 0) {
309 if (tdb_lockall_unmark(ctdb_db->ltdb->tdb) != 0) {
317 static int ctdb_lockall_unmark(struct ctdb_context *ctdb)
321 for (priority=NUM_DB_PRIORITIES; priority>=0; priority--) {
322 if (ctdb_lockall_unmark_prio(ctdb, priority) != 0) {
332 * Lock record / db depending on lock_ctx->type
333 * Called from child context.
335 static bool ctdb_lock_item(struct lock_context *lock_ctx)
339 switch (lock_ctx->type) {
341 if (tdb_chainlock(lock_ctx->ctdb_db->ltdb->tdb, lock_ctx->key) == 0) {
347 if (tdb_lockall(lock_ctx->ctdb_db->ltdb->tdb) == 0) {
352 case LOCK_ALLDB_PRIO:
353 if (ctdb_lockall_prio(lock_ctx->ctdb, lock_ctx->priority) == 0) {
359 if (ctdb_lockall(lock_ctx->ctdb) == 0) {
370 * Unlock record / db depending on lock_ctx->type
372 void ctdb_unlock_item(struct lock_context *lock_ctx)
374 switch (lock_ctx->type) {
376 tdb_chainunlock(lock_ctx->ctdb_db->ltdb->tdb, lock_ctx->key);
380 tdb_unlockall(lock_ctx->ctdb_db->ltdb->tdb);
383 case LOCK_ALLDB_PRIO:
384 ctdb_unlockall_prio(lock_ctx->ctdb, lock_ctx->priority);
388 ctdb_unlockall(lock_ctx->ctdb);
393 static void ctdb_lock_schedule(struct ctdb_context *ctdb);
396 * Destructor to kill the child locking process
398 static int ctdb_lock_context_destructor(struct lock_context *lock_ctx)
400 if (lock_ctx->child > 0) {
401 ctdb_kill(lock_ctx->ctdb, lock_ctx->child, SIGKILL);
402 DLIST_REMOVE(lock_ctx->ctdb->lock_current, lock_ctx);
403 lock_ctx->ctdb->lock_num_current--;
404 CTDB_DECREMENT_STAT(lock_ctx->ctdb, locks.num_current);
405 if (lock_ctx->type == LOCK_RECORD || lock_ctx->type == LOCK_DB) {
406 CTDB_DECREMENT_DB_STAT(lock_ctx->ctdb_db, locks.num_current);
409 DLIST_REMOVE(lock_ctx->ctdb->lock_pending, lock_ctx);
410 lock_ctx->ctdb->lock_num_pending--;
411 CTDB_DECREMENT_STAT(lock_ctx->ctdb, locks.num_pending);
412 if (lock_ctx->type == LOCK_RECORD || lock_ctx->type == LOCK_DB) {
413 CTDB_DECREMENT_DB_STAT(lock_ctx->ctdb_db, locks.num_pending);
417 ctdb_lock_schedule(lock_ctx->ctdb);
424 * Destructor to remove lock request
426 static int ctdb_lock_request_destructor(struct lock_request *lock_request)
428 DLIST_REMOVE(lock_request->lctx->req_queue, lock_request);
433 void ctdb_lock_free_request_context(struct lock_request *lock_req)
435 struct lock_context *lock_ctx;
437 lock_ctx = lock_req->lctx;
438 talloc_free(lock_req);
439 talloc_free(lock_ctx);
444 * Process all the callbacks waiting for lock
446 * If lock has failed, callback is executed with locked=false
448 static void process_callbacks(struct lock_context *lock_ctx, bool locked)
450 struct lock_request *request, *next;
452 if (lock_ctx->auto_mark && locked) {
453 switch (lock_ctx->type) {
455 tdb_chainlock_mark(lock_ctx->ctdb_db->ltdb->tdb, lock_ctx->key);
459 tdb_lockall_mark(lock_ctx->ctdb_db->ltdb->tdb);
462 case LOCK_ALLDB_PRIO:
463 ctdb_lockall_mark_prio(lock_ctx->ctdb, lock_ctx->priority);
467 ctdb_lockall_mark(lock_ctx->ctdb);
472 /* Iterate through all callbacks */
473 request = lock_ctx->req_queue;
475 if (lock_ctx->auto_mark) {
476 /* Reset the destructor, so request is not removed from the list */
477 talloc_set_destructor(request, NULL);
480 /* In case, callback frees the request, store next */
481 next = request->next;
482 request->callback(request->private_data, locked);
486 if (lock_ctx->auto_mark && locked) {
487 switch (lock_ctx->type) {
489 tdb_chainlock_unmark(lock_ctx->ctdb_db->ltdb->tdb, lock_ctx->key);
493 tdb_lockall_unmark(lock_ctx->ctdb_db->ltdb->tdb);
496 case LOCK_ALLDB_PRIO:
497 ctdb_lockall_unmark_prio(lock_ctx->ctdb, lock_ctx->priority);
501 ctdb_lockall_unmark(lock_ctx->ctdb);
508 static int lock_bucket_id(double t)
510 double us = 1.e-6, ms = 1.e-3, s = 1;
515 } else if (t < 10*us) {
517 } else if (t < 100*us) {
519 } else if (t < 1*ms) {
521 } else if (t < 10*ms) {
523 } else if (t < 100*ms) {
525 } else if (t < 1*s) {
527 } else if (t < 10*s) {
537 * Callback routine when the required locks are obtained.
538 * Called from parent context
540 static void ctdb_lock_handler(struct tevent_context *ev,
541 struct tevent_fd *tfd,
545 struct lock_context *lock_ctx;
552 lock_ctx = talloc_get_type_abort(private_data, struct lock_context);
554 /* cancel the timeout event */
555 if (lock_ctx->ttimer) {
556 TALLOC_FREE(lock_ctx->ttimer);
559 t = timeval_elapsed(&lock_ctx->start_time);
560 id = lock_bucket_id(t);
562 if (lock_ctx->auto_mark) {
563 tmp_ctx = talloc_new(ev);
564 talloc_steal(tmp_ctx, lock_ctx);
567 /* Read the status from the child process */
568 read(lock_ctx->fd[0], &c, 1);
569 locked = (c == 0 ? true : false);
571 /* Update statistics */
572 CTDB_DECREMENT_STAT(lock_ctx->ctdb, locks.num_pending);
573 CTDB_INCREMENT_STAT(lock_ctx->ctdb, locks.num_calls);
574 if (lock_ctx->ctdb_db) {
575 CTDB_DECREMENT_DB_STAT(lock_ctx->ctdb_db, locks.num_pending);
576 CTDB_INCREMENT_DB_STAT(lock_ctx->ctdb_db, locks.num_calls);
580 CTDB_INCREMENT_STAT(lock_ctx->ctdb, locks.num_current);
581 CTDB_INCREMENT_STAT(lock_ctx->ctdb, locks.buckets[id]);
582 if (lock_ctx->ctdb_db) {
583 CTDB_INCREMENT_DB_STAT(lock_ctx->ctdb_db, locks.num_current);
584 CTDB_UPDATE_DB_LATENCY(lock_ctx->ctdb_db, lock_type_str[lock_ctx->type], locks.latency, t);
585 CTDB_INCREMENT_DB_STAT(lock_ctx->ctdb_db, locks.buckets[id]);
588 CTDB_INCREMENT_STAT(lock_ctx->ctdb, locks.num_failed);
589 if (lock_ctx->ctdb_db) {
590 CTDB_INCREMENT_DB_STAT(lock_ctx->ctdb_db, locks.num_failed);
594 process_callbacks(lock_ctx, locked);
596 if (lock_ctx->auto_mark) {
597 talloc_free(tmp_ctx);
602 static void ctdb_lock_find_blocker(struct lock_context *lock_ctx);
605 * Callback routine when required locks are not obtained within timeout
606 * Called from parent context
608 static void ctdb_lock_timeout_handler(struct tevent_context *ev,
609 struct tevent_timer *ttimer,
610 struct timeval current_time,
613 struct lock_context *lock_ctx;
614 struct ctdb_context *ctdb;
616 lock_ctx = talloc_get_type_abort(private_data, struct lock_context);
617 ctdb = lock_ctx->ctdb;
619 /* fire a child process to find the blocking process */
620 if (lock_ctx->block_child == -1) {
621 ctdb_lock_find_blocker(lock_ctx);
624 /* reset the timeout timer */
625 // talloc_free(lock_ctx->ttimer);
626 lock_ctx->ttimer = tevent_add_timer(ctdb->ev,
628 timeval_current_ofs(10, 0),
629 ctdb_lock_timeout_handler,
634 static char *lock_child_log_prefix(struct lock_context *lock_ctx)
641 switch (lock_ctx->type) {
643 prefix = talloc_asprintf(NULL, "lockR(%d): ", pid);
647 prefix = talloc_asprintf(NULL, "lockD(%d): ", pid);
650 case LOCK_ALLDB_PRIO:
651 prefix = talloc_asprintf(NULL, "lockP(%d): ", pid);
655 prefix = talloc_asprintf(NULL, "lockA(%d): ", pid);
664 * Schedule a new lock child process
665 * Set up callback handler and timeout handler
667 static void ctdb_lock_schedule(struct ctdb_context *ctdb)
669 struct lock_context *lock_ctx, *next_ctx;
673 if (ctdb->lock_num_current >= MAX_LOCK_PROCESSES_PER_DB) {
677 if (ctdb->lock_pending == NULL) {
681 /* Find a lock context with requests */
682 lock_ctx = ctdb->lock_pending;
683 while (lock_ctx != NULL) {
684 if (! lock_ctx->req_queue) {
685 next_ctx = lock_ctx->next;
686 DEBUG(DEBUG_INFO, ("Removing lock context without lock requests\n"));
687 DLIST_REMOVE(ctdb->lock_pending, lock_ctx);
688 ctdb->lock_num_pending--;
689 CTDB_DECREMENT_STAT(ctdb, locks.num_pending);
690 if (lock_ctx->ctdb_db) {
691 CTDB_DECREMENT_DB_STAT(lock_ctx->ctdb_db, locks.num_pending);
693 talloc_free(lock_ctx);
697 /* Found a lock context with lock requests */
702 if (lock_ctx == NULL) {
706 lock_ctx->child = -1;
707 ret = pipe(lock_ctx->fd);
709 DEBUG(DEBUG_ERR, ("Failed to create pipe in ctdb_lock_schedule\n"));
714 lock_ctx->child = ctdb_fork(ctdb);
716 if (lock_ctx->child == (pid_t)-1) {
717 DEBUG(DEBUG_ERR, ("Failed to create a child in ctdb_lock_schedule\n"));
718 close(lock_ctx->fd[0]);
719 close(lock_ctx->fd[1]);
724 if (lock_ctx->child == 0) {
726 close(lock_ctx->fd[0]);
727 debug_extra = lock_child_log_prefix(lock_ctx);
728 if (ctdb_lock_item(lock_ctx)) {
733 write(lock_ctx->fd[1], &c, 1);
735 /* Hang around, but if parent dies, terminate */
736 while (kill(parent, 0) == 0 || errno != ESRCH) {
743 close(lock_ctx->fd[1]);
744 set_close_on_exec(lock_ctx->fd[0]);
746 talloc_set_destructor(lock_ctx, ctdb_lock_context_destructor);
748 /* Set up timeout handler */
749 lock_ctx->ttimer = tevent_add_timer(ctdb->ev,
751 timeval_current_ofs(10, 0),
752 ctdb_lock_timeout_handler,
754 if (lock_ctx->ttimer == NULL) {
755 ctdb_kill(ctdb, lock_ctx->child, SIGKILL);
756 lock_ctx->child = -1;
757 talloc_set_destructor(lock_ctx, NULL);
758 close(lock_ctx->fd[0]);
762 /* Set up callback */
763 lock_ctx->tfd = tevent_add_fd(ctdb->ev,
769 if (lock_ctx->tfd == NULL) {
770 TALLOC_FREE(lock_ctx->ttimer);
771 ctdb_kill(ctdb, lock_ctx->child, SIGKILL);
772 lock_ctx->child = -1;
773 talloc_set_destructor(lock_ctx, NULL);
774 close(lock_ctx->fd[0]);
777 tevent_fd_set_auto_close(lock_ctx->tfd);
779 /* Move the context from pending to current */
780 DLIST_REMOVE(ctdb->lock_pending, lock_ctx);
781 ctdb->lock_num_pending--;
782 DLIST_ADD_END(ctdb->lock_current, lock_ctx, NULL);
783 ctdb->lock_num_current++;
788 * Find the lock context of a given type
790 static struct lock_context *find_lock_context(struct lock_context *lock_list,
791 struct ctdb_db_context *ctdb_db,
796 struct lock_context *lock_ctx;
798 /* Search active locks */
799 for (lock_ctx=lock_list; lock_ctx; lock_ctx=lock_ctx->next) {
800 if (lock_ctx->type != type) {
804 switch (lock_ctx->type) {
806 if (ctdb_db == lock_ctx->ctdb_db &&
807 key.dsize == lock_ctx->key.dsize &&
808 memcmp(key.dptr, lock_ctx->key.dptr, key.dsize) == 0) {
814 if (ctdb_db == lock_ctx->ctdb_db) {
819 case LOCK_ALLDB_PRIO:
820 if (priority == lock_ctx->priority) {
831 /* Did not find the lock context we are searching for */
841 * Lock record / db depending on type
843 static struct lock_request *ctdb_lock_internal(struct ctdb_context *ctdb,
844 struct ctdb_db_context *ctdb_db,
847 void (*callback)(void *, bool),
852 struct lock_context *lock_ctx;
853 struct lock_request *request;
855 if (callback == NULL) {
856 DEBUG(DEBUG_WARNING, ("No callback function specified, not locking"));
860 /* get a context for this key - search only the pending contexts,
861 * current contexts might in the middle of processing callbacks */
862 lock_ctx = find_lock_context(ctdb->lock_pending, ctdb_db, key, priority, type);
864 /* No existing context, create one */
865 if (lock_ctx == NULL) {
866 lock_ctx = talloc_zero(ctdb, struct lock_context);
867 if (lock_ctx == NULL) {
868 DEBUG(DEBUG_ERR, ("Failed to create a new lock context"));
872 lock_ctx->type = type;
873 lock_ctx->ctdb = ctdb;
874 lock_ctx->ctdb_db = ctdb_db;
875 lock_ctx->key.dsize = key.dsize;
877 lock_ctx->key.dptr = talloc_memdup(lock_ctx, key.dptr, key.dsize);
879 lock_ctx->key.dptr = NULL;
881 lock_ctx->priority = priority;
882 lock_ctx->auto_mark = auto_mark;
884 lock_ctx->child = -1;
885 lock_ctx->block_child = -1;
887 DLIST_ADD_END(ctdb->lock_pending, lock_ctx, NULL);
888 ctdb->lock_num_pending++;
889 CTDB_INCREMENT_STAT(ctdb, locks.num_pending);
891 CTDB_INCREMENT_DB_STAT(ctdb_db, locks.num_pending);
894 /* Start the timer when we activate the context */
895 lock_ctx->start_time = timeval_current();
898 if ((request = talloc_zero(lock_ctx, struct lock_request)) == NULL) {
902 request->lctx = lock_ctx;
903 request->callback = callback;
904 request->private_data = private_data;
906 talloc_set_destructor(request, ctdb_lock_request_destructor);
907 DLIST_ADD_END(lock_ctx->req_queue, request, NULL);
909 ctdb_lock_schedule(ctdb);
916 * obtain a lock on a record in a database
918 struct lock_request *ctdb_lock_record(struct ctdb_db_context *ctdb_db,
921 void (*callback)(void *, bool),
924 return ctdb_lock_internal(ctdb_db->ctdb,
936 * obtain a lock on a database
938 struct lock_request *ctdb_lock_db(struct ctdb_db_context *ctdb_db,
940 void (*callback)(void *, bool),
943 return ctdb_lock_internal(ctdb_db->ctdb,
955 * obtain locks on all databases of specified priority
957 struct lock_request *ctdb_lock_alldb_prio(struct ctdb_context *ctdb,
960 void (*callback)(void *, bool),
963 if (priority < 0 || priority > NUM_DB_PRIORITIES) {
964 DEBUG(DEBUG_ERR, ("Invalid db priority: %u\n", priority));
968 return ctdb_lock_internal(ctdb,
980 * obtain locks on all databases
982 struct lock_request *ctdb_lock_alldb(struct ctdb_context *ctdb,
984 void (*callback)(void *, bool),
987 return ctdb_lock_internal(ctdb,
998 * Callback routine to read the PID of blocking process from the child and log
1001 void ctdb_lock_blocked_handler(struct tevent_context *ev,
1002 struct tevent_fd *tfd,
1006 struct lock_context *lock_ctx;
1007 pid_t blocker_pid = -1;
1008 char *process_name = NULL;
1009 const char *db_name = NULL;
1011 struct ctdb_db_context *ctdb_db;
1013 struct stat stat_buf;
1015 lock_ctx = talloc_get_type_abort(private_data, struct lock_context);
1017 if (read(lock_ctx->block_fd[0], &blocker_pid, sizeof(blocker_pid)) != sizeof(blocker_pid)) {
1018 DEBUG(DEBUG_ERR, ("Error reading blocker process pid from child\n"));
1021 if (read(lock_ctx->block_fd[0], &inode, sizeof(inode)) != sizeof(inode)) {
1022 DEBUG(DEBUG_ERR, ("Error reading blocked inode from child\n"));
1026 if (blocker_pid < 0) {
1030 process_name = ctdb_get_process_name(blocker_pid);
1032 if (lock_ctx->type == LOCK_RECORD || lock_ctx->type == LOCK_DB) {
1033 db_name = lock_ctx->ctdb_db->ltdb->name;
1035 for (ctdb_db = lock_ctx->ctdb->db_list; ctdb_db; ctdb_db = ctdb_db->next) {
1036 fd = tdb_fd(ctdb_db->ltdb->tdb);
1037 if (fstat(fd, &stat_buf) == 0) {
1038 if (stat_buf.st_ino == inode) {
1039 db_name = ctdb_db->ltdb->name;
1047 DEBUG(DEBUG_WARNING,
1048 ("Process (pid=%d) blocked in locking\n", lock_ctx->child));
1049 DEBUG(DEBUG_WARNING,
1050 ("Process %s (pid=%d) locked database %s (inode %lu) for %.0lf seconds\n",
1051 (process_name ? process_name : "unknown"),
1052 blocker_pid, db_name, (unsigned long)inode,
1053 timeval_elapsed(&lock_ctx->start_time)));
1055 DEBUG(DEBUG_WARNING,
1056 ("Process %s (pid=%d) locked database (inode %lu) for %.0lf seconds\n",
1057 (process_name ? process_name : "unknown"),
1058 blocker_pid, (unsigned long)inode,
1059 timeval_elapsed(&lock_ctx->start_time)));
1063 * If ctdb is blocked by smbd for deadlock_interval, detect it as a deadlock
1064 * and kill smbd process.
1066 if (lock_ctx->ctdb->tunable.deadlock_timeout > 0 &&
1067 timeval_elapsed(&lock_ctx->start_time) > lock_ctx->ctdb->tunable.deadlock_timeout &&
1068 process_name && strstr(process_name, "smbd")) {
1069 DEBUG(DEBUG_WARNING,
1070 ("Deadlock detected. Killing smbd process (pid=%d)", blocker_pid));
1071 kill(blocker_pid, SIGKILL);
1077 if (lock_ctx->block_child > 0) {
1078 ctdb_kill(lock_ctx->ctdb, lock_ctx->block_child, SIGKILL);
1080 lock_ctx->block_child = -1;
1086 * Find processes that holds lock we are interested in
1088 void ctdb_lock_find_blocker(struct lock_context *lock_ctx)
1090 struct tevent_fd *tfd;
1093 if (pipe(lock_ctx->block_fd) < 0) {
1099 lock_ctx->block_child = ctdb_fork(lock_ctx->ctdb);
1100 if (lock_ctx->block_child == -1) {
1101 close(lock_ctx->block_fd[0]);
1102 close(lock_ctx->block_fd[1]);
1107 if (lock_ctx->block_child == 0) {
1108 struct ctdb_lock_info reqlock;
1109 pid_t blocker_pid = -1;
1112 close(lock_ctx->block_fd[0]);
1113 if (ctdb_get_lock_info(lock_ctx->child, &reqlock)) {
1114 status = ctdb_get_blocker_pid(&reqlock, &blocker_pid);
1116 /* Could not find blocker pid */
1120 write(lock_ctx->block_fd[1], &blocker_pid, sizeof(blocker_pid));
1121 write(lock_ctx->block_fd[1], &reqlock.inode, sizeof(reqlock.inode));
1123 /* Hang around till parent dies */
1124 while (kill(parent, 0) == 0 || errno != ESRCH) {
1130 /* Parent process */
1131 close(lock_ctx->block_fd[1]);
1132 set_close_on_exec(lock_ctx->block_fd[0]);
1134 tfd = tevent_add_fd(lock_ctx->ctdb->ev,
1136 lock_ctx->block_fd[0],
1138 ctdb_lock_blocked_handler,
1141 ctdb_kill(lock_ctx->ctdb, lock_ctx->block_child, SIGKILL);
1142 close(lock_ctx->block_fd[0]);