4 Copyright (C) Andrew Tridgell 2006
6 This program is free software; you can redistribute it and/or modify
7 it under the terms of the GNU General Public License as published by
8 the Free Software Foundation; either version 3 of the License, or
9 (at your option) any later version.
11 This program is distributed in the hope that it will be useful,
12 but WITHOUT ANY WARRANTY; without even the implied warranty of
13 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14 GNU General Public License for more details.
16 You should have received a copy of the GNU General Public License
17 along with this program; if not, see <http://www.gnu.org/licenses/>.
21 #include "lib/tevent/tevent.h"
22 #include "system/filesys.h"
24 #include "system/time.h"
25 #include "system/wait.h"
26 #include "system/network.h"
28 #include "../include/ctdb_private.h"
32 const char *transport;
33 const char *myaddress;
34 const char *public_address_list;
35 const char *event_script_dir;
36 const char *notification_script;
38 const char *recovery_lock_file;
40 const char *db_dir_persistent;
41 const char *db_dir_state;
42 const char *public_interface;
43 const char *single_public_ip;
47 int start_as_disabled;
54 int max_persistent_check_errors;
56 .nlist = ETCDIR "/ctdb/nodes",
58 .event_script_dir = ETCDIR "/ctdb/events.d",
59 .logfile = LOGDIR "/log.ctdb",
60 .db_dir = VARDIR "/ctdb",
61 .db_dir_persistent = VARDIR "/ctdb/persistent",
62 .db_dir_state = VARDIR "/ctdb/state",
63 .script_log_level = DEBUG_ERR,
70 called by the transport layer when a packet comes in
72 static void ctdb_recv_pkt(struct ctdb_context *ctdb, uint8_t *data, uint32_t length)
74 struct ctdb_req_header *hdr = (struct ctdb_req_header *)data;
76 CTDB_INCREMENT_STAT(ctdb, node_packets_recv);
78 /* up the counter for this source node, so we know its alive */
79 if (ctdb_validate_pnn(ctdb, hdr->srcnode)) {
80 /* as a special case, redirected calls don't increment the rx_cnt */
81 if (hdr->operation != CTDB_REQ_CALL ||
82 ((struct ctdb_req_call *)hdr)->hopcount == 0) {
83 ctdb->nodes[hdr->srcnode]->rx_cnt++;
87 ctdb_input_pkt(ctdb, hdr);
90 void ctdb_load_nodes_file(struct ctdb_context *ctdb)
94 ret = ctdb_set_nlist(ctdb, options.nlist);
96 DEBUG(DEBUG_ALERT,("ctdb_set_nlist failed - %s\n", ctdb_errstr(ctdb)));
101 static const struct ctdb_upcalls ctdb_upcalls = {
102 .recv_pkt = ctdb_recv_pkt,
103 .node_dead = ctdb_node_dead,
104 .node_connected = ctdb_node_connected
112 int main(int argc, const char *argv[])
114 struct ctdb_context *ctdb;
117 struct poptOption popt_options[] = {
120 { "interactive", 'i', POPT_ARG_NONE, &interactive, 0, "don't fork", NULL },
121 { "public-addresses", 0, POPT_ARG_STRING, &options.public_address_list, 0, "public address list file", "filename" },
122 { "public-interface", 0, POPT_ARG_STRING, &options.public_interface, 0, "public interface", "interface"},
123 { "single-public-ip", 0, POPT_ARG_STRING, &options.single_public_ip, 0, "single public ip", "ip-address"},
124 { "event-script-dir", 0, POPT_ARG_STRING, &options.event_script_dir, 0, "event script directory", "dirname" },
125 { "logfile", 0, POPT_ARG_STRING, &options.logfile, 0, "log file location", "filename" },
126 { "nlist", 0, POPT_ARG_STRING, &options.nlist, 0, "node list file", "filename" },
127 { "node-ip", 0, POPT_ARG_STRING, &options.node_ip, 0, "node ip", "ip-address"},
128 { "notification-script", 0, POPT_ARG_STRING, &options.notification_script, 0, "notification script", "filename" },
129 { "listen", 0, POPT_ARG_STRING, &options.myaddress, 0, "address to listen on", "address" },
130 { "transport", 0, POPT_ARG_STRING, &options.transport, 0, "protocol transport", NULL },
131 { "dbdir", 0, POPT_ARG_STRING, &options.db_dir, 0, "directory for the tdb files", NULL },
132 { "dbdir-persistent", 0, POPT_ARG_STRING, &options.db_dir_persistent, 0, "directory for persistent tdb files", NULL },
133 { "dbdir-state", 0, POPT_ARG_STRING, &options.db_dir_state, 0, "directory for internal state tdb files", NULL },
134 { "reclock", 0, POPT_ARG_STRING, &options.recovery_lock_file, 0, "location of recovery lock file", "filename" },
135 { "valgrinding", 0, POPT_ARG_NONE, &options.valgrinding, 0, "disable setscheduler SCHED_FIFO call, use mmap for tdbs", NULL },
136 { "syslog", 0, POPT_ARG_NONE, &options.use_syslog, 0, "log messages to syslog", NULL },
137 { "start-as-disabled", 0, POPT_ARG_NONE, &options.start_as_disabled, 0, "Node starts in disabled state", NULL },
138 { "start-as-stopped", 0, POPT_ARG_NONE, &options.start_as_stopped, 0, "Node starts in stopped state", NULL },
139 { "no-lmaster", 0, POPT_ARG_NONE, &options.no_lmaster, 0, "disable lmaster role on this node", NULL },
140 { "no-recmaster", 0, POPT_ARG_NONE, &options.no_recmaster, 0, "disable recmaster role on this node", NULL },
141 { "lvs", 0, POPT_ARG_NONE, &options.lvs, 0, "lvs is enabled on this node", NULL },
142 { "script-log-level", 0, POPT_ARG_INT, &options.script_log_level, DEBUG_ERR, "log level of event script output", NULL },
143 { "nopublicipcheck", 0, POPT_ARG_NONE, &options.no_publicipcheck, 0, "don't check we have/don't have the correct public ip addresses", NULL },
144 { "max-persistent-check-errors", 0, POPT_ARG_INT,
145 &options.max_persistent_check_errors, 0,
146 "max allowed persistent check errors (default 0)", NULL },
147 { "log-ringbuf-size", 0, POPT_ARG_INT, &log_ringbuf_size, DEBUG_ERR, "Number of log messages we can store in the memory ringbuffer", NULL },
148 { "sloppy-start", 0, POPT_ARG_NONE, &fast_start, 0, "Do not perform full recovery on start", NULL },
152 const char **extra_argv;
155 struct event_context *ev;
157 pc = poptGetContext(argv[0], argc, argv, popt_options, POPT_CONTEXT_KEEP_FIRST);
159 while ((opt = poptGetNextOpt(pc)) != -1) {
162 fprintf(stderr, "Invalid option %s: %s\n",
163 poptBadOption(pc, 0), poptStrerror(opt));
168 /* setup the remaining options for the main program to use */
169 extra_argv = poptGetArgs(pc);
172 while (extra_argv[extra_argc]) extra_argc++;
175 talloc_enable_null_tracking();
177 ctdb_block_signal(SIGPIPE);
178 fault_setup("ctdbd");
180 ev = event_context_init(NULL);
181 tevent_loop_allow_nesting(ev);
183 ctdb = ctdb_cmdline_init(ev);
185 ctdb->start_as_disabled = options.start_as_disabled;
186 ctdb->start_as_stopped = options.start_as_stopped;
188 script_log_level = options.script_log_level;
190 ret = ctdb_set_logfile(ctdb, options.logfile, options.use_syslog);
192 printf("ctdb_set_logfile to %s failed - %s\n",
193 options.use_syslog?"syslog":options.logfile, ctdb_errstr(ctdb));
197 DEBUG(DEBUG_NOTICE,("Starting CTDB daemon\n"));
199 gettimeofday(&ctdb->ctdbd_start_time, NULL);
200 gettimeofday(&ctdb->last_recovery_started, NULL);
201 gettimeofday(&ctdb->last_recovery_finished, NULL);
202 ctdb->recovery_mode = CTDB_RECOVERY_NORMAL;
203 ctdb->recovery_master = (uint32_t)-1;
204 ctdb->upcalls = &ctdb_upcalls;
205 ctdb->idr = idr_init(ctdb);
206 ctdb->recovery_lock_fd = -1;
208 ctdb_tunables_set_defaults(ctdb);
210 ctdb->tunable.disable_ip_failover = options.no_publicipcheck;
212 ret = ctdb_set_recovery_lock_file(ctdb, options.recovery_lock_file);
214 DEBUG(DEBUG_ALERT,("ctdb_set_recovery_lock_file failed - %s\n", ctdb_errstr(ctdb)));
218 ret = ctdb_set_transport(ctdb, options.transport);
220 DEBUG(DEBUG_ALERT,("ctdb_set_transport failed - %s\n", ctdb_errstr(ctdb)));
224 /* tell ctdb what address to listen on */
225 if (options.myaddress) {
226 ret = ctdb_set_address(ctdb, options.myaddress);
228 DEBUG(DEBUG_ALERT,("ctdb_set_address failed - %s\n", ctdb_errstr(ctdb)));
233 /* set ctdbd capabilities */
234 ctdb->capabilities = 0;
235 if (options.no_lmaster == 0) {
236 ctdb->capabilities |= CTDB_CAP_LMASTER;
238 if (options.no_recmaster == 0) {
239 ctdb->capabilities |= CTDB_CAP_RECMASTER;
241 if (options.lvs != 0) {
242 ctdb->capabilities |= CTDB_CAP_LVS;
245 /* tell ctdb what nodes are available */
246 ctdb_load_nodes_file(ctdb);
248 /* if a node-ip was specified, verify that it exists in the
251 if (options.node_ip != NULL) {
252 DEBUG(DEBUG_NOTICE,("IP for this node is %s\n", options.node_ip));
253 ret = ctdb_ip_to_nodeid(ctdb, options.node_ip);
255 DEBUG(DEBUG_ALERT,("The specified node-ip:%s is not a valid node address. Exiting.\n", options.node_ip));
258 ctdb->node_ip = options.node_ip;
259 DEBUG(DEBUG_NOTICE,("This is node %d\n", ret));
262 if (options.db_dir) {
263 ret = ctdb_set_tdb_dir(ctdb, options.db_dir);
265 DEBUG(DEBUG_ALERT,("ctdb_set_tdb_dir failed - %s\n", ctdb_errstr(ctdb)));
269 if (options.db_dir_persistent) {
270 ret = ctdb_set_tdb_dir_persistent(ctdb, options.db_dir_persistent);
272 DEBUG(DEBUG_ALERT,("ctdb_set_tdb_dir_persistent failed - %s\n", ctdb_errstr(ctdb)));
276 if (options.db_dir_state) {
277 ret = ctdb_set_tdb_dir_state(ctdb, options.db_dir_state);
279 DEBUG(DEBUG_ALERT,("ctdb_set_tdb_dir_state failed - %s\n", ctdb_errstr(ctdb)));
284 if (options.public_interface) {
285 ctdb->default_public_interface = talloc_strdup(ctdb, options.public_interface);
286 CTDB_NO_MEMORY(ctdb, ctdb->default_public_interface);
289 if (options.single_public_ip) {
290 if (options.public_interface == NULL) {
291 DEBUG(DEBUG_ALERT,("--single_public_ip used but --public_interface is not specified. You must specify the public interface when using single public ip. Exiting\n"));
295 ret = ctdb_set_single_public_ip(ctdb, options.public_interface,
296 options.single_public_ip);
298 DEBUG(DEBUG_ALERT,("Invalid --single-public-ip argument : %s . This is not a valid ip address. Exiting.\n", options.single_public_ip));
303 ret = ctdb_set_event_script_dir(ctdb, options.event_script_dir);
305 DEBUG(DEBUG_ALERT,("Unable to setup event script directory\n"));
309 if (options.notification_script != NULL) {
310 ret = ctdb_set_notification_script(ctdb, options.notification_script);
312 DEBUG(DEBUG_ALERT,("Unable to setup notification script\n"));
317 ctdb->valgrinding = options.valgrinding;
318 ctdb->do_setsched = !ctdb->valgrinding;
320 if (options.max_persistent_check_errors < 0) {
321 ctdb->max_persistent_check_errors = 0xFFFFFFFFFFFFFFFFLL;
323 ctdb->max_persistent_check_errors = (uint64_t)options.max_persistent_check_errors;
326 if (getenv("CTDB_BASE") == NULL) {
327 /* setup a environment variable for the event scripts to use
328 to find the installation directory */
329 setenv("CTDB_BASE", ETCDIR "/ctdb", 1);
332 /* start the protocol running (as a child) */
333 return ctdb_start_daemon(ctdb, interactive?False:True, options.use_syslog, options.public_address_list);