4 Copyright (C) Ronnie Sahlberg 2007
5 Copyright (C) Andrew Tridgell 2007
6 Copyright (C) Martin Schwenke 2011
8 This program is free software; you can redistribute it and/or modify
9 it under the terms of the GNU General Public License as published by
10 the Free Software Foundation; either version 3 of the License, or
11 (at your option) any later version.
13 This program is distributed in the hope that it will be useful,
14 but WITHOUT ANY WARRANTY; without even the implied warranty of
15 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
16 GNU General Public License for more details.
18 You should have received a copy of the GNU General Public License
19 along with this program; if not, see <http://www.gnu.org/licenses/>.
25 #include "system/network.h"
27 #include "lib/util/debug.h"
29 #include "common/logging.h"
30 #include "common/rb_tree.h"
32 #include "server/ipalloc_private.h"
34 /* Initialise main ipalloc state and sub-structures */
35 struct ipalloc_state *
36 ipalloc_state_init(TALLOC_CTX *mem_ctx,
38 enum ipalloc_algorithm algorithm,
40 uint32_t *force_rebalance_nodes)
42 struct ipalloc_state *ipalloc_state =
43 talloc_zero(mem_ctx, struct ipalloc_state);
44 if (ipalloc_state == NULL) {
45 DEBUG(DEBUG_ERR, (__location__ " Out of memory\n"));
49 ipalloc_state->num = num_nodes;
51 ipalloc_state->noiptakeover =
52 talloc_zero_array(ipalloc_state,
55 if (ipalloc_state->noiptakeover == NULL) {
56 DEBUG(DEBUG_ERR, (__location__ " Out of memory\n"));
59 ipalloc_state->noiphost =
60 talloc_zero_array(ipalloc_state,
63 if (ipalloc_state->noiphost == NULL) {
64 DEBUG(DEBUG_ERR, (__location__ " Out of memory\n"));
68 ipalloc_state->algorithm = algorithm;
69 ipalloc_state->no_ip_failback = no_ip_failback;
70 ipalloc_state->force_rebalance_nodes = force_rebalance_nodes;
74 talloc_free(ipalloc_state);
78 static void *add_ip_callback(void *parm, void *data)
80 struct public_ip_list *this_ip = parm;
81 struct public_ip_list *prev_ip = data;
83 if (prev_ip == NULL) {
86 if (this_ip->pnn == -1) {
87 this_ip->pnn = prev_ip->pnn;
93 static int getips_count_callback(void *param, void *data)
95 struct public_ip_list **ip_list = (struct public_ip_list **)param;
96 struct public_ip_list *new_ip = (struct public_ip_list *)data;
98 new_ip->next = *ip_list;
103 /* Nodes only know about those public addresses that they are
104 * configured to serve and no individual node has a full list of all
105 * public addresses configured across the cluster. Therefore, a
106 * merged list of all public addresses needs to be built so that IP
107 * allocation can be done. */
108 static struct public_ip_list *
109 create_merged_ip_list(struct ipalloc_state *ipalloc_state)
112 struct public_ip_list *ip_list;
113 struct ctdb_public_ip_list *public_ips;
114 struct trbt_tree *ip_tree;
116 ip_tree = trbt_create(ipalloc_state, 0);
118 if (ipalloc_state->known_public_ips == NULL) {
119 DEBUG(DEBUG_ERR, ("Known public IPs not set\n"));
123 for (i=0; i < ipalloc_state->num; i++) {
125 public_ips = &ipalloc_state->known_public_ips[i];
127 for (j=0; j < public_ips->num; j++) {
128 struct public_ip_list *tmp_ip;
130 /* This is returned as part of ip_list */
131 tmp_ip = talloc_zero(ipalloc_state, struct public_ip_list);
132 if (tmp_ip == NULL) {
134 (__location__ " out of memory\n"));
135 talloc_free(ip_tree);
139 /* Do not use information about IP addresses hosted
140 * on other nodes, it may not be accurate */
141 if (public_ips->ip[j].pnn == i) {
142 tmp_ip->pnn = public_ips->ip[j].pnn;
146 tmp_ip->addr = public_ips->ip[j].addr;
149 trbt_insertarray32_callback(ip_tree,
150 IP_KEYLEN, ip_key(&public_ips->ip[j].addr),
157 trbt_traversearray32(ip_tree, IP_KEYLEN, getips_count_callback, &ip_list);
158 talloc_free(ip_tree);
163 static bool all_nodes_are_disabled(struct ctdb_node_map *nodemap)
167 for (i=0;i<nodemap->num;i++) {
168 if (!(nodemap->node[i].flags &
169 (NODE_FLAGS_INACTIVE|NODE_FLAGS_DISABLED))) {
170 /* Found one completely healthy node */
178 /* Set internal flags for IP allocation:
180 * Set NOIPTAKOVER ip flags from per-node NoIPTakeover tunable
181 * Set NOIPHOST ip flag for each INACTIVE node
182 * if all nodes are disabled:
183 * Set NOIPHOST ip flags from per-node NoIPHostOnAllDisabled tunable
185 * Set NOIPHOST ip flags for disabled nodes
187 void ipalloc_set_node_flags(struct ipalloc_state *ipalloc_state,
188 struct ctdb_node_map *nodemap,
189 uint32_t *tval_noiptakeover,
190 uint32_t *tval_noiphostonalldisabled)
194 for (i=0;i<nodemap->num;i++) {
195 /* Can not take IPs on node with NoIPTakeover set */
196 if (tval_noiptakeover[i] != 0) {
197 ipalloc_state->noiptakeover[i] = true;
200 /* Can not host IPs on INACTIVE node */
201 if (nodemap->node[i].flags & NODE_FLAGS_INACTIVE) {
202 ipalloc_state->noiphost[i] = true;
206 if (all_nodes_are_disabled(nodemap)) {
207 /* If all nodes are disabled, can not host IPs on node
208 * with NoIPHostOnAllDisabled set
210 for (i=0;i<nodemap->num;i++) {
211 if (tval_noiphostonalldisabled[i] != 0) {
212 ipalloc_state->noiphost[i] = true;
216 /* If some nodes are not disabled, then can not host
217 * IPs on DISABLED node
219 for (i=0;i<nodemap->num;i++) {
220 if (nodemap->node[i].flags & NODE_FLAGS_DISABLED) {
221 ipalloc_state->noiphost[i] = true;
227 bool ipalloc_set_public_ips(struct ipalloc_state *ipalloc_state,
228 struct ctdb_public_ip_list *known_ips,
229 struct ctdb_public_ip_list *available_ips)
231 ipalloc_state->available_public_ips = available_ips;
232 ipalloc_state->known_public_ips = known_ips;
234 ipalloc_state->all_ips = create_merged_ip_list(ipalloc_state);
236 return (ipalloc_state->all_ips != NULL);
239 /* This can only return false if there are no available IPs *and*
240 * there are no IP addresses currently allocated. If the latter is
241 * true then the cluster can clearly host IPs... just not necessarily
243 bool ipalloc_can_host_ips(struct ipalloc_state *ipalloc_state)
246 bool have_ips = false;
248 for (i=0; i < ipalloc_state->num; i++) {
249 struct ctdb_public_ip_list *ips =
250 ipalloc_state->known_public_ips;
251 if (ips[i].num != 0) {
254 /* Succeed if an address is hosted on node i */
255 for (j=0; j < ips[i].num; j++) {
256 if (ips[i].ip[j].pnn == i) {
267 /* At this point there are known addresses but none are
268 * hosted. Need to check if cluster can now host some
271 for (i=0; i < ipalloc_state->num; i++) {
272 if (ipalloc_state->available_public_ips[i].num != 0) {
280 /* The calculation part of the IP allocation algorithm. */
281 struct public_ip_list *ipalloc(struct ipalloc_state *ipalloc_state)
285 switch (ipalloc_state->algorithm) {
287 ret = ipalloc_lcp2(ipalloc_state);
289 case IPALLOC_DETERMINISTIC:
290 ret = ipalloc_deterministic(ipalloc_state);
292 case IPALLOC_NONDETERMINISTIC:
293 ret = ipalloc_nondeterministic(ipalloc_state);
297 /* at this point ->pnn is the node which will own each IP
298 or -1 if there is no node that can cover this ip
301 return (ret ? ipalloc_state->all_ips : NULL);