qdevice-net-heuristics.c 16 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487
  1. /*
  2. * Copyright (c) 2017-2020 Red Hat, Inc.
  3. *
  4. * All rights reserved.
  5. *
  6. * Author: Jan Friesse (jfriesse@redhat.com)
  7. *
  8. * This software licensed under BSD license, the text of which follows:
  9. *
  10. * Redistribution and use in source and binary forms, with or without
  11. * modification, are permitted provided that the following conditions are met:
  12. *
  13. * - Redistributions of source code must retain the above copyright notice,
  14. * this list of conditions and the following disclaimer.
  15. * - Redistributions in binary form must reproduce the above copyright notice,
  16. * this list of conditions and the following disclaimer in the documentation
  17. * and/or other materials provided with the distribution.
  18. * - Neither the name of the Red Hat, Inc. nor the names of its
  19. * contributors may be used to endorse or promote products derived from this
  20. * software without specific prior written permission.
  21. *
  22. * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
  23. * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
  24. * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
  25. * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
  26. * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
  27. * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
  28. * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
  29. * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
  30. * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
  31. * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF
  32. * THE POSSIBILITY OF SUCH DAMAGE.
  33. */
  34. #include "log.h"
  35. #include "qdevice-net-algorithm.h"
  36. #include "qdevice-net-cast-vote-timer.h"
  37. #include "qdevice-net-heuristics.h"
  38. #include "qdevice-net-send.h"
  39. #include "qdevice-net-votequorum.h"
  40. enum tlv_heuristics
  41. qdevice_net_heuristics_exec_result_to_tlv(enum qdevice_heuristics_exec_result exec_result)
  42. {
  43. enum tlv_heuristics res;
  44. switch (exec_result) {
  45. case QDEVICE_HEURISTICS_EXEC_RESULT_DISABLED: res = TLV_HEURISTICS_UNDEFINED; break;
  46. case QDEVICE_HEURISTICS_EXEC_RESULT_PASS: res = TLV_HEURISTICS_PASS; break;
  47. case QDEVICE_HEURISTICS_EXEC_RESULT_FAIL: res = TLV_HEURISTICS_FAIL; break;
  48. default:
  49. log(LOG_ERR, "qdevice_net_heuristics_exec_result_to_tlv: Unhandled "
  50. "heuristics exec result %s",
  51. qdevice_heuristics_exec_result_to_str(exec_result));
  52. exit(EXIT_FAILURE);
  53. break;
  54. }
  55. return (res);
  56. }
  57. static int
  58. qdevice_net_regular_heuristics_exec_result_callback(uint32_t seq_number,
  59. enum qdevice_heuristics_exec_result exec_result, void *user_data1, void *user_data2)
  60. {
  61. struct qdevice_heuristics_instance *heuristics_instance;
  62. struct qdevice_instance *instance;
  63. struct qdevice_net_instance *net_instance;
  64. int send_msg;
  65. enum tlv_vote vote;
  66. enum tlv_heuristics heuristics;
  67. instance = (struct qdevice_instance *)user_data1;
  68. heuristics_instance = &instance->heuristics_instance;
  69. net_instance = instance->model_data;
  70. if (qdevice_heuristics_result_notifier_list_set_active(&heuristics_instance->exec_result_notifier_list,
  71. qdevice_net_regular_heuristics_exec_result_callback, 0) != 0) {
  72. log(LOG_ERR, "Can't deactivate net regular heuristics exec callback notifier");
  73. net_instance->disconnect_reason = QDEVICE_NET_DISCONNECT_REASON_CANT_ACTIVATE_HEURISTICS_RESULT_NOTIFIER;
  74. net_instance->schedule_disconnect = 1;
  75. return (0);
  76. }
  77. heuristics = qdevice_net_heuristics_exec_result_to_tlv(exec_result);
  78. if (exec_result == QDEVICE_HEURISTICS_EXEC_RESULT_DISABLED) {
  79. /*
  80. * Can happen when user disables heuristics during runtime
  81. */
  82. return (0);
  83. }
  84. if (net_instance->latest_heuristics_result != heuristics) {
  85. log(heuristics == TLV_HEURISTICS_PASS ? LOG_NOTICE : LOG_ERR,
  86. "Heuristics result changed from %s to %s",
  87. tlv_heuristics_to_str(net_instance->latest_heuristics_result),
  88. tlv_heuristics_to_str(heuristics));
  89. if (net_instance->state != QDEVICE_NET_INSTANCE_STATE_WAITING_VOTEQUORUM_CMAP_EVENTS) {
  90. /*
  91. * Not connected to qnetd
  92. */
  93. send_msg = 0;
  94. } else {
  95. send_msg = 1;
  96. }
  97. vote = TLV_VOTE_NO_CHANGE;
  98. if (qdevice_net_algorithm_heuristics_change(net_instance, &heuristics, &send_msg,
  99. &vote) == -1) {
  100. log(LOG_ERR, "Algorithm returned error. Disconnecting.");
  101. net_instance->disconnect_reason =
  102. QDEVICE_NET_DISCONNECT_REASON_ALGO_HEURISTICS_CHANGE_ERR;
  103. net_instance->schedule_disconnect = 1;
  104. return (0);
  105. } else {
  106. log(LOG_DEBUG, "Algorithm decided to %s message with heuristics result "
  107. "%s and result vote is %s", (send_msg ? "send" : "not send"),
  108. tlv_heuristics_to_str(heuristics), tlv_vote_to_str(vote));
  109. }
  110. if (send_msg) {
  111. if (heuristics == TLV_HEURISTICS_UNDEFINED) {
  112. log(LOG_ERR, "Inconsistent algorithm result. "
  113. "It's not possible to send message with undefined heuristics. "
  114. "Disconnecting.");
  115. net_instance->disconnect_reason =
  116. QDEVICE_NET_DISCONNECT_REASON_ALGO_HEURISTICS_CHANGE_ERR;
  117. net_instance->schedule_disconnect = 1;
  118. return (0);
  119. }
  120. if (!net_instance->server_supports_heuristics) {
  121. log(LOG_ERR, "Server doesn't support heuristics. "
  122. "Disconnecting.");
  123. net_instance->disconnect_reason =
  124. QDEVICE_NET_DISCONNECT_REASON_SERVER_DOESNT_SUPPORT_REQUIRED_OPT;
  125. net_instance->schedule_disconnect = 1;
  126. return (0);
  127. }
  128. if (qdevice_net_send_heuristics_change(net_instance, heuristics) != 0) {
  129. net_instance->disconnect_reason = QDEVICE_NET_DISCONNECT_REASON_CANT_ALLOCATE_MSG_BUFFER;
  130. net_instance->schedule_disconnect = 1;
  131. return (0);
  132. }
  133. }
  134. if (qdevice_net_cast_vote_timer_update(net_instance, vote) != 0) {
  135. log(LOG_CRIT, "qdevice_net_heuristics_exec_result_callback "
  136. "Can't update cast vote timer");
  137. net_instance->disconnect_reason = QDEVICE_NET_DISCONNECT_REASON_CANT_SCHEDULE_VOTING_TIMER;
  138. net_instance->schedule_disconnect = 1;
  139. return (0);
  140. }
  141. }
  142. net_instance->latest_regular_heuristics_result = heuristics;
  143. net_instance->latest_heuristics_result = heuristics;
  144. if (qdevice_net_heuristics_schedule_timer(net_instance) != 0) {
  145. return (0);
  146. }
  147. return (0);
  148. }
  149. static int
  150. qdevice_net_connect_heuristics_exec_result_callback(uint32_t seq_number,
  151. enum qdevice_heuristics_exec_result exec_result, void *user_data1, void *user_data2)
  152. {
  153. struct qdevice_heuristics_instance *heuristics_instance;
  154. struct qdevice_instance *instance;
  155. struct qdevice_net_instance *net_instance;
  156. enum tlv_vote vote;
  157. enum tlv_heuristics heuristics;
  158. int send_config_node_list;
  159. int send_membership_node_list;
  160. int send_quorum_node_list;
  161. struct tlv_ring_id tlv_rid;
  162. enum tlv_quorate quorate;
  163. instance = (struct qdevice_instance *)user_data1;
  164. heuristics_instance = &instance->heuristics_instance;
  165. net_instance = instance->model_data;
  166. if (qdevice_heuristics_result_notifier_list_set_active(&heuristics_instance->exec_result_notifier_list,
  167. qdevice_net_connect_heuristics_exec_result_callback, 0) != 0) {
  168. log(LOG_ERR, "Can't deactivate net connect heuristics exec callback notifier");
  169. net_instance->disconnect_reason = QDEVICE_NET_DISCONNECT_REASON_CANT_ACTIVATE_HEURISTICS_RESULT_NOTIFIER;
  170. net_instance->schedule_disconnect = 1;
  171. return (0);
  172. }
  173. if (net_instance->state != QDEVICE_NET_INSTANCE_STATE_WAITING_INIT_REPLY) {
  174. /*
  175. * Not connected to qnetd -> heuristics will be called again on new connect
  176. */
  177. log(LOG_DEBUG, "Received unexpected net connect heuristics in state %u",
  178. net_instance->state);
  179. return (0);
  180. }
  181. heuristics = qdevice_net_heuristics_exec_result_to_tlv(exec_result);
  182. send_config_node_list = 1;
  183. send_membership_node_list = 1;
  184. send_quorum_node_list = 1;
  185. vote = TLV_VOTE_WAIT_FOR_REPLY;
  186. if (qdevice_net_algorithm_connected(net_instance, &heuristics, &send_config_node_list,
  187. &send_membership_node_list, &send_quorum_node_list, &vote) != 0) {
  188. log(LOG_DEBUG, "Algorithm returned error. Disconnecting.");
  189. net_instance->disconnect_reason = QDEVICE_NET_DISCONNECT_REASON_ALGO_CONNECTED_ERR;
  190. return (0);
  191. } else {
  192. log(LOG_DEBUG, "Algorithm decided to %s config node list, %s membership "
  193. "node list, %s quorum node list, heuristics is %s and result vote is %s",
  194. (send_config_node_list ? "send" : "not send"),
  195. (send_membership_node_list ? "send" : "not send"),
  196. (send_quorum_node_list ? "send" : "not send"),
  197. tlv_heuristics_to_str(heuristics),
  198. tlv_vote_to_str(vote));
  199. }
  200. /*
  201. * Inform qnetd about connection options
  202. */
  203. if (net_instance->server_supports_keep_active_partition_tie_breaker) {
  204. if (qdevice_net_send_set_option(net_instance, 0, 0,
  205. net_instance->server_supports_keep_active_partition_tie_breaker,
  206. net_instance->keep_active_partition_tie_breaker) != 0) {
  207. net_instance->disconnect_reason = QDEVICE_NET_DISCONNECT_REASON_CANT_ALLOCATE_MSG_BUFFER;
  208. return (0);
  209. }
  210. }
  211. /*
  212. * Now we can finally really send node list, votequorum node list and update timer
  213. */
  214. if (send_config_node_list) {
  215. if (qdevice_net_send_config_node_list(net_instance,
  216. &instance->config_node_list,
  217. instance->config_node_list_version_set,
  218. instance->config_node_list_version, 1) != 0) {
  219. net_instance->disconnect_reason = QDEVICE_NET_DISCONNECT_REASON_CANT_ALLOCATE_MSG_BUFFER;
  220. return (0);
  221. }
  222. }
  223. if (send_membership_node_list) {
  224. qdevice_net_votequorum_ring_id_to_tlv(&tlv_rid,
  225. &instance->vq_node_list_ring_id);
  226. if (qdevice_net_send_membership_node_list(net_instance, &tlv_rid,
  227. instance->vq_node_list_entries,
  228. instance->vq_node_list,
  229. heuristics) != 0) {
  230. net_instance->disconnect_reason = QDEVICE_NET_DISCONNECT_REASON_CANT_ALLOCATE_MSG_BUFFER;
  231. return (0);
  232. }
  233. }
  234. if (send_quorum_node_list) {
  235. quorate = (instance->vq_quorum_quorate ?
  236. TLV_QUORATE_QUORATE : TLV_QUORATE_INQUORATE);
  237. if (qdevice_net_send_quorum_node_list(net_instance,
  238. quorate,
  239. instance->vq_quorum_node_list_entries,
  240. instance->vq_quorum_node_list) != 0) {
  241. net_instance->disconnect_reason = QDEVICE_NET_DISCONNECT_REASON_CANT_ALLOCATE_MSG_BUFFER;
  242. return (0);
  243. }
  244. }
  245. if (qdevice_net_cast_vote_timer_update(net_instance, vote) != 0) {
  246. log(LOG_CRIT, "qdevice_net_connect_heuristics_exec_result_callback fatal error. "
  247. " Can't update cast vote timer vote");
  248. net_instance->disconnect_reason = QDEVICE_NET_DISCONNECT_REASON_CANT_SCHEDULE_VOTING_TIMER;
  249. }
  250. net_instance->state = QDEVICE_NET_INSTANCE_STATE_WAITING_VOTEQUORUM_CMAP_EVENTS;
  251. net_instance->connected_since_time = time(NULL);
  252. net_instance->latest_connect_heuristics_result = heuristics;
  253. net_instance->latest_heuristics_result = heuristics;
  254. return (0);
  255. }
  256. static int
  257. qdevice_net_heuristics_timer_callback(void *data1, void *data2)
  258. {
  259. struct qdevice_net_instance *net_instance;
  260. struct qdevice_heuristics_instance *heuristics_instance;
  261. net_instance = (struct qdevice_net_instance *)data1;
  262. heuristics_instance = &net_instance->qdevice_instance_ptr->heuristics_instance;
  263. if (qdevice_heuristics_waiting_for_result(heuristics_instance)) {
  264. log(LOG_DEBUG, "Not executing regular heuristics because other heuristics is already running.");
  265. return (1);
  266. }
  267. net_instance->regular_heuristics_timer = NULL;
  268. log(LOG_DEBUG, "Executing regular heuristics.");
  269. if (qdevice_heuristics_result_notifier_list_set_active(&heuristics_instance->exec_result_notifier_list,
  270. qdevice_net_regular_heuristics_exec_result_callback, 1) != 0) {
  271. log(LOG_ERR, "Can't activate net regular heuristics exec callback notifier");
  272. net_instance->disconnect_reason = QDEVICE_NET_DISCONNECT_REASON_CANT_ACTIVATE_HEURISTICS_RESULT_NOTIFIER;
  273. net_instance->schedule_disconnect = 1;
  274. return (0);
  275. }
  276. if (qdevice_heuristics_exec(heuristics_instance,
  277. net_instance->qdevice_instance_ptr->sync_in_progress) != 0) {
  278. log(LOG_ERR, "Can't execute regular heuristics.");
  279. net_instance->schedule_disconnect = 1;
  280. net_instance->disconnect_reason = QDEVICE_NET_DISCONNECT_REASON_CANT_START_HEURISTICS;
  281. return (0);
  282. }
  283. /*
  284. * Do not schedule this callback again. It's going to be scheduled in the
  285. * qdevice_net_heuristics_exec_result_callback
  286. */
  287. return (0);
  288. }
  289. int
  290. qdevice_net_heuristics_stop_timer(struct qdevice_net_instance *net_instance)
  291. {
  292. struct qdevice_instance *instance;
  293. struct qdevice_heuristics_instance *heuristics_instance;
  294. instance = net_instance->qdevice_instance_ptr;
  295. heuristics_instance = &instance->heuristics_instance;
  296. if (net_instance->regular_heuristics_timer != NULL) {
  297. log(LOG_DEBUG, "Regular heuristics timer stopped");
  298. timer_list_entry_delete(pr_poll_loop_get_timer_list(&instance->main_poll_loop),
  299. net_instance->regular_heuristics_timer);
  300. net_instance->regular_heuristics_timer = NULL;
  301. if (qdevice_heuristics_result_notifier_list_set_active(&heuristics_instance->exec_result_notifier_list,
  302. qdevice_net_regular_heuristics_exec_result_callback, 0) != 0) {
  303. log(LOG_ERR, "Can't deactivate net regular heuristics exec callback notifier");
  304. net_instance->disconnect_reason =
  305. QDEVICE_NET_DISCONNECT_REASON_CANT_ACTIVATE_HEURISTICS_RESULT_NOTIFIER;
  306. net_instance->schedule_disconnect = 1;
  307. return (-1);
  308. }
  309. }
  310. return (0);
  311. }
  312. int
  313. qdevice_net_heuristics_schedule_timer(struct qdevice_net_instance *net_instance)
  314. {
  315. uint32_t interval;
  316. struct qdevice_instance *instance;
  317. struct qdevice_heuristics_instance *heuristics_instance;
  318. instance = net_instance->qdevice_instance_ptr;
  319. heuristics_instance = &instance->heuristics_instance;
  320. if (heuristics_instance->mode != QDEVICE_HEURISTICS_MODE_ENABLED) {
  321. log(LOG_DEBUG, "Not scheduling heuristics timer because mode is not enabled");
  322. if (qdevice_net_heuristics_stop_timer(net_instance) != 0) {
  323. return (-1);
  324. }
  325. return (0);
  326. }
  327. if (net_instance->regular_heuristics_timer != NULL) {
  328. log(LOG_DEBUG, "Not scheduling heuristics timer because it is already scheduled");
  329. return (0);
  330. }
  331. interval = heuristics_instance->interval;
  332. log(LOG_DEBUG, "Scheduling next regular heuristics in %"PRIu32"ms", interval);
  333. net_instance->regular_heuristics_timer = timer_list_add(
  334. pr_poll_loop_get_timer_list(&instance->main_poll_loop),
  335. interval,
  336. qdevice_net_heuristics_timer_callback,
  337. (void *)net_instance, NULL);
  338. if (net_instance->regular_heuristics_timer == NULL) {
  339. log(LOG_ERR, "Can't schedule regular heuristics.");
  340. net_instance->disconnect_reason = QDEVICE_NET_DISCONNECT_REASON_CANT_SCHEDULE_HEURISTICS_TIMER;
  341. net_instance->schedule_disconnect = 1;
  342. return (-1);
  343. }
  344. return (0);
  345. }
  346. int
  347. qdevice_net_heuristics_init(struct qdevice_net_instance *net_instance)
  348. {
  349. if (qdevice_heuristics_result_notifier_list_add(
  350. &net_instance->qdevice_instance_ptr->heuristics_instance.exec_result_notifier_list,
  351. qdevice_net_regular_heuristics_exec_result_callback,
  352. net_instance->qdevice_instance_ptr, NULL) == NULL) {
  353. log(LOG_ERR, "Can't add net regular heuristics exec callback into notifier");
  354. return (-1);
  355. }
  356. if (qdevice_heuristics_result_notifier_list_add(
  357. &net_instance->qdevice_instance_ptr->heuristics_instance.exec_result_notifier_list,
  358. qdevice_net_connect_heuristics_exec_result_callback,
  359. net_instance->qdevice_instance_ptr, NULL) == NULL) {
  360. log(LOG_ERR, "Can't add net connect heuristics exec callback into notifier");
  361. return (-1);
  362. }
  363. return (0);
  364. }
  365. int
  366. qdevice_net_heuristics_exec_after_connect(struct qdevice_net_instance *net_instance)
  367. {
  368. struct qdevice_instance *instance;
  369. struct qdevice_heuristics_instance *heuristics_instance;
  370. instance = net_instance->qdevice_instance_ptr;
  371. heuristics_instance = &instance->heuristics_instance;
  372. log(LOG_DEBUG, "Executing after-connect heuristics.");
  373. if (qdevice_heuristics_result_notifier_list_set_active(&heuristics_instance->exec_result_notifier_list,
  374. qdevice_net_connect_heuristics_exec_result_callback, 1) != 0) {
  375. log(LOG_ERR, "Can't activate net connect heuristics exec callback notifier");
  376. net_instance->disconnect_reason = QDEVICE_NET_DISCONNECT_REASON_CANT_ACTIVATE_HEURISTICS_RESULT_NOTIFIER;
  377. net_instance->schedule_disconnect = 1;
  378. return (-1);
  379. }
  380. if (qdevice_heuristics_exec(heuristics_instance,
  381. instance->sync_in_progress) != 0) {
  382. log(LOG_ERR, "Can't execute connect heuristics.");
  383. net_instance->schedule_disconnect = 1;
  384. net_instance->disconnect_reason = QDEVICE_NET_DISCONNECT_REASON_CANT_START_HEURISTICS;
  385. return (-1);
  386. }
  387. return (0);
  388. }