qdevice-net-heuristics.c 15 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463
  1. /*
  2. * Copyright (c) 2017-2020 Red Hat, Inc.
  3. *
  4. * All rights reserved.
  5. *
  6. * Author: Jan Friesse (jfriesse@redhat.com)
  7. *
  8. * This software licensed under BSD license, the text of which follows:
  9. *
  10. * Redistribution and use in source and binary forms, with or without
  11. * modification, are permitted provided that the following conditions are met:
  12. *
  13. * - Redistributions of source code must retain the above copyright notice,
  14. * this list of conditions and the following disclaimer.
  15. * - Redistributions in binary form must reproduce the above copyright notice,
  16. * this list of conditions and the following disclaimer in the documentation
  17. * and/or other materials provided with the distribution.
  18. * - Neither the name of the Red Hat, Inc. nor the names of its
  19. * contributors may be used to endorse or promote products derived from this
  20. * software without specific prior written permission.
  21. *
  22. * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
  23. * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
  24. * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
  25. * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
  26. * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
  27. * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
  28. * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
  29. * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
  30. * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
  31. * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF
  32. * THE POSSIBILITY OF SUCH DAMAGE.
  33. */
  34. #include "log.h"
  35. #include "qdevice-net-algorithm.h"
  36. #include "qdevice-net-cast-vote-timer.h"
  37. #include "qdevice-net-heuristics.h"
  38. #include "qdevice-net-send.h"
  39. #include "qdevice-net-votequorum.h"
  40. enum tlv_heuristics
  41. qdevice_net_heuristics_exec_result_to_tlv(enum qdevice_heuristics_exec_result exec_result)
  42. {
  43. enum tlv_heuristics res;
  44. switch (exec_result) {
  45. case QDEVICE_HEURISTICS_EXEC_RESULT_DISABLED: res = TLV_HEURISTICS_UNDEFINED; break;
  46. case QDEVICE_HEURISTICS_EXEC_RESULT_PASS: res = TLV_HEURISTICS_PASS; break;
  47. case QDEVICE_HEURISTICS_EXEC_RESULT_FAIL: res = TLV_HEURISTICS_FAIL; break;
  48. default:
  49. log(LOG_ERR, "qdevice_net_heuristics_exec_result_to_tlv: Unhandled "
  50. "heuristics exec result %s",
  51. qdevice_heuristics_exec_result_to_str(exec_result));
  52. exit(EXIT_FAILURE);
  53. break;
  54. }
  55. return (res);
  56. }
  57. static int
  58. qdevice_net_regular_heuristics_exec_result_callback(void *heuristics_instance_ptr,
  59. uint32_t seq_number, enum qdevice_heuristics_exec_result exec_result)
  60. {
  61. struct qdevice_heuristics_instance *heuristics_instance;
  62. struct qdevice_instance *instance;
  63. struct qdevice_net_instance *net_instance;
  64. int send_msg;
  65. enum tlv_vote vote;
  66. enum tlv_heuristics heuristics;
  67. heuristics_instance = (struct qdevice_heuristics_instance *)heuristics_instance_ptr;
  68. instance = heuristics_instance->qdevice_instance_ptr;
  69. net_instance = instance->model_data;
  70. if (qdevice_heuristics_result_notifier_list_set_active(&heuristics_instance->exec_result_notifier_list,
  71. qdevice_net_regular_heuristics_exec_result_callback, 0) != 0) {
  72. log(LOG_ERR, "Can't deactivate net regular heuristics exec callback notifier");
  73. net_instance->disconnect_reason = QDEVICE_NET_DISCONNECT_REASON_CANT_ACTIVATE_HEURISTICS_RESULT_NOTIFIER;
  74. net_instance->schedule_disconnect = 1;
  75. return (0);
  76. }
  77. heuristics = qdevice_net_heuristics_exec_result_to_tlv(exec_result);
  78. if (exec_result == QDEVICE_HEURISTICS_EXEC_RESULT_DISABLED) {
  79. /*
  80. * Can happen when user disables heuristics during runtime
  81. */
  82. return (0);
  83. }
  84. if (net_instance->latest_heuristics_result != heuristics) {
  85. log(heuristics == TLV_HEURISTICS_PASS ? LOG_NOTICE : LOG_ERR,
  86. "Heuristics result changed from %s to %s",
  87. tlv_heuristics_to_str(net_instance->latest_heuristics_result),
  88. tlv_heuristics_to_str(heuristics));
  89. if (net_instance->state != QDEVICE_NET_INSTANCE_STATE_WAITING_VOTEQUORUM_CMAP_EVENTS) {
  90. /*
  91. * Not connected to qnetd
  92. */
  93. send_msg = 0;
  94. } else {
  95. send_msg = 1;
  96. }
  97. vote = TLV_VOTE_NO_CHANGE;
  98. if (qdevice_net_algorithm_heuristics_change(net_instance, &heuristics, &send_msg,
  99. &vote) == -1) {
  100. log(LOG_ERR, "Algorithm returned error. Disconnecting.");
  101. net_instance->disconnect_reason =
  102. QDEVICE_NET_DISCONNECT_REASON_ALGO_HEURISTICS_CHANGE_ERR;
  103. net_instance->schedule_disconnect = 1;
  104. return (0);
  105. } else {
  106. log(LOG_DEBUG, "Algorithm decided to %s message with heuristics result "
  107. "%s and result vote is %s", (send_msg ? "send" : "not send"),
  108. tlv_heuristics_to_str(heuristics), tlv_vote_to_str(vote));
  109. }
  110. if (send_msg) {
  111. if (heuristics == TLV_HEURISTICS_UNDEFINED) {
  112. log(LOG_ERR, "Inconsistent algorithm result. "
  113. "It's not possible to send message with undefined heuristics. "
  114. "Disconnecting.");
  115. net_instance->disconnect_reason =
  116. QDEVICE_NET_DISCONNECT_REASON_ALGO_HEURISTICS_CHANGE_ERR;
  117. net_instance->schedule_disconnect = 1;
  118. return (0);
  119. }
  120. if (!net_instance->server_supports_heuristics) {
  121. log(LOG_ERR, "Server doesn't support heuristics. "
  122. "Disconnecting.");
  123. net_instance->disconnect_reason =
  124. QDEVICE_NET_DISCONNECT_REASON_SERVER_DOESNT_SUPPORT_REQUIRED_OPT;
  125. net_instance->schedule_disconnect = 1;
  126. return (0);
  127. }
  128. if (qdevice_net_send_heuristics_change(net_instance, heuristics) != 0) {
  129. net_instance->disconnect_reason = QDEVICE_NET_DISCONNECT_REASON_CANT_ALLOCATE_MSG_BUFFER;
  130. net_instance->schedule_disconnect = 1;
  131. return (0);
  132. }
  133. }
  134. if (qdevice_net_cast_vote_timer_update(net_instance, vote) != 0) {
  135. log(LOG_CRIT, "qdevice_net_heuristics_exec_result_callback "
  136. "Can't update cast vote timer");
  137. net_instance->disconnect_reason = QDEVICE_NET_DISCONNECT_REASON_CANT_SCHEDULE_VOTING_TIMER;
  138. net_instance->schedule_disconnect = 1;
  139. return (0);
  140. }
  141. }
  142. net_instance->latest_regular_heuristics_result = heuristics;
  143. net_instance->latest_heuristics_result = heuristics;
  144. if (qdevice_net_heuristics_schedule_timer(net_instance) != 0) {
  145. return (0);
  146. }
  147. return (0);
  148. }
  149. static int
  150. qdevice_net_connect_heuristics_exec_result_callback(void *heuristics_instance_ptr,
  151. uint32_t seq_number, enum qdevice_heuristics_exec_result exec_result)
  152. {
  153. struct qdevice_heuristics_instance *heuristics_instance;
  154. struct qdevice_instance *instance;
  155. struct qdevice_net_instance *net_instance;
  156. enum tlv_vote vote;
  157. enum tlv_heuristics heuristics;
  158. int send_config_node_list;
  159. int send_membership_node_list;
  160. int send_quorum_node_list;
  161. struct tlv_ring_id tlv_rid;
  162. enum tlv_quorate quorate;
  163. heuristics_instance = (struct qdevice_heuristics_instance *)heuristics_instance_ptr;
  164. instance = heuristics_instance->qdevice_instance_ptr;
  165. net_instance = instance->model_data;
  166. if (qdevice_heuristics_result_notifier_list_set_active(&heuristics_instance->exec_result_notifier_list,
  167. qdevice_net_connect_heuristics_exec_result_callback, 0) != 0) {
  168. log(LOG_ERR, "Can't deactivate net connect heuristics exec callback notifier");
  169. net_instance->disconnect_reason = QDEVICE_NET_DISCONNECT_REASON_CANT_ACTIVATE_HEURISTICS_RESULT_NOTIFIER;
  170. net_instance->schedule_disconnect = 1;
  171. return (0);
  172. }
  173. heuristics = qdevice_net_heuristics_exec_result_to_tlv(exec_result);
  174. send_config_node_list = 1;
  175. send_membership_node_list = 1;
  176. send_quorum_node_list = 1;
  177. vote = TLV_VOTE_WAIT_FOR_REPLY;
  178. if (qdevice_net_algorithm_connected(net_instance, &heuristics, &send_config_node_list,
  179. &send_membership_node_list, &send_quorum_node_list, &vote) != 0) {
  180. log(LOG_DEBUG, "Algorithm returned error. Disconnecting.");
  181. net_instance->disconnect_reason = QDEVICE_NET_DISCONNECT_REASON_ALGO_CONNECTED_ERR;
  182. return (0);
  183. } else {
  184. log(LOG_DEBUG, "Algorithm decided to %s config node list, %s membership "
  185. "node list, %s quorum node list, heuristics is %s and result vote is %s",
  186. (send_config_node_list ? "send" : "not send"),
  187. (send_membership_node_list ? "send" : "not send"),
  188. (send_quorum_node_list ? "send" : "not send"),
  189. tlv_heuristics_to_str(heuristics),
  190. tlv_vote_to_str(vote));
  191. }
  192. /*
  193. * Now we can finally really send node list, votequorum node list and update timer
  194. */
  195. if (send_config_node_list) {
  196. if (qdevice_net_send_config_node_list(net_instance,
  197. &instance->config_node_list,
  198. instance->config_node_list_version_set,
  199. instance->config_node_list_version, 1) != 0) {
  200. net_instance->disconnect_reason = QDEVICE_NET_DISCONNECT_REASON_CANT_ALLOCATE_MSG_BUFFER;
  201. return (0);
  202. }
  203. }
  204. if (send_membership_node_list) {
  205. qdevice_net_votequorum_ring_id_to_tlv(&tlv_rid,
  206. &instance->vq_node_list_ring_id);
  207. if (qdevice_net_send_membership_node_list(net_instance, &tlv_rid,
  208. instance->vq_node_list_entries,
  209. instance->vq_node_list,
  210. heuristics) != 0) {
  211. net_instance->disconnect_reason = QDEVICE_NET_DISCONNECT_REASON_CANT_ALLOCATE_MSG_BUFFER;
  212. return (0);
  213. }
  214. }
  215. if (send_quorum_node_list) {
  216. quorate = (instance->vq_quorum_quorate ?
  217. TLV_QUORATE_QUORATE : TLV_QUORATE_INQUORATE);
  218. if (qdevice_net_send_quorum_node_list(net_instance,
  219. quorate,
  220. instance->vq_quorum_node_list_entries,
  221. instance->vq_quorum_node_list) != 0) {
  222. net_instance->disconnect_reason = QDEVICE_NET_DISCONNECT_REASON_CANT_ALLOCATE_MSG_BUFFER;
  223. return (0);
  224. }
  225. }
  226. if (qdevice_net_cast_vote_timer_update(net_instance, vote) != 0) {
  227. log(LOG_CRIT, "qdevice_net_msg_received_set_option_reply fatal error. "
  228. " Can't update cast vote timer vote");
  229. net_instance->disconnect_reason = QDEVICE_NET_DISCONNECT_REASON_CANT_SCHEDULE_VOTING_TIMER;
  230. }
  231. net_instance->state = QDEVICE_NET_INSTANCE_STATE_WAITING_VOTEQUORUM_CMAP_EVENTS;
  232. net_instance->connected_since_time = time(NULL);
  233. net_instance->latest_connect_heuristics_result = heuristics;
  234. net_instance->latest_heuristics_result = heuristics;
  235. return (0);
  236. }
  237. static int
  238. qdevice_net_heuristics_timer_callback(void *data1, void *data2)
  239. {
  240. struct qdevice_net_instance *net_instance;
  241. struct qdevice_heuristics_instance *heuristics_instance;
  242. net_instance = (struct qdevice_net_instance *)data1;
  243. heuristics_instance = &net_instance->qdevice_instance_ptr->heuristics_instance;
  244. if (qdevice_heuristics_waiting_for_result(heuristics_instance)) {
  245. log(LOG_DEBUG, "Not executing regular heuristics because other heuristics is already running.");
  246. return (1);
  247. }
  248. net_instance->regular_heuristics_timer = NULL;
  249. log(LOG_DEBUG, "Executing regular heuristics.");
  250. if (qdevice_heuristics_result_notifier_list_set_active(&heuristics_instance->exec_result_notifier_list,
  251. qdevice_net_regular_heuristics_exec_result_callback, 1) != 0) {
  252. log(LOG_ERR, "Can't activate net regular heuristics exec callback notifier");
  253. net_instance->disconnect_reason = QDEVICE_NET_DISCONNECT_REASON_CANT_ACTIVATE_HEURISTICS_RESULT_NOTIFIER;
  254. net_instance->schedule_disconnect = 1;
  255. return (0);
  256. }
  257. if (qdevice_heuristics_exec(heuristics_instance,
  258. net_instance->qdevice_instance_ptr->sync_in_progress) != 0) {
  259. log(LOG_ERR, "Can't execute regular heuristics.");
  260. net_instance->schedule_disconnect = 1;
  261. net_instance->disconnect_reason = QDEVICE_NET_DISCONNECT_REASON_CANT_START_HEURISTICS;
  262. return (0);
  263. }
  264. /*
  265. * Do not schedule this callback again. It's going to be scheduled in the
  266. * qdevice_net_heuristics_exec_result_callback
  267. */
  268. return (0);
  269. }
  270. int
  271. qdevice_net_heuristics_stop_timer(struct qdevice_net_instance *net_instance)
  272. {
  273. struct qdevice_instance *instance;
  274. struct qdevice_heuristics_instance *heuristics_instance;
  275. instance = net_instance->qdevice_instance_ptr;
  276. heuristics_instance = &instance->heuristics_instance;
  277. if (net_instance->regular_heuristics_timer != NULL) {
  278. log(LOG_DEBUG, "Regular heuristics timer stopped");
  279. timer_list_delete(&net_instance->main_timer_list, net_instance->regular_heuristics_timer);
  280. net_instance->regular_heuristics_timer = NULL;
  281. if (qdevice_heuristics_result_notifier_list_set_active(&heuristics_instance->exec_result_notifier_list,
  282. qdevice_net_regular_heuristics_exec_result_callback, 0) != 0) {
  283. log(LOG_ERR, "Can't deactivate net regular heuristics exec callback notifier");
  284. net_instance->disconnect_reason =
  285. QDEVICE_NET_DISCONNECT_REASON_CANT_ACTIVATE_HEURISTICS_RESULT_NOTIFIER;
  286. net_instance->schedule_disconnect = 1;
  287. return (-1);
  288. }
  289. }
  290. return (0);
  291. }
  292. int
  293. qdevice_net_heuristics_schedule_timer(struct qdevice_net_instance *net_instance)
  294. {
  295. uint32_t interval;
  296. struct qdevice_instance *instance;
  297. struct qdevice_heuristics_instance *heuristics_instance;
  298. instance = net_instance->qdevice_instance_ptr;
  299. heuristics_instance = &instance->heuristics_instance;
  300. if (heuristics_instance->mode != QDEVICE_HEURISTICS_MODE_ENABLED) {
  301. log(LOG_DEBUG, "Not scheduling heuristics timer because mode is not enabled");
  302. if (qdevice_net_heuristics_stop_timer(net_instance) != 0) {
  303. return (-1);
  304. }
  305. return (0);
  306. }
  307. if (net_instance->regular_heuristics_timer != NULL) {
  308. log(LOG_DEBUG, "Not scheduling heuristics timer because it is already scheduled");
  309. return (0);
  310. }
  311. interval = heuristics_instance->interval;
  312. log(LOG_DEBUG, "Scheduling next regular heuristics in %"PRIu32"ms", interval);
  313. net_instance->regular_heuristics_timer = timer_list_add(&net_instance->main_timer_list,
  314. interval,
  315. qdevice_net_heuristics_timer_callback,
  316. (void *)net_instance, NULL);
  317. if (net_instance->regular_heuristics_timer == NULL) {
  318. log(LOG_ERR, "Can't schedule regular heuristics.");
  319. net_instance->disconnect_reason = QDEVICE_NET_DISCONNECT_REASON_CANT_SCHEDULE_HEURISTICS_TIMER;
  320. net_instance->schedule_disconnect = 1;
  321. return (-1);
  322. }
  323. return (0);
  324. }
  325. int
  326. qdevice_net_heuristics_init(struct qdevice_net_instance *net_instance)
  327. {
  328. if (qdevice_heuristics_result_notifier_list_add(
  329. &net_instance->qdevice_instance_ptr->heuristics_instance.exec_result_notifier_list,
  330. qdevice_net_regular_heuristics_exec_result_callback) == NULL) {
  331. log(LOG_ERR, "Can't add net regular heuristics exec callback into notifier");
  332. return (-1);
  333. }
  334. if (qdevice_heuristics_result_notifier_list_add(
  335. &net_instance->qdevice_instance_ptr->heuristics_instance.exec_result_notifier_list,
  336. qdevice_net_connect_heuristics_exec_result_callback) == NULL) {
  337. log(LOG_ERR, "Can't add net connect heuristics exec callback into notifier");
  338. return (-1);
  339. }
  340. return (0);
  341. }
  342. int
  343. qdevice_net_heuristics_exec_after_connect(struct qdevice_net_instance *net_instance)
  344. {
  345. struct qdevice_instance *instance;
  346. struct qdevice_heuristics_instance *heuristics_instance;
  347. instance = net_instance->qdevice_instance_ptr;
  348. heuristics_instance = &instance->heuristics_instance;
  349. log(LOG_DEBUG, "Executing after-connect heuristics.");
  350. if (qdevice_heuristics_result_notifier_list_set_active(&heuristics_instance->exec_result_notifier_list,
  351. qdevice_net_connect_heuristics_exec_result_callback, 1) != 0) {
  352. log(LOG_ERR, "Can't activate net connect heuristics exec callback notifier");
  353. net_instance->disconnect_reason = QDEVICE_NET_DISCONNECT_REASON_CANT_ACTIVATE_HEURISTICS_RESULT_NOTIFIER;
  354. net_instance->schedule_disconnect = 1;
  355. return (-1);
  356. }
  357. if (qdevice_heuristics_exec(heuristics_instance,
  358. instance->sync_in_progress) != 0) {
  359. log(LOG_ERR, "Can't execute connect heuristics.");
  360. net_instance->schedule_disconnect = 1;
  361. net_instance->disconnect_reason = QDEVICE_NET_DISCONNECT_REASON_CANT_START_HEURISTICS;
  362. return (-1);
  363. }
  364. return (0);
  365. }