qdevice-net-heuristics.c 16 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469
  1. /*
  2. * Copyright (c) 2017-2020 Red Hat, Inc.
  3. *
  4. * All rights reserved.
  5. *
  6. * Author: Jan Friesse (jfriesse@redhat.com)
  7. *
  8. * This software licensed under BSD license, the text of which follows:
  9. *
  10. * Redistribution and use in source and binary forms, with or without
  11. * modification, are permitted provided that the following conditions are met:
  12. *
  13. * - Redistributions of source code must retain the above copyright notice,
  14. * this list of conditions and the following disclaimer.
  15. * - Redistributions in binary form must reproduce the above copyright notice,
  16. * this list of conditions and the following disclaimer in the documentation
  17. * and/or other materials provided with the distribution.
  18. * - Neither the name of the Red Hat, Inc. nor the names of its
  19. * contributors may be used to endorse or promote products derived from this
  20. * software without specific prior written permission.
  21. *
  22. * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
  23. * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
  24. * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
  25. * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
  26. * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
  27. * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
  28. * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
  29. * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
  30. * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
  31. * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF
  32. * THE POSSIBILITY OF SUCH DAMAGE.
  33. */
  34. #include "log.h"
  35. #include "qdevice-net-algorithm.h"
  36. #include "qdevice-net-cast-vote-timer.h"
  37. #include "qdevice-net-heuristics.h"
  38. #include "qdevice-net-send.h"
  39. #include "qdevice-net-votequorum.h"
  40. enum tlv_heuristics
  41. qdevice_net_heuristics_exec_result_to_tlv(enum qdevice_heuristics_exec_result exec_result)
  42. {
  43. enum tlv_heuristics res;
  44. switch (exec_result) {
  45. case QDEVICE_HEURISTICS_EXEC_RESULT_DISABLED: res = TLV_HEURISTICS_UNDEFINED; break;
  46. case QDEVICE_HEURISTICS_EXEC_RESULT_PASS: res = TLV_HEURISTICS_PASS; break;
  47. case QDEVICE_HEURISTICS_EXEC_RESULT_FAIL: res = TLV_HEURISTICS_FAIL; break;
  48. default:
  49. log(LOG_ERR, "qdevice_net_heuristics_exec_result_to_tlv: Unhandled "
  50. "heuristics exec result %s",
  51. qdevice_heuristics_exec_result_to_str(exec_result));
  52. exit(EXIT_FAILURE);
  53. break;
  54. }
  55. return (res);
  56. }
  57. static int
  58. qdevice_net_regular_heuristics_exec_result_callback(void *heuristics_instance_ptr,
  59. uint32_t seq_number, enum qdevice_heuristics_exec_result exec_result)
  60. {
  61. struct qdevice_heuristics_instance *heuristics_instance;
  62. struct qdevice_instance *instance;
  63. struct qdevice_net_instance *net_instance;
  64. int send_msg;
  65. enum tlv_vote vote;
  66. enum tlv_heuristics heuristics;
  67. heuristics_instance = (struct qdevice_heuristics_instance *)heuristics_instance_ptr;
  68. instance = heuristics_instance->qdevice_instance_ptr;
  69. net_instance = instance->model_data;
  70. if (qdevice_heuristics_result_notifier_list_set_active(&heuristics_instance->exec_result_notifier_list,
  71. qdevice_net_regular_heuristics_exec_result_callback, 0) != 0) {
  72. log(LOG_ERR, "Can't deactivate net regular heuristics exec callback notifier");
  73. net_instance->disconnect_reason = QDEVICE_NET_DISCONNECT_REASON_CANT_ACTIVATE_HEURISTICS_RESULT_NOTIFIER;
  74. net_instance->schedule_disconnect = 1;
  75. return (0);
  76. }
  77. heuristics = qdevice_net_heuristics_exec_result_to_tlv(exec_result);
  78. if (exec_result == QDEVICE_HEURISTICS_EXEC_RESULT_DISABLED) {
  79. /*
  80. * Can happen when user disables heuristics during runtime
  81. */
  82. return (0);
  83. }
  84. if (net_instance->latest_heuristics_result != heuristics) {
  85. log(heuristics == TLV_HEURISTICS_PASS ? LOG_NOTICE : LOG_ERR,
  86. "Heuristics result changed from %s to %s",
  87. tlv_heuristics_to_str(net_instance->latest_heuristics_result),
  88. tlv_heuristics_to_str(heuristics));
  89. if (net_instance->state != QDEVICE_NET_INSTANCE_STATE_WAITING_VOTEQUORUM_CMAP_EVENTS) {
  90. /*
  91. * Not connected to qnetd
  92. */
  93. send_msg = 0;
  94. } else {
  95. send_msg = 1;
  96. }
  97. vote = TLV_VOTE_NO_CHANGE;
  98. if (qdevice_net_algorithm_heuristics_change(net_instance, &heuristics, &send_msg,
  99. &vote) == -1) {
  100. log(LOG_ERR, "Algorithm returned error. Disconnecting.");
  101. net_instance->disconnect_reason =
  102. QDEVICE_NET_DISCONNECT_REASON_ALGO_HEURISTICS_CHANGE_ERR;
  103. net_instance->schedule_disconnect = 1;
  104. return (0);
  105. } else {
  106. log(LOG_DEBUG, "Algorithm decided to %s message with heuristics result "
  107. "%s and result vote is %s", (send_msg ? "send" : "not send"),
  108. tlv_heuristics_to_str(heuristics), tlv_vote_to_str(vote));
  109. }
  110. if (send_msg) {
  111. if (heuristics == TLV_HEURISTICS_UNDEFINED) {
  112. log(LOG_ERR, "Inconsistent algorithm result. "
  113. "It's not possible to send message with undefined heuristics. "
  114. "Disconnecting.");
  115. net_instance->disconnect_reason =
  116. QDEVICE_NET_DISCONNECT_REASON_ALGO_HEURISTICS_CHANGE_ERR;
  117. net_instance->schedule_disconnect = 1;
  118. return (0);
  119. }
  120. if (!net_instance->server_supports_heuristics) {
  121. log(LOG_ERR, "Server doesn't support heuristics. "
  122. "Disconnecting.");
  123. net_instance->disconnect_reason =
  124. QDEVICE_NET_DISCONNECT_REASON_SERVER_DOESNT_SUPPORT_REQUIRED_OPT;
  125. net_instance->schedule_disconnect = 1;
  126. return (0);
  127. }
  128. if (qdevice_net_send_heuristics_change(net_instance, heuristics) != 0) {
  129. net_instance->disconnect_reason = QDEVICE_NET_DISCONNECT_REASON_CANT_ALLOCATE_MSG_BUFFER;
  130. net_instance->schedule_disconnect = 1;
  131. return (0);
  132. }
  133. }
  134. if (qdevice_net_cast_vote_timer_update(net_instance, vote) != 0) {
  135. log(LOG_CRIT, "qdevice_net_heuristics_exec_result_callback "
  136. "Can't update cast vote timer");
  137. net_instance->disconnect_reason = QDEVICE_NET_DISCONNECT_REASON_CANT_SCHEDULE_VOTING_TIMER;
  138. net_instance->schedule_disconnect = 1;
  139. return (0);
  140. }
  141. }
  142. net_instance->latest_regular_heuristics_result = heuristics;
  143. net_instance->latest_heuristics_result = heuristics;
  144. if (qdevice_net_heuristics_schedule_timer(net_instance) != 0) {
  145. return (0);
  146. }
  147. return (0);
  148. }
  149. static int
  150. qdevice_net_connect_heuristics_exec_result_callback(void *heuristics_instance_ptr,
  151. uint32_t seq_number, enum qdevice_heuristics_exec_result exec_result)
  152. {
  153. struct qdevice_heuristics_instance *heuristics_instance;
  154. struct qdevice_instance *instance;
  155. struct qdevice_net_instance *net_instance;
  156. enum tlv_vote vote;
  157. enum tlv_heuristics heuristics;
  158. int send_config_node_list;
  159. int send_membership_node_list;
  160. int send_quorum_node_list;
  161. struct tlv_ring_id tlv_rid;
  162. enum tlv_quorate quorate;
  163. heuristics_instance = (struct qdevice_heuristics_instance *)heuristics_instance_ptr;
  164. instance = heuristics_instance->qdevice_instance_ptr;
  165. net_instance = instance->model_data;
  166. if (qdevice_heuristics_result_notifier_list_set_active(&heuristics_instance->exec_result_notifier_list,
  167. qdevice_net_connect_heuristics_exec_result_callback, 0) != 0) {
  168. log(LOG_ERR, "Can't deactivate net connect heuristics exec callback notifier");
  169. net_instance->disconnect_reason = QDEVICE_NET_DISCONNECT_REASON_CANT_ACTIVATE_HEURISTICS_RESULT_NOTIFIER;
  170. net_instance->schedule_disconnect = 1;
  171. return (0);
  172. }
  173. if (net_instance->state != QDEVICE_NET_INSTANCE_STATE_WAITING_VOTEQUORUM_CMAP_EVENTS) {
  174. /*
  175. * Not connected to qnetd -> heuristics will be called again on new connect
  176. */
  177. return (0);
  178. }
  179. heuristics = qdevice_net_heuristics_exec_result_to_tlv(exec_result);
  180. send_config_node_list = 1;
  181. send_membership_node_list = 1;
  182. send_quorum_node_list = 1;
  183. vote = TLV_VOTE_WAIT_FOR_REPLY;
  184. if (qdevice_net_algorithm_connected(net_instance, &heuristics, &send_config_node_list,
  185. &send_membership_node_list, &send_quorum_node_list, &vote) != 0) {
  186. log(LOG_DEBUG, "Algorithm returned error. Disconnecting.");
  187. net_instance->disconnect_reason = QDEVICE_NET_DISCONNECT_REASON_ALGO_CONNECTED_ERR;
  188. return (0);
  189. } else {
  190. log(LOG_DEBUG, "Algorithm decided to %s config node list, %s membership "
  191. "node list, %s quorum node list, heuristics is %s and result vote is %s",
  192. (send_config_node_list ? "send" : "not send"),
  193. (send_membership_node_list ? "send" : "not send"),
  194. (send_quorum_node_list ? "send" : "not send"),
  195. tlv_heuristics_to_str(heuristics),
  196. tlv_vote_to_str(vote));
  197. }
  198. /*
  199. * Now we can finally really send node list, votequorum node list and update timer
  200. */
  201. if (send_config_node_list) {
  202. if (qdevice_net_send_config_node_list(net_instance,
  203. &instance->config_node_list,
  204. instance->config_node_list_version_set,
  205. instance->config_node_list_version, 1) != 0) {
  206. net_instance->disconnect_reason = QDEVICE_NET_DISCONNECT_REASON_CANT_ALLOCATE_MSG_BUFFER;
  207. return (0);
  208. }
  209. }
  210. if (send_membership_node_list) {
  211. qdevice_net_votequorum_ring_id_to_tlv(&tlv_rid,
  212. &instance->vq_node_list_ring_id);
  213. if (qdevice_net_send_membership_node_list(net_instance, &tlv_rid,
  214. instance->vq_node_list_entries,
  215. instance->vq_node_list,
  216. heuristics) != 0) {
  217. net_instance->disconnect_reason = QDEVICE_NET_DISCONNECT_REASON_CANT_ALLOCATE_MSG_BUFFER;
  218. return (0);
  219. }
  220. }
  221. if (send_quorum_node_list) {
  222. quorate = (instance->vq_quorum_quorate ?
  223. TLV_QUORATE_QUORATE : TLV_QUORATE_INQUORATE);
  224. if (qdevice_net_send_quorum_node_list(net_instance,
  225. quorate,
  226. instance->vq_quorum_node_list_entries,
  227. instance->vq_quorum_node_list) != 0) {
  228. net_instance->disconnect_reason = QDEVICE_NET_DISCONNECT_REASON_CANT_ALLOCATE_MSG_BUFFER;
  229. return (0);
  230. }
  231. }
  232. if (qdevice_net_cast_vote_timer_update(net_instance, vote) != 0) {
  233. log(LOG_CRIT, "qdevice_net_msg_received_set_option_reply fatal error. "
  234. " Can't update cast vote timer vote");
  235. net_instance->disconnect_reason = QDEVICE_NET_DISCONNECT_REASON_CANT_SCHEDULE_VOTING_TIMER;
  236. }
  237. net_instance->state = QDEVICE_NET_INSTANCE_STATE_WAITING_VOTEQUORUM_CMAP_EVENTS;
  238. net_instance->connected_since_time = time(NULL);
  239. net_instance->latest_connect_heuristics_result = heuristics;
  240. net_instance->latest_heuristics_result = heuristics;
  241. return (0);
  242. }
  243. static int
  244. qdevice_net_heuristics_timer_callback(void *data1, void *data2)
  245. {
  246. struct qdevice_net_instance *net_instance;
  247. struct qdevice_heuristics_instance *heuristics_instance;
  248. net_instance = (struct qdevice_net_instance *)data1;
  249. heuristics_instance = &net_instance->qdevice_instance_ptr->heuristics_instance;
  250. if (qdevice_heuristics_waiting_for_result(heuristics_instance)) {
  251. log(LOG_DEBUG, "Not executing regular heuristics because other heuristics is already running.");
  252. return (1);
  253. }
  254. net_instance->regular_heuristics_timer = NULL;
  255. log(LOG_DEBUG, "Executing regular heuristics.");
  256. if (qdevice_heuristics_result_notifier_list_set_active(&heuristics_instance->exec_result_notifier_list,
  257. qdevice_net_regular_heuristics_exec_result_callback, 1) != 0) {
  258. log(LOG_ERR, "Can't activate net regular heuristics exec callback notifier");
  259. net_instance->disconnect_reason = QDEVICE_NET_DISCONNECT_REASON_CANT_ACTIVATE_HEURISTICS_RESULT_NOTIFIER;
  260. net_instance->schedule_disconnect = 1;
  261. return (0);
  262. }
  263. if (qdevice_heuristics_exec(heuristics_instance,
  264. net_instance->qdevice_instance_ptr->sync_in_progress) != 0) {
  265. log(LOG_ERR, "Can't execute regular heuristics.");
  266. net_instance->schedule_disconnect = 1;
  267. net_instance->disconnect_reason = QDEVICE_NET_DISCONNECT_REASON_CANT_START_HEURISTICS;
  268. return (0);
  269. }
  270. /*
  271. * Do not schedule this callback again. It's going to be scheduled in the
  272. * qdevice_net_heuristics_exec_result_callback
  273. */
  274. return (0);
  275. }
  276. int
  277. qdevice_net_heuristics_stop_timer(struct qdevice_net_instance *net_instance)
  278. {
  279. struct qdevice_instance *instance;
  280. struct qdevice_heuristics_instance *heuristics_instance;
  281. instance = net_instance->qdevice_instance_ptr;
  282. heuristics_instance = &instance->heuristics_instance;
  283. if (net_instance->regular_heuristics_timer != NULL) {
  284. log(LOG_DEBUG, "Regular heuristics timer stopped");
  285. timer_list_delete(&net_instance->main_timer_list, net_instance->regular_heuristics_timer);
  286. net_instance->regular_heuristics_timer = NULL;
  287. if (qdevice_heuristics_result_notifier_list_set_active(&heuristics_instance->exec_result_notifier_list,
  288. qdevice_net_regular_heuristics_exec_result_callback, 0) != 0) {
  289. log(LOG_ERR, "Can't deactivate net regular heuristics exec callback notifier");
  290. net_instance->disconnect_reason =
  291. QDEVICE_NET_DISCONNECT_REASON_CANT_ACTIVATE_HEURISTICS_RESULT_NOTIFIER;
  292. net_instance->schedule_disconnect = 1;
  293. return (-1);
  294. }
  295. }
  296. return (0);
  297. }
  298. int
  299. qdevice_net_heuristics_schedule_timer(struct qdevice_net_instance *net_instance)
  300. {
  301. uint32_t interval;
  302. struct qdevice_instance *instance;
  303. struct qdevice_heuristics_instance *heuristics_instance;
  304. instance = net_instance->qdevice_instance_ptr;
  305. heuristics_instance = &instance->heuristics_instance;
  306. if (heuristics_instance->mode != QDEVICE_HEURISTICS_MODE_ENABLED) {
  307. log(LOG_DEBUG, "Not scheduling heuristics timer because mode is not enabled");
  308. if (qdevice_net_heuristics_stop_timer(net_instance) != 0) {
  309. return (-1);
  310. }
  311. return (0);
  312. }
  313. if (net_instance->regular_heuristics_timer != NULL) {
  314. log(LOG_DEBUG, "Not scheduling heuristics timer because it is already scheduled");
  315. return (0);
  316. }
  317. interval = heuristics_instance->interval;
  318. log(LOG_DEBUG, "Scheduling next regular heuristics in %"PRIu32"ms", interval);
  319. net_instance->regular_heuristics_timer = timer_list_add(&net_instance->main_timer_list,
  320. interval,
  321. qdevice_net_heuristics_timer_callback,
  322. (void *)net_instance, NULL);
  323. if (net_instance->regular_heuristics_timer == NULL) {
  324. log(LOG_ERR, "Can't schedule regular heuristics.");
  325. net_instance->disconnect_reason = QDEVICE_NET_DISCONNECT_REASON_CANT_SCHEDULE_HEURISTICS_TIMER;
  326. net_instance->schedule_disconnect = 1;
  327. return (-1);
  328. }
  329. return (0);
  330. }
  331. int
  332. qdevice_net_heuristics_init(struct qdevice_net_instance *net_instance)
  333. {
  334. if (qdevice_heuristics_result_notifier_list_add(
  335. &net_instance->qdevice_instance_ptr->heuristics_instance.exec_result_notifier_list,
  336. qdevice_net_regular_heuristics_exec_result_callback) == NULL) {
  337. log(LOG_ERR, "Can't add net regular heuristics exec callback into notifier");
  338. return (-1);
  339. }
  340. if (qdevice_heuristics_result_notifier_list_add(
  341. &net_instance->qdevice_instance_ptr->heuristics_instance.exec_result_notifier_list,
  342. qdevice_net_connect_heuristics_exec_result_callback) == NULL) {
  343. log(LOG_ERR, "Can't add net connect heuristics exec callback into notifier");
  344. return (-1);
  345. }
  346. return (0);
  347. }
  348. int
  349. qdevice_net_heuristics_exec_after_connect(struct qdevice_net_instance *net_instance)
  350. {
  351. struct qdevice_instance *instance;
  352. struct qdevice_heuristics_instance *heuristics_instance;
  353. instance = net_instance->qdevice_instance_ptr;
  354. heuristics_instance = &instance->heuristics_instance;
  355. log(LOG_DEBUG, "Executing after-connect heuristics.");
  356. if (qdevice_heuristics_result_notifier_list_set_active(&heuristics_instance->exec_result_notifier_list,
  357. qdevice_net_connect_heuristics_exec_result_callback, 1) != 0) {
  358. log(LOG_ERR, "Can't activate net connect heuristics exec callback notifier");
  359. net_instance->disconnect_reason = QDEVICE_NET_DISCONNECT_REASON_CANT_ACTIVATE_HEURISTICS_RESULT_NOTIFIER;
  360. net_instance->schedule_disconnect = 1;
  361. return (-1);
  362. }
  363. if (qdevice_heuristics_exec(heuristics_instance,
  364. instance->sync_in_progress) != 0) {
  365. log(LOG_ERR, "Can't execute connect heuristics.");
  366. net_instance->schedule_disconnect = 1;
  367. net_instance->disconnect_reason = QDEVICE_NET_DISCONNECT_REASON_CANT_START_HEURISTICS;
  368. return (-1);
  369. }
  370. return (0);
  371. }