qdevice-net-heuristics.c 15 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462
  1. /*
  2. * Copyright (c) 2017 Red Hat, Inc.
  3. *
  4. * All rights reserved.
  5. *
  6. * Author: Jan Friesse (jfriesse@redhat.com)
  7. *
  8. * This software licensed under BSD license, the text of which follows:
  9. *
  10. * Redistribution and use in source and binary forms, with or without
  11. * modification, are permitted provided that the following conditions are met:
  12. *
  13. * - Redistributions of source code must retain the above copyright notice,
  14. * this list of conditions and the following disclaimer.
  15. * - Redistributions in binary form must reproduce the above copyright notice,
  16. * this list of conditions and the following disclaimer in the documentation
  17. * and/or other materials provided with the distribution.
  18. * - Neither the name of the Red Hat, Inc. nor the names of its
  19. * contributors may be used to endorse or promote products derived from this
  20. * software without specific prior written permission.
  21. *
  22. * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
  23. * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
  24. * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
  25. * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
  26. * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
  27. * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
  28. * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
  29. * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
  30. * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
  31. * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF
  32. * THE POSSIBILITY OF SUCH DAMAGE.
  33. */
  34. #include "qdevice-log.h"
  35. #include "qdevice-net-algorithm.h"
  36. #include "qdevice-net-cast-vote-timer.h"
  37. #include "qdevice-net-heuristics.h"
  38. #include "qdevice-net-send.h"
  39. #include "qdevice-net-votequorum.h"
  40. enum tlv_heuristics
  41. qdevice_net_heuristics_exec_result_to_tlv(enum qdevice_heuristics_exec_result exec_result)
  42. {
  43. enum tlv_heuristics res;
  44. switch (exec_result) {
  45. case QDEVICE_HEURISTICS_EXEC_RESULT_DISABLED: res = TLV_HEURISTICS_UNDEFINED; break;
  46. case QDEVICE_HEURISTICS_EXEC_RESULT_PASS: res = TLV_HEURISTICS_PASS; break;
  47. case QDEVICE_HEURISTICS_EXEC_RESULT_FAIL: res = TLV_HEURISTICS_FAIL; break;
  48. default:
  49. qdevice_log(LOG_ERR, "qdevice_net_heuristics_exec_result_to_tlv: Unhandled "
  50. "heuristics exec result %s",
  51. qdevice_heuristics_exec_result_to_str(exec_result));
  52. exit(1);
  53. break;
  54. }
  55. return (res);
  56. }
  57. static int
  58. qdevice_net_regular_heuristics_exec_result_callback(void *heuristics_instance_ptr,
  59. uint32_t seq_number, enum qdevice_heuristics_exec_result exec_result)
  60. {
  61. struct qdevice_heuristics_instance *heuristics_instance;
  62. struct qdevice_instance *instance;
  63. struct qdevice_net_instance *net_instance;
  64. int send_msg;
  65. enum tlv_vote vote;
  66. enum tlv_heuristics heuristics;
  67. heuristics_instance = (struct qdevice_heuristics_instance *)heuristics_instance_ptr;
  68. instance = heuristics_instance->qdevice_instance_ptr;
  69. net_instance = instance->model_data;
  70. if (qdevice_heuristics_result_notifier_list_set_active(&heuristics_instance->exec_result_notifier_list,
  71. qdevice_net_regular_heuristics_exec_result_callback, 0) != 0) {
  72. qdevice_log(LOG_ERR, "Can't deactivate net regular heuristics exec callback notifier");
  73. net_instance->disconnect_reason = QDEVICE_NET_DISCONNECT_REASON_CANT_ACTIVATE_HEURISTICS_RESULT_NOTIFIER;
  74. net_instance->schedule_disconnect = 1;
  75. return (0);
  76. }
  77. heuristics = qdevice_net_heuristics_exec_result_to_tlv(exec_result);
  78. if (exec_result == QDEVICE_HEURISTICS_EXEC_RESULT_DISABLED) {
  79. /*
  80. * Can happen when user disables heuristics during runtime
  81. */
  82. return (0);
  83. }
  84. if (net_instance->latest_heuristics_result != heuristics) {
  85. qdevice_log(LOG_ERR, "Heuristics result changed from %s to %s",
  86. tlv_heuristics_to_str(net_instance->latest_heuristics_result),
  87. tlv_heuristics_to_str(heuristics));
  88. if (net_instance->state != QDEVICE_NET_INSTANCE_STATE_WAITING_VOTEQUORUM_CMAP_EVENTS) {
  89. /*
  90. * Not connected to qnetd
  91. */
  92. send_msg = 0;
  93. } else {
  94. send_msg = 1;
  95. }
  96. vote = TLV_VOTE_NO_CHANGE;
  97. if (qdevice_net_algorithm_heuristics_change(net_instance, &heuristics, &send_msg,
  98. &vote) == -1) {
  99. qdevice_log(LOG_ERR, "Algorithm returned error. Disconnecting.");
  100. net_instance->disconnect_reason =
  101. QDEVICE_NET_DISCONNECT_REASON_ALGO_HEURISTICS_CHANGE_ERR;
  102. net_instance->schedule_disconnect = 1;
  103. return (0);
  104. } else {
  105. qdevice_log(LOG_DEBUG, "Algorithm decided to %s message with heuristics result "
  106. "%s and result vote is %s", (send_msg ? "send" : "not send"),
  107. tlv_heuristics_to_str(heuristics), tlv_vote_to_str(vote));
  108. }
  109. if (send_msg) {
  110. if (heuristics == TLV_HEURISTICS_UNDEFINED) {
  111. qdevice_log(LOG_ERR, "Inconsistent algorithm result. "
  112. "It's not possible to send message with undefined heuristics. "
  113. "Disconnecting.");
  114. net_instance->disconnect_reason =
  115. QDEVICE_NET_DISCONNECT_REASON_ALGO_HEURISTICS_CHANGE_ERR;
  116. net_instance->schedule_disconnect = 1;
  117. return (0);
  118. }
  119. if (!net_instance->server_supports_heuristics) {
  120. qdevice_log(LOG_ERR, "Server doesn't support heuristics. "
  121. "Disconnecting.");
  122. net_instance->disconnect_reason =
  123. QDEVICE_NET_DISCONNECT_REASON_SERVER_DOESNT_SUPPORT_REQUIRED_OPT;
  124. net_instance->schedule_disconnect = 1;
  125. return (0);
  126. }
  127. if (qdevice_net_send_heuristics_change(net_instance, heuristics) != 0) {
  128. net_instance->disconnect_reason = QDEVICE_NET_DISCONNECT_REASON_CANT_ALLOCATE_MSG_BUFFER;
  129. net_instance->schedule_disconnect = 1;
  130. return (0);
  131. }
  132. }
  133. if (qdevice_net_cast_vote_timer_update(net_instance, vote) != 0) {
  134. qdevice_log(LOG_CRIT, "qdevice_net_heuristics_exec_result_callback "
  135. "Can't update cast vote timer");
  136. net_instance->disconnect_reason = QDEVICE_NET_DISCONNECT_REASON_CANT_SCHEDULE_VOTING_TIMER;
  137. net_instance->schedule_disconnect = 1;
  138. return (0);
  139. }
  140. }
  141. net_instance->latest_regular_heuristics_result = heuristics;
  142. net_instance->latest_heuristics_result = heuristics;
  143. if (qdevice_net_heuristics_schedule_timer(net_instance) != 0) {
  144. return (0);
  145. }
  146. return (0);
  147. }
  148. static int
  149. qdevice_net_connect_heuristics_exec_result_callback(void *heuristics_instance_ptr,
  150. uint32_t seq_number, enum qdevice_heuristics_exec_result exec_result)
  151. {
  152. struct qdevice_heuristics_instance *heuristics_instance;
  153. struct qdevice_instance *instance;
  154. struct qdevice_net_instance *net_instance;
  155. enum tlv_vote vote;
  156. enum tlv_heuristics heuristics;
  157. int send_config_node_list;
  158. int send_membership_node_list;
  159. int send_quorum_node_list;
  160. struct tlv_ring_id tlv_rid;
  161. enum tlv_quorate quorate;
  162. heuristics_instance = (struct qdevice_heuristics_instance *)heuristics_instance_ptr;
  163. instance = heuristics_instance->qdevice_instance_ptr;
  164. net_instance = instance->model_data;
  165. if (qdevice_heuristics_result_notifier_list_set_active(&heuristics_instance->exec_result_notifier_list,
  166. qdevice_net_connect_heuristics_exec_result_callback, 0) != 0) {
  167. qdevice_log(LOG_ERR, "Can't deactivate net connect heuristics exec callback notifier");
  168. net_instance->disconnect_reason = QDEVICE_NET_DISCONNECT_REASON_CANT_ACTIVATE_HEURISTICS_RESULT_NOTIFIER;
  169. net_instance->schedule_disconnect = 1;
  170. return (0);
  171. }
  172. heuristics = qdevice_net_heuristics_exec_result_to_tlv(exec_result);
  173. send_config_node_list = 1;
  174. send_membership_node_list = 1;
  175. send_quorum_node_list = 1;
  176. vote = TLV_VOTE_WAIT_FOR_REPLY;
  177. if (qdevice_net_algorithm_connected(net_instance, &heuristics, &send_config_node_list,
  178. &send_membership_node_list, &send_quorum_node_list, &vote) != 0) {
  179. qdevice_log(LOG_DEBUG, "Algorithm returned error. Disconnecting.");
  180. net_instance->disconnect_reason = QDEVICE_NET_DISCONNECT_REASON_ALGO_CONNECTED_ERR;
  181. return (0);
  182. } else {
  183. qdevice_log(LOG_DEBUG, "Algorithm decided to %s config node list, %s membership "
  184. "node list, %s quorum node list, heuristics is %s and result vote is %s",
  185. (send_config_node_list ? "send" : "not send"),
  186. (send_membership_node_list ? "send" : "not send"),
  187. (send_quorum_node_list ? "send" : "not send"),
  188. tlv_heuristics_to_str(heuristics),
  189. tlv_vote_to_str(vote));
  190. }
  191. /*
  192. * Now we can finally really send node list, votequorum node list and update timer
  193. */
  194. if (send_config_node_list) {
  195. if (qdevice_net_send_config_node_list(net_instance,
  196. &instance->config_node_list,
  197. instance->config_node_list_version_set,
  198. instance->config_node_list_version, 1) != 0) {
  199. net_instance->disconnect_reason = QDEVICE_NET_DISCONNECT_REASON_CANT_ALLOCATE_MSG_BUFFER;
  200. return (0);
  201. }
  202. }
  203. if (send_membership_node_list) {
  204. qdevice_net_votequorum_ring_id_to_tlv(&tlv_rid,
  205. &instance->vq_node_list_ring_id);
  206. if (qdevice_net_send_membership_node_list(net_instance, &tlv_rid,
  207. instance->vq_node_list_entries,
  208. instance->vq_node_list,
  209. heuristics) != 0) {
  210. net_instance->disconnect_reason = QDEVICE_NET_DISCONNECT_REASON_CANT_ALLOCATE_MSG_BUFFER;
  211. return (0);
  212. }
  213. }
  214. if (send_quorum_node_list) {
  215. quorate = (instance->vq_quorum_quorate ?
  216. TLV_QUORATE_QUORATE : TLV_QUORATE_INQUORATE);
  217. if (qdevice_net_send_quorum_node_list(net_instance,
  218. quorate,
  219. instance->vq_quorum_node_list_entries,
  220. instance->vq_quorum_node_list) != 0) {
  221. net_instance->disconnect_reason = QDEVICE_NET_DISCONNECT_REASON_CANT_ALLOCATE_MSG_BUFFER;
  222. return (0);
  223. }
  224. }
  225. if (qdevice_net_cast_vote_timer_update(net_instance, vote) != 0) {
  226. qdevice_log(LOG_CRIT, "qdevice_net_msg_received_set_option_reply fatal error. "
  227. " Can't update cast vote timer vote");
  228. net_instance->disconnect_reason = QDEVICE_NET_DISCONNECT_REASON_CANT_SCHEDULE_VOTING_TIMER;
  229. }
  230. net_instance->state = QDEVICE_NET_INSTANCE_STATE_WAITING_VOTEQUORUM_CMAP_EVENTS;
  231. net_instance->connected_since_time = time(NULL);
  232. net_instance->latest_connect_heuristics_result = heuristics;
  233. net_instance->latest_heuristics_result = heuristics;
  234. return (0);
  235. }
  236. static int
  237. qdevice_net_heuristics_timer_callback(void *data1, void *data2)
  238. {
  239. struct qdevice_net_instance *net_instance;
  240. struct qdevice_heuristics_instance *heuristics_instance;
  241. net_instance = (struct qdevice_net_instance *)data1;
  242. heuristics_instance = &net_instance->qdevice_instance_ptr->heuristics_instance;
  243. if (qdevice_heuristics_waiting_for_result(heuristics_instance)) {
  244. qdevice_log(LOG_DEBUG, "Not executing regular heuristics because other heuristics is already running.");
  245. return (1);
  246. }
  247. net_instance->regular_heuristics_timer = NULL;
  248. qdevice_log(LOG_DEBUG, "Executing regular heuristics.");
  249. if (qdevice_heuristics_result_notifier_list_set_active(&heuristics_instance->exec_result_notifier_list,
  250. qdevice_net_regular_heuristics_exec_result_callback, 1) != 0) {
  251. qdevice_log(LOG_ERR, "Can't activate net regular heuristics exec callback notifier");
  252. net_instance->disconnect_reason = QDEVICE_NET_DISCONNECT_REASON_CANT_ACTIVATE_HEURISTICS_RESULT_NOTIFIER;
  253. net_instance->schedule_disconnect = 1;
  254. return (0);
  255. }
  256. if (qdevice_heuristics_exec(heuristics_instance,
  257. net_instance->qdevice_instance_ptr->sync_in_progress) != 0) {
  258. qdevice_log(LOG_ERR, "Can't execute regular heuristics.");
  259. net_instance->schedule_disconnect = 1;
  260. net_instance->disconnect_reason = QDEVICE_NET_DISCONNECT_REASON_CANT_START_HEURISTICS;
  261. return (0);
  262. }
  263. /*
  264. * Do not schedule this callback again. It's going to be scheduled in the
  265. * qdevice_net_heuristics_exec_result_callback
  266. */
  267. return (0);
  268. }
  269. int
  270. qdevice_net_heuristics_stop_timer(struct qdevice_net_instance *net_instance)
  271. {
  272. struct qdevice_instance *instance;
  273. struct qdevice_heuristics_instance *heuristics_instance;
  274. instance = net_instance->qdevice_instance_ptr;
  275. heuristics_instance = &instance->heuristics_instance;
  276. if (net_instance->regular_heuristics_timer != NULL) {
  277. qdevice_log(LOG_DEBUG, "Regular heuristics timer stopped");
  278. timer_list_delete(&net_instance->main_timer_list, net_instance->regular_heuristics_timer);
  279. net_instance->regular_heuristics_timer = NULL;
  280. if (qdevice_heuristics_result_notifier_list_set_active(&heuristics_instance->exec_result_notifier_list,
  281. qdevice_net_regular_heuristics_exec_result_callback, 0) != 0) {
  282. qdevice_log(LOG_ERR, "Can't deactivate net regular heuristics exec callback notifier");
  283. net_instance->disconnect_reason =
  284. QDEVICE_NET_DISCONNECT_REASON_CANT_ACTIVATE_HEURISTICS_RESULT_NOTIFIER;
  285. net_instance->schedule_disconnect = 1;
  286. return (-1);
  287. }
  288. }
  289. return (0);
  290. }
  291. int
  292. qdevice_net_heuristics_schedule_timer(struct qdevice_net_instance *net_instance)
  293. {
  294. uint32_t interval;
  295. struct qdevice_instance *instance;
  296. struct qdevice_heuristics_instance *heuristics_instance;
  297. instance = net_instance->qdevice_instance_ptr;
  298. heuristics_instance = &instance->heuristics_instance;
  299. if (heuristics_instance->mode != QDEVICE_HEURISTICS_MODE_ENABLED) {
  300. qdevice_log(LOG_DEBUG, "Not scheduling heuristics timer because mode is not enabled");
  301. if (qdevice_net_heuristics_stop_timer(net_instance) != 0) {
  302. return (-1);
  303. }
  304. return (0);
  305. }
  306. if (net_instance->regular_heuristics_timer != NULL) {
  307. qdevice_log(LOG_DEBUG, "Not scheduling heuristics timer because it is already scheduled");
  308. return (0);
  309. }
  310. interval = heuristics_instance->interval;
  311. qdevice_log(LOG_DEBUG, "Scheduling next regular heuristics in %"PRIu32"ms", interval);
  312. net_instance->regular_heuristics_timer = timer_list_add(&net_instance->main_timer_list,
  313. interval,
  314. qdevice_net_heuristics_timer_callback,
  315. (void *)net_instance, NULL);
  316. if (net_instance->regular_heuristics_timer == NULL) {
  317. qdevice_log(LOG_ERR, "Can't schedule regular heuristics.");
  318. net_instance->disconnect_reason = QDEVICE_NET_DISCONNECT_REASON_CANT_SCHEDULE_HEURISTICS_TIMER;
  319. net_instance->schedule_disconnect = 1;
  320. return (-1);
  321. }
  322. return (0);
  323. }
  324. int
  325. qdevice_net_heuristics_init(struct qdevice_net_instance *net_instance)
  326. {
  327. if (qdevice_heuristics_result_notifier_list_add(
  328. &net_instance->qdevice_instance_ptr->heuristics_instance.exec_result_notifier_list,
  329. qdevice_net_regular_heuristics_exec_result_callback) == NULL) {
  330. qdevice_log(LOG_ERR, "Can't add net regular heuristics exec callback into notifier");
  331. return (-1);
  332. }
  333. if (qdevice_heuristics_result_notifier_list_add(
  334. &net_instance->qdevice_instance_ptr->heuristics_instance.exec_result_notifier_list,
  335. qdevice_net_connect_heuristics_exec_result_callback) == NULL) {
  336. qdevice_log(LOG_ERR, "Can't add net connect heuristics exec callback into notifier");
  337. return (-1);
  338. }
  339. return (0);
  340. }
  341. int
  342. qdevice_net_heuristics_exec_after_connect(struct qdevice_net_instance *net_instance)
  343. {
  344. struct qdevice_instance *instance;
  345. struct qdevice_heuristics_instance *heuristics_instance;
  346. instance = net_instance->qdevice_instance_ptr;
  347. heuristics_instance = &instance->heuristics_instance;
  348. qdevice_log(LOG_DEBUG, "Executing after-connect heuristics.");
  349. if (qdevice_heuristics_result_notifier_list_set_active(&heuristics_instance->exec_result_notifier_list,
  350. qdevice_net_connect_heuristics_exec_result_callback, 1) != 0) {
  351. qdevice_log(LOG_ERR, "Can't activate net connect heuristics exec callback notifier");
  352. net_instance->disconnect_reason = QDEVICE_NET_DISCONNECT_REASON_CANT_ACTIVATE_HEURISTICS_RESULT_NOTIFIER;
  353. net_instance->schedule_disconnect = 1;
  354. return (-1);
  355. }
  356. if (qdevice_heuristics_exec(heuristics_instance,
  357. instance->sync_in_progress) != 0) {
  358. qdevice_log(LOG_ERR, "Can't execute connect heuristics.");
  359. net_instance->schedule_disconnect = 1;
  360. net_instance->disconnect_reason = QDEVICE_NET_DISCONNECT_REASON_CANT_START_HEURISTICS;
  361. return (-1);
  362. }
  363. return (0);
  364. }