qdevice-net-heuristics.c 16 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471
  1. /*
  2. * Copyright (c) 2017-2019 Red Hat, Inc.
  3. *
  4. * All rights reserved.
  5. *
  6. * Author: Jan Friesse (jfriesse@redhat.com)
  7. *
  8. * This software licensed under BSD license, the text of which follows:
  9. *
  10. * Redistribution and use in source and binary forms, with or without
  11. * modification, are permitted provided that the following conditions are met:
  12. *
  13. * - Redistributions of source code must retain the above copyright notice,
  14. * this list of conditions and the following disclaimer.
  15. * - Redistributions in binary form must reproduce the above copyright notice,
  16. * this list of conditions and the following disclaimer in the documentation
  17. * and/or other materials provided with the distribution.
  18. * - Neither the name of the Red Hat, Inc. nor the names of its
  19. * contributors may be used to endorse or promote products derived from this
  20. * software without specific prior written permission.
  21. *
  22. * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
  23. * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
  24. * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
  25. * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
  26. * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
  27. * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
  28. * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
  29. * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
  30. * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
  31. * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF
  32. * THE POSSIBILITY OF SUCH DAMAGE.
  33. */
  34. #include "log.h"
  35. #include "qdevice-net-algorithm.h"
  36. #include "qdevice-net-cast-vote-timer.h"
  37. #include "qdevice-net-heuristics.h"
  38. #include "qdevice-net-send.h"
  39. #include "qdevice-net-votequorum.h"
  40. enum tlv_heuristics
  41. qdevice_net_heuristics_exec_result_to_tlv(enum qdevice_heuristics_exec_result exec_result)
  42. {
  43. enum tlv_heuristics res;
  44. switch (exec_result) {
  45. case QDEVICE_HEURISTICS_EXEC_RESULT_DISABLED: res = TLV_HEURISTICS_UNDEFINED; break;
  46. case QDEVICE_HEURISTICS_EXEC_RESULT_PASS: res = TLV_HEURISTICS_PASS; break;
  47. case QDEVICE_HEURISTICS_EXEC_RESULT_FAIL: res = TLV_HEURISTICS_FAIL; break;
  48. default:
  49. log(LOG_ERR, "qdevice_net_heuristics_exec_result_to_tlv: Unhandled "
  50. "heuristics exec result %s",
  51. qdevice_heuristics_exec_result_to_str(exec_result));
  52. exit(1);
  53. break;
  54. }
  55. return (res);
  56. }
  57. static int
  58. qdevice_net_regular_heuristics_exec_result_callback(void *heuristics_instance_ptr,
  59. uint32_t seq_number, enum qdevice_heuristics_exec_result exec_result)
  60. {
  61. struct qdevice_heuristics_instance *heuristics_instance;
  62. struct qdevice_instance *instance;
  63. struct qdevice_net_instance *net_instance;
  64. int send_msg;
  65. enum tlv_vote vote;
  66. enum tlv_heuristics heuristics;
  67. heuristics_instance = (struct qdevice_heuristics_instance *)heuristics_instance_ptr;
  68. instance = heuristics_instance->qdevice_instance_ptr;
  69. net_instance = instance->model_data;
  70. if (qdevice_heuristics_result_notifier_list_set_active(&heuristics_instance->exec_result_notifier_list,
  71. qdevice_net_regular_heuristics_exec_result_callback, 0) != 0) {
  72. log(LOG_ERR, "Can't deactivate net regular heuristics exec callback notifier");
  73. net_instance->disconnect_reason = QDEVICE_NET_DISCONNECT_REASON_CANT_ACTIVATE_HEURISTICS_RESULT_NOTIFIER;
  74. net_instance->schedule_disconnect = 1;
  75. return (0);
  76. }
  77. heuristics = qdevice_net_heuristics_exec_result_to_tlv(exec_result);
  78. if (exec_result == QDEVICE_HEURISTICS_EXEC_RESULT_DISABLED) {
  79. /*
  80. * Can happen when user disables heuristics during runtime
  81. */
  82. return (0);
  83. }
  84. if (net_instance->latest_heuristics_result != heuristics) {
  85. log(heuristics == TLV_HEURISTICS_PASS ? LOG_NOTICE : LOG_ERR,
  86. "Heuristics result changed from %s to %s",
  87. tlv_heuristics_to_str(net_instance->latest_heuristics_result),
  88. tlv_heuristics_to_str(heuristics));
  89. if (net_instance->state != QDEVICE_NET_INSTANCE_STATE_WAITING_VOTEQUORUM_CMAP_EVENTS) {
  90. /*
  91. * Not connected to qnetd
  92. */
  93. send_msg = 0;
  94. } else {
  95. send_msg = 1;
  96. }
  97. vote = TLV_VOTE_NO_CHANGE;
  98. if (qdevice_net_algorithm_heuristics_change(net_instance, &heuristics, &send_msg,
  99. &vote) == -1) {
  100. log(LOG_ERR, "Algorithm returned error. Disconnecting.");
  101. net_instance->disconnect_reason =
  102. QDEVICE_NET_DISCONNECT_REASON_ALGO_HEURISTICS_CHANGE_ERR;
  103. net_instance->schedule_disconnect = 1;
  104. return (0);
  105. } else {
  106. log(LOG_DEBUG, "Algorithm decided to %s message with heuristics result "
  107. "%s and result vote is %s", (send_msg ? "send" : "not send"),
  108. tlv_heuristics_to_str(heuristics), tlv_vote_to_str(vote));
  109. }
  110. if (send_msg) {
  111. if (heuristics == TLV_HEURISTICS_UNDEFINED) {
  112. log(LOG_ERR, "Inconsistent algorithm result. "
  113. "It's not possible to send message with undefined heuristics. "
  114. "Disconnecting.");
  115. net_instance->disconnect_reason =
  116. QDEVICE_NET_DISCONNECT_REASON_ALGO_HEURISTICS_CHANGE_ERR;
  117. net_instance->schedule_disconnect = 1;
  118. return (0);
  119. }
  120. if (!net_instance->server_supports_heuristics) {
  121. log(LOG_ERR, "Server doesn't support heuristics. "
  122. "Disconnecting.");
  123. net_instance->disconnect_reason =
  124. QDEVICE_NET_DISCONNECT_REASON_SERVER_DOESNT_SUPPORT_REQUIRED_OPT;
  125. net_instance->schedule_disconnect = 1;
  126. return (0);
  127. }
  128. if (qdevice_net_send_heuristics_change(net_instance, heuristics) != 0) {
  129. net_instance->disconnect_reason = QDEVICE_NET_DISCONNECT_REASON_CANT_ALLOCATE_MSG_BUFFER;
  130. net_instance->schedule_disconnect = 1;
  131. return (0);
  132. }
  133. }
  134. if (qdevice_net_cast_vote_timer_update(net_instance, vote) != 0) {
  135. log(LOG_CRIT, "qdevice_net_heuristics_exec_result_callback "
  136. "Can't update cast vote timer");
  137. net_instance->disconnect_reason = QDEVICE_NET_DISCONNECT_REASON_CANT_SCHEDULE_VOTING_TIMER;
  138. net_instance->schedule_disconnect = 1;
  139. return (0);
  140. }
  141. }
  142. net_instance->latest_regular_heuristics_result = heuristics;
  143. net_instance->latest_heuristics_result = heuristics;
  144. if (qdevice_net_heuristics_schedule_timer(net_instance) != 0) {
  145. return (0);
  146. }
  147. return (0);
  148. }
  149. static int
  150. qdevice_net_connect_heuristics_exec_result_callback(void *heuristics_instance_ptr,
  151. uint32_t seq_number, enum qdevice_heuristics_exec_result exec_result)
  152. {
  153. struct qdevice_heuristics_instance *heuristics_instance;
  154. struct qdevice_instance *instance;
  155. struct qdevice_net_instance *net_instance;
  156. enum tlv_vote vote;
  157. enum tlv_heuristics heuristics;
  158. int send_config_node_list;
  159. int send_membership_node_list;
  160. int send_quorum_node_list;
  161. struct tlv_ring_id tlv_rid;
  162. enum tlv_quorate quorate;
  163. heuristics_instance = (struct qdevice_heuristics_instance *)heuristics_instance_ptr;
  164. instance = heuristics_instance->qdevice_instance_ptr;
  165. net_instance = instance->model_data;
  166. if (qdevice_heuristics_result_notifier_list_set_active(&heuristics_instance->exec_result_notifier_list,
  167. qdevice_net_connect_heuristics_exec_result_callback, 0) != 0) {
  168. log(LOG_ERR, "Can't deactivate net connect heuristics exec callback notifier");
  169. net_instance->disconnect_reason = QDEVICE_NET_DISCONNECT_REASON_CANT_ACTIVATE_HEURISTICS_RESULT_NOTIFIER;
  170. net_instance->schedule_disconnect = 1;
  171. return (0);
  172. }
  173. if (net_instance->state != QDEVICE_NET_INSTANCE_STATE_WAITING_INIT_REPLY) {
  174. /*
  175. * Not connected to qnetd -> heuristics will be called again on new connect
  176. */
  177. log(LOG_DEBUG, "Received unexpected net connect heuristics in state %u",
  178. net_instance->state);
  179. return (0);
  180. }
  181. heuristics = qdevice_net_heuristics_exec_result_to_tlv(exec_result);
  182. send_config_node_list = 1;
  183. send_membership_node_list = 1;
  184. send_quorum_node_list = 1;
  185. vote = TLV_VOTE_WAIT_FOR_REPLY;
  186. if (qdevice_net_algorithm_connected(net_instance, &heuristics, &send_config_node_list,
  187. &send_membership_node_list, &send_quorum_node_list, &vote) != 0) {
  188. log(LOG_DEBUG, "Algorithm returned error. Disconnecting.");
  189. net_instance->disconnect_reason = QDEVICE_NET_DISCONNECT_REASON_ALGO_CONNECTED_ERR;
  190. return (0);
  191. } else {
  192. log(LOG_DEBUG, "Algorithm decided to %s config node list, %s membership "
  193. "node list, %s quorum node list, heuristics is %s and result vote is %s",
  194. (send_config_node_list ? "send" : "not send"),
  195. (send_membership_node_list ? "send" : "not send"),
  196. (send_quorum_node_list ? "send" : "not send"),
  197. tlv_heuristics_to_str(heuristics),
  198. tlv_vote_to_str(vote));
  199. }
  200. /*
  201. * Now we can finally really send node list, votequorum node list and update timer
  202. */
  203. if (send_config_node_list) {
  204. if (qdevice_net_send_config_node_list(net_instance,
  205. &instance->config_node_list,
  206. instance->config_node_list_version_set,
  207. instance->config_node_list_version, 1) != 0) {
  208. net_instance->disconnect_reason = QDEVICE_NET_DISCONNECT_REASON_CANT_ALLOCATE_MSG_BUFFER;
  209. return (0);
  210. }
  211. }
  212. if (send_membership_node_list) {
  213. qdevice_net_votequorum_ring_id_to_tlv(&tlv_rid,
  214. &instance->vq_node_list_ring_id);
  215. if (qdevice_net_send_membership_node_list(net_instance, &tlv_rid,
  216. instance->vq_node_list_entries,
  217. instance->vq_node_list,
  218. heuristics) != 0) {
  219. net_instance->disconnect_reason = QDEVICE_NET_DISCONNECT_REASON_CANT_ALLOCATE_MSG_BUFFER;
  220. return (0);
  221. }
  222. }
  223. if (send_quorum_node_list) {
  224. quorate = (instance->vq_quorum_quorate ?
  225. TLV_QUORATE_QUORATE : TLV_QUORATE_INQUORATE);
  226. if (qdevice_net_send_quorum_node_list(net_instance,
  227. quorate,
  228. instance->vq_quorum_node_list_entries,
  229. instance->vq_quorum_node_list) != 0) {
  230. net_instance->disconnect_reason = QDEVICE_NET_DISCONNECT_REASON_CANT_ALLOCATE_MSG_BUFFER;
  231. return (0);
  232. }
  233. }
  234. if (qdevice_net_cast_vote_timer_update(net_instance, vote) != 0) {
  235. log(LOG_CRIT, "qdevice_net_msg_received_set_option_reply fatal error. "
  236. " Can't update cast vote timer vote");
  237. net_instance->disconnect_reason = QDEVICE_NET_DISCONNECT_REASON_CANT_SCHEDULE_VOTING_TIMER;
  238. }
  239. net_instance->state = QDEVICE_NET_INSTANCE_STATE_WAITING_VOTEQUORUM_CMAP_EVENTS;
  240. net_instance->connected_since_time = time(NULL);
  241. net_instance->latest_connect_heuristics_result = heuristics;
  242. net_instance->latest_heuristics_result = heuristics;
  243. return (0);
  244. }
  245. static int
  246. qdevice_net_heuristics_timer_callback(void *data1, void *data2)
  247. {
  248. struct qdevice_net_instance *net_instance;
  249. struct qdevice_heuristics_instance *heuristics_instance;
  250. net_instance = (struct qdevice_net_instance *)data1;
  251. heuristics_instance = &net_instance->qdevice_instance_ptr->heuristics_instance;
  252. if (qdevice_heuristics_waiting_for_result(heuristics_instance)) {
  253. log(LOG_DEBUG, "Not executing regular heuristics because other heuristics is already running.");
  254. return (1);
  255. }
  256. net_instance->regular_heuristics_timer = NULL;
  257. log(LOG_DEBUG, "Executing regular heuristics.");
  258. if (qdevice_heuristics_result_notifier_list_set_active(&heuristics_instance->exec_result_notifier_list,
  259. qdevice_net_regular_heuristics_exec_result_callback, 1) != 0) {
  260. log(LOG_ERR, "Can't activate net regular heuristics exec callback notifier");
  261. net_instance->disconnect_reason = QDEVICE_NET_DISCONNECT_REASON_CANT_ACTIVATE_HEURISTICS_RESULT_NOTIFIER;
  262. net_instance->schedule_disconnect = 1;
  263. return (0);
  264. }
  265. if (qdevice_heuristics_exec(heuristics_instance,
  266. net_instance->qdevice_instance_ptr->sync_in_progress) != 0) {
  267. log(LOG_ERR, "Can't execute regular heuristics.");
  268. net_instance->schedule_disconnect = 1;
  269. net_instance->disconnect_reason = QDEVICE_NET_DISCONNECT_REASON_CANT_START_HEURISTICS;
  270. return (0);
  271. }
  272. /*
  273. * Do not schedule this callback again. It's going to be scheduled in the
  274. * qdevice_net_heuristics_exec_result_callback
  275. */
  276. return (0);
  277. }
  278. int
  279. qdevice_net_heuristics_stop_timer(struct qdevice_net_instance *net_instance)
  280. {
  281. struct qdevice_instance *instance;
  282. struct qdevice_heuristics_instance *heuristics_instance;
  283. instance = net_instance->qdevice_instance_ptr;
  284. heuristics_instance = &instance->heuristics_instance;
  285. if (net_instance->regular_heuristics_timer != NULL) {
  286. log(LOG_DEBUG, "Regular heuristics timer stopped");
  287. timer_list_delete(&net_instance->main_timer_list, net_instance->regular_heuristics_timer);
  288. net_instance->regular_heuristics_timer = NULL;
  289. if (qdevice_heuristics_result_notifier_list_set_active(&heuristics_instance->exec_result_notifier_list,
  290. qdevice_net_regular_heuristics_exec_result_callback, 0) != 0) {
  291. log(LOG_ERR, "Can't deactivate net regular heuristics exec callback notifier");
  292. net_instance->disconnect_reason =
  293. QDEVICE_NET_DISCONNECT_REASON_CANT_ACTIVATE_HEURISTICS_RESULT_NOTIFIER;
  294. net_instance->schedule_disconnect = 1;
  295. return (-1);
  296. }
  297. }
  298. return (0);
  299. }
  300. int
  301. qdevice_net_heuristics_schedule_timer(struct qdevice_net_instance *net_instance)
  302. {
  303. uint32_t interval;
  304. struct qdevice_instance *instance;
  305. struct qdevice_heuristics_instance *heuristics_instance;
  306. instance = net_instance->qdevice_instance_ptr;
  307. heuristics_instance = &instance->heuristics_instance;
  308. if (heuristics_instance->mode != QDEVICE_HEURISTICS_MODE_ENABLED) {
  309. log(LOG_DEBUG, "Not scheduling heuristics timer because mode is not enabled");
  310. if (qdevice_net_heuristics_stop_timer(net_instance) != 0) {
  311. return (-1);
  312. }
  313. return (0);
  314. }
  315. if (net_instance->regular_heuristics_timer != NULL) {
  316. log(LOG_DEBUG, "Not scheduling heuristics timer because it is already scheduled");
  317. return (0);
  318. }
  319. interval = heuristics_instance->interval;
  320. log(LOG_DEBUG, "Scheduling next regular heuristics in %"PRIu32"ms", interval);
  321. net_instance->regular_heuristics_timer = timer_list_add(&net_instance->main_timer_list,
  322. interval,
  323. qdevice_net_heuristics_timer_callback,
  324. (void *)net_instance, NULL);
  325. if (net_instance->regular_heuristics_timer == NULL) {
  326. log(LOG_ERR, "Can't schedule regular heuristics.");
  327. net_instance->disconnect_reason = QDEVICE_NET_DISCONNECT_REASON_CANT_SCHEDULE_HEURISTICS_TIMER;
  328. net_instance->schedule_disconnect = 1;
  329. return (-1);
  330. }
  331. return (0);
  332. }
  333. int
  334. qdevice_net_heuristics_init(struct qdevice_net_instance *net_instance)
  335. {
  336. if (qdevice_heuristics_result_notifier_list_add(
  337. &net_instance->qdevice_instance_ptr->heuristics_instance.exec_result_notifier_list,
  338. qdevice_net_regular_heuristics_exec_result_callback) == NULL) {
  339. log(LOG_ERR, "Can't add net regular heuristics exec callback into notifier");
  340. return (-1);
  341. }
  342. if (qdevice_heuristics_result_notifier_list_add(
  343. &net_instance->qdevice_instance_ptr->heuristics_instance.exec_result_notifier_list,
  344. qdevice_net_connect_heuristics_exec_result_callback) == NULL) {
  345. log(LOG_ERR, "Can't add net connect heuristics exec callback into notifier");
  346. return (-1);
  347. }
  348. return (0);
  349. }
  350. int
  351. qdevice_net_heuristics_exec_after_connect(struct qdevice_net_instance *net_instance)
  352. {
  353. struct qdevice_instance *instance;
  354. struct qdevice_heuristics_instance *heuristics_instance;
  355. instance = net_instance->qdevice_instance_ptr;
  356. heuristics_instance = &instance->heuristics_instance;
  357. log(LOG_DEBUG, "Executing after-connect heuristics.");
  358. if (qdevice_heuristics_result_notifier_list_set_active(&heuristics_instance->exec_result_notifier_list,
  359. qdevice_net_connect_heuristics_exec_result_callback, 1) != 0) {
  360. log(LOG_ERR, "Can't activate net connect heuristics exec callback notifier");
  361. net_instance->disconnect_reason = QDEVICE_NET_DISCONNECT_REASON_CANT_ACTIVATE_HEURISTICS_RESULT_NOTIFIER;
  362. net_instance->schedule_disconnect = 1;
  363. return (-1);
  364. }
  365. if (qdevice_heuristics_exec(heuristics_instance,
  366. instance->sync_in_progress) != 0) {
  367. log(LOG_ERR, "Can't execute connect heuristics.");
  368. net_instance->schedule_disconnect = 1;
  369. net_instance->disconnect_reason = QDEVICE_NET_DISCONNECT_REASON_CANT_START_HEURISTICS;
  370. return (-1);
  371. }
  372. return (0);
  373. }