sam.h 9.0 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247
  1. /*
  2. * Copyright (c) 2009-2011 Red Hat, Inc.
  3. *
  4. * All rights reserved.
  5. *
  6. * Author: Jan Friesse (jfriesse@redhat.com)
  7. *
  8. * This software licensed under BSD license, the text of which follows:
  9. *
  10. * Redistribution and use in source and binary forms, with or without
  11. * modification, are permitted provided that the following conditions are met:
  12. *
  13. * - Redistributions of source code must retain the above copyright notice,
  14. * this list of conditions and the following disclaimer.
  15. * - Redistributions in binary form must reproduce the above copyright notice,
  16. * this list of conditions and the following disclaimer in the documentation
  17. * and/or other materials provided with the distribution.
  18. * - Neither the name of the Red Hat, Inc. nor the names of its
  19. * contributors may be used to endorse or promote products derived from this
  20. * software without specific prior written permission.
  21. *
  22. * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
  23. * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
  24. * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
  25. * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
  26. * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
  27. * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
  28. * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
  29. * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
  30. * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
  31. * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF
  32. * THE POSSIBILITY OF SUCH DAMAGE.
  33. */
  34. #ifndef COROSYNC_SAM_H_DEFINED
  35. #define COROSYNC_SAM_H_DEFINED
  36. #include <corosync/corotypes.h>
  37. #ifdef __cplusplus
  38. extern "C" {
  39. #endif
  40. typedef enum {
  41. SAM_RECOVERY_POLICY_QUIT = 1,
  42. SAM_RECOVERY_POLICY_RESTART = 2,
  43. SAM_RECOVERY_POLICY_QUORUM = 0x08,
  44. SAM_RECOVERY_POLICY_QUORUM_QUIT = SAM_RECOVERY_POLICY_QUORUM | SAM_RECOVERY_POLICY_QUIT,
  45. SAM_RECOVERY_POLICY_QUORUM_RESTART = SAM_RECOVERY_POLICY_QUORUM | SAM_RECOVERY_POLICY_RESTART,
  46. SAM_RECOVERY_POLICY_CMAP = 0x10,
  47. SAM_RECOVERY_POLICY_CONFDB = 0x10,
  48. } sam_recovery_policy_t;
  49. /**
  50. * Callback definition for event driven checking
  51. */
  52. typedef int (*sam_hc_callback_t)(void);
  53. /**
  54. * Create a new SAM connection.
  55. *
  56. * This function must be called before any other.
  57. * It is recommended to call it as one of first in application.
  58. *
  59. * @param time_interval Time interval in miliseconds of healthcheck. After this time, application
  60. * will be killed and recovery policy will be taken. This can be zero, which means,
  61. * that there is no time limit (only fall of application is checked and only then
  62. * recovery action is taken)
  63. * @param recovery_policy One of SAM_RECOVERY_POLICY_RESTART, which means, that after
  64. * timeout application will be killed and new instance will be started.
  65. * SAM_RECOVERY_POLICY_QUIT will just stop application
  66. *
  67. * @retval CS_OK in case no problem appeared
  68. * @retval CS_ERR_BAD_HANDLE in case user is trying to initialize initialized instance
  69. * @retval CS_ERR_INVALID_PARAM in case recovery_policy had bad value
  70. */
  71. cs_error_t sam_initialize (
  72. int time_interval,
  73. sam_recovery_policy_t recovery_policy);
  74. /**
  75. * Close the SAM handle.
  76. *
  77. * This function should be called as late as possible.
  78. * (in reality, if you plan just quit, and checking is stopped, there is no need
  79. * to call it). Function will stop healtchecking and put library to state, where
  80. * no new start is possible.
  81. *
  82. * @retval CS_OK in case no problem appeared
  83. * @retval CS_ERR_BAD_HANDLE library was not initialized by #sam_initialize
  84. */
  85. cs_error_t sam_finalize (void);
  86. /**
  87. * Start healthchecking.
  88. *
  89. * From this time, you should call every time_interval
  90. * sam_hc_send, otherwise, recovery action will be taken.
  91. *
  92. * @retval CS_OK in case no problem appeared
  93. * @retval CS_ERR_BAD_HANDLE component was not registered by #sam_register
  94. */
  95. cs_error_t sam_start (void);
  96. /**
  97. * Stop healthchecking.
  98. *
  99. * Oposite of #sam_start. You can call sam_start and sam_stop how many
  100. * times you want.
  101. *
  102. * @retval CS_OK in case no problem appeared
  103. * @retval CS_ERR_BAD_HANDLE healthchecking is not in running state (no sam_start
  104. * was called)
  105. */
  106. cs_error_t sam_stop (void);
  107. /**
  108. * Set warning signal to be send.
  109. *
  110. * Default signal is SIGTERM. You can use SIGKILL to emulate NOT sending
  111. * warning signal and just send SIGKILL.
  112. *
  113. * @retval CS_OK in case no problem appeared
  114. * @retval CS_ERR_BAD_HANDLE library was not initialized by #sam_initialize or
  115. * is finalized
  116. */
  117. cs_error_t sam_warn_signal_set (int warn_signal);
  118. /**
  119. * Register application.
  120. *
  121. * This is one of most crucial function. In case, your
  122. * application will be restarted, you will always return to point after calling
  123. * this function. This function can be called only once, and SAM must be initialized
  124. * by sam_initialize. You can choose any place in your application, where to call
  125. * this function.
  126. *
  127. * @param instance_id NULL or pointer to int memory, where current instance
  128. * of application will be returned. It's always safe to suppose, that first instance
  129. * (this means, no recovery action was taken yet) will be always 1 and instance_id
  130. * will be raising up to MAX_INT (after this, it will fall to 0).
  131. *
  132. * @retval CS_OK in case no problem appeared
  133. * @retval CS_ERR_BAD_HANDLE in case, you call this function twice, or before sam_init
  134. * @retval CS_ERR_LIBRARY internal library call failed. This can be one of pipe or fork
  135. * creation. You can get more information from errno
  136. */
  137. cs_error_t sam_register (
  138. unsigned int *instance_id);
  139. /**
  140. * Send healthcheck confirmation.
  141. *
  142. * This should be called after #sam_start
  143. *
  144. * @retval CS_OK in case no problem appeared
  145. * @retval CS_ERR_BAD_HANDLE healthchecking is not in running state (no sam_start was
  146. * called, or called after sam_stop/sam_finalize)
  147. */
  148. cs_error_t sam_hc_send (void);
  149. /**
  150. * Register healtcheck callback.
  151. *
  152. * After you will call this function, and set
  153. * cb to something else then NULL, SAM is automatically switched from
  154. * application driven healtchecking to event driven healtchecking. In other
  155. * words, is not longer needed to call sam_hc_send, but your callback function
  156. * must return 0 in case of healtchecking is correct, or value different then
  157. * 0, in case something happend. After next hc iteration, warning signal and
  158. * after that kill signal is sent back to your application.
  159. *
  160. * @param cb Pointer to healtcheck function, or NULL to switch back to application driven hc
  161. *
  162. * @retval CS_OK in case no problem appeared
  163. * @retval CS_ERR_BAD_HANDLE in case, you call this function before sam_init or after sam_start
  164. * @retval CS_ERR_LIBRARY internal library call failed. This can be one of pipe or pthread
  165. * creation.
  166. */
  167. cs_error_t sam_hc_callback_register (sam_hc_callback_t cb);
  168. /**
  169. * Return size of stored data.
  170. *
  171. * @param size Pointer to variable, where stored data size is returned. If
  172. * nothing or NULL is stored, then 0 is returned.
  173. *
  174. * @retval CS_OK in case no problem appeared
  175. * @retval CS_ERR_BAD_HANDLE in case you call this function before sam_init or after
  176. * sam_finalize
  177. * @retval CS_ERR_INVALID_PARAM if size parameter is NULL
  178. */
  179. cs_error_t sam_data_getsize (size_t *size);
  180. /**
  181. * Return stored data.
  182. *
  183. * @param data Pointer to place, where to store data
  184. * @param size Allocated size of data
  185. *
  186. * @retval CS_OK if no problem appeared
  187. * @retval CS_ERR_BAD_HANDLE if you call this function before sam_init or after sam_finalize
  188. * @retval CS_ERR_INVALID_PARAM if data is NULL or size is less then currently saved user data length
  189. */
  190. cs_error_t sam_data_restore (
  191. void *data,
  192. size_t size);
  193. /**
  194. * Store user data.
  195. *
  196. * Such stored data survives restart of child.
  197. *
  198. * @param data Data to store. You can use NULL to delete data
  199. * @param size Size of data to store.
  200. *
  201. * @retval CS_OK in case no problem appeared
  202. * @retval CS_ERR_BAD_HANDLE if you call this function before sam_init or
  203. * after sam_finalize
  204. * @retval CS_ERR_NO_MEMORY if data is too large and malloc/realloc was not
  205. * sucesfull
  206. * @retval CS_ERR_LIBRARY if some internal error appeared (communication with parent
  207. * process)
  208. */
  209. cs_error_t sam_data_store (
  210. const void *data,
  211. size_t size);
  212. /**
  213. * Marks child as failed.
  214. *
  215. * This can be called only with SAM_RECOVERY_POLICY_CMAP flag set and
  216. * makes sense only for SAM_RECOVERY_POLICY_RESTART. This will kill child without sending warn
  217. * signal. Cmap state key will be set to failed.
  218. *
  219. * @retval CS_OK in case no problem appeared
  220. * @retval CS_ERR_BAD_HANDLE library was not initialized or was already finalized
  221. * @retval CS_ERR_INVALID_PARAM recovery policy doesn't has SAM_RECOVERY_POLICY_CMAP flag set
  222. * @retval CS_ERR_LIBRARY if some internal error appeared (communication with parent
  223. * process)
  224. */
  225. cs_error_t sam_mark_failed (void);
  226. #ifdef __cplusplus
  227. }
  228. #endif
  229. #endif /* COROSYNC_SAM_H_DEFINED */