sam.h 8.9 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246
  1. /*
  2. * Copyright (c) 2009-2010 Red Hat, Inc.
  3. *
  4. * All rights reserved.
  5. *
  6. * Author: Jan Friesse (jfriesse@redhat.com)
  7. *
  8. * This software licensed under BSD license, the text of which follows:
  9. *
  10. * Redistribution and use in source and binary forms, with or without
  11. * modification, are permitted provided that the following conditions are met:
  12. *
  13. * - Redistributions of source code must retain the above copyright notice,
  14. * this list of conditions and the following disclaimer.
  15. * - Redistributions in binary form must reproduce the above copyright notice,
  16. * this list of conditions and the following disclaimer in the documentation
  17. * and/or other materials provided with the distribution.
  18. * - Neither the name of the Red Hat, Inc. nor the names of its
  19. * contributors may be used to endorse or promote products derived from this
  20. * software without specific prior written permission.
  21. *
  22. * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
  23. * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
  24. * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
  25. * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
  26. * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
  27. * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
  28. * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
  29. * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
  30. * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
  31. * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF
  32. * THE POSSIBILITY OF SUCH DAMAGE.
  33. */
  34. #ifndef COROSYNC_SAM_H_DEFINED
  35. #define COROSYNC_SAM_H_DEFINED
  36. #include <corosync/corotypes.h>
  37. #ifdef __cplusplus
  38. extern "C" {
  39. #endif
  40. typedef enum {
  41. SAM_RECOVERY_POLICY_QUIT = 1,
  42. SAM_RECOVERY_POLICY_RESTART = 2,
  43. SAM_RECOVERY_POLICY_QUORUM = 0x08,
  44. SAM_RECOVERY_POLICY_QUORUM_QUIT = SAM_RECOVERY_POLICY_QUORUM | SAM_RECOVERY_POLICY_QUIT,
  45. SAM_RECOVERY_POLICY_QUORUM_RESTART = SAM_RECOVERY_POLICY_QUORUM | SAM_RECOVERY_POLICY_RESTART,
  46. SAM_RECOVERY_POLICY_CONFDB = 0x10,
  47. } sam_recovery_policy_t;
  48. /**
  49. * Callback definition for event driven checking
  50. */
  51. typedef int (*sam_hc_callback_t)(void);
  52. /**
  53. * Create a new SAM connection.
  54. *
  55. * This function must be called before any other.
  56. * It is recommended to call it as one of first in application.
  57. *
  58. * @param time_interval Time interval in miliseconds of healthcheck. After this time, application
  59. * will be killed and recovery policy will be taken. This can be zero, which means,
  60. * that there is no time limit (only fall of application is checked and only then
  61. * recovery action is taken)
  62. * @param recovery_policy One of SAM_RECOVERY_POLICY_RESTART, which means, that after
  63. * timeout application will be killed and new instance will be started.
  64. * SAM_RECOVERY_POLICY_QUIT will just stop application
  65. *
  66. * @retval CS_OK in case no problem appeared
  67. * @retval CS_ERR_BAD_HANDLE in case user is trying to initialize initialized instance
  68. * @retval CS_ERR_INVALID_PARAM in case recovery_policy had bad value
  69. */
  70. cs_error_t sam_initialize (
  71. int time_interval,
  72. sam_recovery_policy_t recovery_policy);
  73. /**
  74. * Close the SAM handle.
  75. *
  76. * This function should be called as late as possible.
  77. * (in reality, if you plan just quit, and checking is stopped, there is no need
  78. * to call it). Function will stop healtchecking and put library to state, where
  79. * no new start is possible.
  80. *
  81. * @retval CS_OK in case no problem appeared
  82. * @retval CS_ERR_BAD_HANDLE library was not initialized by #sam_initialize
  83. */
  84. cs_error_t sam_finalize (void);
  85. /**
  86. * Start healthchecking.
  87. *
  88. * From this time, you should call every time_interval
  89. * sam_hc_send, otherwise, recovery action will be taken.
  90. *
  91. * @retval CS_OK in case no problem appeared
  92. * @retval CS_ERR_BAD_HANDLE component was not registered by #sam_register
  93. */
  94. cs_error_t sam_start (void);
  95. /**
  96. * Stop healthchecking.
  97. *
  98. * Oposite of #sam_start. You can call sam_start and sam_stop how many
  99. * times you want.
  100. *
  101. * @retval CS_OK in case no problem appeared
  102. * @retval CS_ERR_BAD_HANDLE healthchecking is not in running state (no sam_start
  103. * was called)
  104. */
  105. cs_error_t sam_stop (void);
  106. /**
  107. * Set warning signal to be send.
  108. *
  109. * Default signal is SIGTERM. You can use SIGKILL to emulate NOT sending
  110. * warning signal and just send SIGKILL.
  111. *
  112. * @retval CS_OK in case no problem appeared
  113. * @retval CS_ERR_BAD_HANDLE library was not initialized by #sam_initialize or
  114. * is finalized
  115. */
  116. cs_error_t sam_warn_signal_set (int warn_signal);
  117. /**
  118. * Register application.
  119. *
  120. * This is one of most crucial function. In case, your
  121. * application will be restarted, you will always return to point after calling
  122. * this function. This function can be called only once, and SAM must be initialized
  123. * by sam_initialize. You can choose any place in your application, where to call
  124. * this function.
  125. *
  126. * @param instance_id NULL or pointer to int memory, where current instance
  127. * of application will be returned. It's always safe to suppose, that first instance
  128. * (this means, no recovery action was taken yet) will be always 1 and instance_id
  129. * will be raising up to MAX_INT (after this, it will fall to 0).
  130. *
  131. * @retval CS_OK in case no problem appeared
  132. * @retval CS_ERR_BAD_HANDLE in case, you call this function twice, or before sam_init
  133. * @retval CS_ERR_LIBRARY internal library call failed. This can be one of pipe or fork
  134. * creation. You can get more information from errno
  135. */
  136. cs_error_t sam_register (
  137. unsigned int *instance_id);
  138. /**
  139. * Send healthcheck confirmation.
  140. *
  141. * This should be called after #sam_start
  142. *
  143. * @retval CS_OK in case no problem appeared
  144. * @retval CS_ERR_BAD_HANDLE healthchecking is not in running state (no sam_start was
  145. * called, or called after sam_stop/sam_finalize)
  146. */
  147. cs_error_t sam_hc_send (void);
  148. /**
  149. * Register healtcheck callback.
  150. *
  151. * After you will call this function, and set
  152. * cb to something else then NULL, SAM is automatically switched from
  153. * application driven healtchecking to event driven healtchecking. In other
  154. * words, is not longer needed to call sam_hc_send, but your callback function
  155. * must return 0 in case of healtchecking is correct, or value different then
  156. * 0, in case something happend. After next hc iteration, warning signal and
  157. * after that kill signal is sent back to your application.
  158. *
  159. * @param cb Pointer to healtcheck function, or NULL to switch back to application driven hc
  160. *
  161. * @retval CS_OK in case no problem appeared
  162. * @retval CS_ERR_BAD_HANDLE in case, you call this function before sam_init or after sam_start
  163. * @retval CS_ERR_LIBRARY internal library call failed. This can be one of pipe or pthread
  164. * creation.
  165. */
  166. cs_error_t sam_hc_callback_register (sam_hc_callback_t cb);
  167. /**
  168. * Return size of stored data.
  169. *
  170. * @param size Pointer to variable, where stored data size is returned. If
  171. * nothing or NULL is stored, then 0 is returned.
  172. *
  173. * @retval CS_OK in case no problem appeared
  174. * @retval CS_ERR_BAD_HANDLE in case you call this function before sam_init or after
  175. * sam_finalize
  176. * @retval CS_ERR_INVALID_PARAM if size parameter is NULL
  177. */
  178. cs_error_t sam_data_getsize (size_t *size);
  179. /**
  180. * Return stored data.
  181. *
  182. * @param data Pointer to place, where to store data
  183. * @param size Allocated size of data
  184. *
  185. * @retval CS_OK if no problem appeared
  186. * @retval CS_ERR_BAD_HANDLE if you call this function before sam_init or after sam_finalize
  187. * @retval CS_ERR_INVALID_PARAM if data is NULL or size is less then currently saved user data length
  188. */
  189. cs_error_t sam_data_restore (
  190. void *data,
  191. size_t size);
  192. /**
  193. * Store user data.
  194. *
  195. * Such stored data survives restart of child.
  196. *
  197. * @param data Data to store. You can use NULL to delete data
  198. * @param size Size of data to store.
  199. *
  200. * @retval CS_OK in case no problem appeared
  201. * @retval CS_ERR_BAD_HANDLE if you call this function before sam_init or
  202. * after sam_finalize
  203. * @retval CS_ERR_NO_MEMORY if data is too large and malloc/realloc was not
  204. * sucesfull
  205. * @retval CS_ERR_LIBRARY if some internal error appeared (communication with parent
  206. * process)
  207. */
  208. cs_error_t sam_data_store (
  209. const void *data,
  210. size_t size);
  211. /**
  212. * Marks child as failed.
  213. *
  214. * This can be called only with SAM_RECOVERY_POLICY_CONFDB flag set and
  215. * makes sense only for SAM_RECOVERY_POLICY_RESTART. This will kill child without sending warn
  216. * signal. Confdb state key will be set to failed.
  217. *
  218. * @retval CS_OK in case no problem appeared
  219. * @retval CS_ERR_BAD_HANDLE library was not initialized or was already finalized
  220. * @retval CS_ERR_INVALID_PARAM recovery policy doesn't has SAM_RECOVERY_POLICY_CONFDB flag set
  221. * @retval CS_ERR_LIBRARY if some internal error appeared (communication with parent
  222. * process)
  223. */
  224. cs_error_t sam_mark_failed (void);
  225. #ifdef __cplusplus
  226. }
  227. #endif
  228. #endif /* COROSYNC_SAM_H_DEFINED */