corolab.py 11 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324
  1. #!/usr/bin/python
  2. '''CTS: Cluster Testing System: Lab environment module
  3. '''
  4. __copyright__='''
  5. Copyright (c) 2010 Red Hat, Inc.
  6. '''
  7. # All rights reserved.
  8. #
  9. # Author: Angus Salkeld <asalkeld@redhat.com>
  10. #
  11. # This software licensed under BSD license, the text of which follows:
  12. #
  13. # Redistribution and use in source and binary forms, with or without
  14. # modification, are permitted provided that the following conditions are met:
  15. #
  16. # - Redistributions of source code must retain the above copyright notice,
  17. # this list of conditions and the following disclaimer.
  18. # - Redistributions in binary form must reproduce the above copyright notice,
  19. # this list of conditions and the following disclaimer in the documentation
  20. # and/or other materials provided with the distribution.
  21. # - Neither the name of the MontaVista Software, Inc. nor the names of its
  22. # contributors may be used to endorse or promote products derived from this
  23. # software without specific prior written permission.
  24. #
  25. # THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
  26. # AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
  27. # IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
  28. # ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
  29. # LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
  30. # CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
  31. # SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
  32. # INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
  33. # CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
  34. # ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF
  35. # THE POSSIBILITY OF SUCH DAMAGE.
  36. import sys
  37. from cts.CTSscenarios import *
  38. from corotests import CoroTestList
  39. from corosync import *
  40. sys.path.append("/usr/share/pacemaker/tests/cts") # So that things work from the source directory
  41. try:
  42. from CTSlab import *
  43. except ImportError:
  44. sys.stderr.write("abort: couldn't find CTSLab in [%s]\n" %
  45. ' '.join(sys.path))
  46. sys.stderr.write("(check your install and PYTHONPATH)\n")
  47. sys.exit(-1)
  48. tests = None
  49. cm = None
  50. old_handler = None
  51. DefaultFacility = "daemon"
  52. def usage(arg):
  53. print "Illegal argument " + arg
  54. print "usage: " + sys.argv[0] +" [options] number-of-iterations"
  55. print "\nCommon options: "
  56. print "\t [--at-boot (1|0)], does the cluster software start at boot time"
  57. print "\t [--nodes 'node list'], list of cluster nodes separated by whitespace"
  58. print "\t [--limit-nodes max], only use the first 'max' cluster nodes supplied with --nodes"
  59. print "\t [--logfile path], where should the test software look for logs from cluster nodes"
  60. print "\t [--rrp-bindaddr addr], extra interface used for rrp, provide the bindaddr"
  61. print "\t [--outputfile path], optional location for the test software to write logs to"
  62. print "\t [--syslog-facility name], which syslog facility should the test software log to"
  63. print "\t [--choose testcase-name], run only the named test"
  64. print "\t [--list-tests], list the valid tests"
  65. print "\t [--benchmark], add the timing information"
  66. print "\t "
  67. print "Additional (less common) options: "
  68. print "\t [--trunc (truncate logfile before starting)]"
  69. print "\t [--xmit-loss lost-rate(0.0-1.0)]"
  70. print "\t [--recv-loss lost-rate(0.0-1.0)]"
  71. print "\t [--standby (1 | 0 | yes | no)]"
  72. print "\t [--fencing (1 | 0 | yes | no)]"
  73. print "\t [--once], run all valid tests once"
  74. print "\t [--no-loop-tests], dont run looping/time-based tests"
  75. print "\t [--no-unsafe-tests], dont run tests that are unsafe for use with ocfs2/drbd"
  76. print "\t [--valgrind-tests], include tests using valgrind"
  77. print "\t [--experimental-tests], include experimental tests"
  78. print "\t [--oprofile 'node list'], list of cluster nodes to run oprofile on]"
  79. print "\t [--qarsh] Use the QARSH backdoor to access nodes instead of SSH"
  80. print "\t [--seed random_seed]"
  81. print "\t [--set option=value]"
  82. sys.exit(1)
  83. class CoroLabEnvironment(CtsLab):
  84. def __init__(self):
  85. CtsLab.__init__(self)
  86. # Get a random seed for the random number generator.
  87. self["DoStonith"] = 0
  88. self["DoStandby"] = 0
  89. self["DoFencing"] = 0
  90. self["XmitLoss"] = "0.0"
  91. self["RecvLoss"] = "0.0"
  92. self["IPBase"] = "127.0.0.10"
  93. self["ClobberCIB"] = 0
  94. self["CIBfilename"] = None
  95. self["CIBResource"] = 0
  96. self["DoBSC"] = 0
  97. self["use_logd"] = 0
  98. self["oprofile"] = []
  99. self["RrpBindAddr"] = None
  100. self["warn-inactive"] = 0
  101. self["ListTests"] = 0
  102. self["benchmark"] = 0
  103. self["logrestartcmd"] = "systemctl restart rsyslog.service 2>&1 > /dev/null"
  104. self["syslogd"] ="rsyslog"
  105. self["Schema"] = "corosync 2.0"
  106. self["Stack"] = "corosync (needle)"
  107. self['CMclass'] = corosync_needle
  108. self["stonith-type"] = "external/ssh"
  109. self["stonith-params"] = "hostlist=all,livedangerously=yes"
  110. self["at-boot"] = 0 # Does the cluster software start automatically when the node boot
  111. self["logger"] = ([StdErrLog(self)])
  112. self["loop-minutes"] = 60
  113. self["valgrind-prefix"] = None
  114. self["valgrind-procs"] = "corosync"
  115. self["valgrind-opts"] = """--leak-check=full --show-reachable=yes --trace-children=no --num-callers=25 --gen-suppressions=all --suppressions="""+CTSvars.CTS_home+"""/cts.supp"""
  116. self["experimental-tests"] = 0
  117. self["valgrind-tests"] = 0
  118. self["unsafe-tests"] = 0
  119. self["loop-tests"] = 0
  120. self["all-once"] = 0
  121. self["LogWatcher"] = "remote"
  122. self["SyslogFacility"] = DefaultFacility
  123. #
  124. # Main entry into the test system.
  125. #
  126. if __name__ == '__main__':
  127. Environment = CoroLabEnvironment()
  128. NumIter = 0
  129. Version = 1
  130. LimitNodes = 0
  131. TestCase = None
  132. TruncateLog = 0
  133. ListTests = 0
  134. HaveSeed = 0
  135. node_list = ''
  136. #
  137. # The values of the rest of the parameters are now properly derived from
  138. # the configuration files.
  139. #
  140. # Set the signal handler
  141. signal.signal(15, sig_handler)
  142. signal.signal(10, sig_handler)
  143. # Process arguments...
  144. skipthis=None
  145. args=sys.argv[1:]
  146. for i in range(0, len(args)):
  147. if skipthis:
  148. skipthis=None
  149. continue
  150. elif args[i] == "-l" or args[i] == "--limit-nodes":
  151. skipthis=1
  152. LimitNodes = int(args[i+1])
  153. elif args[i] == "-L" or args[i] == "--logfile":
  154. skipthis=1
  155. Environment["LogFileName"] = args[i+1]
  156. elif args[i] == "--outputfile":
  157. skipthis=1
  158. Environment["OutputFile"] = args[i+1]
  159. elif args[i] == "--rrp-bindaddr":
  160. skipthis=1
  161. Environment["RrpBindAddr"] = args[i+1]
  162. elif args[i] == "--oprofile":
  163. skipthis=1
  164. Environment["oprofile"] = args[i+1].split(' ')
  165. elif args[i] == "--trunc":
  166. Environment["TruncateLog"]=1
  167. elif args[i] == "--list-tests":
  168. Environment["ListTests"]=1
  169. elif args[i] == "--benchmark":
  170. Environment["benchmark"]=1
  171. elif args[i] == "--qarsh":
  172. Environment.rsh.enable_qarsh()
  173. elif args[i] == "--fencing":
  174. skipthis=1
  175. if args[i+1] == "1" or args[i+1] == "yes":
  176. Environment["DoFencing"] = 1
  177. elif args[i+1] == "0" or args[i+1] == "no":
  178. Environment["DoFencing"] = 0
  179. else:
  180. usage(args[i+1])
  181. elif args[i] == "--xmit-loss":
  182. try:
  183. float(args[i+1])
  184. except ValueError:
  185. print ("--xmit-loss parameter should be float")
  186. usage(args[i+1])
  187. skipthis=1
  188. Environment["XmitLoss"] = args[i+1]
  189. elif args[i] == "--recv-loss":
  190. try:
  191. float(args[i+1])
  192. except ValueError:
  193. print ("--recv-loss parameter should be float")
  194. usage(args[i+1])
  195. skipthis=1
  196. Environment["RecvLoss"] = args[i+1]
  197. elif args[i] == "--choose":
  198. skipthis=1
  199. TestCase = args[i+1]
  200. elif args[i] == "--nodes":
  201. skipthis=1
  202. node_list = args[i+1].split(' ')
  203. elif args[i] == "--at-boot" or args[i] == "--cluster-starts-at-boot":
  204. skipthis=1
  205. if args[i+1] == "1" or args[i+1] == "yes":
  206. Environment["at-boot"] = 1
  207. elif args[i+1] == "0" or args[i+1] == "no":
  208. Environment["at-boot"] = 0
  209. else:
  210. usage(args[i+1])
  211. elif args[i] == "--set":
  212. skipthis=1
  213. (name, value) = args[i+1].split('=')
  214. Environment[name] = value
  215. else:
  216. try:
  217. NumIter=int(args[i])
  218. except ValueError:
  219. usage(args[i])
  220. if Environment["OutputFile"]:
  221. Environment["logger"].append(FileLog(Environment, Environment["OutputFile"]))
  222. if len(node_list) < 1:
  223. print "No nodes specified!"
  224. sys.exit(1)
  225. if LimitNodes > 0:
  226. if len(node_list) > LimitNodes:
  227. print("Limiting the number of nodes configured=%d (max=%d)"
  228. %(len(node_list), LimitNodes))
  229. while len(node_list) > LimitNodes:
  230. node_list.pop(len(node_list)-1)
  231. Environment["nodes"] = node_list
  232. # Create the Cluster Manager object
  233. cm = Environment['CMclass'](Environment)
  234. Audits = CoroAuditList(cm)
  235. if Environment["ListTests"] == 1 :
  236. Tests = CoroTestList(cm, Audits)
  237. Environment.log("Total %d tests"%len(Tests))
  238. for test in Tests :
  239. Environment.log(str(test.name));
  240. sys.exit(0)
  241. if TruncateLog:
  242. Environment.log("Truncating %s" % LogFile)
  243. lf = open(LogFile, "w");
  244. if lf != None:
  245. lf.truncate(0)
  246. lf.close()
  247. if TestCase != None:
  248. for test in CoroTestList(cm, Audits):
  249. if test.name == TestCase:
  250. Tests.append(test)
  251. if Tests == []:
  252. usage("--choose: No applicable/valid tests chosen")
  253. else:
  254. Tests = CoroTestList(cm, Audits)
  255. # Scenario selection
  256. if Environment["DoBSC"]:
  257. scenario = RandomTests(cm, [ BasicSanityCheck(Environment) ], Audits, Tests)
  258. elif Environment["all-once"] or NumIter == 0:
  259. NumIter = len(Tests)
  260. scenario = AllOnce(
  261. cm, [ InitClusterManager(Environment), TestAgentComponent(Environment), PacketLoss(Environment) ], Audits, Tests)
  262. else:
  263. scenario = RandomTests(
  264. cm, [ InitClusterManager(Environment), TestAgentComponent(Environment), PacketLoss(Environment) ], Audits, Tests)
  265. Environment.log(">>>>>>>>>>>>>>>> BEGINNING " + repr(NumIter) + " TESTS ")
  266. Environment.log("Stack: %s" % Environment["Stack"])
  267. Environment.log("Schema: %s" % Environment["Schema"])
  268. Environment.log("Scenario: %s" % scenario.__doc__)
  269. Environment.log("Random Seed: %s" % Environment["RandSeed"])
  270. Environment.log("System log files: %s" % Environment["LogFileName"])
  271. Environment.dump()
  272. rc = Environment.run(scenario, NumIter)
  273. sys.exit(rc)