corolab.py 11 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318
  1. #!/usr/bin/python
  2. '''CTS: Cluster Testing System: Lab environment module
  3. '''
  4. __copyright__='''
  5. Copyright (c) 2010 Red Hat, Inc.
  6. '''
  7. # All rights reserved.
  8. #
  9. # Author: Angus Salkeld <asalkeld@redhat.com>
  10. #
  11. # This software licensed under BSD license, the text of which follows:
  12. #
  13. # Redistribution and use in source and binary forms, with or without
  14. # modification, are permitted provided that the following conditions are met:
  15. #
  16. # - Redistributions of source code must retain the above copyright notice,
  17. # this list of conditions and the following disclaimer.
  18. # - Redistributions in binary form must reproduce the above copyright notice,
  19. # this list of conditions and the following disclaimer in the documentation
  20. # and/or other materials provided with the distribution.
  21. # - Neither the name of the MontaVista Software, Inc. nor the names of its
  22. # contributors may be used to endorse or promote products derived from this
  23. # software without specific prior written permission.
  24. #
  25. # THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
  26. # AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
  27. # IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
  28. # ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
  29. # LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
  30. # CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
  31. # SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
  32. # INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
  33. # CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
  34. # ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF
  35. # THE POSSIBILITY OF SUCH DAMAGE.
  36. import sys
  37. from cts.CTSaudits import AuditList
  38. from cts.CTSscenarios import *
  39. from corotests import CoroTestList
  40. from corosync import *
  41. sys.path.append("/usr/share/pacemaker/tests/cts") # So that things work from the source directory
  42. try:
  43. from CTSlab import *
  44. except ImportError:
  45. sys.stderr.write("abort: couldn't find CTSLab in [%s]\n" %
  46. ' '.join(sys.path))
  47. sys.stderr.write("(check your install and PYTHONPATH)\n")
  48. sys.exit(-1)
  49. tests = None
  50. cm = None
  51. old_handler = None
  52. DefaultFacility = "daemon"
  53. def usage(arg):
  54. print "Illegal argument " + arg
  55. print "usage: " + sys.argv[0] +" [options] number-of-iterations"
  56. print "\nCommon options: "
  57. print "\t [--at-boot (1|0)], does the cluster software start at boot time"
  58. print "\t [--nodes 'node list'], list of cluster nodes separated by whitespace"
  59. print "\t [--limit-nodes max], only use the first 'max' cluster nodes supplied with --nodes"
  60. print "\t [--logfile path], where should the test software look for logs from cluster nodes"
  61. print "\t [--outputfile path], optional location for the test software to write logs to"
  62. print "\t [--syslog-facility name], which syslog facility should the test software log to"
  63. print "\t [--choose testcase-name], run only the named test"
  64. print "\t [--list-tests], list the valid tests"
  65. print "\t [--benchmark], add the timing information"
  66. print "\t "
  67. print "Additional (less common) options: "
  68. print "\t [--trunc (truncate logfile before starting)]"
  69. print "\t [--xmit-loss lost-rate(0.0-1.0)]"
  70. print "\t [--recv-loss lost-rate(0.0-1.0)]"
  71. print "\t [--standby (1 | 0 | yes | no)]"
  72. print "\t [--fencing (1 | 0 | yes | no)]"
  73. print "\t [--once], run all valid tests once"
  74. print "\t [--no-loop-tests], dont run looping/time-based tests"
  75. print "\t [--no-unsafe-tests], dont run tests that are unsafe for use with ocfs2/drbd"
  76. print "\t [--valgrind-tests], include tests using valgrind"
  77. print "\t [--experimental-tests], include experimental tests"
  78. print "\t [--oprofile 'node list'], list of cluster nodes to run oprofile on]"
  79. print "\t [--qarsh] Use the QARSH backdoor to access nodes instead of SSH"
  80. print "\t [--seed random_seed]"
  81. print "\t [--set option=value]"
  82. sys.exit(1)
  83. class CoroLabEnvironment(CtsLab):
  84. def __init__(self):
  85. CtsLab.__init__(self)
  86. # Get a random seed for the random number generator.
  87. self["DoStonith"] = 0
  88. self["DoStandby"] = 0
  89. self["DoFencing"] = 0
  90. self["XmitLoss"] = "0.0"
  91. self["RecvLoss"] = "0.0"
  92. self["IPBase"] = "127.0.0.10"
  93. self["ClobberCIB"] = 0
  94. self["CIBfilename"] = None
  95. self["CIBResource"] = 0
  96. self["DoBSC"] = 0
  97. self["use_logd"] = 0
  98. self["oprofile"] = []
  99. self["warn-inactive"] = 0
  100. self["ListTests"] = 0
  101. self["benchmark"] = 0
  102. self["logrestartcmd"] = "/etc/init.d/rsyslog restart 2>&1 > /dev/null"
  103. self["Schema"] = "corosync 1.2"
  104. self["Stack"] = "corosync (flatiron)"
  105. self['CMclass'] = corosync_flatiron
  106. self["stonith-type"] = "external/ssh"
  107. self["stonith-params"] = "hostlist=all,livedangerously=yes"
  108. self["at-boot"] = 0 # Does the cluster software start automatically when the node boot
  109. self["logger"] = ([StdErrLog(self)])
  110. self["loop-minutes"] = 60
  111. self["valgrind-prefix"] = None
  112. self["valgrind-procs"] = "corosync"
  113. self["valgrind-opts"] = """--leak-check=full --show-reachable=yes --trace-children=no --num-callers=25 --gen-suppressions=all --suppressions="""+CTSvars.CTS_home+"""/cts.supp"""
  114. self["experimental-tests"] = 0
  115. self["valgrind-tests"] = 0
  116. self["unsafe-tests"] = 0
  117. self["loop-tests"] = 0
  118. self["all-once"] = 1
  119. self["LogWatcher"] = "remote"
  120. self["SyslogFacility"] = DefaultFacility
  121. #
  122. # Main entry into the test system.
  123. #
  124. if __name__ == '__main__':
  125. Environment = CoroLabEnvironment()
  126. NumIter = 0
  127. Version = 1
  128. LimitNodes = 0
  129. TestCase = None
  130. TruncateLog = 0
  131. ListTests = 0
  132. HaveSeed = 0
  133. node_list = ''
  134. #
  135. # The values of the rest of the parameters are now properly derived from
  136. # the configuration files.
  137. #
  138. # Set the signal handler
  139. signal.signal(15, sig_handler)
  140. signal.signal(10, sig_handler)
  141. # Process arguments...
  142. skipthis=None
  143. args=sys.argv[1:]
  144. for i in range(0, len(args)):
  145. if skipthis:
  146. skipthis=None
  147. continue
  148. elif args[i] == "-l" or args[i] == "--limit-nodes":
  149. skipthis=1
  150. LimitNodes = int(args[i+1])
  151. elif args[i] == "-L" or args[i] == "--logfile":
  152. skipthis=1
  153. Environment["LogFileName"] = args[i+1]
  154. elif args[i] == "--outputfile":
  155. skipthis=1
  156. Environment["OutputFile"] = args[i+1]
  157. elif args[i] == "--oprofile":
  158. skipthis=1
  159. Environment["oprofile"] = args[i+1].split(' ')
  160. elif args[i] == "--trunc":
  161. Environment["TruncateLog"]=1
  162. elif args[i] == "--list-tests":
  163. Environment["ListTests"]=1
  164. elif args[i] == "--benchmark":
  165. Environment["benchmark"]=1
  166. elif args[i] == "--qarsh":
  167. Environment.rsh.enable_qarsh()
  168. elif args[i] == "--fencing":
  169. skipthis=1
  170. if args[i+1] == "1" or args[i+1] == "yes":
  171. Environment["DoFencing"] = 1
  172. elif args[i+1] == "0" or args[i+1] == "no":
  173. Environment["DoFencing"] = 0
  174. else:
  175. usage(args[i+1])
  176. elif args[i] == "--xmit-loss":
  177. try:
  178. float(args[i+1])
  179. except ValueError:
  180. print ("--xmit-loss parameter should be float")
  181. usage(args[i+1])
  182. skipthis=1
  183. Environment["XmitLoss"] = args[i+1]
  184. elif args[i] == "--recv-loss":
  185. try:
  186. float(args[i+1])
  187. except ValueError:
  188. print ("--recv-loss parameter should be float")
  189. usage(args[i+1])
  190. skipthis=1
  191. Environment["RecvLoss"] = args[i+1]
  192. elif args[i] == "--choose":
  193. skipthis=1
  194. TestCase = args[i+1]
  195. elif args[i] == "--nodes":
  196. skipthis=1
  197. node_list = args[i+1].split(' ')
  198. elif args[i] == "--at-boot" or args[i] == "--cluster-starts-at-boot":
  199. skipthis=1
  200. if args[i+1] == "1" or args[i+1] == "yes":
  201. Environment["at-boot"] = 1
  202. elif args[i+1] == "0" or args[i+1] == "no":
  203. Environment["at-boot"] = 0
  204. else:
  205. usage(args[i+1])
  206. elif args[i] == "--set":
  207. skipthis=1
  208. (name, value) = args[i+1].split('=')
  209. Environment[name] = value
  210. else:
  211. try:
  212. NumIter=int(args[i])
  213. except ValueError:
  214. usage(args[i])
  215. if Environment["OutputFile"]:
  216. Environment["logger"].append(FileLog(Environment, Environment["OutputFile"]))
  217. if len(node_list) < 1:
  218. print "No nodes specified!"
  219. sys.exit(1)
  220. if LimitNodes > 0:
  221. if len(node_list) > LimitNodes:
  222. print("Limiting the number of nodes configured=%d (max=%d)"
  223. %(len(node_list), LimitNodes))
  224. while len(node_list) > LimitNodes:
  225. node_list.pop(len(node_list)-1)
  226. Environment["nodes"] = node_list
  227. # Create the Cluster Manager object
  228. cm = Environment['CMclass'](Environment)
  229. Audits = AuditList(cm)
  230. if Environment["ListTests"] == 1 :
  231. Tests = CoroTestList(cm, Audits)
  232. Environment.log("Total %d tests"%len(Tests))
  233. for test in Tests :
  234. Environment.log(str(test.name));
  235. sys.exit(0)
  236. if TruncateLog:
  237. Environment.log("Truncating %s" % LogFile)
  238. lf = open(LogFile, "w");
  239. if lf != None:
  240. lf.truncate(0)
  241. lf.close()
  242. if TestCase != None:
  243. for test in CoroTestList(cm, Audits):
  244. if test.name == TestCase:
  245. Tests.append(test)
  246. if Tests == []:
  247. usage("--choose: No applicable/valid tests chosen")
  248. else:
  249. Tests = CoroTestList(cm, Audits)
  250. # Scenario selection
  251. if Environment["DoBSC"]:
  252. scenario = RandomTests(cm, [ BasicSanityCheck(Environment) ], Audits, Tests)
  253. elif Environment["all-once"] or NumIter == 0:
  254. NumIter = len(Tests)
  255. scenario = AllOnce(
  256. cm, [ InitClusterManager(Environment), TestAgentComponent(Environment), PacketLoss(Environment) ], Audits, Tests)
  257. else:
  258. scenario = RandomTests(
  259. cm, [ InitClusterManager(Environment), TestAgentComponent(Environment), PacketLoss(Environment) ], Audits, Tests)
  260. Environment.log(">>>>>>>>>>>>>>>> BEGINNING " + repr(NumIter) + " TESTS ")
  261. Environment.log("Stack: %s" % Environment["Stack"])
  262. Environment.log("Schema: %s" % Environment["Schema"])
  263. Environment.log("Scenario: %s" % scenario.__doc__)
  264. Environment.log("Random Seed: %s" % Environment["RandSeed"])
  265. Environment.log("System log files: %s" % Environment["LogFileName"])
  266. Environment.dump()
  267. rc = Environment.run(scenario, NumIter)
  268. sys.exit(rc)