bitbake-worker 15 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447
  1. #!/usr/bin/env python
  2. import os
  3. import sys
  4. import warnings
  5. sys.path.insert(0, os.path.join(os.path.dirname(os.path.dirname(sys.argv[0])), 'lib'))
  6. from bb import fetch2
  7. import logging
  8. import bb
  9. import select
  10. import errno
  11. import signal
  12. from multiprocessing import Lock
  13. # Users shouldn't be running this code directly
  14. if len(sys.argv) != 2 or not sys.argv[1].startswith("decafbad"):
  15. print("bitbake-worker is meant for internal execution by bitbake itself, please don't use it standalone.")
  16. sys.exit(1)
  17. profiling = False
  18. if sys.argv[1].startswith("decafbadbad"):
  19. profiling = True
  20. try:
  21. import cProfile as profile
  22. except:
  23. import profile
  24. # Unbuffer stdout to avoid log truncation in the event
  25. # of an unorderly exit as well as to provide timely
  26. # updates to log files for use with tail
  27. try:
  28. if sys.stdout.name == '<stdout>':
  29. sys.stdout = os.fdopen(sys.stdout.fileno(), 'w', 0)
  30. except:
  31. pass
  32. logger = logging.getLogger("BitBake")
  33. try:
  34. import cPickle as pickle
  35. except ImportError:
  36. import pickle
  37. bb.msg.note(1, bb.msg.domain.Cache, "Importing cPickle failed. Falling back to a very slow implementation.")
  38. worker_pipe = sys.stdout.fileno()
  39. bb.utils.nonblockingfd(worker_pipe)
  40. # Need to guard against multiprocessing being used in child processes
  41. # and multiple processes trying to write to the parent at the same time
  42. worker_pipe_lock = None
  43. handler = bb.event.LogHandler()
  44. logger.addHandler(handler)
  45. if 0:
  46. # Code to write out a log file of all events passing through the worker
  47. logfilename = "/tmp/workerlogfile"
  48. format_str = "%(levelname)s: %(message)s"
  49. conlogformat = bb.msg.BBLogFormatter(format_str)
  50. consolelog = logging.FileHandler(logfilename)
  51. bb.msg.addDefaultlogFilter(consolelog)
  52. consolelog.setFormatter(conlogformat)
  53. logger.addHandler(consolelog)
  54. worker_queue = ""
  55. def worker_fire(event, d):
  56. data = "<event>" + pickle.dumps(event) + "</event>"
  57. worker_fire_prepickled(data)
  58. def worker_fire_prepickled(event):
  59. global worker_queue
  60. worker_queue = worker_queue + event
  61. worker_flush()
  62. def worker_flush():
  63. global worker_queue, worker_pipe
  64. if not worker_queue:
  65. return
  66. try:
  67. written = os.write(worker_pipe, worker_queue)
  68. worker_queue = worker_queue[written:]
  69. except (IOError, OSError) as e:
  70. if e.errno != errno.EAGAIN and e.errno != errno.EPIPE:
  71. raise
  72. def worker_child_fire(event, d):
  73. global worker_pipe
  74. global worker_pipe_lock
  75. data = "<event>" + pickle.dumps(event) + "</event>"
  76. try:
  77. worker_pipe_lock.acquire()
  78. worker_pipe.write(data)
  79. worker_pipe_lock.release()
  80. except IOError:
  81. sigterm_handler(None, None)
  82. raise
  83. bb.event.worker_fire = worker_fire
  84. lf = None
  85. #lf = open("/tmp/workercommandlog", "w+")
  86. def workerlog_write(msg):
  87. if lf:
  88. lf.write(msg)
  89. lf.flush()
  90. def sigterm_handler(signum, frame):
  91. signal.signal(signal.SIGTERM, signal.SIG_DFL)
  92. os.killpg(0, signal.SIGTERM)
  93. sys.exit()
  94. def fork_off_task(cfg, data, workerdata, fn, task, taskname, appends, taskdepdata, quieterrors=False):
  95. # We need to setup the environment BEFORE the fork, since
  96. # a fork() or exec*() activates PSEUDO...
  97. envbackup = {}
  98. fakeenv = {}
  99. umask = None
  100. taskdep = workerdata["taskdeps"][fn]
  101. if 'umask' in taskdep and taskname in taskdep['umask']:
  102. # umask might come in as a number or text string..
  103. try:
  104. umask = int(taskdep['umask'][taskname],8)
  105. except TypeError:
  106. umask = taskdep['umask'][taskname]
  107. # We can't use the fakeroot environment in a dry run as it possibly hasn't been built
  108. if 'fakeroot' in taskdep and taskname in taskdep['fakeroot'] and not cfg.dry_run:
  109. envvars = (workerdata["fakerootenv"][fn] or "").split()
  110. for key, value in (var.split('=') for var in envvars):
  111. envbackup[key] = os.environ.get(key)
  112. os.environ[key] = value
  113. fakeenv[key] = value
  114. fakedirs = (workerdata["fakerootdirs"][fn] or "").split()
  115. for p in fakedirs:
  116. bb.utils.mkdirhier(p)
  117. logger.debug(2, 'Running %s:%s under fakeroot, fakedirs: %s' %
  118. (fn, taskname, ', '.join(fakedirs)))
  119. else:
  120. envvars = (workerdata["fakerootnoenv"][fn] or "").split()
  121. for key, value in (var.split('=') for var in envvars):
  122. envbackup[key] = os.environ.get(key)
  123. os.environ[key] = value
  124. fakeenv[key] = value
  125. sys.stdout.flush()
  126. sys.stderr.flush()
  127. try:
  128. pipein, pipeout = os.pipe()
  129. pipein = os.fdopen(pipein, 'rb', 4096)
  130. pipeout = os.fdopen(pipeout, 'wb', 0)
  131. pid = os.fork()
  132. except OSError as e:
  133. bb.msg.fatal("RunQueue", "fork failed: %d (%s)" % (e.errno, e.strerror))
  134. if pid == 0:
  135. def child():
  136. global worker_pipe
  137. global worker_pipe_lock
  138. pipein.close()
  139. signal.signal(signal.SIGTERM, sigterm_handler)
  140. # Let SIGHUP exit as SIGTERM
  141. signal.signal(signal.SIGHUP, sigterm_handler)
  142. bb.utils.signal_on_parent_exit("SIGTERM")
  143. # Save out the PID so that the event can include it the
  144. # events
  145. bb.event.worker_pid = os.getpid()
  146. bb.event.worker_fire = worker_child_fire
  147. worker_pipe = pipeout
  148. worker_pipe_lock = Lock()
  149. # Make the child the process group leader and ensure no
  150. # child process will be controlled by the current terminal
  151. # This ensures signals sent to the controlling terminal like Ctrl+C
  152. # don't stop the child processes.
  153. os.setsid()
  154. # No stdin
  155. newsi = os.open(os.devnull, os.O_RDWR)
  156. os.dup2(newsi, sys.stdin.fileno())
  157. if umask:
  158. os.umask(umask)
  159. data.setVar("BB_WORKERCONTEXT", "1")
  160. data.setVar("BB_TASKDEPDATA", taskdepdata)
  161. data.setVar("BUILDNAME", workerdata["buildname"])
  162. data.setVar("DATE", workerdata["date"])
  163. data.setVar("TIME", workerdata["time"])
  164. bb.parse.siggen.set_taskdata(workerdata["sigdata"])
  165. ret = 0
  166. try:
  167. the_data = bb.cache.Cache.loadDataFull(fn, appends, data)
  168. the_data.setVar('BB_TASKHASH', workerdata["runq_hash"][task])
  169. bb.utils.set_process_name("%s:%s" % (the_data.getVar("PN", True), taskname.replace("do_", "")))
  170. # exported_vars() returns a generator which *cannot* be passed to os.environ.update()
  171. # successfully. We also need to unset anything from the environment which shouldn't be there
  172. exports = bb.data.exported_vars(the_data)
  173. bb.utils.empty_environment()
  174. for e, v in exports:
  175. os.environ[e] = v
  176. for e in fakeenv:
  177. os.environ[e] = fakeenv[e]
  178. the_data.setVar(e, fakeenv[e])
  179. the_data.setVarFlag(e, 'export', "1")
  180. if quieterrors:
  181. the_data.setVarFlag(taskname, "quieterrors", "1")
  182. except Exception as exc:
  183. if not quieterrors:
  184. logger.critical(str(exc))
  185. os._exit(1)
  186. try:
  187. if cfg.dry_run:
  188. return 0
  189. return bb.build.exec_task(fn, taskname, the_data, cfg.profile)
  190. except:
  191. os._exit(1)
  192. if not profiling:
  193. os._exit(child())
  194. else:
  195. profname = "profile-%s.log" % (fn.replace("/", "-") + "-" + taskname)
  196. prof = profile.Profile()
  197. try:
  198. ret = profile.Profile.runcall(prof, child)
  199. finally:
  200. prof.dump_stats(profname)
  201. bb.utils.process_profilelog(profname)
  202. os._exit(ret)
  203. else:
  204. for key, value in envbackup.iteritems():
  205. if value is None:
  206. del os.environ[key]
  207. else:
  208. os.environ[key] = value
  209. return pid, pipein, pipeout
  210. class runQueueWorkerPipe():
  211. """
  212. Abstraction for a pipe between a worker thread and the worker server
  213. """
  214. def __init__(self, pipein, pipeout):
  215. self.input = pipein
  216. if pipeout:
  217. pipeout.close()
  218. bb.utils.nonblockingfd(self.input)
  219. self.queue = ""
  220. def read(self):
  221. start = len(self.queue)
  222. try:
  223. self.queue = self.queue + self.input.read(102400)
  224. except (OSError, IOError) as e:
  225. if e.errno != errno.EAGAIN:
  226. raise
  227. end = len(self.queue)
  228. index = self.queue.find("</event>")
  229. while index != -1:
  230. worker_fire_prepickled(self.queue[:index+8])
  231. self.queue = self.queue[index+8:]
  232. index = self.queue.find("</event>")
  233. return (end > start)
  234. def close(self):
  235. while self.read():
  236. continue
  237. if len(self.queue) > 0:
  238. print("Warning, worker child left partial message: %s" % self.queue)
  239. self.input.close()
  240. normalexit = False
  241. class BitbakeWorker(object):
  242. def __init__(self, din):
  243. self.input = din
  244. bb.utils.nonblockingfd(self.input)
  245. self.queue = ""
  246. self.cookercfg = None
  247. self.databuilder = None
  248. self.data = None
  249. self.build_pids = {}
  250. self.build_pipes = {}
  251. signal.signal(signal.SIGTERM, self.sigterm_exception)
  252. # Let SIGHUP exit as SIGTERM
  253. signal.signal(signal.SIGHUP, self.sigterm_exception)
  254. if "beef" in sys.argv[1]:
  255. bb.utils.set_process_name("Worker (Fakeroot)")
  256. else:
  257. bb.utils.set_process_name("Worker")
  258. def sigterm_exception(self, signum, stackframe):
  259. if signum == signal.SIGTERM:
  260. bb.warn("Worker received SIGTERM, shutting down...")
  261. elif signum == signal.SIGHUP:
  262. bb.warn("Worker received SIGHUP, shutting down...")
  263. self.handle_finishnow(None)
  264. signal.signal(signal.SIGTERM, signal.SIG_DFL)
  265. os.kill(os.getpid(), signal.SIGTERM)
  266. def serve(self):
  267. while True:
  268. (ready, _, _) = select.select([self.input] + [i.input for i in self.build_pipes.values()], [] , [], 1)
  269. if self.input in ready:
  270. try:
  271. r = self.input.read()
  272. if len(r) == 0:
  273. # EOF on pipe, server must have terminated
  274. self.sigterm_exception(signal.SIGTERM, None)
  275. self.queue = self.queue + r
  276. except (OSError, IOError):
  277. pass
  278. if len(self.queue):
  279. self.handle_item("cookerconfig", self.handle_cookercfg)
  280. self.handle_item("workerdata", self.handle_workerdata)
  281. self.handle_item("runtask", self.handle_runtask)
  282. self.handle_item("finishnow", self.handle_finishnow)
  283. self.handle_item("ping", self.handle_ping)
  284. self.handle_item("quit", self.handle_quit)
  285. for pipe in self.build_pipes:
  286. self.build_pipes[pipe].read()
  287. if len(self.build_pids):
  288. self.process_waitpid()
  289. worker_flush()
  290. def handle_item(self, item, func):
  291. if self.queue.startswith("<" + item + ">"):
  292. index = self.queue.find("</" + item + ">")
  293. while index != -1:
  294. func(self.queue[(len(item) + 2):index])
  295. self.queue = self.queue[(index + len(item) + 3):]
  296. index = self.queue.find("</" + item + ">")
  297. def handle_cookercfg(self, data):
  298. self.cookercfg = pickle.loads(data)
  299. self.databuilder = bb.cookerdata.CookerDataBuilder(self.cookercfg, worker=True)
  300. self.databuilder.parseBaseConfiguration()
  301. self.data = self.databuilder.data
  302. def handle_workerdata(self, data):
  303. self.workerdata = pickle.loads(data)
  304. bb.msg.loggerDefaultDebugLevel = self.workerdata["logdefaultdebug"]
  305. bb.msg.loggerDefaultVerbose = self.workerdata["logdefaultverbose"]
  306. bb.msg.loggerVerboseLogs = self.workerdata["logdefaultverboselogs"]
  307. bb.msg.loggerDefaultDomains = self.workerdata["logdefaultdomain"]
  308. self.data.setVar("PRSERV_HOST", self.workerdata["prhost"])
  309. def handle_ping(self, _):
  310. workerlog_write("Handling ping\n")
  311. logger.warn("Pong from bitbake-worker!")
  312. def handle_quit(self, data):
  313. workerlog_write("Handling quit\n")
  314. global normalexit
  315. normalexit = True
  316. sys.exit(0)
  317. def handle_runtask(self, data):
  318. fn, task, taskname, quieterrors, appends, taskdepdata = pickle.loads(data)
  319. workerlog_write("Handling runtask %s %s %s\n" % (task, fn, taskname))
  320. pid, pipein, pipeout = fork_off_task(self.cookercfg, self.data, self.workerdata, fn, task, taskname, appends, taskdepdata, quieterrors)
  321. self.build_pids[pid] = task
  322. self.build_pipes[pid] = runQueueWorkerPipe(pipein, pipeout)
  323. def process_waitpid(self):
  324. """
  325. Return none is there are no processes awaiting result collection, otherwise
  326. collect the process exit codes and close the information pipe.
  327. """
  328. try:
  329. pid, status = os.waitpid(-1, os.WNOHANG)
  330. if pid == 0 or os.WIFSTOPPED(status):
  331. return None
  332. except OSError:
  333. return None
  334. workerlog_write("Exit code of %s for pid %s\n" % (status, pid))
  335. if os.WIFEXITED(status):
  336. status = os.WEXITSTATUS(status)
  337. elif os.WIFSIGNALED(status):
  338. # Per shell conventions for $?, when a process exits due to
  339. # a signal, we return an exit code of 128 + SIGNUM
  340. status = 128 + os.WTERMSIG(status)
  341. task = self.build_pids[pid]
  342. del self.build_pids[pid]
  343. self.build_pipes[pid].close()
  344. del self.build_pipes[pid]
  345. worker_fire_prepickled("<exitcode>" + pickle.dumps((task, status)) + "</exitcode>")
  346. def handle_finishnow(self, _):
  347. if self.build_pids:
  348. logger.info("Sending SIGTERM to remaining %s tasks", len(self.build_pids))
  349. for k, v in self.build_pids.iteritems():
  350. try:
  351. os.kill(-k, signal.SIGTERM)
  352. os.waitpid(-1, 0)
  353. except:
  354. pass
  355. for pipe in self.build_pipes:
  356. self.build_pipes[pipe].read()
  357. try:
  358. worker = BitbakeWorker(sys.stdin)
  359. if not profiling:
  360. worker.serve()
  361. else:
  362. profname = "profile-worker.log"
  363. prof = profile.Profile()
  364. try:
  365. profile.Profile.runcall(prof, worker.serve)
  366. finally:
  367. prof.dump_stats(profname)
  368. bb.utils.process_profilelog(profname)
  369. except BaseException as e:
  370. if not normalexit:
  371. import traceback
  372. sys.stderr.write(traceback.format_exc())
  373. sys.stderr.write(str(e))
  374. while len(worker_queue):
  375. worker_flush()
  376. workerlog_write("exitting")
  377. sys.exit(0)