bitbake-worker 15 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448
  1. #!/usr/bin/env python
  2. import os
  3. import sys
  4. import warnings
  5. sys.path.insert(0, os.path.join(os.path.dirname(os.path.dirname(sys.argv[0])), 'lib'))
  6. from bb import fetch2
  7. import logging
  8. import bb
  9. import select
  10. import errno
  11. import signal
  12. from multiprocessing import Lock
  13. # Users shouldn't be running this code directly
  14. if len(sys.argv) != 2 or not sys.argv[1].startswith("decafbad"):
  15. print("bitbake-worker is meant for internal execution by bitbake itself, please don't use it standalone.")
  16. sys.exit(1)
  17. profiling = False
  18. if sys.argv[1].startswith("decafbadbad"):
  19. profiling = True
  20. try:
  21. import cProfile as profile
  22. except:
  23. import profile
  24. # Unbuffer stdout to avoid log truncation in the event
  25. # of an unorderly exit as well as to provide timely
  26. # updates to log files for use with tail
  27. try:
  28. if sys.stdout.name == '<stdout>':
  29. sys.stdout = os.fdopen(sys.stdout.fileno(), 'w', 0)
  30. except:
  31. pass
  32. logger = logging.getLogger("BitBake")
  33. try:
  34. import cPickle as pickle
  35. except ImportError:
  36. import pickle
  37. bb.msg.note(1, bb.msg.domain.Cache, "Importing cPickle failed. Falling back to a very slow implementation.")
  38. worker_pipe = sys.stdout.fileno()
  39. bb.utils.nonblockingfd(worker_pipe)
  40. # Need to guard against multiprocessing being used in child processes
  41. # and multiple processes trying to write to the parent at the same time
  42. worker_pipe_lock = None
  43. handler = bb.event.LogHandler()
  44. logger.addHandler(handler)
  45. if 0:
  46. # Code to write out a log file of all events passing through the worker
  47. logfilename = "/tmp/workerlogfile"
  48. format_str = "%(levelname)s: %(message)s"
  49. conlogformat = bb.msg.BBLogFormatter(format_str)
  50. consolelog = logging.FileHandler(logfilename)
  51. bb.msg.addDefaultlogFilter(consolelog)
  52. consolelog.setFormatter(conlogformat)
  53. logger.addHandler(consolelog)
  54. worker_queue = ""
  55. def worker_fire(event, d):
  56. data = "<event>" + pickle.dumps(event) + "</event>"
  57. worker_fire_prepickled(data)
  58. def worker_fire_prepickled(event):
  59. global worker_queue
  60. worker_queue = worker_queue + event
  61. worker_flush()
  62. def worker_flush():
  63. global worker_queue, worker_pipe
  64. if not worker_queue:
  65. return
  66. try:
  67. written = os.write(worker_pipe, worker_queue)
  68. worker_queue = worker_queue[written:]
  69. except (IOError, OSError) as e:
  70. if e.errno != errno.EAGAIN and e.errno != errno.EPIPE:
  71. raise
  72. def worker_child_fire(event, d):
  73. global worker_pipe
  74. global worker_pipe_lock
  75. data = "<event>" + pickle.dumps(event) + "</event>"
  76. try:
  77. worker_pipe_lock.acquire()
  78. worker_pipe.write(data)
  79. worker_pipe_lock.release()
  80. except IOError:
  81. sigterm_handler(None, None)
  82. raise
  83. bb.event.worker_fire = worker_fire
  84. lf = None
  85. #lf = open("/tmp/workercommandlog", "w+")
  86. def workerlog_write(msg):
  87. if lf:
  88. lf.write(msg)
  89. lf.flush()
  90. def sigterm_handler(signum, frame):
  91. signal.signal(signal.SIGTERM, signal.SIG_DFL)
  92. os.killpg(0, signal.SIGTERM)
  93. sys.exit()
  94. def fork_off_task(cfg, data, workerdata, fn, task, taskname, appends, taskdepdata, quieterrors=False):
  95. # We need to setup the environment BEFORE the fork, since
  96. # a fork() or exec*() activates PSEUDO...
  97. envbackup = {}
  98. fakeenv = {}
  99. umask = None
  100. taskdep = workerdata["taskdeps"][fn]
  101. if 'umask' in taskdep and taskname in taskdep['umask']:
  102. # umask might come in as a number or text string..
  103. try:
  104. umask = int(taskdep['umask'][taskname],8)
  105. except TypeError:
  106. umask = taskdep['umask'][taskname]
  107. # We can't use the fakeroot environment in a dry run as it possibly hasn't been built
  108. if 'fakeroot' in taskdep and taskname in taskdep['fakeroot'] and not cfg.dry_run:
  109. envvars = (workerdata["fakerootenv"][fn] or "").split()
  110. for key, value in (var.split('=') for var in envvars):
  111. envbackup[key] = os.environ.get(key)
  112. os.environ[key] = value
  113. fakeenv[key] = value
  114. fakedirs = (workerdata["fakerootdirs"][fn] or "").split()
  115. for p in fakedirs:
  116. bb.utils.mkdirhier(p)
  117. logger.debug(2, 'Running %s:%s under fakeroot, fakedirs: %s' %
  118. (fn, taskname, ', '.join(fakedirs)))
  119. else:
  120. envvars = (workerdata["fakerootnoenv"][fn] or "").split()
  121. for key, value in (var.split('=') for var in envvars):
  122. envbackup[key] = os.environ.get(key)
  123. os.environ[key] = value
  124. fakeenv[key] = value
  125. sys.stdout.flush()
  126. sys.stderr.flush()
  127. try:
  128. pipein, pipeout = os.pipe()
  129. pipein = os.fdopen(pipein, 'rb', 4096)
  130. pipeout = os.fdopen(pipeout, 'wb', 0)
  131. pid = os.fork()
  132. except OSError as e:
  133. logger.critical("fork failed: %d (%s)" % (e.errno, e.strerror))
  134. sys.exit(1)
  135. if pid == 0:
  136. def child():
  137. global worker_pipe
  138. global worker_pipe_lock
  139. pipein.close()
  140. signal.signal(signal.SIGTERM, sigterm_handler)
  141. # Let SIGHUP exit as SIGTERM
  142. signal.signal(signal.SIGHUP, sigterm_handler)
  143. bb.utils.signal_on_parent_exit("SIGTERM")
  144. # Save out the PID so that the event can include it the
  145. # events
  146. bb.event.worker_pid = os.getpid()
  147. bb.event.worker_fire = worker_child_fire
  148. worker_pipe = pipeout
  149. worker_pipe_lock = Lock()
  150. # Make the child the process group leader and ensure no
  151. # child process will be controlled by the current terminal
  152. # This ensures signals sent to the controlling terminal like Ctrl+C
  153. # don't stop the child processes.
  154. os.setsid()
  155. # No stdin
  156. newsi = os.open(os.devnull, os.O_RDWR)
  157. os.dup2(newsi, sys.stdin.fileno())
  158. if umask:
  159. os.umask(umask)
  160. data.setVar("BB_WORKERCONTEXT", "1")
  161. data.setVar("BB_TASKDEPDATA", taskdepdata)
  162. data.setVar("BUILDNAME", workerdata["buildname"])
  163. data.setVar("DATE", workerdata["date"])
  164. data.setVar("TIME", workerdata["time"])
  165. bb.parse.siggen.set_taskdata(workerdata["sigdata"])
  166. ret = 0
  167. try:
  168. the_data = bb.cache.Cache.loadDataFull(fn, appends, data)
  169. the_data.setVar('BB_TASKHASH', workerdata["runq_hash"][task])
  170. bb.utils.set_process_name("%s:%s" % (the_data.getVar("PN", True), taskname.replace("do_", "")))
  171. # exported_vars() returns a generator which *cannot* be passed to os.environ.update()
  172. # successfully. We also need to unset anything from the environment which shouldn't be there
  173. exports = bb.data.exported_vars(the_data)
  174. bb.utils.empty_environment()
  175. for e, v in exports:
  176. os.environ[e] = v
  177. for e in fakeenv:
  178. os.environ[e] = fakeenv[e]
  179. the_data.setVar(e, fakeenv[e])
  180. the_data.setVarFlag(e, 'export', "1")
  181. if quieterrors:
  182. the_data.setVarFlag(taskname, "quieterrors", "1")
  183. except Exception as exc:
  184. if not quieterrors:
  185. logger.critical(str(exc))
  186. os._exit(1)
  187. try:
  188. if cfg.dry_run:
  189. return 0
  190. return bb.build.exec_task(fn, taskname, the_data, cfg.profile)
  191. except:
  192. os._exit(1)
  193. if not profiling:
  194. os._exit(child())
  195. else:
  196. profname = "profile-%s.log" % (fn.replace("/", "-") + "-" + taskname)
  197. prof = profile.Profile()
  198. try:
  199. ret = profile.Profile.runcall(prof, child)
  200. finally:
  201. prof.dump_stats(profname)
  202. bb.utils.process_profilelog(profname)
  203. os._exit(ret)
  204. else:
  205. for key, value in envbackup.iteritems():
  206. if value is None:
  207. del os.environ[key]
  208. else:
  209. os.environ[key] = value
  210. return pid, pipein, pipeout
  211. class runQueueWorkerPipe():
  212. """
  213. Abstraction for a pipe between a worker thread and the worker server
  214. """
  215. def __init__(self, pipein, pipeout):
  216. self.input = pipein
  217. if pipeout:
  218. pipeout.close()
  219. bb.utils.nonblockingfd(self.input)
  220. self.queue = ""
  221. def read(self):
  222. start = len(self.queue)
  223. try:
  224. self.queue = self.queue + self.input.read(102400)
  225. except (OSError, IOError) as e:
  226. if e.errno != errno.EAGAIN:
  227. raise
  228. end = len(self.queue)
  229. index = self.queue.find("</event>")
  230. while index != -1:
  231. worker_fire_prepickled(self.queue[:index+8])
  232. self.queue = self.queue[index+8:]
  233. index = self.queue.find("</event>")
  234. return (end > start)
  235. def close(self):
  236. while self.read():
  237. continue
  238. if len(self.queue) > 0:
  239. print("Warning, worker child left partial message: %s" % self.queue)
  240. self.input.close()
  241. normalexit = False
  242. class BitbakeWorker(object):
  243. def __init__(self, din):
  244. self.input = din
  245. bb.utils.nonblockingfd(self.input)
  246. self.queue = ""
  247. self.cookercfg = None
  248. self.databuilder = None
  249. self.data = None
  250. self.build_pids = {}
  251. self.build_pipes = {}
  252. signal.signal(signal.SIGTERM, self.sigterm_exception)
  253. # Let SIGHUP exit as SIGTERM
  254. signal.signal(signal.SIGHUP, self.sigterm_exception)
  255. if "beef" in sys.argv[1]:
  256. bb.utils.set_process_name("Worker (Fakeroot)")
  257. else:
  258. bb.utils.set_process_name("Worker")
  259. def sigterm_exception(self, signum, stackframe):
  260. if signum == signal.SIGTERM:
  261. bb.warn("Worker received SIGTERM, shutting down...")
  262. elif signum == signal.SIGHUP:
  263. bb.warn("Worker received SIGHUP, shutting down...")
  264. self.handle_finishnow(None)
  265. signal.signal(signal.SIGTERM, signal.SIG_DFL)
  266. os.kill(os.getpid(), signal.SIGTERM)
  267. def serve(self):
  268. while True:
  269. (ready, _, _) = select.select([self.input] + [i.input for i in self.build_pipes.values()], [] , [], 1)
  270. if self.input in ready:
  271. try:
  272. r = self.input.read()
  273. if len(r) == 0:
  274. # EOF on pipe, server must have terminated
  275. self.sigterm_exception(signal.SIGTERM, None)
  276. self.queue = self.queue + r
  277. except (OSError, IOError):
  278. pass
  279. if len(self.queue):
  280. self.handle_item("cookerconfig", self.handle_cookercfg)
  281. self.handle_item("workerdata", self.handle_workerdata)
  282. self.handle_item("runtask", self.handle_runtask)
  283. self.handle_item("finishnow", self.handle_finishnow)
  284. self.handle_item("ping", self.handle_ping)
  285. self.handle_item("quit", self.handle_quit)
  286. for pipe in self.build_pipes:
  287. self.build_pipes[pipe].read()
  288. if len(self.build_pids):
  289. self.process_waitpid()
  290. worker_flush()
  291. def handle_item(self, item, func):
  292. if self.queue.startswith("<" + item + ">"):
  293. index = self.queue.find("</" + item + ">")
  294. while index != -1:
  295. func(self.queue[(len(item) + 2):index])
  296. self.queue = self.queue[(index + len(item) + 3):]
  297. index = self.queue.find("</" + item + ">")
  298. def handle_cookercfg(self, data):
  299. self.cookercfg = pickle.loads(data)
  300. self.databuilder = bb.cookerdata.CookerDataBuilder(self.cookercfg, worker=True)
  301. self.databuilder.parseBaseConfiguration()
  302. self.data = self.databuilder.data
  303. def handle_workerdata(self, data):
  304. self.workerdata = pickle.loads(data)
  305. bb.msg.loggerDefaultDebugLevel = self.workerdata["logdefaultdebug"]
  306. bb.msg.loggerDefaultVerbose = self.workerdata["logdefaultverbose"]
  307. bb.msg.loggerVerboseLogs = self.workerdata["logdefaultverboselogs"]
  308. bb.msg.loggerDefaultDomains = self.workerdata["logdefaultdomain"]
  309. self.data.setVar("PRSERV_HOST", self.workerdata["prhost"])
  310. def handle_ping(self, _):
  311. workerlog_write("Handling ping\n")
  312. logger.warning("Pong from bitbake-worker!")
  313. def handle_quit(self, data):
  314. workerlog_write("Handling quit\n")
  315. global normalexit
  316. normalexit = True
  317. sys.exit(0)
  318. def handle_runtask(self, data):
  319. fn, task, taskname, quieterrors, appends, taskdepdata = pickle.loads(data)
  320. workerlog_write("Handling runtask %s %s %s\n" % (task, fn, taskname))
  321. pid, pipein, pipeout = fork_off_task(self.cookercfg, self.data, self.workerdata, fn, task, taskname, appends, taskdepdata, quieterrors)
  322. self.build_pids[pid] = task
  323. self.build_pipes[pid] = runQueueWorkerPipe(pipein, pipeout)
  324. def process_waitpid(self):
  325. """
  326. Return none is there are no processes awaiting result collection, otherwise
  327. collect the process exit codes and close the information pipe.
  328. """
  329. try:
  330. pid, status = os.waitpid(-1, os.WNOHANG)
  331. if pid == 0 or os.WIFSTOPPED(status):
  332. return None
  333. except OSError:
  334. return None
  335. workerlog_write("Exit code of %s for pid %s\n" % (status, pid))
  336. if os.WIFEXITED(status):
  337. status = os.WEXITSTATUS(status)
  338. elif os.WIFSIGNALED(status):
  339. # Per shell conventions for $?, when a process exits due to
  340. # a signal, we return an exit code of 128 + SIGNUM
  341. status = 128 + os.WTERMSIG(status)
  342. task = self.build_pids[pid]
  343. del self.build_pids[pid]
  344. self.build_pipes[pid].close()
  345. del self.build_pipes[pid]
  346. worker_fire_prepickled("<exitcode>" + pickle.dumps((task, status)) + "</exitcode>")
  347. def handle_finishnow(self, _):
  348. if self.build_pids:
  349. logger.info("Sending SIGTERM to remaining %s tasks", len(self.build_pids))
  350. for k, v in self.build_pids.iteritems():
  351. try:
  352. os.kill(-k, signal.SIGTERM)
  353. os.waitpid(-1, 0)
  354. except:
  355. pass
  356. for pipe in self.build_pipes:
  357. self.build_pipes[pipe].read()
  358. try:
  359. worker = BitbakeWorker(sys.stdin)
  360. if not profiling:
  361. worker.serve()
  362. else:
  363. profname = "profile-worker.log"
  364. prof = profile.Profile()
  365. try:
  366. profile.Profile.runcall(prof, worker.serve)
  367. finally:
  368. prof.dump_stats(profname)
  369. bb.utils.process_profilelog(profname)
  370. except BaseException as e:
  371. if not normalexit:
  372. import traceback
  373. sys.stderr.write(traceback.format_exc())
  374. sys.stderr.write(str(e))
  375. while len(worker_queue):
  376. worker_flush()
  377. workerlog_write("exitting")
  378. sys.exit(0)