# # BitBake Process based server. # # Copyright (C) 2010 Bob Foerster # # SPDX-License-Identifier: GPL-2.0-only # """ This module implements a multiprocessing.Process based server for bitbake. """ import bb import bb.event import logging import multiprocessing import threading import array import os import sys import time import select import socket import subprocess import errno import re import datetime import bb.server.xmlrpcserver from bb import daemonize from multiprocessing import queues logger = logging.getLogger('BitBake') class ProcessTimeout(SystemExit): pass class ProcessServer(): profile_filename = "profile.log" profile_processed_filename = "profile.log.processed" def __init__(self, lock, sock, sockname, server_timeout, xmlrpcinterface): self.command_channel = False self.command_channel_reply = False self.quit = False self.heartbeat_seconds = 1 # default, BB_HEARTBEAT_EVENT will be checked once we have a datastore. self.next_heartbeat = time.time() self.event_handle = None self.hadanyui = False self.haveui = False self.maxuiwait = 30 self.xmlrpc = False self._idlefuns = {} self.bitbake_lock = lock self.sock = sock self.sockname = sockname self.server_timeout = server_timeout self.xmlrpcinterface = xmlrpcinterface def register_idle_function(self, function, data): """Register a function to be called while the server is idle""" assert hasattr(function, '__call__') self._idlefuns[function] = data def run(self): if self.xmlrpcinterface[0]: self.xmlrpc = bb.server.xmlrpcserver.BitBakeXMLRPCServer(self.xmlrpcinterface, self.cooker, self) print("Bitbake XMLRPC server address: %s, server port: %s" % (self.xmlrpc.host, self.xmlrpc.port)) heartbeat_event = self.cooker.data.getVar('BB_HEARTBEAT_EVENT') if heartbeat_event: try: self.heartbeat_seconds = float(heartbeat_event) except: bb.warn('Ignoring invalid BB_HEARTBEAT_EVENT=%s, must be a float specifying seconds.' % heartbeat_event) self.timeout = self.server_timeout or self.cooker.data.getVar('BB_SERVER_TIMEOUT') try: if self.timeout: self.timeout = float(self.timeout) except: bb.warn('Ignoring invalid BB_SERVER_TIMEOUT=%s, must be a float specifying seconds.' % self.timeout) try: self.bitbake_lock.seek(0) self.bitbake_lock.truncate() if self.xmlrpc: self.bitbake_lock.write("%s %s:%s\n" % (os.getpid(), self.xmlrpc.host, self.xmlrpc.port)) else: self.bitbake_lock.write("%s\n" % (os.getpid())) self.bitbake_lock.flush() except Exception as e: print("Error writing to lock file: %s" % str(e)) pass if self.cooker.configuration.profile: try: import cProfile as profile except: import profile prof = profile.Profile() ret = profile.Profile.runcall(prof, self.main) prof.dump_stats("profile.log") bb.utils.process_profilelog("profile.log") print("Raw profiling information saved to profile.log and processed statistics to profile.log.processed") else: ret = self.main() return ret def main(self): self.cooker.pre_serve() bb.utils.set_process_name("Cooker") ready = [] newconnections = [] self.controllersock = False fds = [self.sock] if self.xmlrpc: fds.append(self.xmlrpc) print("Entering server connection loop") def disconnect_client(self, fds): print("Disconnecting Client") if self.controllersock: fds.remove(self.controllersock) self.controllersock.close() self.controllersock = False if self.haveui: fds.remove(self.command_channel) bb.event.unregister_UIHhandler(self.event_handle, True) self.command_channel_reply.writer.close() self.event_writer.writer.close() self.command_channel.close() self.command_channel = False del self.event_writer self.lastui = time.time() self.cooker.clientComplete() self.haveui = False ready = select.select(fds,[],[],0)[0] if newconnections: print("Starting new client") conn = newconnections.pop(-1) fds.append(conn) self.controllersock = conn elif self.timeout is None and not ready: print("No timeout, exiting.") self.quit = True self.lastui = time.time() while not self.quit: if self.sock in ready: while select.select([self.sock],[],[],0)[0]: controllersock, address = self.sock.accept() if self.controllersock: print("Queuing %s (%s)" % (str(ready), str(newconnections))) newconnections.append(controllersock) else: print("Accepting %s (%s)" % (str(ready), str(newconnections))) self.controllersock = controllersock fds.append(controllersock) if self.controllersock in ready: try: print("Processing Client") ui_fds = recvfds(self.controllersock, 3) print("Connecting Client") # Where to write events to writer = ConnectionWriter(ui_fds[0]) self.event_handle = bb.event.register_UIHhandler(writer, True) self.event_writer = writer # Where to read commands from reader = ConnectionReader(ui_fds[1]) fds.append(reader) self.command_channel = reader # Where to send command return values to writer = ConnectionWriter(ui_fds[2]) self.command_channel_reply = writer self.haveui = True self.hadanyui = True except (EOFError, OSError): disconnect_client(self, fds) if not self.timeout == -1.0 and not self.haveui and self.timeout and \ (self.lastui + self.timeout) < time.time(): print("Server timeout, exiting.") self.quit = True # If we don't see a UI connection within maxuiwait, its unlikely we're going to see # one. We have had issue with processes hanging indefinitely so timing out UI-less # servers is useful. if not self.hadanyui and not self.xmlrpc and not self.timeout and (self.lastui + self.maxuiwait) < time.time(): print("No UI connection within max timeout, exiting to avoid infinite loop.") self.quit = True if self.command_channel in ready: try: command = self.command_channel.get() except EOFError: # Client connection shutting down ready = [] disconnect_client(self, fds) continue if command[0] == "terminateServer": self.quit = True continue try: print("Running command %s" % command) self.command_channel_reply.send(self.cooker.command.runCommand(command)) except Exception as e: logger.exception('Exception in server main event loop running command %s (%s)' % (command, str(e))) if self.xmlrpc in ready: self.xmlrpc.handle_requests() ready = self.idle_commands(.1, fds) print("Exiting") # Remove the socket file so we don't get any more connections to avoid races try: os.unlink(self.sockname) except: pass self.sock.close() try: self.cooker.shutdown(True) self.cooker.notifier.stop() self.cooker.confignotifier.stop() except: pass self.cooker.post_serve() # Flush logs before we release the lock sys.stdout.flush() sys.stderr.flush() # Finally release the lockfile but warn about other processes holding it open lock = self.bitbake_lock lockfile = lock.name lock.close() lock = None while not lock: with bb.utils.timeout(3): lock = bb.utils.lockfile(lockfile, shared=False, retry=False, block=True) if lock: # We hold the lock so we can remove the file (hide stale pid data) # via unlockfile. bb.utils.unlockfile(lock) return if not lock: # Some systems may not have lsof available procs = None try: procs = subprocess.check_output(["lsof", '-w', lockfile], stderr=subprocess.STDOUT) except OSError as e: if e.errno != errno.ENOENT: raise if procs is None: # Fall back to fuser if lsof is unavailable try: procs = subprocess.check_output(["fuser", '-v', lockfile], stderr=subprocess.STDOUT) except OSError as e: if e.errno != errno.ENOENT: raise msg = "Delaying shutdown due to active processes which appear to be holding bitbake.lock" if procs: msg += ":\n%s" % str(procs) print(msg) def idle_commands(self, delay, fds=None): nextsleep = delay if not fds: fds = [] for function, data in list(self._idlefuns.items()): try: retval = function(self, data, False) if retval is False: del self._idlefuns[function] nextsleep = None elif retval is True: nextsleep = None elif isinstance(retval, float) and nextsleep: if (retval < nextsleep): nextsleep = retval elif nextsleep is None: continue else: fds = fds + retval except SystemExit: raise except Exception as exc: if not isinstance(exc, bb.BBHandledException): logger.exception('Running idle function') del self._idlefuns[function] self.quit = True # Create new heartbeat event? now = time.time() if now >= self.next_heartbeat: # We might have missed heartbeats. Just trigger once in # that case and continue after the usual delay. self.next_heartbeat += self.heartbeat_seconds if self.next_heartbeat <= now: self.next_heartbeat = now + self.heartbeat_seconds heartbeat = bb.event.HeartbeatEvent(now) bb.event.fire(heartbeat, self.cooker.data) if nextsleep and now + nextsleep > self.next_heartbeat: # Shorten timeout so that we we wake up in time for # the heartbeat. nextsleep = self.next_heartbeat - now if nextsleep is not None: if self.xmlrpc: nextsleep = self.xmlrpc.get_timeout(nextsleep) try: return select.select(fds,[],[],nextsleep)[0] except InterruptedError: # Ignore EINTR return [] else: return select.select(fds,[],[],0)[0] class ServerCommunicator(): def __init__(self, connection, recv): self.connection = connection self.recv = recv def runCommand(self, command): self.connection.send(command) if not self.recv.poll(30): logger.info("No reply from server in 30s") if not self.recv.poll(30): raise ProcessTimeout("Timeout while waiting for a reply from the bitbake server (60s)") return self.recv.get() def updateFeatureSet(self, featureset): _, error = self.runCommand(["setFeatures", featureset]) if error: logger.error("Unable to set the cooker to the correct featureset: %s" % error) raise BaseException(error) def getEventHandle(self): handle, error = self.runCommand(["getUIHandlerNum"]) if error: logger.error("Unable to get UI Handler Number: %s" % error) raise BaseException(error) return handle def terminateServer(self): self.connection.send(['terminateServer']) return class BitBakeProcessServerConnection(object): def __init__(self, ui_channel, recv, eq, sock): self.connection = ServerCommunicator(ui_channel, recv) self.events = eq # Save sock so it doesn't get gc'd for the life of our connection self.socket_connection = sock def terminate(self): self.socket_connection.close() self.connection.connection.close() self.connection.recv.close() return class BitBakeServer(object): start_log_format = '--- Starting bitbake server pid %s at %s ---' start_log_datetime_format = '%Y-%m-%d %H:%M:%S.%f' def __init__(self, lock, sockname, configuration, featureset): self.configuration = configuration self.featureset = featureset self.sockname = sockname self.bitbake_lock = lock self.readypipe, self.readypipein = os.pipe() # Create server control socket if os.path.exists(sockname): os.unlink(sockname) # Place the log in the builddirectory alongside the lock file logfile = os.path.join(os.path.dirname(self.bitbake_lock.name), "bitbake-cookerdaemon.log") self.sock = socket.socket(socket.AF_UNIX, socket.SOCK_STREAM) # AF_UNIX has path length issues so chdir here to workaround cwd = os.getcwd() try: os.chdir(os.path.dirname(sockname)) self.sock.bind(os.path.basename(sockname)) finally: os.chdir(cwd) self.sock.listen(1) os.set_inheritable(self.sock.fileno(), True) startdatetime = datetime.datetime.now() bb.daemonize.createDaemon(self._startServer, logfile) self.sock.close() self.bitbake_lock.close() os.close(self.readypipein) ready = ConnectionReader(self.readypipe) r = ready.poll(5) if not r: bb.note("Bitbake server didn't start within 5 seconds, waiting for 90") r = ready.poll(90) if r: try: r = ready.get() except EOFError: # Trap the child exitting/closing the pipe and error out r = None if not r or r[0] != "r": ready.close() bb.error("Unable to start bitbake server (%s)" % str(r)) if os.path.exists(logfile): logstart_re = re.compile(self.start_log_format % ('([0-9]+)', '([0-9-]+ [0-9:.]+)')) started = False lines = [] lastlines = [] with open(logfile, "r") as f: for line in f: if started: lines.append(line) else: lastlines.append(line) res = logstart_re.match(line.rstrip()) if res: ldatetime = datetime.datetime.strptime(res.group(2), self.start_log_datetime_format) if ldatetime >= startdatetime: started = True lines.append(line) if len(lastlines) > 60: lastlines = lastlines[-60:] if lines: if len(lines) > 60: bb.error("Last 60 lines of server log for this session (%s):\n%s" % (logfile, "".join(lines[-60:]))) else: bb.error("Server log for this session (%s):\n%s" % (logfile, "".join(lines))) elif lastlines: bb.error("Server didn't start, last 60 loglines (%s):\n%s" % (logfile, "".join(lastlines))) else: bb.error("%s doesn't exist" % logfile) raise SystemExit(1) ready.close() def _startServer(self): print(self.start_log_format % (os.getpid(), datetime.datetime.now().strftime(self.start_log_datetime_format))) sys.stdout.flush() try: server = ProcessServer(self.bitbake_lock, self.sock, self.sockname, self.configuration.server_timeout, self.configuration.xmlrpcinterface) os.close(self.readypipe) writer = ConnectionWriter(self.readypipein) try: self.cooker = bb.cooker.BBCooker(self.configuration, self.featureset, server.register_idle_function) except bb.BBHandledException: return None writer.send("r") writer.close() server.cooker = self.cooker print("Started bitbake server pid %d" % os.getpid()) sys.stdout.flush() server.run() finally: # Flush any ,essages/errors to the logfile before exit sys.stdout.flush() sys.stderr.flush() def connectProcessServer(sockname, featureset): # Connect to socket sock = socket.socket(socket.AF_UNIX, socket.SOCK_STREAM) # AF_UNIX has path length issues so chdir here to workaround cwd = os.getcwd() readfd = writefd = readfd1 = writefd1 = readfd2 = writefd2 = None eq = command_chan_recv = command_chan = None sock.settimeout(10) try: try: os.chdir(os.path.dirname(sockname)) finished = False while not finished: try: sock.connect(os.path.basename(sockname)) finished = True except IOError as e: if e.errno == errno.EWOULDBLOCK: pass raise finally: os.chdir(cwd) # Send an fd for the remote to write events to readfd, writefd = os.pipe() eq = BBUIEventQueue(readfd) # Send an fd for the remote to recieve commands from readfd1, writefd1 = os.pipe() command_chan = ConnectionWriter(writefd1) # Send an fd for the remote to write commands results to readfd2, writefd2 = os.pipe() command_chan_recv = ConnectionReader(readfd2) sendfds(sock, [writefd, readfd1, writefd2]) server_connection = BitBakeProcessServerConnection(command_chan, command_chan_recv, eq, sock) # Close the ends of the pipes we won't use for i in [writefd, readfd1, writefd2]: os.close(i) server_connection.connection.updateFeatureSet(featureset) except (Exception, SystemExit) as e: if command_chan_recv: command_chan_recv.close() if command_chan: command_chan.close() for i in [writefd, readfd1, writefd2]: try: if i: os.close(i) except OSError: pass sock.close() raise return server_connection def sendfds(sock, fds): '''Send an array of fds over an AF_UNIX socket.''' fds = array.array('i', fds) msg = bytes([len(fds) % 256]) sock.sendmsg([msg], [(socket.SOL_SOCKET, socket.SCM_RIGHTS, fds)]) def recvfds(sock, size): '''Receive an array of fds over an AF_UNIX socket.''' a = array.array('i') bytes_size = a.itemsize * size msg, ancdata, flags, addr = sock.recvmsg(1, socket.CMSG_LEN(bytes_size)) if not msg and not ancdata: raise EOFError try: if len(ancdata) != 1: raise RuntimeError('received %d items of ancdata' % len(ancdata)) cmsg_level, cmsg_type, cmsg_data = ancdata[0] if (cmsg_level == socket.SOL_SOCKET and cmsg_type == socket.SCM_RIGHTS): if len(cmsg_data) % a.itemsize != 0: raise ValueError a.frombytes(cmsg_data) assert len(a) % 256 == msg[0] return list(a) except (ValueError, IndexError): pass raise RuntimeError('Invalid data received') class BBUIEventQueue: def __init__(self, readfd): self.eventQueue = [] self.eventQueueLock = threading.Lock() self.eventQueueNotify = threading.Event() self.reader = ConnectionReader(readfd) self.t = threading.Thread() self.t.setDaemon(True) self.t.run = self.startCallbackHandler self.t.start() def getEvent(self): self.eventQueueLock.acquire() if len(self.eventQueue) == 0: self.eventQueueLock.release() return None item = self.eventQueue.pop(0) if len(self.eventQueue) == 0: self.eventQueueNotify.clear() self.eventQueueLock.release() return item def waitEvent(self, delay): self.eventQueueNotify.wait(delay) return self.getEvent() def queue_event(self, event): self.eventQueueLock.acquire() self.eventQueue.append(event) self.eventQueueNotify.set() self.eventQueueLock.release() def send_event(self, event): self.queue_event(pickle.loads(event)) def startCallbackHandler(self): bb.utils.set_process_name("UIEventQueue") while True: try: self.reader.wait() event = self.reader.get() self.queue_event(event) except EOFError: # Easiest way to exit is to close the file descriptor to cause an exit break self.reader.close() class ConnectionReader(object): def __init__(self, fd): self.reader = multiprocessing.connection.Connection(fd, writable=False) self.rlock = multiprocessing.Lock() def wait(self, timeout=None): return multiprocessing.connection.wait([self.reader], timeout) def poll(self, timeout=None): return self.reader.poll(timeout) def get(self): with self.rlock: res = self.reader.recv_bytes() return multiprocessing.reduction.ForkingPickler.loads(res) def fileno(self): return self.reader.fileno() def close(self): return self.reader.close() class ConnectionWriter(object): def __init__(self, fd): self.writer = multiprocessing.connection.Connection(fd, readable=False) self.wlock = multiprocessing.Lock() # Why bb.event needs this I have no idea self.event = self def send(self, obj): obj = multiprocessing.reduction.ForkingPickler.dumps(obj) with self.wlock: self.writer.send_bytes(obj) def fileno(self): return self.writer.fileno() def close(self): return self.writer.close()