관리-도구
편집 파일: web_server.py
import asyncio import inspect import io import logging import os import re import shlex import shutil import string import xml.etree.ElementTree as ET from contextlib import suppress from contextvars import ContextVar from datetime import timedelta from packaging.version import Version from pathlib import Path from subprocess import check_call, DEVNULL from typing import Any, Callable, List, Optional, Set, Tuple, Iterable import psutil from defence360agent.api.integration_conf import IntegrationConfig from defence360agent.application.determine_hosting_panel import ( is_generic_panel_installed, is_plesk_installed, ) from defence360agent.internals.global_scope import g from defence360agent.utils import ( async_lru_cache, atomic_rewrite, check_run, get_system_user_names, OsReleaseInfo, CheckRunError, TimedCache, BACKUP_EXTENSION, ) from defence360agent.utils.common import webserver_gracefull_restart GRACEFUL_RESTART_MIN_PERIOD = int( os.environ.get("IM360_GRACEFUL_RESTART_MIN_PERIOD", 5 * 60) ) # seconds """ how many seconds should pass minimum between web server restarts. """ CPANEL_RESTART_APACHE_SCRIPT = "/usr/local/cpanel/scripts/restartsrv_httpd" # according to LS docs https://www.litespeedtech.com/docs/webserver/admin LITESPEED_PID_FILE_PATH = Path("/tmp/lshttpd/lshttpd.pid") LITESPEED_RESTART_CMD = ("/usr/local/lsws/bin/lswsctrl", "condrestart") LITESPEED_CONF_PATH = "/usr/local/lsws/conf/httpd_config.xml" APACHE2_BIN_PATH = "/usr/sbin/apache2" HTTPD_BIN_PATH = "/usr/sbin/httpd" apache_version_regexp = re.compile(r"Server version:.*(\d+\.\d+\.\d+)") BYTE_SPACES = tuple(x.encode() for x in list(string.whitespace)) APACHE = "apache" logger = logging.getLogger(__name__) class NotRunningError(RuntimeError): """ Error for cases when the web server is expected to be running but it is not. """ class ConfigInvalidError(RuntimeError): """ Error used to indicate that the web server config is having error(s). """ class LiteSpeedConfig: CLIENT_IP_IN_HEADER_TAG = "useIpInProxyHeader" SECURITY_TAG = "security" ACCESS_CONTROL_TAG = "accessControl" ACCESS_CONTROL_ALLOWED_TAG = "allow" ACCESS_CONTROL_DENIED_TAG = "deny" CLIENT_IP_IN_HEADER_DISABLED = 0 CLIENT_IP_IN_HEADER_ENABLED = 1 CLIENT_IP_IN_HEADER_TRUSTED_IP_ONLY = 2 def __init__(self, content): self.config = ET.fromstring(content) def client_ip_in_header(self) -> int: element = self.config.find(self.CLIENT_IP_IN_HEADER_TAG) if element is None or not element.text: return self.CLIENT_IP_IN_HEADER_DISABLED return int(element.text) def set_client_ip_in_header(self, value: int): element = self.config.find(self.CLIENT_IP_IN_HEADER_TAG) if element is None: element = ET.Element(self.CLIENT_IP_IN_HEADER_TAG) self.config.append(element) element.text = str(value) def access_control_allowed_list(self) -> Set[Tuple[str, bool]]: element = self.config.find( "/".join( [ ".", self.SECURITY_TAG, self.ACCESS_CONTROL_TAG, self.ACCESS_CONTROL_ALLOWED_TAG, ] ) ) if element is not None and element.text: return { (item[:-1] if item.endswith("T") else item, item.endswith("T")) for s in element.text.split() for item in s.split(",") if item } return set() def set_access_control_allowed_list(self, allowed): items = [item[0] + "T" if item[1] else item[0] for item in allowed] value = ",".join(items) element = self.config.find( "/".join( [ ".", self.SECURITY_TAG, self.ACCESS_CONTROL_TAG, self.ACCESS_CONTROL_ALLOWED_TAG, ] ) ) if element is None: element = ET.Element(self.ACCESS_CONTROL_ALLOWED_TAG) access_control = self.config.find( "/".join( [ ".", self.SECURITY_TAG, self.ACCESS_CONTROL_TAG, ] ) ) if access_control is None: access_control = ET.Element(self.ACCESS_CONTROL_TAG) security = self.config.find(self.SECURITY_TAG) if security is None: security = ET.Element(self.SECURITY_TAG) self.config.append(security) security.append(access_control) access_control.append(element) element.text = value def tostring(self) -> bytes: buf = io.BytesIO() tree = ET.ElementTree(self.config) tree.write(buf, encoding="utf-8", xml_declaration=True) return buf.getvalue() def _get_litespeed_pid(): """Return LiteSpeed's pid or None if it can't be read.""" with suppress(OSError, ValueError): return int(LITESPEED_PID_FILE_PATH.read_bytes()) def litespeed_running(): """ Litespeed use constant PID file path, so using it to determinate status :return bool """ pid = _get_litespeed_pid() try: return bool(pid and psutil.pid_exists(pid)) except OverflowError: return False def apache_running() -> Optional[str]: """ Finding process with name 'httpd' which belongs to system user. :return str: path to the apache binary if it is running :return None: if apache is not running """ info = _apache_running_process() return info["httpd_bin"] if info else None async def apache_binary_call(*args) -> bytes: httpd_bin = apache_running() if not httpd_bin: raise NotRunningError("Apache is not running") try: if ( OsReleaseInfo.id_like() & OsReleaseInfo.DEBIAN and Path("/etc/apache2/envvars").exists() ): # on Debian OS apache requires some env variables # that are set in /etc/apache2/envvars (see DEF-6844) stdout = await check_run( ". /etc/apache2/envvars && {} {}".format( shlex.quote(httpd_bin), shlex.join(args) ), shell=True, ) else: stdout = await check_run([httpd_bin, *args]) except CheckRunError: logger.warning("Apache doesn't work properly") return b"" return stdout def _apache_running_process(*, exclude_users=frozenset()): """ Finding process with name 'httpd' which belongs to system user. Return process info for the apache binary if it is running. Return None if apache is not running """ # Cpanel works on rpm based os and uses packages # according documentation https://documentation.cpanel.net/display/EA4/Apache # noqa # httpd binary is /usr/sbin/httpd # Plesk/Generic uses pkgs from os # so it has /usr/sbin/httpd on rpm based os and /usr/sbin/apache2 on debian # DirectAdmin uses custombuild # It's httpd binary is /usr/sbib/httpd def is_generic_panel_on_apache(): if is_generic_panel_installed(): return IntegrationConfig.get("web_server", "server_type") == APACHE return False if (OsReleaseInfo.id_like() & OsReleaseInfo.DEBIAN) and ( is_plesk_installed() or is_generic_panel_on_apache() ): httpd_bin = APACHE2_BIN_PATH else: httpd_bin = HTTPD_BIN_PATH sys_users = set(get_system_user_names()) - exclude_users info = _apache_running_process_info(sys_users) if info: assert info["exe"] is not None info["httpd_bin"] = httpd_bin try: httpd_process_exe = info["exe"] if os.path.samefile(httpd_bin, httpd_process_exe): return info except OSError as exc: logger.info("Can't determine apache bin path: %s", exc) return None def _apache_running_process_info(sys_users): """Retry process_iter() on IndexError.""" for _ in range(2): # retry with suppress(IndexError): return next( ( p.info for p in psutil.process_iter( attrs=["name", "username", "exe", "uids", "gids"] ) if ( p.info["exe"] is not None # non ad_value and p.info["exe"].endswith(("/httpd", "/apache2")) and p.info["username"] in sys_users ) ), None, ) def chown(path): """Make web server user/group own *path*.""" info = _apache_running_process(exclude_users={"root"}) if not info: raise NotRunningError( "Can't find running apache process without root owner." ) os.chown(path, info["uids"][0], info["gids"][0]) def find_running_nginx(): """Return path to a running nginx binary or None if not found.""" return next( ( p.info["exe"] for p in psutil.process_iter(attrs=["name", "username", "exe"]) if ( p.info["name"] is not None # non ad_value and p.info["name"].endswith("nginx") and p.info["exe"] is not None # non ad_value and "nginx" in p.info["exe"] and p.info["username"] == "nginx" ) ), None, ) async def check_with_timeout( webserver_running_cb: Callable[[], Any], timeout_sec=10, granularity: int = 10, ): assert granularity > 0 for _ in range(granularity): result = webserver_running_cb() if result: return result await asyncio.sleep(timeout_sec / granularity) else: return result def is_EA4_available(): """ though, available != running :return bool: """ return os.path.isfile("/etc/cpanel/ea4/is_ea4") def _apache_graceful_restart_cmd(apachectl) -> List[str]: """ :return list: command which can be passed to check_call(..., shell=False) 'apache2 -k graceful' will not work for Ubuntu and will produce 'Invalid Mutex directory in argument file:${APACHE_LOCK_DIR}' error. https://serverfault.com/questions/558283/apache2-config-variable-is-not-defined That is why this specialization for Ubuntu graceful restart. """ # noqa restartsrv_httpd = shutil.which(CPANEL_RESTART_APACHE_SCRIPT) if restartsrv_httpd: # use cpanel specific script if found return [restartsrv_httpd] if OsReleaseInfo.id_like() & OsReleaseInfo.DEBIAN: # see DEF-16795 for details return [ "systemctl", "reload", "--job-mode=replace-irreversibly", os.path.basename(apachectl), ] else: return [apachectl, "-k", "graceful"] def _graceful_restart_cmd_from_integration_conf() -> Optional[Iterable[str]]: if IntegrationConfig.exists(): # Fallback on regular restart techniques # in case of missing restart script. try: restart_script = IntegrationConfig.to_dict()["web_server"][ "graceful_restart_script" ] except KeyError: logger.warning( "Integration config is missing graceful_restart_script field" ) else: if not restart_script: logger.warning( "graceful_restart_script option is empty", ) return None cmd = restart_script.split() if os.path.exists(cmd[0]): return cmd logger.warning( "Web server restart script does not exist: %s", restart_script, ) return None def _graceful_restart_cmd() -> Iterable[str]: """Gracefully restart a web server.""" # Do not restart web server in the agent cgroup # (to avoid attaching its processes to it, see DEF-20577) prefix = [] if systemd_run := shutil.which("systemd-run"): prefix += [ systemd_run, "-p", "SendSIGKILL=no", "--slice=graceful_restart", "--", ] cmd = _graceful_restart_cmd_from_integration_conf() if cmd is not None: return prefix + list(cmd) if litespeed_running(): return prefix + list(LITESPEED_RESTART_CMD) if apachectl := apache_running(): return prefix + _apache_graceful_restart_cmd(apachectl) raise RuntimeError("Could not detect a web server") def _configtest_cmd() -> Iterable[str]: if is_generic_panel_installed(): try: cmd = IntegrationConfig.get("web_server", "config_test_script") if cmd: return cmd.split() except KeyError: # if setting is not present, fall back to default detection pass if apache_bin := apache_running(): if OsReleaseInfo.id_like() & OsReleaseInfo.DEBIAN: return ["apachectl", "configtest"] return [apache_bin, "-t"] elif litespeed_running(): return ["lightspeed", "-t"] elif nginx_bin := find_running_nginx(): return [nginx_bin, "-t"] raise RuntimeError("Could not detect a web server") _graceful_restart_caller = ContextVar("graceful_restart_caller") async def safe_update_config(config_path, new_config: str) -> bool: """ Update Web-server config with fallback in case of an error happens. It tries to do all the best but because of graceful_restart() the faulty config might still be applied but in practice it is barely probable (because of premature config check). 1. The new config is checked before to be applied. 2. The new config (if checked valid) is atomically applied. 3. The graceful Web-server restart is scheduled. It may hold the actual restart for some time, but it is a required workaround of a litespeed issue. 4. If the Web-server failed to restart the config is reverted. Return value: True if no errors (at least up to the server restart), False if There was an error and config was reverted. Note: It is possible that the config may be reverted even when return value is True. It is because the graceful_restart may delay the actual restart and config may be reverted on that (delayed) stage. """ config_backup_path = os.fspath(config_path) + BACKUP_EXTENSION def remove_backup(): with suppress(FileNotFoundError): os.unlink(config_backup_path) make_backup = os.path.exists(config_path) if not atomic_rewrite(config_path, new_config, backup=make_backup): # nothing has changed => no need to restart return True def revert(): try: os.rename(config_backup_path, config_path) except FileNotFoundError: # truncate file if backup does not exist open(config_path, "w").close() try: await configtest(raise_exception=True) except ConfigInvalidError as e: logger.error("Web server config is invalid: %s", e) revert() else: restart_cmd = _graceful_restart_cmd() loop = asyncio.get_running_loop() def restart_callback(task): def log_config_error(fut): if not fut.cancelled() and fut.exception() is not None: logger.critical( "The reverted config seems to be invalid", exc_info=fut.exception(), ) def log_uncaught_exception(fut): if not fut.cancelled() and fut.exception() is not None: logger.critical( "uncaught exception", exc_info=fut.exception() ) if not task.cancelled() and task.exception() is not None: logger.error( "Web server failed to start... Revert changes back. (%s)", task.exception(), ) revert() task = loop.create_task(configtest(raise_exception=True)) task.add_done_callback(log_config_error) # the least we can do is to try to restart task = loop.create_task(_graceful_restart(restart_cmd)) task.add_done_callback(log_uncaught_exception) else: remove_backup() graceful_restart = webserver_gracefull_restart.coalesce_calls( GRACEFUL_RESTART_MIN_PERIOD, done_callback=restart_callback )(_graceful_restart) caller_frame = inspect.stack()[1] context_token = _graceful_restart_caller.set(caller_frame.function) try: await graceful_restart(restart_cmd) finally: _graceful_restart_caller.reset(context_token) logger.info("Successfully scheduled web server restart") return True return False async def _graceful_restart(restart_cmd=None): """ Gracefully restart a web server. If web server cannot be detected, do nothing. """ _log_graceful_restart_start() try: await check_run(restart_cmd or _graceful_restart_cmd()) except RuntimeError as err: logger.warning("Could not restart a Web server: %s", err) else: logger.info("Successfully restarted web server") @webserver_gracefull_restart.coalesce_calls(GRACEFUL_RESTART_MIN_PERIOD) async def _graceful_restart_coalesced(restart_cmd=None): task = _graceful_restart(restart_cmd) g.web_server_restart_task = task try: return await task finally: g.pop("web_server_restart_task") async def graceful_restart(restart_cmd=None): """ Gracefully restart a web server. If web server cannot be detected, do nothing. """ caller_frame = inspect.stack()[1] context_token = _graceful_restart_caller.set(caller_frame.function) try: result = await _graceful_restart_coalesced(restart_cmd) finally: _graceful_restart_caller.reset(context_token) return result def _log_graceful_restart_start(): caller = _graceful_restart_caller.get("unknown") logger.info("Performing web server graceful restart, from %s", caller) def graceful_restart_sync(): """ Gracefully restart a web server synchronously. If web server cannot be detected, do nothing. """ caller_frame = inspect.stack()[1] context_token = _graceful_restart_caller.set(caller_frame.function) try: _log_graceful_restart_start() finally: _graceful_restart_caller.reset(context_token) try: check_call(_graceful_restart_cmd(), stdout=DEVNULL, stderr=DEVNULL) except RuntimeError as err: logger.warning("Could not restart a Web server: %s", err) else: logger.info("Successfully restarted web server") async def configtest(raise_exception=False): """ Check web server's config file. If web server cannot be detected, do nothing. """ logger.info("Performing web server config test") try: await check_run(_configtest_cmd(), raise_exc=ConfigInvalidError) except RuntimeError as err: logger.warning("Could not run configtest: %s", err) if raise_exception: raise ConfigInvalidError("Failed to check config") from err def _parse_apache_version_output(output): match = apache_version_regexp.search(output) if match is not None: return Version(match.group(1)) else: raise ValueError( "Failed to parse apache version string: {}".format(output) ) def _parse_apache_module_list(output: bytes) -> List[bytes]: """ Parse response of httpd -M :param output: stdout of httpd -M (with spaces before module name) Output example: Loaded Modules: core_module (static) so_module (static) http_module (static) mpm_prefork_module (shared) :return: list with installed modules """ return [ line.strip().split()[0] for line in output.splitlines() if line.startswith(BYTE_SPACES) ] def _parse_includes(dump): includes = [] for line in dump.decode().split("\n"): index = line.find("/") if index > 0: includes.append(line[index:].strip()) return includes async def dump_includes(): try: return _parse_includes( await check_run(["apachectl", "-t", "-D", "DUMP_INCLUDES"]) ) except FileNotFoundError: return [] @async_lru_cache(maxsize=1) async def apache_version(): apache_bin = apache_running() if apache_bin is None: raise NotRunningError("Apache is not running") out = await check_run([apache_bin, "-v"]) version = _parse_apache_version_output(out.decode()) logger.info("Apache %s version detected", version) return version @TimedCache( expiration=timedelta( seconds=int( os.environ.get("IMUNIFY360_APACHE_MODULES_CACHE_TIMEOUT", 600) ) ) ) async def apache_modules(): stdout = await apache_binary_call("-M") return _parse_apache_module_list(stdout)