mirror of https://github.com/jumpserver/jumpserver
You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
573 lines
15 KiB
573 lines
15 KiB
#!/usr/bin/env python3 |
|
# coding: utf-8 |
|
|
|
import os |
|
import subprocess |
|
import threading |
|
import datetime |
|
import logging |
|
import logging.handlers |
|
import psutil |
|
import time |
|
import argparse |
|
import sys |
|
import shutil |
|
import signal |
|
from collections import defaultdict |
|
import daemon |
|
from daemon import pidfile |
|
|
|
BASE_DIR = os.path.dirname(os.path.abspath(__file__)) |
|
sys.path.insert(0, BASE_DIR) |
|
|
|
logging.basicConfig(level=logging.DEBUG, format="%(asctime)s %(message)s", datefmt="%Y-%m-%d %H:%M:%S") |
|
|
|
try: |
|
from apps.jumpserver import const |
|
__version__ = const.VERSION |
|
except ImportError as e: |
|
print("Not found __version__: {}".format(e)) |
|
print("Python is: ") |
|
logging.info(sys.executable) |
|
__version__ = 'Unknown' |
|
sys.exit(1) |
|
|
|
try: |
|
from apps.jumpserver.const import CONFIG |
|
except ImportError as e: |
|
print("Import error: {}".format(e)) |
|
print("Could not find config file, `cp config_example.yml config.yml`") |
|
sys.exit(1) |
|
|
|
os.environ["PYTHONIOENCODING"] = "UTF-8" |
|
APPS_DIR = os.path.join(BASE_DIR, 'apps') |
|
LOG_DIR = os.path.join(BASE_DIR, 'logs') |
|
TMP_DIR = os.path.join(BASE_DIR, 'tmp') |
|
HTTP_HOST = CONFIG.HTTP_BIND_HOST or '127.0.0.1' |
|
HTTP_PORT = CONFIG.HTTP_LISTEN_PORT or 8080 |
|
WS_PORT = CONFIG.WS_LISTEN_PORT or 8082 |
|
DEBUG = CONFIG.DEBUG or False |
|
LOG_LEVEL = CONFIG.LOG_LEVEL or 'INFO' |
|
|
|
START_TIMEOUT = 40 |
|
WORKERS = 4 |
|
DAEMON = False |
|
LOG_KEEP_DAYS = 7 |
|
logging.basicConfig( |
|
format='%(asctime)s %(message)s', level=logging.INFO, |
|
datefmt='%Y-%m-%d %H:%M:%S' |
|
) |
|
|
|
EXIT_EVENT = threading.Event() |
|
LOCK = threading.Lock() |
|
files_preserve = [] |
|
STOP_TIMEOUT = 10 |
|
|
|
logger = logging.getLogger() |
|
|
|
try: |
|
os.makedirs(os.path.join(BASE_DIR, "data", "static")) |
|
os.makedirs(os.path.join(BASE_DIR, "data", "media")) |
|
except: |
|
pass |
|
|
|
|
|
def check_database_connection(): |
|
os.chdir(os.path.join(BASE_DIR, 'apps')) |
|
for i in range(60): |
|
logging.info("Check database connection ...") |
|
code = subprocess.call("python manage.py showmigrations users ", shell=True) |
|
if code == 0: |
|
logging.info("Database connect success") |
|
return |
|
time.sleep(1) |
|
logging.error("Connection database failed, exist") |
|
sys.exit(10) |
|
|
|
|
|
def check_migrations(): |
|
apps_dir = os.path.join(BASE_DIR, 'apps') |
|
code = subprocess.call("python manage.py showmigrations | grep '\[.\]' | grep -v '\[X\]'", shell=True, cwd=apps_dir) |
|
|
|
if code == 1: |
|
return |
|
# for i in range(3): |
|
# print("!!! Warning: Has SQL migrations not perform, 有 SQL 变更没有执行") |
|
# print("You should run `./PROC upgrade_db` first, 请先运行 ./PROC upgrade_db, 进行表结构变更") |
|
# sys.exit(1) |
|
|
|
|
|
def expire_caches(): |
|
apps_dir = os.path.join(BASE_DIR, 'apps') |
|
code = subprocess.call("python manage.py expire_caches", shell=True, cwd=apps_dir) |
|
|
|
if code == 1: |
|
return |
|
|
|
|
|
def perform_db_migrate(): |
|
logging.info("Check database structure change ...") |
|
os.chdir(os.path.join(BASE_DIR, 'apps')) |
|
logging.info("Migrate model change to database ...") |
|
subprocess.call('python3 manage.py migrate', shell=True) |
|
|
|
|
|
def collect_static(): |
|
logging.info("Collect static files") |
|
os.chdir(os.path.join(BASE_DIR, 'apps')) |
|
command = 'python3 manage.py collectstatic --no-input -c &> /dev/null ' |
|
subprocess.call(command, shell=True) |
|
logging.info("Collect static files done") |
|
|
|
|
|
def prepare(): |
|
check_database_connection() |
|
check_migrations() |
|
upgrade_db() |
|
expire_caches() |
|
|
|
|
|
def check_pid(pid): |
|
""" Check For the existence of a unix pid. """ |
|
try: |
|
os.kill(pid, 0) |
|
except (OSError, ProcessLookupError): |
|
return False |
|
else: |
|
return True |
|
|
|
|
|
def get_pid_file_path(s): |
|
return os.path.join(TMP_DIR, '{}.pid'.format(s)) |
|
|
|
|
|
def get_log_file_path(s): |
|
return os.path.join(LOG_DIR, '{}.log'.format(s)) |
|
|
|
|
|
def get_pid_from_file(path): |
|
if os.path.isfile(path): |
|
with open(path) as f: |
|
try: |
|
return int(f.read().strip()) |
|
except ValueError: |
|
return 0 |
|
return 0 |
|
|
|
|
|
def get_pid(s): |
|
pid_file = get_pid_file_path(s) |
|
return get_pid_from_file(pid_file) |
|
|
|
|
|
def is_running(s, unlink=True): |
|
pid_file = get_pid_file_path(s) |
|
|
|
if os.path.isfile(pid_file): |
|
pid = get_pid(s) |
|
if pid == 0: |
|
return False |
|
elif check_pid(pid): |
|
return True |
|
|
|
if unlink: |
|
os.unlink(pid_file) |
|
return False |
|
|
|
|
|
def parse_service(s): |
|
web_services = ['gunicorn', 'flower', 'daphne'] |
|
celery_services = [ |
|
"celery_ansible", "celery_default" |
|
] |
|
task_services = celery_services + ['beat'] |
|
all_services = web_services + task_services |
|
if s == 'all': |
|
return all_services |
|
elif s == "web": |
|
return web_services |
|
elif s == 'ws': |
|
return ['daphne'] |
|
elif s == "task": |
|
return task_services |
|
elif s == "celery": |
|
return celery_services |
|
elif "," in s: |
|
services = set() |
|
for i in s.split(','): |
|
services.update(parse_service(i)) |
|
return services |
|
else: |
|
return [s] |
|
|
|
|
|
def get_start_gunicorn_kwargs(): |
|
print("\n- Start Gunicorn WSGI HTTP Server") |
|
prepare() |
|
bind = '{}:{}'.format(HTTP_HOST, HTTP_PORT) |
|
log_format = '%(h)s %(t)s %(L)ss "%(r)s" %(s)s %(b)s ' |
|
|
|
cmd = [ |
|
'gunicorn', 'jumpserver.wsgi', |
|
'-b', bind, |
|
'-k', 'gthread', |
|
'--threads', '10', |
|
'-w', str(WORKERS), |
|
'--max-requests', '4096', |
|
'--access-logformat', log_format, |
|
'--access-logfile', '-' |
|
] |
|
|
|
if DEBUG: |
|
cmd.append('--reload') |
|
return {'cmd': cmd, 'cwd': APPS_DIR} |
|
|
|
|
|
def get_start_daphne_kwargs(): |
|
print("\n- Start Daphne ASGI WS Server") |
|
cmd = [ |
|
'daphne', 'jumpserver.asgi:application', |
|
'-b', HTTP_HOST, |
|
'-p', str(WS_PORT), |
|
] |
|
return {'cmd': cmd, 'cwd': APPS_DIR} |
|
|
|
|
|
def get_start_celery_ansible_kwargs(): |
|
print("\n- Start Celery as Distributed Task Queue: Ansible") |
|
return get_start_worker_kwargs('ansible', 10) |
|
|
|
|
|
def get_start_celery_default_kwargs(): |
|
print("\n- Start Celery as Distributed Task Queue: Celery") |
|
return get_start_worker_kwargs('celery', 10) |
|
|
|
|
|
def get_start_worker_kwargs(queue, num): |
|
# Todo: Must set this environment, otherwise not no ansible result return |
|
os.environ.setdefault('PYTHONOPTIMIZE', '1') |
|
os.environ.setdefault('ANSIBLE_FORCE_COLOR', 'True') |
|
|
|
if os.getuid() == 0: |
|
os.environ.setdefault('C_FORCE_ROOT', '1') |
|
server_hostname = os.environ.get("SERVER_HOSTNAME") |
|
if not server_hostname: |
|
server_hostname = '%h' |
|
|
|
cmd = [ |
|
'celery', 'worker', |
|
'-P', 'threads', |
|
'-A', 'ops', |
|
'-l', 'INFO', |
|
'-c', str(num), |
|
'-Q', queue, |
|
'-n', '{}@{}'.format(queue, server_hostname) |
|
] |
|
return {"cmd": cmd, "cwd": APPS_DIR} |
|
|
|
|
|
def get_start_flower_kwargs(): |
|
print("\n- Start Flower as Task Monitor") |
|
if os.getuid() == 0: |
|
os.environ.setdefault('C_FORCE_ROOT', '1') |
|
|
|
cmd = [ |
|
'celery', 'flower', |
|
'-A', 'ops', |
|
'-l', 'INFO', |
|
'--url_prefix=/core/flower', |
|
'--auto_refresh=False', |
|
'--max_tasks=1000', |
|
'--tasks_columns=uuid,name,args,state,received,started,runtime,worker' |
|
] |
|
return {"cmd": cmd, "cwd": APPS_DIR} |
|
|
|
|
|
def get_start_beat_kwargs(): |
|
print("\n- Start Beat as Periodic Task Scheduler") |
|
utils_dir = os.path.join(BASE_DIR, 'utils') |
|
cmd = [ |
|
sys.executable, 'start_celery_beat.py', |
|
] |
|
return {"cmd": cmd, 'cwd': utils_dir} |
|
|
|
|
|
processes = {} |
|
|
|
|
|
def watch_services(): |
|
max_retry = 3 |
|
services_retry = defaultdict(int) |
|
stopped_services = {} |
|
|
|
def check_services(): |
|
now = datetime.datetime.now().strftime('%Y-%m-%d %H:%M:%S') |
|
for s, p in processes.items(): |
|
print("{} Check service status: {} -> ".format(now, s), end='') |
|
try: |
|
p.wait(timeout=1) # 不wait,子进程可能无法回收 |
|
except subprocess.TimeoutExpired: |
|
pass |
|
ok = is_running(s) |
|
if not ok: |
|
stopped_services[s] = '' |
|
print("stopped with code: {}({})".format(p.returncode, p.pid)) |
|
else: |
|
print("running at {}".format(p.pid)) |
|
stopped_services.pop(s, None) |
|
services_retry.pop(s, None) |
|
|
|
def retry_start_stopped_services(): |
|
for s in stopped_services: |
|
if services_retry[s] > max_retry: |
|
logging.info("Service start failed, exit: ", s) |
|
EXIT_EVENT.set() |
|
break |
|
|
|
p = start_service(s) |
|
logging.info("> Find {} stopped, retry {}, {}".format( |
|
s, services_retry[s] + 1, p.pid) |
|
) |
|
processes[s] = p |
|
services_retry[s] += 1 |
|
|
|
def rotate_log_if_need(): |
|
now = datetime.datetime.now() |
|
tm = now.strftime('%H:%M') |
|
if tm != '23:59': |
|
return |
|
suffix = now.strftime('%Y-%m-%d') |
|
services = list(processes.keys()) |
|
services.append('jms') |
|
|
|
for s in services: |
|
log_path = get_log_file_path(s) |
|
log_dir = os.path.dirname(log_path) |
|
filename = os.path.basename(log_path) |
|
pre_log_dir = os.path.join(log_dir, suffix) |
|
if not os.path.exists(pre_log_dir): |
|
os.mkdir(pre_log_dir) |
|
|
|
pre_log_path = os.path.join(pre_log_dir, filename) |
|
if os.path.isfile(log_path) and not os.path.isfile(pre_log_path): |
|
logging.info("Rotate log file: {} => {}".format(log_path, pre_log_path)) |
|
shutil.copy(log_path, pre_log_path) |
|
with open(log_path, 'w') as f: |
|
pass |
|
some_days_ago = now - datetime.timedelta(days=LOG_KEEP_DAYS) |
|
days_ago_dir = os.path.join(LOG_DIR, some_days_ago.strftime('%Y-%m-%d')) |
|
if os.path.exists(days_ago_dir): |
|
logger.info("Remove old log: {}".format(days_ago_dir)) |
|
shutil.rmtree(days_ago_dir, ignore_errors=True) |
|
|
|
while not EXIT_EVENT.is_set(): |
|
try: |
|
with LOCK: |
|
check_services() |
|
retry_start_stopped_services() |
|
rotate_log_if_need() |
|
time.sleep(30) |
|
except KeyboardInterrupt: |
|
print("Start stop service") |
|
time.sleep(1) |
|
break |
|
clean_up() |
|
|
|
|
|
def start_service(s): |
|
services_kwargs = { |
|
"gunicorn": get_start_gunicorn_kwargs, |
|
"celery_ansible": get_start_celery_ansible_kwargs, |
|
"celery_default": get_start_celery_default_kwargs, |
|
"beat": get_start_beat_kwargs, |
|
"flower": get_start_flower_kwargs, |
|
"daphne": get_start_daphne_kwargs, |
|
} |
|
|
|
kwargs = services_kwargs.get(s)() |
|
pid_file = get_pid_file_path(s) |
|
|
|
if os.path.isfile(pid_file): |
|
os.unlink(pid_file) |
|
cmd = kwargs.pop('cmd') |
|
|
|
log_file_path = get_log_file_path(s) |
|
log_file_f = open(log_file_path, 'a') |
|
files_preserve.append(log_file_f) |
|
kwargs['stderr'] = log_file_f |
|
kwargs['stdout'] = log_file_f |
|
p = subprocess.Popen(cmd, **kwargs) |
|
with open(pid_file, 'w') as f: |
|
f.write(str(p.pid)) |
|
return p |
|
|
|
|
|
def start_services_and_watch(s): |
|
logging.info(time.ctime()) |
|
logging.info('JumpServer version {}, more see https://www.jumpserver.org'.format( |
|
__version__) |
|
) |
|
|
|
services_set = parse_service(s) |
|
for i in services_set: |
|
if is_running(i): |
|
show_service_status(i) |
|
continue |
|
p = start_service(i) |
|
time.sleep(2) |
|
processes[i] = p |
|
|
|
if not DAEMON: |
|
watch_services() |
|
else: |
|
show_service_status(s) |
|
context = get_daemon_context() |
|
with context: |
|
watch_services() |
|
|
|
|
|
def get_daemon_context(): |
|
daemon_pid_file = get_pid_file_path('jms') |
|
daemon_log_f = open(get_log_file_path('jms'), 'a') |
|
files_preserve.append(daemon_log_f) |
|
context = daemon.DaemonContext( |
|
pidfile=pidfile.TimeoutPIDLockFile(daemon_pid_file), |
|
signal_map={ |
|
signal.SIGTERM: lambda x, y: clean_up(), |
|
signal.SIGHUP: 'terminate', |
|
}, |
|
stdout=daemon_log_f, |
|
stderr=daemon_log_f, |
|
files_preserve=files_preserve, |
|
detach_process=True, |
|
) |
|
return context |
|
|
|
|
|
def stop_service(srv, sig=15): |
|
services_set = parse_service(srv) |
|
for s in services_set: |
|
if not is_running(s): |
|
show_service_status(s) |
|
continue |
|
print("Stop service: {}".format(s), end='') |
|
pid = get_pid(s) |
|
os.kill(pid, sig) |
|
with LOCK: |
|
process = processes.pop(s, None) |
|
if process is None: |
|
try: |
|
process = psutil.Process(pid) |
|
except: |
|
pass |
|
if process is None: |
|
print("\033[31m No process found\033[0m") |
|
continue |
|
try: |
|
process.wait(1) |
|
except: |
|
pass |
|
for i in range(STOP_TIMEOUT): |
|
if i == STOP_TIMEOUT - 1: |
|
print("\033[31m Error\033[0m") |
|
if not is_running(s): |
|
print("\033[32m Ok\033[0m") |
|
break |
|
else: |
|
time.sleep(1) |
|
continue |
|
|
|
if srv == "all": |
|
stop_daemon_service() |
|
|
|
|
|
def stop_daemon_service(): |
|
pid = get_pid('jms') |
|
if pid and check_pid(pid): |
|
os.kill(pid, 15) |
|
|
|
|
|
def stop_multi_services(services): |
|
for s in services: |
|
stop_service(s, sig=9) |
|
|
|
|
|
def stop_service_force(s): |
|
stop_service(s, sig=9) |
|
|
|
|
|
def clean_up(): |
|
if not EXIT_EVENT.is_set(): |
|
EXIT_EVENT.set() |
|
processes_dump = {k: v for k, v in processes.items()} |
|
for s1, p1 in processes_dump.items(): |
|
stop_service(s1) |
|
p1.wait() |
|
|
|
|
|
def show_service_status(s): |
|
services_set = parse_service(s) |
|
for ns in services_set: |
|
if is_running(ns): |
|
pid = get_pid(ns) |
|
print("{} is running: {}".format(ns, pid)) |
|
else: |
|
print("{} is stopped".format(ns)) |
|
|
|
|
|
def upgrade_db(): |
|
collect_static() |
|
perform_db_migrate() |
|
|
|
|
|
if __name__ == '__main__': |
|
parser = argparse.ArgumentParser( |
|
description=""" |
|
Jumpserver service control tools; |
|
|
|
Example: \r\n |
|
|
|
%(prog)s start all -d; |
|
""" |
|
) |
|
parser.add_argument( |
|
'action', type=str, |
|
choices=("start", "stop", "restart", "status", "upgrade_db"), |
|
help="Action to run" |
|
) |
|
parser.add_argument( |
|
"service", type=str, default="all", nargs="?", |
|
choices=("all", "web", "task", "gunicorn", "celery", "beat", "celery,beat", "flower", "ws"), |
|
help="The service to start", |
|
) |
|
parser.add_argument('-d', '--daemon', nargs="?", const=1) |
|
parser.add_argument('-w', '--worker', type=int, nargs="?", const=4) |
|
parser.add_argument('-f', '--force', nargs="?", const=1) |
|
args = parser.parse_args() |
|
if args.daemon: |
|
DAEMON = True |
|
|
|
if args.worker: |
|
WORKERS = args.worker |
|
|
|
action = args.action |
|
srv = args.service |
|
|
|
if action == "start": |
|
start_services_and_watch(srv) |
|
os._exit(0) |
|
elif action == "stop": |
|
print("Stop service") |
|
if args.force: |
|
stop_service_force(srv) |
|
else: |
|
stop_service(srv) |
|
elif action == "restart": |
|
DAEMON = True |
|
stop_service(srv) |
|
time.sleep(5) |
|
start_services_and_watch(srv) |
|
elif action == "upgrade_db": |
|
upgrade_db() |
|
else: |
|
show_service_status(srv)
|
|
|