emqx 33 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018101910201021102210231024102510261027102810291030103110321033103410351036103710381039
  1. #!/usr/bin/env bash
  2. # -*- tab-width:4;indent-tabs-mode:nil -*-
  3. # ex: ts=4 sw=4 et
  4. set -euo pipefail
  5. DEBUG="${DEBUG:-0}"
  6. [ "$DEBUG" -eq 1 ] && set -x
  7. RUNNER_ROOT_DIR="$(cd "$(dirname "$(readlink "$0" || echo "$0")")"/..; pwd -P)"
  8. # shellcheck disable=SC1090,SC1091
  9. . "$RUNNER_ROOT_DIR"/releases/emqx_vars
  10. # defined in emqx_vars
  11. export RUNNER_ROOT_DIR
  12. export EMQX_ETC_DIR
  13. export REL_VSN
  14. export SCHEMA_MOD
  15. RUNNER_SCRIPT="$RUNNER_BIN_DIR/$REL_NAME"
  16. CODE_LOADING_MODE="${CODE_LOADING_MODE:-embedded}"
  17. REL_DIR="$RUNNER_ROOT_DIR/releases/$REL_VSN"
  18. WHOAMI=$(whoami)
  19. # Make sure log directory exists
  20. mkdir -p "$RUNNER_LOG_DIR"
  21. # hocon try to read environment variables starting with "EMQX_"
  22. export HOCON_ENV_OVERRIDE_PREFIX='EMQX_'
  23. export ERTS_DIR="$RUNNER_ROOT_DIR/erts-$ERTS_VSN"
  24. export BINDIR="$ERTS_DIR/bin"
  25. export EMU="beam"
  26. export PROGNAME="erl"
  27. export ERTS_LIB_DIR="$RUNNER_ROOT_DIR/lib"
  28. DYNLIBS_DIR="$RUNNER_ROOT_DIR/dynlibs"
  29. # Echo to stderr on errors
  30. echoerr() {
  31. echo -e "$*" 1>&2;
  32. }
  33. die() {
  34. set +x
  35. echoerr "ERROR: $1"
  36. errno=${2:-1}
  37. exit "$errno"
  38. }
  39. assert_node_alive() {
  40. if ! relx_nodetool "ping" > /dev/null; then
  41. die "node_is_not_running!" 1
  42. fi
  43. }
  44. usage() {
  45. local command="$1"
  46. case "$command" in
  47. start)
  48. echo "Start EMQX service in daemon mode"
  49. ;;
  50. stop)
  51. echo "Stop the running EMQX program"
  52. ;;
  53. console)
  54. echo "Boot up EMQX service in an interactive Erlang or Elixir shell"
  55. echo "This command needs a tty"
  56. ;;
  57. console_clean)
  58. echo "This command does NOT boot up the EMQX service"
  59. echo "It only starts an interactive Erlang or Elixir console with all the"
  60. echo "EMQX code available"
  61. ;;
  62. foreground)
  63. echo "Start EMQX in foreground mode without an interactive shell"
  64. ;;
  65. pid)
  66. echo "Print out EMQX process identifier"
  67. ;;
  68. ping)
  69. echo "Check if the EMQX node is up and running"
  70. echo "This command exit with 0 silently if node is running"
  71. ;;
  72. escript)
  73. echo "Execute a escript using the Erlang runtime from EMQX package installation"
  74. echo "For example $REL_NAME escript /path/to/my/escript my_arg1 my_arg2"
  75. ;;
  76. attach)
  77. echo "This command is applicable when EMQX is started in daemon mode."
  78. echo "It attaches the current shell to EMQX's control console"
  79. echo "through a named pipe."
  80. echo "WARNING: try to use the safer alternative, remote_console command."
  81. ;;
  82. remote_console)
  83. echo "Start an interactive shell running an Erlang or Elixir node which "
  84. echo "hidden-connects to the running EMQX node".
  85. echo "This command is mostly used for troubleshooting."
  86. ;;
  87. ertspath)
  88. echo "Print path to Erlang runtime bin dir"
  89. ;;
  90. rpc)
  91. echo "Usge $REL_NAME rpc MODULE FUNCTION [ARGS, ...]"
  92. echo "Connect to the EMQX node and make an Erlang RPC"
  93. echo "This command blocks for at most 60 seconds."
  94. echo "It exits with non-zero code in case of any RPC failure"
  95. echo "including connection error and runtime exception"
  96. ;;
  97. rpcterms)
  98. echo "Usge $REL_NAME rpcterms MODULE FUNCTION [ARGS, ...]"
  99. echo "Connect to the EMQX node and make an Erlang RPC"
  100. echo "The result of the RPC call is pretty-printed as an "
  101. echo "Erlang term"
  102. ;;
  103. root_dir)
  104. echo "Print EMQX installation root dir"
  105. ;;
  106. eval)
  107. echo "Evaluate an Erlang or Elixir expression in the EMQX node"
  108. ;;
  109. eval-erl)
  110. echo "Evaluate an Erlang expression in the EMQX node, even on Elixir node"
  111. ;;
  112. versions)
  113. echo "List installed EMQX versions and their status"
  114. ;;
  115. unpack)
  116. echo "Usage: $REL_NAME unpack [VERSION]"
  117. echo "Unpacks a release package VERSION, it assumes that this"
  118. echo "release package tarball has already been deployed at one"
  119. echo "of the following locations:"
  120. echo " releases/<relname>-<version>.tar.gz"
  121. ;;
  122. install)
  123. echo "Usage: $REL_NAME install [VERSION]"
  124. echo "Installs a release package VERSION, it assumes that this"
  125. echo "release package tarball has already been deployed at one"
  126. echo "of the following locations:"
  127. echo " releases/<relname>-<version>.tar.gz"
  128. echo ""
  129. echo " --no-permanent Install release package VERSION but"
  130. echo " don't make it permanent"
  131. ;;
  132. uninstall)
  133. echo "Usage: $REL_NAME uninstall [VERSION]"
  134. echo "Uninstalls a release VERSION, it will only accept"
  135. echo "versions that are not currently in use"
  136. ;;
  137. upgrade)
  138. echo "Usage: $REL_NAME upgrade [VERSION]"
  139. echo "Upgrades the currently running release to VERSION, it assumes"
  140. echo "that a release package tarball has already been deployed at one"
  141. echo "of the following locations:"
  142. echo " releases/<relname>-<version>.tar.gz"
  143. echo ""
  144. echo " --no-permanent Install release package VERSION but"
  145. echo " don't make it permanent"
  146. ;;
  147. downgrade)
  148. echo "Usage: $REL_NAME downgrade [VERSION]"
  149. echo "Downgrades the currently running release to VERSION, it assumes"
  150. echo "that a release package tarball has already been deployed at one"
  151. echo "of the following locations:"
  152. echo " releases/<relname>-<version>.tar.gz"
  153. echo ""
  154. echo " --no-permanent Install release package VERSION but"
  155. echo " don't make it permanent"
  156. ;;
  157. *)
  158. echo "Usage: $REL_NAME COMMAND [help]"
  159. echo ''
  160. echo "Commonly used COMMANDs:"
  161. echo " start: Start EMQX in daemon mode"
  162. echo " console: Start EMQX in an interactive Erlang or Elixir shell"
  163. echo " foreground: Start EMQX in foreground mode without an interactive shell"
  164. echo " stop: Stop the running EMQX node"
  165. echo " ctl: Administration commands, execute '$REL_NAME ctl help' for more details"
  166. echo ''
  167. echo "More:"
  168. echo " Shell attach: remote_console | attach"
  169. echo " Up/Down-grade: upgrade | downgrade | install | uninstall"
  170. echo " Install info: ertspath | root_dir"
  171. echo " Runtime info: pid | ping | versions"
  172. echo " Advanced: console_clean | escript | rpc | rpcterms | eval | eval-erl"
  173. echo ''
  174. echo "Execute '$REL_NAME COMMAND help' for more information"
  175. ;;
  176. esac
  177. }
  178. COMMAND="${1:-}"
  179. if [ -z "$COMMAND" ]; then
  180. usage 'help'
  181. exit 1
  182. elif [ "$COMMAND" = 'help' ]; then
  183. usage 'help'
  184. exit 0
  185. fi
  186. if [ "${2:-}" = 'help' ]; then
  187. ## 'ctl' command has its own usage info
  188. if [ "$COMMAND" != 'ctl' ]; then
  189. usage "$COMMAND"
  190. exit 0
  191. fi
  192. fi
  193. ## IS_BOOT_COMMAND is set for later to inspect node name and cookie from hocon config (or env variable)
  194. case "${COMMAND}" in
  195. start|console|console_clean|foreground)
  196. IS_BOOT_COMMAND='yes'
  197. ;;
  198. ertspath)
  199. echo "$ERTS_DIR"
  200. exit 0
  201. ;;
  202. root_dir)
  203. echo "$RUNNER_ROOT_DIR"
  204. exit 0
  205. ;;
  206. *)
  207. IS_BOOT_COMMAND='no'
  208. ;;
  209. esac
  210. ## backward compatible
  211. if [ -d "$ERTS_DIR/lib" ]; then
  212. export LD_LIBRARY_PATH="$ERTS_DIR/lib:$LD_LIBRARY_PATH"
  213. fi
  214. # Simple way to check the correct user and fail early
  215. check_user() {
  216. # Validate that the user running the script is the owner of the
  217. # RUN_DIR.
  218. if [ "$RUNNER_USER" ] && [ "x$WHOAMI" != "x$RUNNER_USER" ]; then
  219. if [ "x$WHOAMI" != "xroot" ]; then
  220. echo "You need to be root or use sudo to run this command"
  221. exit 1
  222. fi
  223. CMD="DEBUG=$DEBUG \"$RUNNER_SCRIPT\" "
  224. for ARG in "$@"; do
  225. CMD="${CMD} \"$ARG\""
  226. done
  227. # This will drop privileges into the runner user
  228. # It exec's in a new shell and the current shell will exit
  229. exec su - "$RUNNER_USER" -c "$CMD"
  230. fi
  231. }
  232. # Make sure the user running this script is the owner and/or su to that user
  233. check_user "$@"
  234. ES=$?
  235. if [ "$ES" -ne 0 ]; then
  236. exit $ES
  237. fi
  238. COMPATIBILITY_CHECK='
  239. io:format("BEAM_OK~n", []),
  240. try
  241. [_|_] = L = crypto:info_lib(),
  242. io:format("CRYPTO_OK ~0p~n", [L])
  243. catch
  244. _ : _ ->
  245. %% so logger has the chance to log something
  246. timer:sleep(100),
  247. halt(1)
  248. end,
  249. try
  250. mnesia_hook:module_info(),
  251. io:format("MNESIA_OK~n", [])
  252. catch
  253. _ : _ ->
  254. io:format("WARNING: Mnesia app has no post-coommit hook support~n", []),
  255. halt(2)
  256. end,
  257. halt(0).
  258. '
  259. compatiblity_info() {
  260. # RELEASE_LIB is used by Elixir
  261. "$BINDIR/$PROGNAME" \
  262. -noshell \
  263. -boot_var RELEASE_LIB "$ERTS_LIB_DIR/lib" \
  264. -boot "$REL_DIR/start_clean" \
  265. -eval "$COMPATIBILITY_CHECK"
  266. }
  267. # Collect Erlang/OTP runtime sanity and compatibility in one go
  268. if [ "$IS_BOOT_COMMAND" = 'yes' ]; then
  269. # Read BUILD_INFO early as the next commands may mess up the shell
  270. BUILD_INFO="$(cat "${REL_DIR}/BUILD_INFO")"
  271. COMPATIBILITY_INFO="$(compatiblity_info 2>/dev/null || true)"
  272. if ! (echo -e "$COMPATIBILITY_INFO" | grep -q 'CRYPTO_OK'); then
  273. ## failed to start, might be due to missing libs, try to be portable
  274. export LD_LIBRARY_PATH="${LD_LIBRARY_PATH:-$DYNLIBS_DIR}"
  275. if [ "$LD_LIBRARY_PATH" != "$DYNLIBS_DIR" ]; then
  276. export LD_LIBRARY_PATH="$DYNLIBS_DIR:$LD_LIBRARY_PATH"
  277. fi
  278. ## Turn off debug, because COMPATIBILITY_INFO needs to capture stderr
  279. set +x
  280. COMPATIBILITY_INFO="$(compatiblity_info 2>&1 || true)"
  281. if ! (echo -e "$COMPATIBILITY_INFO" | grep -q 'BEAM_OK'); then
  282. ## not able to start beam.smp
  283. set +x
  284. echoerr "$COMPATIBILITY_INFO"
  285. echoerr "Please ensure it is running on the correct platform:"
  286. echoerr "$BUILD_INFO"
  287. echoerr "Version=$REL_VSN"
  288. echoerr "Required dependencies: openssl-1.1.1 (libcrypto), libncurses and libatomic1"
  289. exit 1
  290. elif ! (echo -e "$COMPATIBILITY_INFO" | grep -q 'CRYPTO_OK'); then
  291. ## not able to start crypto app
  292. set +x
  293. echoerr "$COMPATIBILITY_INFO"
  294. exit 2
  295. fi
  296. echoerr "Using libs from '${DYNLIBS_DIR}' due to missing from the OS."
  297. fi
  298. [ "$DEBUG" -eq 1 ] && set -x
  299. fi
  300. # Warn the user if ulimit -n is less than 1024
  301. ULIMIT_F=$(ulimit -n)
  302. if [ "$ULIMIT_F" -lt 1024 ]; then
  303. echo "!!!!"
  304. echo "!!!! WARNING: ulimit -n is ${ULIMIT_F}; 1024 is the recommended minimum."
  305. echo "!!!!"
  306. fi
  307. SED_REPLACE="sed -i "
  308. case $(sed --help 2>&1) in
  309. *GNU*) SED_REPLACE="sed -i ";;
  310. *BusyBox*) SED_REPLACE="sed -i ";;
  311. *) SED_REPLACE="sed -i '' ";;
  312. esac
  313. # Get node pid
  314. relx_get_pid() {
  315. if output="$(relx_nodetool rpcterms os getpid)"
  316. then
  317. # shellcheck disable=SC2001 # Escaped quote taken as closing quote in editor
  318. echo "$output" | sed -e 's/"//g'
  319. return 0
  320. else
  321. echo "$output"
  322. return 1
  323. fi
  324. }
  325. # Connect to a remote node
  326. remsh() {
  327. # Generate a unique id used to allow multiple remsh to the same node
  328. # transparently
  329. id="remsh$(relx_gen_id)-${NAME}"
  330. # Get the node's ticktime so that we use the same thing.
  331. TICKTIME="$(relx_nodetool rpcterms net_kernel get_net_ticktime)"
  332. # shellcheck disable=SC2086
  333. # Setup remote shell command to control node
  334. if [ "$IS_ELIXIR" = no ] || [ "${EMQX_CONSOLE_FLAVOR:-}" = 'erl' ] ; then
  335. set -- "$BINDIR/erl" "$NAME_TYPE" "$id" \
  336. -remsh "$NAME" -boot "$REL_DIR/start_clean" \
  337. -boot_var ERTS_LIB_DIR "$ERTS_LIB_DIR" \
  338. -boot_var RELEASE_LIB "$ERTS_LIB_DIR" \
  339. -setcookie "$COOKIE" \
  340. -hidden \
  341. -kernel net_ticktime "$TICKTIME" \
  342. $EPMD_ARGS
  343. else
  344. set -- "$REL_DIR/iex" \
  345. --remsh "$NAME" \
  346. --boot-var RELEASE_LIB "$ERTS_LIB_DIR" \
  347. --cookie "$COOKIE" \
  348. --hidden \
  349. --erl "-kernel net_ticktime $TICKTIME" \
  350. --erl "$EPMD_ARGS" \
  351. --erl "$NAME_TYPE $id" \
  352. --boot "$REL_DIR/start_clean"
  353. fi
  354. exec "$@"
  355. }
  356. # Generate a random id
  357. relx_gen_id() {
  358. od -t x -N 4 /dev/urandom | head -n1 | awk '{print $2}'
  359. }
  360. call_nodetool() {
  361. "$ERTS_DIR/bin/escript" "$RUNNER_ROOT_DIR/bin/nodetool" "$@"
  362. }
  363. # Control a node
  364. relx_nodetool() {
  365. command="$1"; shift
  366. ERL_FLAGS="${ERL_FLAGS:-} $EPMD_ARGS" \
  367. call_nodetool "$NAME_TYPE" "$NAME" \
  368. -setcookie "$COOKIE" "$command" "$@"
  369. }
  370. call_hocon() {
  371. call_nodetool hocon "$@" \
  372. || die "call_hocon_failed: $*" $?
  373. }
  374. ## Resolve boot configs in a batch
  375. ## This is because starting the Erlang beam with all modules loaded
  376. ## and parsing HOCON config + environment variables is a non-trivial task
  377. CONF_KEYS=( 'node.data_dir' 'node.name' 'node.cookie' 'node.db_backend' 'cluster.proto_dist' )
  378. if [ "$IS_ENTERPRISE" = 'yes' ]; then
  379. CONF_KEYS+=( 'license.file' 'license.key' )
  380. fi
  381. if [ "$IS_BOOT_COMMAND" = 'yes' ]; then
  382. if [ "${EMQX_BOOT_CONFIGS:-}" = '' ]; then
  383. EMQX_BOOT_CONFIGS="$(call_hocon -s "$SCHEMA_MOD" -c "$EMQX_ETC_DIR"/emqx.conf multi_get "${CONF_KEYS[@]}")"
  384. ## export here so the 'console' command recursively called from
  385. ## 'start' command does not have to parse the configs again
  386. export EMQX_BOOT_CONFIGS
  387. fi
  388. else
  389. # For non-boot commands, we try to get data_dir and ssl_dist_optfile from 'ps -ef' output
  390. # shellcheck disable=SC2009
  391. PS_LINE="$(ps -ef | grep "\-[r]oot $RUNNER_ROOT_DIR" || true)"
  392. if [ "$(echo -e "$PS_LINE" | wc -l)" -eq 1 ]; then
  393. ## only one emqx node is running
  394. ## strip 'emqx_data_dir ' and ' --' because the dir in between may contain spaces
  395. DATA_DIR="$(echo -e "$PS_LINE" | grep -oE "\-emqx_data_dir.*" | sed -E 's#.+emqx_data_dir[[:blank:]]##g' | sed -E 's#[[:blank:]]--$##g' || true)"
  396. if [ "$DATA_DIR" = '' ]; then
  397. ## this should not happen unless -emqx_data_dir is not set
  398. die "node_is_not_running!" 1
  399. fi
  400. # get ssl_dist_optfile option
  401. SSL_DIST_OPTFILE="$(echo -e "$PS_LINE" | grep -oE '+ssl_dist_optfile\s.+\s' | awk '{print $2}' || true)"
  402. if [ -z "$SSL_DIST_OPTFILE" ]; then
  403. EMQX_BOOT_CONFIGS="node.data_dir=${DATA_DIR}\ncluster.proto_dist=inet_tcp"
  404. else
  405. EMQX_BOOT_CONFIGS="node.data_dir=${DATA_DIR}\ncluster.proto_dist=inet_tls"
  406. fi
  407. else
  408. ## None or more than one node is running, resolve from boot config
  409. EMQX_BOOT_CONFIGS="$(call_hocon -s "$SCHEMA_MOD" -c "$EMQX_ETC_DIR"/emqx.conf multi_get "${CONF_KEYS[@]}")"
  410. fi
  411. fi
  412. get_boot_config() {
  413. path_to_value="$1"
  414. echo -e "$EMQX_BOOT_CONFIGS" | grep "$path_to_value=" | sed -e "s/$path_to_value=//g" | tr -d \"
  415. }
  416. EPMD_ARGS="-start_epmd false -epmd_module ekka_epmd -proto_dist ekka"
  417. PROTO_DIST="$(get_boot_config 'cluster.proto_dist' || true)"
  418. # this environment variable is required by ekka_dist module
  419. # because proto_dist is overriden to ekka, and there is a lack of ekka_tls module
  420. export EKKA_PROTO_DIST_MOD="${PROTO_DIST:-inet_tcp}"
  421. if [ "$EKKA_PROTO_DIST_MOD" = 'inet_tls' ]; then
  422. if [ "$IS_BOOT_COMMAND" = 'yes' ]; then
  423. SSL_DIST_OPTFILE=${EMQX_SSL_DIST_OPTFILE:-"$EMQX_ETC_DIR/ssl_dist.conf"}
  424. case "$SSL_DIST_OPTFILE" in
  425. *\ *)
  426. # there is unfortunately no way to support space for this option because we'd need to grep
  427. # from 'ps -ef' result to get this option for non-boot commands (nodtool) to run
  428. set +x
  429. echoerr "Got space in: $SSL_DIST_OPTFILE"
  430. echoerr "No space is allowed for Erlang distribution over SSL option file path."
  431. echoerr "Configure it from environment varialbe EMQX_SSL_DIST_OPTFILE."
  432. echoerr "Or make sure emqx root path '$RUNNER_ROOT_DIR' has no space"
  433. exit 1
  434. ;;
  435. *)
  436. true
  437. ;;
  438. esac
  439. fi
  440. EPMD_ARGS="${EPMD_ARGS} -ssl_dist_optfile $SSL_DIST_OPTFILE"
  441. fi
  442. DATA_DIR="$(get_boot_config 'node.data_dir')"
  443. # ensure no trailing /
  444. DATA_DIR="${DATA_DIR%/}"
  445. if [[ $DATA_DIR != /* ]]; then
  446. # relative path
  447. DATA_DIR="${RUNNER_ROOT_DIR}/${DATA_DIR}"
  448. fi
  449. CONFIGS_DIR="$DATA_DIR/configs"
  450. mkdir -p "$CONFIGS_DIR"
  451. check_license() {
  452. if [ "$IS_ENTERPRISE" == "no" ]; then
  453. return 0
  454. fi
  455. file_license="${EMQX_LICENSE__FILE:-$(get_boot_config 'license.file')}"
  456. if [[ -n "$file_license" && ("$file_license" != "undefined") ]]; then
  457. call_nodetool check_license_file "$file_license"
  458. else
  459. key_license="${EMQX_LICENSE__KEY:-$(get_boot_config 'license.key')}"
  460. if [[ -n "$key_license" && ("$key_license" != "undefined") ]]; then
  461. call_nodetool check_license_key "$key_license"
  462. else
  463. set +x
  464. echoerr "License not found."
  465. echoerr "Please specify one via EMQX_LICENSE__KEY or EMQX_LICENSE__FILE variables"
  466. echoerr "or via license.key|file in emqx_enterprise.conf."
  467. return 1
  468. fi
  469. fi
  470. }
  471. # Run an escript in the node's environment
  472. relx_escript() {
  473. shift; scriptpath="$1"; shift
  474. "$ERTS_DIR/bin/escript" "$RUNNER_ROOT_DIR/$scriptpath" "$@"
  475. }
  476. # Output a start command for the last argument of run_erl
  477. relx_start_command() {
  478. printf "exec \"%s\" \"%s\"" "$RUNNER_SCRIPT" \
  479. "$START_OPTION"
  480. }
  481. # Function to generate app.config and vm.args
  482. # sets two environment variables CONF_FILE and ARGS_FILE
  483. generate_config() {
  484. local name_type="$1"
  485. local node_name="$2"
  486. ## Delete the *.siz files first or it can't start after
  487. ## changing the config 'log.rotation.size'
  488. rm -rf "${RUNNER_LOG_DIR}"/*.siz
  489. ## timestamp for each generation
  490. local NOW_TIME
  491. NOW_TIME="$(date +'%Y.%m.%d.%H.%M.%S')"
  492. ## this command populates two files: app.<time>.config and vm.<time>.args
  493. ## NOTE: the generate command merges environment variables to the base config (emqx.conf),
  494. ## but does not include the cluster-override.conf and local-override.conf
  495. ## meaning, certain overrides will not be mapped to app.<time>.config file
  496. call_hocon -v -t "$NOW_TIME" -s "$SCHEMA_MOD" -c "$EMQX_ETC_DIR"/emqx.conf -d "$DATA_DIR"/configs generate
  497. ## filenames are per-hocon convention
  498. CONF_FILE="$CONFIGS_DIR/app.$NOW_TIME.config"
  499. ARGS_FILE="$CONFIGS_DIR/vm.$NOW_TIME.args"
  500. ## Merge hocon generated *.args into the vm.args
  501. TMP_ARG_FILE="$CONFIGS_DIR/vm.args.tmp"
  502. cp "$EMQX_ETC_DIR/vm.args" "$TMP_ARG_FILE"
  503. echo "" >> "$TMP_ARG_FILE"
  504. echo "-pa \"${REL_DIR}/consolidated\"" >> "$TMP_ARG_FILE"
  505. ## read lines from generated vm.<time>.args file
  506. ## drop comment lines, and empty lines using sed
  507. ## pipe the lines to a while loop
  508. sed '/^#/d' "$ARGS_FILE" | sed '/^$/d' | while IFS='' read -r ARG_LINE || [ -n "$ARG_LINE" ]; do
  509. ## in the loop, split the 'key[:space:]value' pair
  510. ARG_KEY=$(echo "$ARG_LINE" | awk '{$NF="";print}')
  511. ARG_VALUE=$(echo "$ARG_LINE" | awk '{print $NF}')
  512. ## use the key to look up in vm.args file for the value
  513. TMP_ARG_VALUE=$(grep "^$ARG_KEY" "$TMP_ARG_FILE" || true | awk '{print $NF}')
  514. ## compare generated (to override) value to original (to be overridden) value
  515. if [ "$ARG_VALUE" != "$TMP_ARG_VALUE" ] ; then
  516. ## if they are different
  517. if [ -n "$TMP_ARG_VALUE" ]; then
  518. ## if the old value is present, replace it with generated value
  519. sh -c "$SED_REPLACE 's|^$ARG_KEY.*$|$ARG_LINE|' \"$TMP_ARG_FILE\""
  520. else
  521. ## otherwise append generated value to the end
  522. echo "$ARG_LINE" >> "$TMP_ARG_FILE"
  523. fi
  524. fi
  525. done
  526. echo "$name_type $node_name" >> "$TMP_ARG_FILE"
  527. echo "-mnesia dir '\"$DATA_DIR/mnesia/$NAME\"'" >> "$TMP_ARG_FILE"
  528. ## rename the generated vm.<time>.args file
  529. mv -f "$TMP_ARG_FILE" "$ARGS_FILE"
  530. }
  531. # check if a PID is down
  532. is_down() {
  533. PID="$1"
  534. if ps -p "$PID" >/dev/null; then
  535. # still around
  536. # shellcheck disable=SC2009 # this grep pattern is not a part of the progra names
  537. if ps -p "$PID" | grep -q 'defunct'; then
  538. # zombie state, print parent pid
  539. parent="$(ps -o ppid= -p "$PID" | tr -d ' ')"
  540. echo "WARN: $PID is marked <defunct>, parent:"
  541. ps -p "$parent"
  542. return 0
  543. fi
  544. return 1
  545. fi
  546. # it's gone
  547. return 0
  548. }
  549. wait_for() {
  550. local WAIT_TIME
  551. local CMD
  552. WAIT_TIME="$1"
  553. shift
  554. CMD="$*"
  555. while true; do
  556. if $CMD >/dev/null 2>&1; then
  557. return 0
  558. fi
  559. if [ "$WAIT_TIME" -le 0 ]; then
  560. return 1
  561. fi
  562. WAIT_TIME=$((WAIT_TIME - 1))
  563. sleep 1
  564. done
  565. }
  566. wait_until_return_val() {
  567. local RESULT
  568. local WAIT_TIME
  569. local CMD
  570. RESULT="$1"
  571. WAIT_TIME="$2"
  572. shift 2
  573. CMD="$*"
  574. while true; do
  575. if [ "$($CMD 2>/dev/null)" = "$RESULT" ]; then
  576. return 0
  577. fi
  578. if [ "$WAIT_TIME" -le 0 ]; then
  579. return 1
  580. fi
  581. WAIT_TIME=$((WAIT_TIME - 1))
  582. sleep 1
  583. done
  584. }
  585. latest_vm_args() {
  586. local hint_var_name="$1"
  587. local vm_args_file
  588. vm_args_file="$(find "$CONFIGS_DIR" -type f -name "vm.*.args" | sort | tail -1)"
  589. if [ -f "$vm_args_file" ]; then
  590. echo "$vm_args_file"
  591. else
  592. set +x
  593. echoerr "Node not initialized?"
  594. echoerr "Generated config file vm.*.args is not found for command '$COMMAND'"
  595. echoerr "in config dir: $CONFIGS_DIR"
  596. echoerr "In case the file has been deleted while the node is running,"
  597. echoerr "set environment variable '$hint_var_name' to continue"
  598. exit 1
  599. fi
  600. }
  601. # backward compabible with 4.x
  602. tr_log_to_env() {
  603. local log_to=${EMQX_LOG__TO:-undefined}
  604. # unset because it's unknown to 5.0
  605. unset EMQX_LOG__TO
  606. case "${log_to}" in
  607. console)
  608. export EMQX_LOG__CONSOLE_HANDLER__ENABLE='true'
  609. export EMQX_LOG__FILE_HANDLERS__DEFAULT__ENABLE='false'
  610. ;;
  611. file)
  612. export EMQX_LOG__CONSOLE_HANDLER__ENABLE='false'
  613. export EMQX_LOG__FILE_HANDLERS__DEFAULT__ENABLE='true'
  614. ;;
  615. both)
  616. export EMQX_LOG__CONSOLE_HANDLER__ENABLE='true'
  617. export EMQX_LOG__FILE_HANDLERS__DEFAULT__ENABLE='true'
  618. ;;
  619. default)
  620. # want to use config file defaults, do nothing
  621. ;;
  622. undefined)
  623. # value not set, do nothing
  624. ;;
  625. *)
  626. echoerr "Unknown environment value for EMQX_LOG__TO=${log_to} discarded"
  627. ;;
  628. esac
  629. }
  630. maybe_log_to_console() {
  631. if [ "${EMQX_LOG__TO:-}" = 'default' ]; then
  632. # want to use config file defaults, do nothing
  633. unset EMQX_LOG__TO
  634. else
  635. tr_log_to_env
  636. # ensure defaults
  637. export EMQX_LOG__CONSOLE_HANDLER__ENABLE="${EMQX_LOG__CONSOLE_HANDLER__ENABLE:-true}"
  638. export EMQX_LOG__FILE_HANDLERS__DEFAULT__ENABLE="${EMQX_LOG__FILE_HANDLERS__DEFAULT__ENABLE:-false}"
  639. fi
  640. }
  641. if [ -n "${EMQX_NODE_NAME:-}" ]; then
  642. export EMQX_NODE__NAME="${EMQX_NODE_NAME}"
  643. unset EMQX_NODE_NAME
  644. fi
  645. ## Possible ways to configure emqx node name:
  646. ## 1. configure node.name in emqx.conf
  647. ## 2. override with environment variable EMQX_NODE__NAME
  648. ## Node name is either short-name (without '@'), e.g. 'emqx'
  649. ## or long name (with '@') e.g. 'emqx@example.net' or 'emqx@127.0.0.1'
  650. NAME="${EMQX_NODE__NAME:-}"
  651. if [ -z "$NAME" ]; then
  652. if [ "$IS_BOOT_COMMAND" = 'yes' ]; then
  653. # for boot commands, inspect emqx.conf for node name
  654. NAME="$(get_boot_config 'node.name')"
  655. else
  656. vm_args_file="$(latest_vm_args 'EMQX_NODE__NAME')"
  657. NAME="$(grep -E '^-s?name' "${vm_args_file}" | awk '{print $2}')"
  658. fi
  659. fi
  660. # force to use 'emqx' short name
  661. [ -z "$NAME" ] && NAME='emqx'
  662. case "$NAME" in
  663. *@*)
  664. NAME_TYPE='-name'
  665. ;;
  666. *)
  667. NAME_TYPE='-sname'
  668. esac
  669. SHORT_NAME="$(echo "$NAME" | awk -F'@' '{print $1}')"
  670. if ! (echo "$SHORT_NAME" | grep -q '^[0-9A-Za-z_\-]\+$'); then
  671. echo "Invalid node name, should be of format '^[0-9A-Za-z_-]+$'."
  672. exit 1
  673. fi
  674. # This also changes the program name from 'beam.smp' to node name
  675. # e.g. the 'ps' command output
  676. export ESCRIPT_NAME="$SHORT_NAME"
  677. PIPE_DIR="${PIPE_DIR:-/$DATA_DIR/${WHOAMI}_erl_pipes/$NAME/}"
  678. ## make EMQX_NODE_COOKIE right
  679. if [ -n "${EMQX_NODE_COOKIE:-}" ]; then
  680. export EMQX_NODE__COOKIE="${EMQX_NODE_COOKIE}"
  681. unset EMQX_NODE_COOKIE
  682. fi
  683. COOKIE="${EMQX_NODE__COOKIE:-}"
  684. if [ -z "$COOKIE" ]; then
  685. if [ "$IS_BOOT_COMMAND" = 'yes' ]; then
  686. COOKIE="$(get_boot_config 'node.cookie')"
  687. else
  688. vm_args_file="$(latest_vm_args 'EMQX_NODE__COOKIE')"
  689. COOKIE="$(grep -E '^-setcookie' "${vm_args_file}" | awk '{print $2}')"
  690. fi
  691. fi
  692. if [ -z "$COOKIE" ]; then
  693. die "Please set node.cookie in $EMQX_ETC_DIR/emqx.conf or override from environment variable EMQX_NODE__COOKIE"
  694. fi
  695. ## check if OTP version has mnesia_hook feature; if not, fallback to
  696. ## using Mnesia DB backend.
  697. if [[ "$IS_BOOT_COMMAND" == 'yes' && "$(get_boot_config 'node.db_backend')" == "rlog" ]]; then
  698. if ! (echo -e "$COMPATIBILITY_INFO" | grep -q 'MNESIA_OK'); then
  699. echoerr "DB Backend is RLOG, but an incompatible OTP version has been detected. Falling back to using Mnesia DB backend."
  700. export EMQX_NODE__DB_BACKEND=mnesia
  701. export EMQX_NODE__DB_ROLE=core
  702. fi
  703. fi
  704. cd "$RUNNER_ROOT_DIR"
  705. case "${COMMAND}" in
  706. start)
  707. # Make sure a node IS not running
  708. if relx_nodetool "ping" >/dev/null 2>&1; then
  709. die "node_is_already_running!"
  710. fi
  711. # this flag passes down to console mode
  712. # so we know it's intended to be run in daemon mode
  713. export _EMQX_START_DAEMON_MODE=1
  714. case "$COMMAND" in
  715. start)
  716. shift
  717. START_OPTION="console"
  718. HEART_OPTION="start"
  719. ;;
  720. esac
  721. RUN_PARAM="$*"
  722. # Set arguments for the heart command
  723. set -- "$RUNNER_SCRIPT" "$HEART_OPTION"
  724. [ "$RUN_PARAM" ] && set -- "$@" "$RUN_PARAM"
  725. # Export the HEART_COMMAND
  726. HEART_COMMAND="$RUNNER_SCRIPT $COMMAND"
  727. export HEART_COMMAND
  728. ## See: http://erlang.org/doc/man/run_erl.html
  729. # Export the RUN_ERL_LOG_GENERATIONS
  730. export RUN_ERL_LOG_GENERATIONS=${RUN_ERL_LOG_GENERATIONS:-"5"}
  731. # Export the RUN_ERL_LOG_MAXSIZE
  732. export RUN_ERL_LOG_MAXSIZE=${RUN_ERL_LOG_MAXSIZE:-"10485760"}
  733. mkdir -p "$PIPE_DIR"
  734. "$BINDIR/run_erl" -daemon "$PIPE_DIR" "$RUNNER_LOG_DIR" \
  735. "$(relx_start_command)"
  736. WAIT_TIME=${EMQX_WAIT_FOR_START:-120}
  737. if wait_until_return_val "true" "$WAIT_TIME" 'relx_nodetool' \
  738. 'eval' 'emqx:is_running()'; then
  739. echo "$EMQX_DESCRIPTION $REL_VSN is started successfully!"
  740. exit 0
  741. else
  742. echo "$EMQX_DESCRIPTION $REL_VSN failed to start in ${WAIT_TIME} seconds."
  743. echo "Please find more information in erlang.log.N"
  744. echo "Or run 'env DEBUG=1 $0 console' to have logs printed to console."
  745. exit 1
  746. fi
  747. ;;
  748. stop)
  749. # Wait for the node to completely stop...
  750. PID="$(relx_get_pid)"
  751. if ! relx_nodetool "stop"; then
  752. die "Graceful shutdown failed PID=[$PID]"
  753. fi
  754. WAIT_TIME="${EMQX_WAIT_FOR_STOP:-120}"
  755. if ! wait_for "$WAIT_TIME" 'is_down' "$PID"; then
  756. msg="dangling after ${WAIT_TIME} seconds"
  757. # also log to syslog
  758. logger -t "${REL_NAME}[${PID}]" "STOP: $msg"
  759. # log to user console
  760. set +x
  761. echoerr "Stop failed, $msg"
  762. echo "ERROR: $PID is still around"
  763. ps -p "$PID"
  764. exit 1
  765. fi
  766. echo "ok"
  767. logger -t "${REL_NAME}[${PID}]" "STOP: OK"
  768. ;;
  769. pid)
  770. ## Get the VM's pid
  771. if ! relx_get_pid; then
  772. exit 1
  773. fi
  774. ;;
  775. ping)
  776. assert_node_alive
  777. echo pong
  778. ;;
  779. escript)
  780. ## Run an escript under the node's environment
  781. if ! relx_escript "$@"; then
  782. exit 1
  783. fi
  784. ;;
  785. attach)
  786. assert_node_alive
  787. shift
  788. exec "$BINDIR/to_erl" "$PIPE_DIR"
  789. ;;
  790. remote_console)
  791. assert_node_alive
  792. shift
  793. remsh
  794. ;;
  795. upgrade|downgrade|install|unpack|uninstall)
  796. if [ -z "${2:-}" ]; then
  797. echo "Missing version argument"
  798. echo "Usage: $REL_NAME $COMMAND {version}"
  799. exit 1
  800. fi
  801. shift
  802. assert_node_alive
  803. ERL_FLAGS="${ERL_FLAGS:-} $EPMD_ARGS" \
  804. exec "$BINDIR/escript" "$RUNNER_ROOT_DIR/bin/install_upgrade.escript" \
  805. "$COMMAND" "{'$REL_NAME', \"$NAME_TYPE\", '$NAME', '$COOKIE'}" "$@"
  806. ;;
  807. versions)
  808. assert_node_alive
  809. shift
  810. ERL_FLAGS="${ERL_FLAGS:-} $EPMD_ARGS" \
  811. exec "$BINDIR/escript" "$RUNNER_ROOT_DIR/bin/install_upgrade.escript" \
  812. "versions" "{'$REL_NAME', \"$NAME_TYPE\", '$NAME', '$COOKIE'}" "$@"
  813. ;;
  814. console|console_clean|foreground)
  815. # .boot file typically just $REL_NAME (ie, the app name)
  816. # however, for debugging, sometimes start_clean.boot is useful.
  817. # For e.g. 'setup', one may even want to name another boot script.
  818. case "$COMMAND" in
  819. console|foreground)
  820. if [ -f "$REL_DIR/$REL_NAME.boot" ]; then
  821. BOOTFILE="$REL_DIR/$REL_NAME"
  822. else
  823. BOOTFILE="$REL_DIR/start"
  824. fi
  825. ;;
  826. console_clean)
  827. BOOTFILE="$REL_DIR/start_clean"
  828. ;;
  829. esac
  830. case "$COMMAND" in
  831. foreground)
  832. FOREGROUNDOPTIONS="-noshell -noinput +Bd"
  833. ;;
  834. *)
  835. FOREGROUNDOPTIONS=''
  836. ;;
  837. esac
  838. # set before generate_config
  839. if [ "${_EMQX_START_DAEMON_MODE:-}" = 1 ]; then
  840. tr_log_to_env
  841. else
  842. maybe_log_to_console
  843. fi
  844. #generate app.config and vm.args
  845. generate_config "$NAME_TYPE" "$NAME"
  846. check_license
  847. # Setup beam-required vars
  848. EMU="beam"
  849. PROGNAME="${0}"
  850. export EMU
  851. export PROGNAME
  852. # Store passed arguments since they will be erased by `set`
  853. # add emqx_data_dir to boot command so it is visible from 'ps -ef'
  854. ARGS="$*"
  855. # shellcheck disable=SC2086
  856. # Build an array of arguments to pass to exec later on
  857. # Build it here because this command will be used for logging.
  858. if [ "$IS_ELIXIR" = no ] || [ "${EMQX_CONSOLE_FLAVOR:-}" = 'erl' ] ; then
  859. # pass down RELEASE_LIB so we can switch to IS_ELIXIR=no
  860. # to boot an Erlang node from the elixir release
  861. set -- "$BINDIR/erlexec" \
  862. $FOREGROUNDOPTIONS \
  863. -boot "$BOOTFILE" \
  864. -boot_var RELEASE_LIB "$ERTS_LIB_DIR" \
  865. -boot_var ERTS_LIB_DIR "$ERTS_LIB_DIR" \
  866. -mode "$CODE_LOADING_MODE" \
  867. -config "$CONF_FILE" \
  868. -args_file "$ARGS_FILE" \
  869. $EPMD_ARGS
  870. else
  871. set -- "$REL_DIR/iex" \
  872. --boot "$BOOTFILE" \
  873. --boot-var RELEASE_LIB "${ERTS_LIB_DIR}" \
  874. --erl-config "${CONF_FILE}" \
  875. --vm-args "${ARGS_FILE}" \
  876. --erl "$FOREGROUNDOPTIONS" \
  877. --erl "-mode $CODE_LOADING_MODE" \
  878. --erl "$EPMD_ARGS" \
  879. --werl
  880. fi
  881. # Log the startup
  882. logger -t "${REL_NAME}[$$]" "EXEC: $* -- ${1+$ARGS} -emqx_data_dir ${DATA_DIR}"
  883. # Start the VM
  884. exec "$@" -- ${1+$ARGS} -emqx_data_dir "${DATA_DIR}"
  885. ;;
  886. ctl)
  887. assert_node_alive
  888. shift
  889. relx_nodetool rpc_infinity emqx_ctl run_command "$@"
  890. ;;
  891. rpc)
  892. assert_node_alive
  893. shift
  894. relx_nodetool rpc "$@"
  895. ;;
  896. rpcterms)
  897. assert_node_alive
  898. shift
  899. relx_nodetool rpcterms "$@"
  900. ;;
  901. eval)
  902. assert_node_alive
  903. shift
  904. if [ "$IS_ELIXIR" = "yes" ]
  905. then
  906. "$REL_DIR/elixir" \
  907. --hidden \
  908. --name "rand-$(relx_gen_id)-$NAME" \
  909. --cookie "$COOKIE" \
  910. --boot "$REL_DIR/start_clean" \
  911. --boot-var RELEASE_LIB "$ERTS_LIB_DIR" \
  912. --vm-args "$REL_DIR/remote.vm.args" \
  913. --erl "-start_epmd false -epmd_module ekka_epmd" \
  914. --rpc-eval "$NAME" "$@"
  915. else
  916. relx_nodetool "eval" "$@"
  917. fi
  918. ;;
  919. eval-erl)
  920. assert_node_alive
  921. shift
  922. relx_nodetool "eval" "$@"
  923. ;;
  924. *)
  925. usage "$COMMAND"
  926. exit 1
  927. ;;
  928. esac
  929. exit 0