zioinfo-mail/workspace/guardia-itsm/scripts/sm/agent/agent_scouter_sm.sh
DESKTOP-TKLFCPR\ython cfe2901a55 refactor(structure): consolidate all projects under workspace/
- itsm/    -> workspace/guardia-itsm/
- manager/ -> workspace/guardia-manager/
- app/     -> workspace/guardia-messenger/
- manual/  -> workspace/guardia-docs/

workspace/zioinfo-web/ unchanged.
git mv preserves full commit history.

Co-Authored-By: Claude Sonnet 4.6 <noreply@anthropic.com>
2026-05-31 23:50:56 +09:00

137 lines
6.5 KiB
Bash

#!/bin/bash
# ============================================================
# GUARDiA SM | agent_scouter_sm.sh
# 대상: Scouter APM (Collector / Host-Agent / Java-Agent)
# 파라미터: SCOUTER_HOME=/opt/scouter
# SC_COLLECTOR_HOST=localhost SC_COLLECTOR_PORT=6100
# SC_WEB_PORT=6180 SC_COLLECTOR_UDP=6100
# ============================================================
set -euo pipefail
SCOUTER_HOME=${SCOUTER_HOME:-/opt/scouter}
SC_COLLECTOR_HOST=${SC_COLLECTOR_HOST:-localhost}
SC_COLLECTOR_PORT=${SC_COLLECTOR_PORT:-6100}
SC_WEB_PORT=${SC_WEB_PORT:-6180}
OK="[OK]"; WARN="[WARN]"; CRIT="[CRIT]"
SEP="─────────────────────────────────────────"
RESULT=0
echo "======================================================"
echo " GUARDiA SM 점검 | Scouter APM | $(hostname -s)"
echo " 점검 시각: $(date '+%Y-%m-%d %H:%M:%S %Z')"
echo "======================================================"
# ── 1. Scouter Collector ──────────────────────────────────
echo; echo "[$SEP] 1. Scouter Collector"
COLL_PROC=$(pgrep -f "scouter.server\|ScouterCollector\|scouter-collector" 2>/dev/null | wc -l || echo 0)
COLL_JAR=$(pgrep -f "scouter.server" 2>/dev/null | head -1 || echo "")
if [ "$COLL_PROC" -gt 0 ] || pgrep -f "scouter" &>/dev/null; then
echo " ${OK} Scouter Collector 실행 중"
if [ -n "$COLL_JAR" ]; then
RSS_MB=$(awk '/VmRSS/{print $2}' /proc/${COLL_JAR}/status 2>/dev/null | \
awk '{printf "%d", $1/1024}' || echo "N/A")
echo " RSS 메모리: ${RSS_MB} MB"
fi
else
echo " ${CRIT} Scouter Collector 프로세스 없음"
RESULT=2
fi
# 포트 리스닝 (TCP + UDP 6100)
ss -tlnp 2>/dev/null | grep -q ":${SC_COLLECTOR_PORT} " && \
echo " ${OK} TCP 포트 ${SC_COLLECTOR_PORT} LISTEN" || \
echo " ${WARN} TCP 포트 ${SC_COLLECTOR_PORT} LISTEN 없음"
ss -ulnp 2>/dev/null | grep -q ":${SC_COLLECTOR_PORT} " && \
echo " ${OK} UDP 포트 ${SC_COLLECTOR_PORT} LISTEN" || \
echo " ${WARN} UDP 포트 ${SC_COLLECTOR_PORT} LISTEN 없음"
# ── 2. Scouter Web (선택) ────────────────────────────────
echo; echo "[$SEP] 2. Scouter Web API"
ss -tlnp 2>/dev/null | grep -q ":${SC_WEB_PORT} " && \
echo " ${OK} Web API 포트 ${SC_WEB_PORT} LISTEN" || \
echo " ${WARN} Web API 포트 ${SC_WEB_PORT} LISTEN 없음 (별도 배포 시 무시)"
if command -v curl &>/dev/null; then
HTTP_CODE=$(curl -sk -o /dev/null -w "%{http_code}" \
--max-time 5 "http://${SC_COLLECTOR_HOST}:${SC_WEB_PORT}/scouter/v1/info/server" \
2>/dev/null || echo "ERR")
echo "$HTTP_CODE" | grep -qE "^[23]" && \
echo " ${OK} Web API 응답: ${HTTP_CODE}" || \
echo " ${WARN} Web API 응답: ${HTTP_CODE}"
fi
# ── 3. Host Agent ─────────────────────────────────────────
echo; echo "[$SEP] 3. Scouter Host Agent"
HOST_PROC=$(pgrep -f "scouter.agent.host\|host-agent" 2>/dev/null | wc -l || echo 0)
if [ "$HOST_PROC" -gt 0 ]; then
echo " ${OK} Host Agent 실행 중"
else
echo " ${WARN} Host Agent 프로세스 없음"
fi
# ── 4. Java Agent 연결된 프로세스 ────────────────────────
echo; echo "[$SEP] 4. Java Agent 연결 현황"
JAVA_AGENTS=$(pgrep -f "scouter.agent.jar\|scouter-agent.jar" 2>/dev/null | wc -l || echo 0)
echo " Scouter Java Agent 연결 수: ${JAVA_AGENTS}"
if [ "$JAVA_AGENTS" -gt 0 ]; then
echo " ${OK} Java Agent 활성"
# 에이전트가 붙은 프로세스 목록
pgrep -f "scouter.agent.jar\|scouter-agent.jar" 2>/dev/null | while read PID; do
CMD=$(ps -p "$PID" -o comm= 2>/dev/null || echo "unknown")
echo " PID:${PID} CMD:${CMD}"
done | head -5
else
echo " ${WARN} Scouter Java Agent 미연결 (WAS에 agent 미설정)"
fi
# ── 5. Collector 데이터 디렉터리 ─────────────────────────
echo; echo "[$SEP] 5. 데이터 저장 용량"
for DATADIR in "${SCOUTER_HOME}/server/database" "${SCOUTER_HOME}/database" \
"${SCOUTER_HOME}/collector/database"; do
if [ -d "$DATADIR" ]; then
USED=$(du -sh "$DATADIR" 2>/dev/null | awk '{print $1}' || echo "N/A")
echo " 데이터 경로: ${DATADIR}"
echo " 사용 용량: ${USED}"
break
fi
done
# ── 6. Collector 로그 ─────────────────────────────────────
echo; echo "[$SEP] 6. Collector 로그 오류"
for LOGDIR in "${SCOUTER_HOME}/server/logs" "${SCOUTER_HOME}/logs" \
"${SCOUTER_HOME}/collector/logs"; do
if [ -d "$LOGDIR" ]; then
LOGFILE=$(ls -t "${LOGDIR}"/*.log 2>/dev/null | head -1 || echo "")
if [ -n "$LOGFILE" ] && [ -r "$LOGFILE" ]; then
ERR=$(tail -500 "$LOGFILE" | grep -cE "ERROR|FATAL|Exception" || echo 0)
echo " 최근 오류: ${ERR}건 (${LOGFILE})"
[ "$ERR" -gt 0 ] && tail -500 "$LOGFILE" | grep -E "ERROR|FATAL" | tail -5 | sed 's/^/ /'
[ "$ERR" -gt 0 ] && [ $RESULT -lt 1 ] && RESULT=1
fi
break
fi
done
# ── 7. XLog 수집 확인 ─────────────────────────────────────
echo; echo "[$SEP] 7. XLog/Counter 수집 파일"
for DATADIR in "${SCOUTER_HOME}/server/database/xlog" "${SCOUTER_HOME}/database/xlog"; do
if [ -d "$DATADIR" ]; then
TODAY=$(date +%Y%m%d)
TODAY_FILES=$(ls "${DATADIR}"/*${TODAY}* 2>/dev/null | wc -l || echo 0)
echo " 오늘 XLog 파일 수: ${TODAY_FILES} (${DATADIR})"
[ "$TODAY_FILES" -eq 0 ] && echo " ${WARN} 오늘 XLog 없음 (수집 중단 가능성)" && \
[ $RESULT -lt 1 ] && RESULT=1 || echo " ${OK} XLog 수집 중"
break
fi
done
# ── 요약 ─────────────────────────────────────────────────
echo
echo "======================================================"
case $RESULT in
0) echo " 최종 결과: ${OK} Scouter APM 정상" ;;
1) echo " 최종 결과: ${WARN} 주의 항목 있음" ;;
2) echo " 최종 결과: ${CRIT} 즉시 조치 필요" ;;
esac
echo " 점검 완료: $(date '+%Y-%m-%d %H:%M:%S')"
echo "======================================================"
exit $RESULT