ha5.5 sp8
HA已经打到sp8的补丁。现在问题仍旧。停止HA后,卷组,IP已经不在了。但是进程都在
。各位DX分析分析问题
Status of the RSCT subsystems used by HACMP:
Subsystem Group PID Status
topsvcs topsvcs 450680 active
grpsvcs grpsvcs 454874 active
grpglsm grpsvcs inoperative
emsvcs emsvcs 434418 active
emaixos emsvcs 479244 active
ctrmc rsct 122976 active
Status of the HACMP subsystems:
Subsystem Group PID Status
clcomdES clcomdES 118968 active
clstrmgrES cluster 487474 active
Status of the optional HACMP subsystems:
Subsystem Group PID Status
clinfoES cluster inoperative
Oct 28 11:15:49 EVENT START: event_error 1 TE_FAIL_NODE
:event_error[+52] [[ high = high ]]
:event_error[+52] version=1.13
:event_error[+53] :event_error[+53] cl_get_path
HA_DIR=es
:event_error[+55] EXIT_STATUS=1
:event_error[+56] RP_NAME=1 TE_FAIL_NODE
:event_error[+59] [ 2 -ne 2 ]
:event_error[+65] set -u
:event_error[+68] RP_NAME=FAIL_NODE
:event_error[+69] RP_NAME=FAIL
:event_error[+72] :event_error[+72] cllsclstr -c
:event_error[+72] grep -v cname
:event_error[+72] cut -d : -f2
CLUSTER=hatest
:event_error[+77] [ -x /usr/lpp/ssp/bin/spget_syspar ]
:event_error[+84] dspmsg scripts.cat 9646 WARNING: Cluster hatest Failed while running event [FAIL], exit status was 1n hatest FAIL 1
:event_error[+84] 1> /dev/console
:event_error[+85] dspmsg scripts.cat 9646 WARNING: Cluster hatest Failed while running event [FAIL], exit status was 1n hatest FAIL 1
WARNING: Cluster hatest Failed while running event [FAIL], exit status was 1
:event_error[+90] [[ nodea = nodea ]]
:event_error[+94] dspmsg scripts.cat 9648 Check hacmp.out on this node for errors.n
Check hacmp.out on this node for errors.
:event_error[+94] [[ FAIL = reconfig_resource* ]]
:event_error[+120] :
:event_error[+121] ps -edf
UID PID PPID C STIME TTY TIME CMD
root 1 0 0 10:55:06 - 0:00 /etc/init
root 77940 1 0 10:55:47 - 0:00 /usr/sbin/syncd 60
radiusd 86098 303252 0 10:56:25 - 0:00 /usr/radius/bin/radiusd
root 98466 1 0 10:55:35 - 0:00 /usr/dt/bin/dtlogin -daemon
root 102512 106680 0 10:56:24 - 0:02 dtgreet
root 106680 98466 0 10:55:35 - 0:00 dtlogin <:0> -daemon
root 118968 139374 0 10:56:57 - 0:02 /usr/es/sbin/cluster/clcomd -d
root 122976 139374 0 10:56:27 - 0:00 /usr/sbin/rsct/bin/rmcd -a IBM.LPCommands -r
root 131214 98466 0 10:55:35 - 0:00 /usr/lpp/X11/bin/X -D /usr/lib/X11//rgb -T -force :0 -auth /var/dt/A:0-Ft7kia
root 135234 1 0 10:55:47 - 0:00 /usr/lib/errdemon
root 139374 1 0 10:55:54 - 0:00 /usr/sbin/srcmstr
root 143522 1 0 10:56:21 - 0:00 /usr/sbin/uprintfd
nobody 151724 241784 0 10:56:08 - 0:00 /usr/sbin/tftpd -n
root 159868 139374 0 10:56:03 - 0:00 /usr/sbin/snmpmibd
root 172154 139374 0 10:56:03 - 0:00 /usr/sbin/portmap
root 180314 1 0 10:55:47 - 0:00 /usr/ccs/bin/shlap64
root 188422 221292 0 10:56:14 - 0:00 bootpd /etc/bootptab
root 192662 139374 0 10:56:04 - 0:00 /usr/sbin/aixmibd
root 209056 139374 0 10:56:03 - 0:00 /usr/sbin/snmpd
root 213096 139374 0 10:56:03 - 0:00 /usr/sbin/syslogd
root 217194 139374 0 10:56:03 - 0:00 sendmail: accepting connections
root 221292 139374 0 10:56:03 - 0:00 /usr/sbin/inetd
daemon 225448 139374 0 10:56:14 - 0:00 /usr/sbin/rpc.statd -d 0 -t 50
root 229488 139374 0 10:56:03 - 0:00 /usr/sbin/hostmibd
root 233688 221292 0 10:56:16 - 0:00 telnetd -a
root 237688 139374 0 10:56:07 - 0:00 /usr/sbin/muxatmd
root 241784 139374 0 10:56:08 - 0:00 /usr/sbin/tftpd -n
root 250032 233688 0 10:56:16 pts/0 0:00 -ksh
root 254098 139374 0 10:56:14 - 0:00 /usr/sbin/rpc.lockd -d 0
root 258218 139374 0 10:56:13 - 0:00 /usr/sbin/rpc.mountd
root 266404 139374 0 10:56:20 - 0:00 /usr/sbin/writesrv
root 270516 139374 0 10:56:13 - 0:00 /usr/sbin/nfsd -gpx 0 -gp on -P /var/adm/nfsv4 3891
root 274622 1 0 10:56:14 - 0:00 /usr/sbin/cron
root 278674 139374 0 10:56:17 - 0:00 /usr/sbin/qdaemon
root 282764 139374 0 10:56:13 - 0:00 /usr/sbin/biod 6
root 286868 1 0 10:56:25 - 0:00 /usr/bin/topasrec -L -s 300 -R 1 -r 6 -o /etc/perf/daily/ -ypersistent=1 -O type=bin -ystart_time=10:56:25,Oct28,2011
root 295062 1 0 10:56:43 - 0:03 /usr/java14/jre/bin/java -Dderby.system.home=/usr/ibm/common/acsi/repos -Xrs -Djava.library.path=/tmp/acsisvc/4b3ed88a:/usr/java14/jre/bin:/usr/java14/jre/bin/classic:/usr/java14/jre/bin:/usr/ibm/common/acsi/lib:/usr/java14/jre/bin/sovvm:/usr/lib: -classpath /tmp/acsisvc/4b3ed88a/sisvboot.jar:/tmp/acsisvc/4b3ed88a/setup.jar:/tmp/acsisvc/4b3ed88a/jlog.jar:/tmp/acsisvc/4b3ed88a/derbynet.jar:/tmp/acsisvc/4b3ed88a/derbytools.jar:/tmp/acsisvc/4b3ed88a/derby.jar:/tmp/acsisvc/4b3ed88a/xercesImpl.jar: com.ibm.ac.si.service.ACSIServiceManager -sipath /usr/ibm/common/acsi -start -jardir /tmp/acsisvc/4b3ed88a -completionfile /tmp/acsisvc/4b3ed88a/oresult -errorfile /tmp/acsisvc/4b3ed88a/eresult
radiusd 303252 139374 0 10:56:24 - 0:00 /usr/radius/bin/radiusd
radiusd 307354 303252 0 10:56:25 - 0:00 /usr/radius/bin/radiusd
root 327848 1 0 10:56:24 - 0:00 /usr/sbin/getty /dev/tty2
root 331940 1 0 10:56:24 lft0 0:00 /usr/sbin/getty /dev/lft0
root 344232 1 0 10:56:24 - 0:00 /usr/sbin/getty /dev/tty1
root 348330 1 0 10:56:24 - 0:00 /usr/lpp/diagnostics/bin/diagd
root 352488 1 0 10:56:51 - 0:00 /usr/sbin/getty /dev/console
root 356588 536670 0 11:15:39 pts/1 0:00 smitty clstop
root 364558 401486 1 11:15:49 - 0:00 ps -edf
root 372942 139374 0 10:56:35 - 0:00 /usr/sbin/rsct/bin/IBM.ServiceRMd
root 385202 487474 0 11:15:49 - 0:00 /usr/es/sbin/cluster/clstrmgr
root 393368 426160 0 11:15:44 pts/1 0:00 /usr/es/sbin/cluster/utilities/clrsh nodea -n /usr/es/sbin/cluster/cspoc/cexec clstop -N -s -g
root 397508 139374 0 10:56:35 - 0:00 /usr/sbin/rsct/bin/vac5/IBM.CSMAgentRMd
root 401486 385202 1 11:15:49 - 0:00 /bin/ksh /usr/es/sbin/cluster/events/event_error 1 TE_FAIL_NODE
root 405654 430294 0 11:15:43 pts/1 0:00 /bin/ksh /usr/es/sbin/cluster/sbin/cl_clstop -cspoc -n nodea -N -s -g
root 409770 544806 0 11:15:45 - 0:00 sleep 5
root 413870 405654 0 11:15:44 pts/1 0:00 /bin/ksh93 /usr/es/sbin/cluster/cspoc/cdsh /tmp/cel405654_s3 nodea clstop -N -s -g
root 417886 544806 0 11:15:45 - 0:00 /bin/ksh /usr/es/sbin/cluster/utilities/clstop -N -s -g
root 422090 503952 0 11:15:44 pts/1 0:00 cat
root 426160 520222 0 11:15:44 pts/1 0:00 /bin/ksh /usr/es/sbin/cluster/utilities/cl_rsh nodea -n /usr/es/sbin/cluster/cspoc/cexec clstop -N -s -g
root 430294 356588 0 11:15:43 pts/1 0:00 /bin/ksh /usr/es/sbin/cluster/cspoc/fix_args nop cl_clstop -N -cspoc-n nodea -s -g
root 434418 139374 0 11:14:16 - 0:00 haemd HACMP 1 hatest SECNOSUPPORT
root 438292 499912 0 11:15:44 pts/1 0:00 tee -a /tmp/cel405654_s3.err
root 442380 139374 0 11:14:24 - 0:00 /usr/sbin/gsclvmd
root 446496 450680 0 11:14:11 - 0:00 /usr/sbin/rsct/bin/hats_nim
root 450680 139374 0 11:14:10 - 0:00 /usr/sbin/rsct/bin/hatsd -n 1 -o deadManSwitch
root 454874 139374 1 11:14:13 - 0:00 hagsd grpsvcs
root 458980 450680 0 11:14:11 - 0:00 /usr/sbin/rsct/bin/hats_nim
root 463094 483450 0 11:15:44 - 0:00 /bin/ksh /usr/es/sbin/cluster/cspoc/cexec clstop -N -s -g
root 475306 417886 0 11:15:45 - 0:00 sleep 5
root 479244 139374 0 11:14:19 - 0:00 harmad -t HACMP -n hatest
root 483450 118968 0 11:15:44 - 0:00 /usr/es/sbin/cluster/clcomd -d
root 487474 139374 3 11:11:23 - 0:00 /usr/es/sbin/cluster/clstrmgr
root 491762 450680 0 11:14:11 - 0:00 /usr/sbin/rsct/bin/hats_diskhb_nim
root 495804 139374 0 11:09:46 - 0:00 /usr/sbin/rsct/bin/IBM.HostRMd
root 499912 413870 0 11:15:44 pts/1 0:00 /bin/ksh93 /usr/es/sbin/cluster/cspoc/cdsh /tmp/cel405654_s3 nodea clstop -N -s -g
root 503952 413870 0 11:15:44 pts/1 0:00 /bin/ksh93 /usr/es/sbin/cluster/cspoc/cdsh /tmp/cel405654_s3 nodea clstop -N -s -g
root 516226 499912 0 11:15:44 pts/1 0:00 cat
root 520222 413870 0 11:15:44 pts/1 0:00 /usr/bin/perl /usr/es/sbin/cluster/cspoc/dsh -w nodea /usr/es/sbin/cluster/cspoc/cexec clstop -N -s -g
root 524530 520222 0 11:15:44 pts/1 0:00 /usr/bin/perl /usr/es/sbin/cluster/cspoc/dsh -w nodea /usr/es/sbin/cluster/cspoc/cexec clstop -N -s -g
root 528392 250032 0 11:15:30 pts/0 0:00 tail -f /var/hacmp/log/hacmp.out
root 532538 221292 0 11:15:34 - 0:00 telnetd -a
root 536670 532538 0 11:15:34 pts/1 0:00 -ksh
root 540896 487474 0 11:14:57 - 0:00 run_rcovcmd
root 544806 463094 0 11:15:44 - 0:00 /bin/ksh /usr/es/sbin/cluster/utilities/clstop -N -s -g
root 549102 499912 0 11:15:44 pts/1 0:00 grep -v : RETURN_CODE=
root 553072 503952 0 11:15:44 pts/1 0:00 tee -a /tmp/cel405654_s3.out
:event_error[+122] :
:event_error[+128] set +u
:event_error[+129] [[ != disable ]]
:event_error[+131] /usr/es/sbin/cluster/utilities/cl_sel
:cl_sel[46] FFDC_DIRECTORY=/tmp/ibmsupt/hacmp
:cl_sel[49] uname -m
:cl_sel[49] UNAME=0055823C4C00
:cl_sel[55] PLATFORM=__AIX__
:cl_sel[55] export PLATFORM
:cl_sel[62] [[ __AIX__ == __AIX__ ]]
:cl_sel[63] tail -1
:cl_sel[63] awk '{ print $3 }'
:cl_sel[63] df -k /tmp
:cl_sel[63] FREE_SPACE=578356
:cl_sel[71] REQUIRED_SPACE=20000
:cl_sel[72] [ 578356 -lt 20000 ]
:cl_sel[82] test -d /tmp/ibmsupt/hacmp
:cl_sel[83] [ 0 -ne 0 ]
:cl_sel[94] date +%Y.%m.%d.%H.%M
:cl_sel[94] TIMESTAMP=2011.10.28.11.15
:cl_sel[95] [[ -z 2011.10.28.11.15 ]]
:cl_sel[105] grep 'value ='
:cl_sel[105] awk -F '"' '{print $2}'
:cl_sel[105] odmget -qname=hacmp.out HACMPlogs
:cl_sel[105] LOG_DIRECTORY=/var/hacmp/log
:cl_sel[107] [[ -z /var/hacmp/log ]]
:cl_sel[117] tar cvf /tmp/ibmsupt/hacmp/eventlogs.2011.10.28.11.15 /var/hacmp/log/hacmp.out /var/hacmp/log/hacmp.out.1 /var/hacmp/log/hacmp.out.2 /var/hacmp/log/hacmp.out.3 /var/hacmp/log/hacmp.out.4 /var/hacmp/log/hacmp.out.5 /var/hacmp/log/hacmp.out.6 /var/hacmp/log/hacmp.out.7
:cl_sel[117] 1> /dev/null 2>& 1
:cl_sel[118] [ 0 -ne 0 ]
:cl_sel[125] compress /tmp/ibmsupt/hacmp/eventlogs.2011.10.28.11.15
:cl_sel[125] 1> /dev/null 2>& 1
:cl_sel[130] wc -l
:cl_sel[130] ls -1 /tmp/ibmsupt/hacmp/eventlogs.2011.10.27.22.39.Z /tmp/ibmsupt/hacmp/eventlogs.2011.10.27.22.49.Z /tmp/ibmsupt/hacmp/eventlogs.2011.10.27.22.55.Z /tmp/ibmsupt/hacmp/eventlogs.2011.10.28.10.44.Z /tmp/ibmsupt/hacmp/eventlogs.2011.10.28.11.09.Z /tmp/ibmsupt/hacmp/eventlogs.2011.10.28.11.15.Z
:cl_sel[130] 2> /dev/null
:cl_sel[130] FFDC_COUNT=' 6'
:cl_sel[131] [ ' 6' -gt 5 ]
:cl_sel[133] expr 6 - 5
:cl_sel[133] number_to_rm=1
:cl_sel[134] head -1
:cl_sel[134] ls -rt1 /tmp/ibmsupt/hacmp/eventlogs.2011.10.27.22.39.Z /tmp/ibmsupt/hacmp/eventlogs.2011.10.27.22.49.Z /tmp/ibmsupt/hacmp/eventlogs.2011.10.27.22.55.Z /tmp/ibmsupt/hacmp/eventlogs.2011.10.28.10.44.Z /tmp/ibmsupt/hacmp/eventlogs.2011.10.28.11.09.Z /tmp/ibmsupt/hacmp/eventlogs.2011.10.28.11.15.Z
:cl_sel[134] FFDC_LIST=/tmp/ibmsupt/hacmp/eventlogs.2011.10.27.22.39.Z
:cl_sel[137] rm -f /tmp/ibmsupt/hacmp/eventlogs.2011.10.27.22.39.Z
:cl_sel[141] dspmsg scripts.cat 10059 'FFDC event log collection saved to /tmp/ibmsupt/hacmp/eventlogs.2011.10.28.11.15n' /tmp/ibmsupt/hacmp/eventlogs.2011.10.28.11.15
FFDC event log collection saved to /tmp/ibmsupt/hacmp/eventlogs.2011.10.28.11.15
:cl_sel[143] exit 0
:event_error[+134] exit 0
Oct 28 11:15:51 EVENT COMPLETED: event_error 1 TE_FAIL_NODE 0
收起