Quote:
When oom killer is choosing something to kill, it has a preference for processes which are consuming a lot of memory but which are not long lived. The fact that apache seems to get picked first leads me to suspect that it is consuming too much memory. The situation may be being made worse by the io limiter kicking in and delaying swap operations - a possible cause of your meltdown in the early hours of 4th Oct
Well, it doesn't seem like apache is using too much memory... Amavis uses more.
Maybe some daily cronjob is triggering several processes that use lots of memory (not individually, but collectively)? Is it common for cronjobs to behve like that?
I ask because for two consecutive days, the oom killer was triggered at thetime when the daily cronjob was running.
The information you asked follows.
jp
Code:
# ps -e -o pid,cmd,%mem,rss,trs,sz,vsz
PID CMD %MEM RSS TRS SZ VSZ
1 init [2] 0.1 72 24 318 1272
2 [ksoftirqd/0] 0.0 0 0 0 0
3 [events/0] 0.0 0 0 0 0
4 [khelper] 0.0 0 0 0 0
5 [kthread] 0.0 0 0 0 0
6 [kblockd/0] 0.0 0 0 0 0
17 [pdflush] 0.0 0 0 0 0
18 [pdflush] 0.0 0 0 0 0
20 [aio/0] 0.0 0 0 0 0
19 [kswapd0] 0.0 0 0 0 0
21 [jfsIO] 0.0 0 0 0 0
22 [jfsCommit] 0.0 0 0 0 0
23 [jfsSync] 0.0 0 0 0 0
24 [xfslogd/0] 0.0 0 0 0 0
25 [xfsdatad/0] 0.0 0 0 0 0
26 [xfsbufd] 0.0 0 0 0 0
652 [kjournald] 0.0 0 0 0 0
692 [kjournald] 0.0 0 0 0 0
693 [xfssyncd] 0.0 0 0 0 0
738 dhclient eth0 0.0 0 378 479 1916
1040 /usr/sbin/sshd 0.1 92 264 697 2788
1052 /sbin/syslogd 0.4 264 22 336 1344
1055 /sbin/klogd 0.2 160 17 316 1264
1058 /usr/sbin/named 1.3 800 232 2582 10328
1059 /usr/sbin/named 1.3 804 232 2582 10328
1061 /usr/sbin/named 1.3 804 232 2582 10328
1064 /usr/sbin/named 1.3 804 232 2582 10328
1065 /usr/sbin/named 1.3 804 232 2582 10328
1071 amavisd (master) 1.5 908 659 7101 28404
1075 /usr/sbin/spamd 0.0 0 659 5633 22532
1085 spamd child 0.0 0 659 5633 22532
1086 spamd child 0.0 0 659 5633 22532
1087 spamd child 0.0 0 659 5633 22532
1088 spamd child 0.0 0 659 5633 22532
1089 spamd child 0.0 0 659 5633 22532
1090 /usr/sbin/clamd 5.7 3424 35 7987 31948
1131 /usr/bin/freshcl 0.6 392 27 510 2040
1136 /usr/sbin/courie 0.0 0 8 362 1448
1137 /usr/lib/courier 0.0 48 59 515 2060
1139 /usr/lib/courier 0.0 48 59 515 2060
1140 /usr/lib/courier 0.0 48 59 515 2060
1141 /usr/lib/courier 0.0 48 59 515 2060
1142 /usr/lib/courier 0.0 48 59 515 2060
1143 /usr/lib/courier 0.0 48 59 515 2060
1156 /usr/sbin/inetd 0.0 24 15 327 1308
1167 /bin/sh /usr/bin 0.0 0 473 547 2188
1209 /usr/sbin/mysqld 1.9 1180 3692 16294 65176
1216 /usr/sbin/mysqld 1.9 1180 3692 16294 65176
1217 /usr/sbin/mysqld 1.9 1180 3692 16294 65176
1218 /usr/sbin/mysqld 1.9 1180 3692 16294 65176
1315 /usr/lib/postfix 0.3 188 21 628 2512
1319 qmgr -l -t fifo 0.8 496 34 680 2720
1353 /usr/lib/postgre 0.3 188 1457 2137 8548
1355 postgres: stats 0.0 32 1457 2385 9540
1356 postgres: stats 0.1 84 1457 2148 8592
1371 /usr/sbin/courie 0.0 0 8 358 1432
1372 /usr/lib/courier 0.0 0 1452 749 2996
1375 /usr/lib/courier 0.0 0 1452 749 2996
1377 /usr/lib/courier 0.0 0 1452 749 2996
1379 /usr/lib/courier 0.0 0 1452 749 2996
1381 /usr/lib/courier 0.0 0 1452 749 2996
1383 /usr/lib/courier 0.0 0 1452 749 2996
1391 /usr/bin/python2 0.1 72 418 1357 5428
1392 /usr/bin/python2 1.3 820 418 4596 18384
1401 /usr/sbin/cron 0.2 172 21 414 1656
1408 /sbin/getty 3840 0.0 0 10 314 1256
1454 /usr/sbin/doveco 0.2 156 75 614 2456
1456 dovecot-auth 0.8 500 105 972 3888
1486 /usr/sbin/clamd 5.7 3424 35 7987 31948
2770 SCREEN -S im 1.1 660 243 654 2616
2771 /bin/bash 0.0 0 473 557 2228
2774 centericq 2.5 1540 3858 2425 9700
6509 /usr/sbin/sshd 0.0 0 264 1430 5720
6512 /usr/sbin/sshd 0.0 48 264 1464 5856
6513 -bash 0.2 140 473 555 2220
6911 /usr/sbin/sshd 0.0 0 264 1430 5720
6914 /usr/sbin/sshd 0.1 60 264 1455 5820
6915 -bash 0.2 132 473 554 2216
16807 /usr/sbin/mysqld 1.9 1180 3692 16294 65176
18443 /usr/sbin/apache 0.5 324 218 20530 82120
18444 /usr/sbin/apache 8.6 5116 218 21157 84628
18445 /usr/sbin/apache 1.4 836 218 20564 82256
18447 /usr/sbin/apache 3.6 2164 218 20709 82836
18448 /usr/sbin/apache 9.2 5484 218 21276 85104
18449 /usr/sbin/apache 8.6 5128 218 21121 84484
19673 /usr/sbin/apache 5.2 3128 218 21137 84548
19678 /usr/sbin/apache 9.0 5372 218 21223 84892
19679 /usr/sbin/apache 3.0 1816 218 21311 85244
19680 /usr/sbin/apache 0.9 588 218 20572 82288
19967 /usr/sbin/apache 5.5 3312 218 21230 84920
28516 amavisd (child) 23.9 14216 659 7133 28532
28557 /usr/sbin/sshd 1.3 800 264 1427 5708
28559 /usr/sbin/sshd 1.6 1008 264 1461 5844
28560 -bash 1.4 864 473 556 2224
28952 amavisd (virgin 3.0 1796 659 7101 28404
29752 pickup -l -t fif 1.6 956 6 661 2644
30493 imap-login 2.0 1220 73 622 2488
30564 imap-login 2.0 1220 73 622 2488
30566 imap-login 2.0 1220 73 622 2488
30567 -su 2.1 1248 473 555 2220
30571 ps -e -o pid,cmd 1.0 644 59 514 2056
Code:
# cat /proc/meminfo
MemTotal: 59352 kB
MemFree: 760 kB
Buffers: 348 kB
Cached: 6744 kB
SwapCached: 11184 kB
Active: 45612 kB
Inactive: 2980 kB
HighTotal: 0 kB
HighFree: 0 kB
LowTotal: 59352 kB
LowFree: 760 kB
SwapTotal: 132088 kB
SwapFree: 10052 kB
Dirty: 48 kB
Writeback: 4 kB
Mapped: 42456 kB
Slab: 6896 kB
Committed_AS: 483472 kB
PageTables: 1588 kB
VmallocTotal: 973804 kB
VmallocUsed: 676 kB
VmallocChunk: 973120 kB
Code:
# cat /proc/io_status
io_count=1851754 io_rate=555 io_tokens=398756 token_refill=512 token_max=400000