Dear all Happy new year!
A series of events (recent apt-get upgrade & power failure), has brought one of my servers (software RAID-1 with SiI3112 SATA controller) to the following state: [0] GREP segfaults: helios:/# grep Segmentation fault helios:/# An strace shows the following: execve("/bin/grep", ["grep"], [/* 16 vars */]) = 0 uname({sys="Linux", node="helios", ...}) = 0 brk(0) = 0x805ac7c old_mmap(NULL, 4096, PROT_READ|PROT_WRITE, MAP_PRIVATE|MAP_ANONYMOUS, -1, 0) = 0x40017000 access("/etc/ld.so.nohwcap", F_OK) = -1 ENOENT (No such file or directory) open("/etc/ld.so.preload", O_RDONLY) = -1 ENOENT (No such file or directory) open("/etc/ld.so.cache", O_RDONLY) = 3 fstat64(3, {st_mode=S_IFREG|0644, st_size=13447, ...}) = 0 old_mmap(NULL, 13447, PROT_READ, MAP_PRIVATE, 3, 0) = 0x40018000 close(3) = 0 access("/etc/ld.so.nohwcap", F_OK) = -1 ENOENT (No such file or directory) open("/lib/libc.so.6", O_RDONLY) = 3 read(3, "\177ELF\1\1\1\0\0\0\0\0\0\0\0\0\3\0\3\0\1\0\0\0\200^\1"..., 512) = 512 fstat64(3, {st_mode=S_IFREG|0644, st_size=1244080, ...}) = 0 old_mmap(NULL, 1254244, PROT_READ|PROT_EXEC, MAP_PRIVATE, 3, 0) = 0x4001c000 old_mmap(0x40144000, 32768, PROT_READ|PROT_WRITE, MAP_PRIVATE|MAP_FIXED, 3, 0x127000) = 0x40144000 old_mmap(0x4014c000, 9060, PROT_READ|PROT_WRITE, MAP_PRIVATE|MAP_FIXED|MAP_ANONYMOUS, -1, 0) = 0x4014c000 close(3) = 0 munmap(0x40018000, 13447) = 0 --- SIGSEGV (Segmentation fault) @ 0 (0) --- +++ killed by SIGSEGV +++ [1] TAR segfaults too: helios:/# tar -cf boot.tar boot/ Segmentation fault helios:/# Strace shows the following: execve("/bin/tar", ["tar", "-cf", "boot.tar", "boot/"], [/* 15 vars */]) = 0 uname({sys="Linux", node="helios", ...}) = 0 brk(0) = 0x8070d58 old_mmap(NULL, 4096, PROT_READ|PROT_WRITE, MAP_PRIVATE|MAP_ANONYMOUS, -1, 0) = 0x40017000 access("/etc/ld.so.nohwcap", F_OK) = -1 ENOENT (No such file or directory) open("/etc/ld.so.preload", O_RDONLY) = -1 ENOENT (No such file or directory) open("/etc/ld.so.cache", O_RDONLY) = 3 fstat64(3, {st_mode=S_IFREG|0644, st_size=13447, ...}) = 0 old_mmap(NULL, 13447, PROT_READ, MAP_PRIVATE, 3, 0) = 0x40018000 close(3) = 0 access("/etc/ld.so.nohwcap", F_OK) = -1 ENOENT (No such file or directory) open("/lib/librt.so.1", O_RDONLY) = 3 read(3, "[EMAIL PROTECTED]"..., 512) = 512 fstat64(3, {st_mode=S_IFREG|0644, st_size=26884, ...}) = 0 old_mmap(NULL, 69912, PROT_READ|PROT_EXEC, MAP_PRIVATE, 3, 0) = 0x4001c000 old_mmap(0x40022000, 4096, PROT_READ|PROT_WRITE, MAP_PRIVATE|MAP_FIXED, 3, 0x6000) = 0x40022000 old_mmap(0x40023000, 41240, PROT_READ|PROT_WRITE, MAP_PRIVATE|MAP_FIXED|MAP_ANONYMOUS, -1, 0) = 0x40023000 close(3) = 0 access("/etc/ld.so.nohwcap", F_OK) = -1 ENOENT (No such file or directory) open("/lib/libc.so.6", O_RDONLY) = 3 read(3, "\177ELF\1\1\1\0\0\0\0\0\0\0\0\0\3\0\3\0\1\0\0\0\200^\1"..., 512) = 512 fstat64(3, {st_mode=S_IFREG|0644, st_size=1244080, ...}) = 0 old_mmap(NULL, 1254244, PROT_READ|PROT_EXEC, MAP_PRIVATE, 3, 0) = 0x4002e000 old_mmap(0x40156000, 32768, PROT_READ|PROT_WRITE, MAP_PRIVATE|MAP_FIXED, 3, 0x127000) = 0x40156000 old_mmap(0x4015e000, 9060, PROT_READ|PROT_WRITE, MAP_PRIVATE|MAP_FIXED|MAP_ANONYMOUS, -1, 0) = 0x4015e000 close(3) = 0 access("/etc/ld.so.nohwcap", F_OK) = -1 ENOENT (No such file or directory) open("/lib/libpthread.so.0", O_RDONLY) = 3 read(3, "\177ELF\1\1\1\0\0\0\0\0\0\0\0\0\3\0\3\0\1\0\0\0\340A\0"..., 512) = 512 fstat64(3, {st_mode=S_IFREG|0644, st_size=81127, ...}) = 0 old_mmap(NULL, 331716, PROT_READ|PROT_EXEC, MAP_PRIVATE, 3, 0) = 0x40161000 old_mmap(0x4016e000, 8192, PROT_READ|PROT_WRITE, MAP_PRIVATE|MAP_FIXED, 3, 0xc000) = 0x4016e000 old_mmap(0x40170000, 270276, PROT_READ|PROT_WRITE, MAP_PRIVATE|MAP_FIXED|MAP_ANONYMOUS, -1, 0) = 0x40170000 close(3) = 0 old_mmap(NULL, 4096, PROT_READ|PROT_WRITE, MAP_PRIVATE|MAP_ANONYMOUS, -1, 0) = 0x401b2000 munmap(0x40018000, 13447) = 0 getrlimit(RLIMIT_STACK, {rlim_cur=8192*1024, rlim_max=RLIM_INFINITY}) = 0 setrlimit(RLIMIT_STACK, {rlim_cur=2044*1024, rlim_max=RLIM_INFINITY}) = 0 getpid() = 1478 rt_sigaction(SIGRTMIN, {0x40169030, [], SA_RESTORER, 0x400575e8}, NULL, 8) = 0 rt_sigaction(SIGRT_1, {0x40169080, [], SA_RESTORER, 0x400575e8}, NULL, 8) = 0 rt_sigaction(SIGRT_2, {0x40169150, [], SA_RESTORER, 0x400575e8}, NULL, 8) = 0 rt_sigprocmask(SIG_BLOCK, [RTMIN], NULL, 8) = 0 rt_sigprocmask(SIG_UNBLOCK, [RT_1], NULL, 8) = 0 _sysctl({{CTL_KERN, KERN_VERSION}, 2, 0xbffff804, 30, (nil), 0}) = 0 --- SIGSEGV (Segmentation fault) @ 0 (0) --- +++ killed by SIGSEGV +++ I can't apt-get upgrade anymore (although I see there is a new kernel package out there), since grep is heavily used in the dpkg scripts: helios:/# apt-get upgrade Reading Package Lists... Done Building Dependency Tree... Done The following packages will be upgraded: base-passwd debconf debconf-i18n discover1 kernel-image-2.4.27-1-386 libapache2-mod-php4 libdiscover1 libgcc1 libmysqlclient12 libtiff4 mailx modutils mysql-client mysql-common mysql-server php4 php4-cli php4-common php4-domxml php4-gd php4-mysql phpmyadmin samba-common squid squid-common 25 upgraded, 0 newly installed, 0 to remove and 0 not upgraded. Need to get 0B/24.9MB of archives. After unpacking 1232kB of additional disk space will be used. Do you want to continue? [Y/n] Preconfiguring packages ... /tmp/squid.config.17333: line 72: 1761 Segmentation fault grep -q "^cache_dir[$w]*[^/$w]" /etc/squid/squid.conf /tmp/squid.config.17333: line 72: 1762 Segmentation fault grep -q '^dns_children\|^dns_defnames\|^cache_dns_program' $sq /tmp/squid.config.17333: line 72: 1764 Segmentation fault grep -q '^cache_dir' $sq /tmp/php4-mysql.config.17337: line 30: 1779 Segmentation fault grep -q "^[[:space:]]*extension[[:space:]]*=[[:space:]]*mysql.so" "/etc/php4/$SAPI/php.ini" /tmp/php4-mysql.config.17337: line 30: 1781 Segmentation fault grep -q "^[[:space:]]*extension[[:space:]]*=[[:space:]]*mysql.so" "/etc/php4/$SAPI/php.ini" /tmp/php4-domxml.config.17339: line 30: 1784 Segmentation fault grep -q "^[[:space:]]*extension[[:space:]]*=[[:space:]]*domxml.so" "/etc/php4/$SAPI/php.ini" /tmp/php4-domxml.config.17339: line 30: 1786 Segmentation fault grep -q "^[[:space:]]*extension[[:space:]]*=[[:space:]]*domxml.so" "/etc/php4/$SAPI/php.ini" /tmp/php4-gd.config.173311: line 30: 1789 Segmentation fault grep -q "^[[:space:]]*extension[[:space:]]*=[[:space:]]*gd.so" "/etc/php4/$SAPI/php.ini" /tmp/php4-gd.config.173311: line 30: 1791 Segmentation fault grep -q "^[[:space:]]*extension[[:space:]]*=[[:space:]]*gd.so" "/etc/php4/$SAPI/php.ini" /tmp/samba-common.config.173315: line 41: 1797 Segmentation fault grep -v dhcp.conf $FILE 1798 | grep -qEi '\\$|^[[:space:]]*include[[:space:]]*=' /tmp/samba-common.config.173315: line 154: 1821 Segmentation fault grep -q -i 'wins server' $FILE dpkg-deb: subprocess tar killed by signal (Segmentation fault) dpkg: error processing /var/cache/apt/archives/base-passwd_3.5.9_i386.deb (--unpack): subprocess dpkg-deb --control returned error exit status 2 Errors were encountered while processing: /var/cache/apt/archives/base-passwd_3.5.9_i386.deb E: Sub-process /usr/bin/dpkg returned an error code (1) helios:/# Some information about the machine: helios:~# cat /proc/cpuinfo processor : 0 vendor_id : GenuineIntel cpu family : 6 model : 7 model name : Pentium III (Katmai) stepping : 3 cpu MHz : 400.913 cache size : 512 KB fdiv_bug : no hlt_bug : no f00f_bug : no coma_bug : no fpu : yes fpu_exception : yes cpuid level : 2 wp : yes flags : fpu vme de pse tsc msr pae mce cx8 apic sep mtrr pge mca cmov pat pse36 mmx fxsr sse bogomips : 799.53 helios:~# free -m total used free shared buffers cached Mem: 504 210 293 0 15 147 -/+ buffers/cache: 48 456 Swap: 525 0 525 helios:~# df -h Filesystem Size Used Avail Use% Mounted on /dev/md1 4.6G 404M 4.0G 10% / /dev/md3 71G 2.9G 68G 5% /srv helios:~# cat /proc/mdstat Personalities : [raid1] read_ahead 1024 sectors md2 : active raid1 ide/host2/bus1/target0/lun0/part2[0] ide/host2/bus0/target0/lun0/part2[1] 538112 blocks [2/2] [UU] md3 : active raid1 ide/host2/bus1/target0/lun0/part3[0] ide/host2/bus0/target0/lun0/part3[1] 74613824 blocks [2/2] [UU] md1 : active raid1 ide/host2/bus1/target0/lun0/part1[0] ide/host2/bus0/target0/lun0/part1[1] 4883648 blocks [2/2] [UU] unused devices: <none> helios:~# lsmod Module Size Used by Not tainted nls_cp437 4284 0 (autoclean) sd_mod 10764 0 (autoclean) (unused) scsi_mod 86020 1 (autoclean) [sd_mod] usb-uhci 19504 0 (unused) usbcore 52268 1 [usb-uhci] rivafb 36144 63 fbcon-cfb16 3752 0 [rivafb] fbcon-cfb32 3656 0 [rivafb] fbcon-cfb8 3176 0 [rivafb] cmpci 25164 1 soundcore 3268 2 [cmpci] gameport 1388 0 [cmpci] 8139too 12328 1 mii 1952 0 [8139too] crc32 2848 0 [8139too] agpgart 39108 0 (unused) ide-cd 27040 0 cdrom 26212 0 [ide-cd] rtc 5768 0 (autoclean) ide-detect 288 0 (autoclean) (unused) siimage 6916 1 (autoclean) piix 7784 1 (autoclean) ide-disk 12416 6 (autoclean) ide-core 91800 6 (autoclean) [ide-cd ide-detect siimage piix ide-disk] unix 12720 13 (autoclean) raid1 11216 3 (autoclean) md 54880 6 (autoclean) [raid1] ext3 65388 2 (autoclean) jbd 34628 2 (autoclean) [ext3] helios:~# uname -a Linux helios 2.4.27-1-386 #1 Fri Sep 3 06:24:46 UTC 2004 i686 GNU/Linux What can I do to fix this? -A -- To UNSUBSCRIBE, email to [EMAIL PROTECTED] with a subject of "unsubscribe". Trouble? Contact [EMAIL PROTECTED]