4 * The contents of this file are subject to the terms of the
5 * Common Development and Distribution License (the "License").
6 * You may not use this file except in compliance with the License.
8 * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
9 * or http://www.opensolaris.org/os/licensing.
10 * See the License for the specific language governing permissions
11 * and limitations under the License.
13 * When distributing Covered Code, include this CDDL HEADER in each
14 * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
15 * If applicable, add the following below this CDDL HEADER, with the
16 * fields enclosed by brackets "[]" replaced with your own identifying
17 * information: Portions Copyright [yyyy] [name of copyright owner]
22 * Copyright (c) 1983, 2010, Oracle and/or its affiliates. All rights reserved.
23 * Copyright 2016 Joyent, Inc.
26 * Copyright 2016 Nexenta Systems, Inc. All rights reserved.
43 #include <libnvpair.h>
46 #include <sys/statvfs.h>
47 #include <sys/dumphdr.h>
48 #include <sys/dumpadm.h>
49 #include <sys/compress.h>
50 #include <sys/panic.h>
51 #include <sys/sysmacros.h>
53 #include <sys/resource.h>
54 #include <bzip2/bzlib.h>
55 #include <sys/fm/util.h>
56 #include <fm/libfmevent.h>
57 #include <sys/int_fmtio.h>
60 /* fread/fwrite buffer size */
61 #define FBUFSIZE (1ULL << 20)
63 /* minimum size for output buffering */
64 #define MINCOREBLKSIZE (1ULL << 17)
66 /* create this file if metrics collection is enabled in the kernel */
67 #define METRICSFILE "METRICS.csv"
69 static char progname
[9] = "savecore";
70 static char *savedir
; /* savecore directory */
71 static char *dumpfile
; /* source of raw crash dump */
72 static long bounds
= -1; /* numeric suffix */
73 static long pagesize
; /* dump pagesize */
74 static int dumpfd
= -1; /* dumpfile descriptor */
75 static boolean_t have_dumpfile
= B_TRUE
; /* dumpfile existence */
76 static dumphdr_t corehdr
, dumphdr
; /* initial and terminal dumphdrs */
77 static boolean_t dump_incomplete
; /* dumphdr indicates incomplete */
78 static boolean_t fm_panic
; /* dump is the result of fm_panic */
79 static offset_t endoff
; /* offset of end-of-dump header */
80 static int verbose
; /* chatty mode */
81 static int disregard_valid_flag
; /* disregard valid flag */
82 static int livedump
; /* dump the current running system */
83 static int interactive
; /* user invoked; no syslog */
84 static int csave
; /* save dump compressed */
85 static int filemode
; /* processing file, not dump device */
86 static int percent_done
; /* progress indicator */
87 static int sec_done
; /* progress last report time */
88 static hrtime_t startts
; /* timestamp at start */
89 static volatile uint64_t saved
; /* count of pages written */
90 static volatile uint64_t zpages
; /* count of zero pages not written */
91 static dumpdatahdr_t datahdr
; /* compression info */
92 static long coreblksize
; /* preferred write size (st_blksize) */
93 static int cflag
; /* run as savecore -c */
94 static int mflag
; /* run as savecore -m */
97 * Payload information for the events we raise. These are used
98 * in raise_event to determine what payload to include.
100 #define SC_PAYLOAD_SAVEDIR 0x0001 /* Include savedir in event */
101 #define SC_PAYLOAD_INSTANCE 0x0002 /* Include bounds instance number */
102 #define SC_PAYLOAD_IMAGEUUID 0x0004 /* Include dump OS instance uuid */
103 #define SC_PAYLOAD_CRASHTIME 0x0008 /* Include epoch crashtime */
104 #define SC_PAYLOAD_PANICSTR 0x0010 /* Include panic string */
105 #define SC_PAYLOAD_PANICSTACK 0x0020 /* Include panic string */
106 #define SC_PAYLOAD_FAILREASON 0x0040 /* Include failure reason */
107 #define SC_PAYLOAD_DUMPCOMPLETE 0x0080 /* Include completeness indicator */
108 #define SC_PAYLOAD_ISCOMPRESSED 0x0100 /* Dump is in vmdump.N form */
109 #define SC_PAYLOAD_DUMPADM_EN 0x0200 /* Is dumpadm enabled or not? */
110 #define SC_PAYLOAD_FM_PANIC 0x0400 /* Panic initiated by FMA */
111 #define SC_PAYLOAD_JUSTCHECKING 0x0800 /* Run with -c flag? */
114 SC_EVENT_DUMP_PENDING
,
115 SC_EVENT_SAVECORE_FAILURE
,
116 SC_EVENT_DUMP_AVAILABLE
122 #define _SC_PAYLOAD_CMN \
123 SC_PAYLOAD_IMAGEUUID | \
124 SC_PAYLOAD_CRASHTIME | \
125 SC_PAYLOAD_PANICSTR | \
126 SC_PAYLOAD_PANICSTACK | \
127 SC_PAYLOAD_DUMPCOMPLETE | \
128 SC_PAYLOAD_FM_PANIC | \
131 static const struct {
132 const char *sce_subclass
;
133 uint32_t sce_payload
;
136 * SC_EVENT_DUMP_PENDING
139 "dump_pending_on_device",
140 _SC_PAYLOAD_CMN
| SC_PAYLOAD_DUMPADM_EN
|
141 SC_PAYLOAD_JUSTCHECKING
145 * SC_EVENT_SAVECORE_FAILURE
149 _SC_PAYLOAD_CMN
| SC_PAYLOAD_INSTANCE
| SC_PAYLOAD_FAILREASON
153 * SC_EVENT_DUMP_AVAILABLE
157 _SC_PAYLOAD_CMN
| SC_PAYLOAD_INSTANCE
| SC_PAYLOAD_ISCOMPRESSED
161 static void raise_event(enum sc_event_type
, char *);
166 (void) fprintf(stderr
,
167 "usage: %s [-Lvd] [-f dumpfile] [dirname]\n", progname
);
171 #define SC_SL_NONE 0x0001 /* no syslog */
172 #define SC_SL_ERR 0x0002 /* syslog if !interactive, LOG_ERR */
173 #define SC_SL_WARN 0x0004 /* syslog if !interactive, LOG_WARNING */
174 #define SC_IF_VERBOSE 0x0008 /* message only if -v */
175 #define SC_IF_ISATTY 0x0010 /* message only if interactive */
176 #define SC_EXIT_OK 0x0020 /* exit(0) */
177 #define SC_EXIT_ERR 0x0040 /* exit(1) */
178 #define SC_EXIT_PEND 0x0080 /* exit(2) */
179 #define SC_EXIT_FM 0x0100 /* exit(3) */
181 #define _SC_ALLEXIT (SC_EXIT_OK | SC_EXIT_ERR | SC_EXIT_PEND | SC_EXIT_FM)
184 logprint(uint32_t flags
, char *message
, ...)
188 int do_always
= ((flags
& (SC_IF_VERBOSE
| SC_IF_ISATTY
)) == 0);
189 int do_ifverb
= (flags
& SC_IF_VERBOSE
) && verbose
;
190 int do_ifisatty
= (flags
& SC_IF_ISATTY
) && interactive
;
192 static int logprint_raised
= 0;
194 if (do_always
|| do_ifverb
|| do_ifisatty
) {
195 va_start(args
, message
);
196 /*LINTED: E_SEC_PRINTF_VAR_FMT*/
197 (void) vsnprintf(buf
, sizeof (buf
), message
, args
);
198 (void) fprintf(stderr
, "%s: %s\n", progname
, buf
);
200 switch (flags
& (SC_SL_NONE
| SC_SL_ERR
| SC_SL_WARN
)) {
202 /*LINTED: E_SEC_PRINTF_VAR_FMT*/
203 syslog(LOG_ERR
, buf
);
207 /*LINTED: E_SEC_PRINTF_VAR_FMT*/
208 syslog(LOG_WARNING
, buf
);
218 switch (flags
& _SC_ALLEXIT
) {
228 * Raise an ireport saying why we are exiting. Do not
229 * raise if run as savecore -m. If something in the
230 * raise_event codepath calls logprint avoid recursion.
232 if (!mflag
&& logprint_raised
++ == 0)
233 raise_event(SC_EVENT_SAVECORE_FAILURE
, buf
);
243 if (!mflag
&& logprint_raised
++ == 0 && have_dumpfile
)
244 raise_event(SC_EVENT_SAVECORE_FAILURE
, buf
);
253 * System call / libc wrappers that exit on error.
256 Open(const char *name
, int oflags
, mode_t mode
)
260 if ((fd
= open(name
, oflags
, mode
)) == -1)
261 logprint(SC_SL_ERR
| SC_EXIT_ERR
, "open(\"%s\"): %s",
262 name
, strerror(errno
));
267 Fread(void *buf
, size_t size
, FILE *f
)
269 if (fread(buf
, size
, 1, f
) != 1)
270 logprint(SC_SL_ERR
| SC_EXIT_ERR
, "fread: %s",
275 Fwrite(void *buf
, size_t size
, FILE *f
)
277 if (fwrite(buf
, size
, 1, f
) != 1)
278 logprint(SC_SL_ERR
| SC_EXIT_ERR
, "fwrite: %s",
283 Fseek(offset_t off
, FILE *f
)
285 if (fseeko(f
, off
, SEEK_SET
) != 0)
286 logprint(SC_SL_ERR
| SC_EXIT_ERR
, "fseeko64: %s",
290 typedef struct stat Stat_t
;
293 Fstat(int fd
, Stat_t
*sb
, const char *fname
)
295 if (fstat(fd
, sb
) != 0)
296 logprint(SC_SL_ERR
| SC_EXIT_ERR
, "fstat(\"%s\"): %s", fname
,
301 Stat(const char *fname
, Stat_t
*sb
)
303 if (stat(fname
, sb
) != 0) {
304 have_dumpfile
= B_FALSE
;
305 logprint(SC_SL_ERR
| SC_EXIT_ERR
, "failed to get status "
306 "of file %s", fname
);
311 Pread(int fd
, void *buf
, size_t size
, offset_t off
)
313 ssize_t sz
= pread(fd
, buf
, size
, off
);
316 logprint(SC_SL_ERR
| SC_EXIT_ERR
,
317 "pread: %s", strerror(errno
));
319 logprint(SC_SL_ERR
| SC_EXIT_ERR
,
320 "pread: size %ld != %ld", sz
, size
);
324 Pwrite(int fd
, void *buf
, size_t size
, off64_t off
)
326 if (pwrite(fd
, buf
, size
, off
) != size
)
327 logprint(SC_SL_ERR
| SC_EXIT_ERR
, "pwrite: %s",
336 if ((buf
= calloc(size
, 1)) == NULL
)
337 logprint(SC_SL_ERR
| SC_EXIT_ERR
, "calloc: %s",
343 read_number_from_file(const char *filename
, long default_value
)
345 long file_value
= -1;
348 if ((fp
= fopen(filename
, "r")) != NULL
) {
349 (void) fscanf(fp
, "%ld", &file_value
);
352 return (file_value
< 0 ? default_value
: file_value
);
359 dumpfd
= Open(dumpfile
, O_RDONLY
, 0644);
361 dumpfd
= Open(dumpfile
, O_RDWR
| O_DSYNC
, 0644);
362 endoff
= llseek(dumpfd
, -DUMP_OFFSET
, SEEK_END
) & -DUMP_OFFSET
;
363 Pread(dumpfd
, &dumphdr
, sizeof (dumphdr
), endoff
);
364 Pread(dumpfd
, &datahdr
, sizeof (datahdr
), endoff
+ sizeof (dumphdr
));
366 pagesize
= dumphdr
.dump_pagesize
;
368 if (dumphdr
.dump_magic
!= DUMP_MAGIC
)
369 logprint(SC_SL_NONE
| SC_EXIT_PEND
, "bad magic number %x",
372 if ((dumphdr
.dump_flags
& DF_VALID
) == 0 && !disregard_valid_flag
)
373 logprint(SC_SL_NONE
| SC_IF_VERBOSE
| SC_EXIT_OK
,
374 "dump already processed");
376 if (dumphdr
.dump_version
!= DUMP_VERSION
)
377 logprint(SC_SL_NONE
| SC_IF_VERBOSE
| SC_EXIT_PEND
,
378 "dump version (%d) != %s version (%d)",
379 dumphdr
.dump_version
, progname
, DUMP_VERSION
);
381 if (dumphdr
.dump_wordsize
!= DUMP_WORDSIZE
)
382 logprint(SC_SL_NONE
| SC_EXIT_PEND
,
383 "dump is from %u-bit kernel - cannot save on %u-bit kernel",
384 dumphdr
.dump_wordsize
, DUMP_WORDSIZE
);
386 if (datahdr
.dump_datahdr_magic
== DUMP_DATAHDR_MAGIC
) {
387 if (datahdr
.dump_datahdr_version
!= DUMP_DATAHDR_VERSION
)
388 logprint(SC_SL_NONE
| SC_IF_VERBOSE
| SC_EXIT_PEND
,
389 "dump data version (%d) != %s data version (%d)",
390 datahdr
.dump_datahdr_version
, progname
,
391 DUMP_DATAHDR_VERSION
);
393 (void) memset(&datahdr
, 0, sizeof (datahdr
));
394 datahdr
.dump_maxcsize
= pagesize
;
398 * Read the initial header, clear the valid bits, and compare headers.
399 * The main header may have been overwritten by swapping if we're
400 * using a swap partition as the dump device, in which case we bail.
402 Pread(dumpfd
, &corehdr
, sizeof (dumphdr_t
), dumphdr
.dump_start
);
404 corehdr
.dump_flags
&= ~DF_VALID
;
405 dumphdr
.dump_flags
&= ~DF_VALID
;
407 if (memcmp(&corehdr
, &dumphdr
, sizeof (dumphdr_t
)) != 0) {
409 * Clear valid bit so we don't complain on every invocation.
412 Pwrite(dumpfd
, &dumphdr
, sizeof (dumphdr
), endoff
);
413 logprint(SC_SL_ERR
| SC_EXIT_ERR
,
414 "initial dump header corrupt");
419 check_space(int csave
)
422 int64_t spacefree
, dumpsize
, minfree
, datasize
;
424 if (statvfs(".", &fsb
) < 0)
425 logprint(SC_SL_ERR
| SC_EXIT_ERR
, "statvfs: %s",
428 dumpsize
= dumphdr
.dump_data
- dumphdr
.dump_start
;
429 datasize
= dumphdr
.dump_npages
* pagesize
;
431 dumpsize
+= datasize
;
433 dumpsize
+= datahdr
.dump_data_csize
;
435 spacefree
= (int64_t)fsb
.f_bavail
* fsb
.f_frsize
;
436 minfree
= 1024LL * read_number_from_file("minfree", 1024);
437 if (spacefree
< minfree
+ dumpsize
) {
438 logprint(SC_SL_ERR
| SC_EXIT_ERR
,
439 "not enough space in %s (%lld MB avail, %lld MB needed)",
440 savedir
, spacefree
>> 20, (minfree
+ dumpsize
) >> 20);
445 build_dump_map(int corefd
, const pfn_t
*pfn_table
)
448 static long misses
= 0;
449 size_t dump_mapsize
= (corehdr
.dump_hashmask
+ 1) * sizeof (dump_map_t
);
451 dump_map_t
*dmp
= Zalloc(dump_mapsize
);
452 char *inbuf
= Zalloc(FBUFSIZE
);
453 FILE *in
= fdopen(dup(dumpfd
), "rb");
455 (void) setvbuf(in
, inbuf
, _IOFBF
, FBUFSIZE
);
456 Fseek(dumphdr
.dump_map
, in
);
458 corehdr
.dump_data
= corehdr
.dump_map
+ roundup(dump_mapsize
, pagesize
);
460 for (i
= 0; i
< corehdr
.dump_nvtop
; i
++) {
462 long last
= corehdr
.dump_npages
- 1;
467 Fread(&vtop
, sizeof (mem_vtop_t
), in
);
468 while (last
>= first
) {
469 middle
= (first
+ last
) / 2;
470 pfn
= pfn_table
[middle
];
471 if (pfn
== vtop
.m_pfn
)
473 if (pfn
< vtop
.m_pfn
)
478 if (pfn
!= vtop
.m_pfn
) {
480 (void) fprintf(stderr
,
481 "pfn %ld not found for as=%p, va=%p\n",
482 vtop
.m_pfn
, (void *)vtop
.m_as
, vtop
.m_va
);
486 dmp
[i
].dm_as
= vtop
.m_as
;
487 dmp
[i
].dm_va
= (uintptr_t)vtop
.m_va
;
488 dmp
[i
].dm_data
= corehdr
.dump_data
+
489 ((uint64_t)middle
<< corehdr
.dump_pageshift
);
491 h
= DUMP_HASH(&corehdr
, dmp
[i
].dm_as
, dmp
[i
].dm_va
);
492 dmp
[i
].dm_next
= dmp
[h
].dm_first
;
493 dmp
[h
].dm_first
= corehdr
.dump_map
+ i
* sizeof (dump_map_t
);
496 Pwrite(corefd
, dmp
, dump_mapsize
, corehdr
.dump_map
);
503 * Copy whole sections of the dump device to the file.
506 Copy(offset_t dumpoff
, len_t nb
, offset_t
*offp
, int fd
, char *buf
,
510 offset_t off
= *offp
;
513 nr
= sz
< nb
? sz
: (size_t)nb
;
514 Pread(dumpfd
, buf
, nr
, dumpoff
);
515 Pwrite(fd
, buf
, nr
, off
);
524 * Copy pages when the dump data header is missing.
525 * This supports older kernels with latest savecore.
528 CopyPages(offset_t
*offp
, int fd
, char *buf
, size_t sz
)
531 FILE *in
= fdopen(dup(dumpfd
), "rb");
532 FILE *out
= fdopen(dup(fd
), "wb");
533 char *cbuf
= Zalloc(pagesize
);
534 char *outbuf
= Zalloc(FBUFSIZE
);
535 pgcnt_t np
= dumphdr
.dump_npages
;
537 (void) setvbuf(out
, outbuf
, _IOFBF
, FBUFSIZE
);
538 (void) setvbuf(in
, buf
, _IOFBF
, sz
);
539 Fseek(dumphdr
.dump_data
, in
);
543 Fread(&csize
, sizeof (uint32_t), in
);
544 Fwrite(&csize
, sizeof (uint32_t), out
);
545 *offp
+= sizeof (uint32_t);
546 if (csize
> pagesize
|| csize
== 0) {
548 "CopyPages: page %lu csize %d (0x%x) pagesize %d",
549 dumphdr
.dump_npages
- np
, csize
, csize
,
553 Fread(cbuf
, csize
, in
);
554 Fwrite(cbuf
, csize
, out
);
565 * Concatenate dump contents into a new file.
566 * Update corehdr with new offsets.
569 copy_crashfile(const char *corefile
)
571 int corefd
= Open(corefile
, O_WRONLY
| O_CREAT
| O_TRUNC
, 0644);
572 size_t bufsz
= FBUFSIZE
;
573 char *inbuf
= Zalloc(bufsz
);
577 logprint(SC_SL_ERR
| SC_IF_VERBOSE
,
578 "Copying %s to %s/%s\n", dumpfile
, savedir
, corefile
);
581 * This dump file is still compressed
583 corehdr
.dump_flags
|= DF_COMPRESSED
| DF_VALID
;
586 * Leave room for corehdr, it is updated and written last
588 corehdr
.dump_start
= 0;
589 coreoff
= sizeof (corehdr
);
592 * Read in the compressed symbol table, copy it to corefile.
594 coreoff
= roundup(coreoff
, pagesize
);
595 corehdr
.dump_ksyms
= coreoff
;
596 Copy(dumphdr
.dump_ksyms
, dumphdr
.dump_ksyms_csize
, &coreoff
, corefd
,
600 * Save the pfn table.
602 coreoff
= roundup(coreoff
, pagesize
);
603 corehdr
.dump_pfn
= coreoff
;
604 Copy(dumphdr
.dump_pfn
, dumphdr
.dump_npages
* sizeof (pfn_t
), &coreoff
,
605 corefd
, inbuf
, bufsz
);
610 coreoff
= roundup(coreoff
, pagesize
);
611 corehdr
.dump_map
= coreoff
;
612 Copy(dumphdr
.dump_map
, dumphdr
.dump_nvtop
* sizeof (mem_vtop_t
),
613 &coreoff
, corefd
, inbuf
, bufsz
);
616 * Save the data pages.
618 coreoff
= roundup(coreoff
, pagesize
);
619 corehdr
.dump_data
= coreoff
;
620 if (datahdr
.dump_data_csize
!= 0)
621 Copy(dumphdr
.dump_data
, datahdr
.dump_data_csize
, &coreoff
,
622 corefd
, inbuf
, bufsz
);
624 CopyPages(&coreoff
, corefd
, inbuf
, bufsz
);
627 * Now write the modified dump header to front and end of the copy.
628 * Make it look like a valid dump device.
630 * From dumphdr.h: Two headers are written out: one at the
631 * beginning of the dump, and the other at the very end of the
632 * dump device. The terminal header is at a known location
633 * (end of device) so we can always find it.
635 * Pad with zeros to each DUMP_OFFSET boundary.
637 (void) memset(inbuf
, 0, DUMP_OFFSET
);
639 nb
= DUMP_OFFSET
- (coreoff
& (DUMP_OFFSET
- 1));
641 Pwrite(corefd
, inbuf
, nb
, coreoff
);
645 Pwrite(corefd
, &corehdr
, sizeof (corehdr
), coreoff
);
646 coreoff
+= sizeof (corehdr
);
648 Pwrite(corefd
, &datahdr
, sizeof (datahdr
), coreoff
);
649 coreoff
+= sizeof (datahdr
);
651 nb
= DUMP_OFFSET
- (coreoff
& (DUMP_OFFSET
- 1));
653 Pwrite(corefd
, inbuf
, nb
, coreoff
);
657 Pwrite(corefd
, &corehdr
, sizeof (corehdr
), corehdr
.dump_start
);
660 * Write out the modified dump header to the dump device.
661 * The dump device has been processed, so DF_VALID is clear.
664 Pwrite(dumpfd
, &dumphdr
, sizeof (dumphdr
), endoff
);
666 (void) close(corefd
);
672 typedef struct blockhdr blockhdr_t
;
673 typedef struct block block_t
;
686 typedef enum streamstate
{
691 typedef struct stream
{
708 static stream_t
*streams
;
709 static stream_t
*endstreams
;
711 const int cs
= sizeof (dumpcsize_t
);
713 typedef struct tinfo
{
718 static int threads_stop
;
719 static int threads_active
;
720 static tinfo_t
*tinfo
;
721 static tinfo_t
*endtinfo
;
723 static pthread_mutex_t lock
= PTHREAD_MUTEX_INITIALIZER
;
724 static pthread_cond_t cvfree
= PTHREAD_COND_INITIALIZER
;
725 static pthread_cond_t cvwork
= PTHREAD_COND_INITIALIZER
;
726 static pthread_cond_t cvbarrier
= PTHREAD_COND_INITIALIZER
;
728 static blockhdr_t freeblocks
;
731 enqt(blockhdr_t
*h
, block_t
*b
)
744 block_t
*b
= h
->head
;
754 static void *runstreams(void *arg
);
757 initstreams(int corefd
, int nstreams
, int maxcsize
)
765 nthreads
= sysconf(_SC_NPROCESSORS_ONLN
);
766 if (nstreams
< nthreads
)
770 nblocks
= nthreads
* 2;
772 tinfo
= Zalloc(nthreads
* sizeof (tinfo_t
));
773 endtinfo
= &tinfo
[nthreads
];
776 streams
= Zalloc(nstreams
* sizeof (stream_t
));
777 endstreams
= &streams
[nstreams
];
779 /* init stream block buffers */
780 for (i
= 0; i
< nblocks
; i
++) {
781 b
= Zalloc(sizeof (block_t
));
782 b
->block
= Zalloc(maxcsize
);
783 enqt(&freeblocks
, b
);
786 /* init worker threads */
787 (void) pthread_mutex_lock(&lock
);
790 for (t
= tinfo
; t
!= endtinfo
; t
++) {
791 t
->corefd
= dup(corefd
);
793 nthreads
= t
- tinfo
;
797 if (pthread_create(&t
->tid
, NULL
, runstreams
, t
) != 0)
798 logprint(SC_SL_ERR
| SC_EXIT_ERR
, "pthread_create: %s",
801 (void) pthread_mutex_unlock(&lock
);
809 (void) pthread_mutex_lock(&lock
);
810 for (s
= streams
; s
!= endstreams
; s
++) {
811 while (s
->bound
|| s
->blocks
.head
!= NULL
)
812 (void) pthread_cond_wait(&cvbarrier
, &lock
);
814 (void) pthread_mutex_unlock(&lock
);
822 if (threads_active
) {
824 (void) pthread_mutex_lock(&lock
);
826 (void) pthread_cond_signal(&cvwork
);
827 (void) pthread_mutex_unlock(&lock
);
828 for (t
= tinfo
; t
!= endtinfo
; t
++)
829 (void) pthread_join(t
->tid
, NULL
);
841 (void) pthread_mutex_lock(&lock
);
842 while ((b
= deqh(&freeblocks
)) == NULL
)
843 (void) pthread_cond_wait(&cvfree
, &lock
);
844 (void) pthread_mutex_unlock(&lock
);
848 /* data page offset from page number */
849 #define BTOP(b) ((b) >> dumphdr.dump_pageshift)
850 #define PTOB(p) ((p) << dumphdr.dump_pageshift)
851 #define DATAOFF(p) (corehdr.dump_data + PTOB(p))
853 /* check for coreblksize boundary */
855 isblkbnd(pgcnt_t pgnum
)
857 return (P2PHASE(DATAOFF(pgnum
), coreblksize
) == 0);
866 /*LINTED:E_BAD_PTR_CAST_ALIGN*/
867 pl
= (uint64_t *)(buf
);
868 for (sz
= 0; sz
< pagesize
; sz
+= sizeof (*pl
))
874 volatile uint_t
*hist
;
876 /* write pages to the core file */
878 putpage(int corefd
, char *buf
, pgcnt_t pgnum
, pgcnt_t np
)
880 atomic_inc_uint(&hist
[np
]);
882 Pwrite(corefd
, buf
, PTOB(np
), DATAOFF(pgnum
));
886 * Process one lzjb block.
887 * No object (stream header or page) will be split over a block boundary.
890 lzjbblock(int corefd
, stream_t
*s
, char *block
, size_t blocksz
)
902 if (s
->blkbuf
== NULL
)
903 s
->blkbuf
= Zalloc(coreblksize
);
904 s
->state
= STREAMSTART
;
906 while (in
< blocksz
) {
909 (void) memcpy(&sh
, block
+ in
, sizeof (sh
));
911 if (strcmp(DUMP_STREAM_MAGIC
, sh
.stream_magic
) != 0)
912 logprint(SC_SL_ERR
| SC_EXIT_ERR
,
913 "LZJB STREAMSTART: bad stream header");
914 if (sh
.stream_npages
> datahdr
.dump_maxrange
)
915 logprint(SC_SL_ERR
| SC_EXIT_ERR
,
916 "LZJB STREAMSTART: bad range: %d > %d",
917 sh
.stream_npages
, datahdr
.dump_maxrange
);
918 s
->pagenum
= sh
.stream_pagenum
;
919 s
->npages
= sh
.stream_npages
;
920 s
->curpage
= s
->pagenum
;
923 s
->state
= STREAMPAGES
;
926 (void) memcpy(&sc
, block
+ in
, cs
);
928 csize
= DUMP_GET_CSIZE(sc
);
929 if (csize
> pagesize
)
930 logprint(SC_SL_ERR
| SC_EXIT_ERR
,
931 "LZJB STREAMPAGES: bad csize=%d", csize
);
933 out
= s
->blkbuf
+ PTOB(s
->nout
);
934 dsize
= decompress(block
+ in
, out
, csize
, pagesize
);
936 if (dsize
!= pagesize
)
937 logprint(SC_SL_ERR
| SC_EXIT_ERR
,
938 "LZJB STREAMPAGES: dsize %d != pagesize %d",
942 atomic_inc_64(&saved
);
945 if (s
->nout
== 0 && iszpage(out
)) {
947 atomic_inc_64(&zpages
);
948 } else if (++s
->nout
>= BTOP(coreblksize
) ||
949 isblkbnd(s
->curpage
+ s
->nout
)) {
952 if (++s
->done
>= s
->npages
) {
953 s
->state
= STREAMSTART
;
957 putpage(corefd
, s
->blkbuf
, s
->curpage
, s
->nout
);
959 s
->curpage
= s
->pagenum
+ s
->done
;
966 /* bzlib library reports errors with this callback */
968 bz_internal_error(int errcode
)
970 logprint(SC_SL_ERR
| SC_EXIT_ERR
, "bz_internal_error: err %s\n",
971 BZ2_bzErrorString(errcode
));
975 * Return one object in the stream.
977 * An object (stream header or page) will likely span an input block
978 * of compression data. Return non-zero when an entire object has been
979 * retrieved from the stream.
982 bz2decompress(stream_t
*s
, void *buf
, size_t size
)
986 if (s
->strm
.avail_out
== 0) {
987 s
->strm
.next_out
= buf
;
988 s
->strm
.avail_out
= size
;
990 while (s
->strm
.avail_in
> 0) {
991 rc
= BZ2_bzDecompress(&s
->strm
);
992 if (rc
== BZ_STREAM_END
) {
993 rc
= BZ2_bzDecompressReset(&s
->strm
);
995 logprint(SC_SL_ERR
| SC_EXIT_ERR
,
996 "BZ2_bzDecompressReset: %s",
997 BZ2_bzErrorString(rc
));
1001 if (s
->strm
.avail_out
== 0)
1004 return (s
->strm
.avail_out
== 0);
1008 * Process one bzip2 block.
1009 * The interface is documented here:
1010 * http://www.bzip.org/1.0.5/bzip2-manual-1.0.5.html
1013 bz2block(int corefd
, stream_t
*s
, char *block
, size_t blocksz
)
1021 rc
= BZ2_bzDecompressInit(&s
->strm
, 0, 0);
1023 logprint(SC_SL_ERR
| SC_EXIT_ERR
,
1024 "BZ2_bzDecompressInit: %s", BZ2_bzErrorString(rc
));
1025 if (s
->blkbuf
== NULL
)
1026 s
->blkbuf
= Zalloc(coreblksize
);
1027 s
->strm
.avail_out
= 0;
1028 s
->state
= STREAMSTART
;
1030 s
->strm
.next_in
= block
;
1031 s
->strm
.avail_in
= blocksz
;
1033 while (s
->strm
.avail_in
> 0) {
1036 if (!bz2decompress(s
, &s
->sh
, sizeof (s
->sh
)))
1038 if (strcmp(DUMP_STREAM_MAGIC
, s
->sh
.stream_magic
) != 0)
1039 logprint(SC_SL_ERR
| SC_EXIT_ERR
,
1040 "BZ2 STREAMSTART: bad stream header");
1041 if (s
->sh
.stream_npages
> datahdr
.dump_maxrange
)
1042 logprint(SC_SL_ERR
| SC_EXIT_ERR
,
1043 "BZ2 STREAMSTART: bad range: %d > %d",
1044 s
->sh
.stream_npages
, datahdr
.dump_maxrange
);
1045 s
->pagenum
= s
->sh
.stream_pagenum
;
1046 s
->npages
= s
->sh
.stream_npages
;
1047 s
->curpage
= s
->pagenum
;
1050 s
->state
= STREAMPAGES
;
1053 out
= s
->blkbuf
+ PTOB(s
->nout
);
1054 if (!bz2decompress(s
, out
, pagesize
))
1057 atomic_inc_64(&saved
);
1060 if (s
->nout
== 0 && iszpage(out
)) {
1062 atomic_inc_64(&zpages
);
1063 } else if (++s
->nout
>= BTOP(coreblksize
) ||
1064 isblkbnd(s
->curpage
+ s
->nout
)) {
1067 if (++s
->done
>= s
->npages
) {
1068 s
->state
= STREAMSTART
;
1072 putpage(corefd
, s
->blkbuf
, s
->curpage
, s
->nout
);
1074 s
->curpage
= s
->pagenum
+ s
->done
;
1081 /* report progress */
1090 percent
= saved
* 100LL / corehdr
.dump_npages
;
1091 sec
= (gethrtime() - startts
) / NANOSEC
;
1092 if (percent
> percent_done
|| sec
> sec_done
) {
1093 (void) printf("\r%2d:%02d %3d%% done", sec
/ 60, sec
% 60,
1095 (void) fflush(stdout
);
1097 percent_done
= percent
;
1103 runstreams(void *arg
)
1110 (void) pthread_mutex_lock(&lock
);
1111 while (!threads_stop
) {
1113 for (s
= streams
; s
!= endstreams
; s
++) {
1114 if (s
->bound
|| s
->blocks
.head
== NULL
)
1118 (void) pthread_cond_signal(&cvwork
);
1119 while (s
->blocks
.head
!= NULL
) {
1120 b
= deqh(&s
->blocks
);
1121 (void) pthread_mutex_unlock(&lock
);
1123 if (datahdr
.dump_clevel
< DUMP_CLEVEL_BZIP2
)
1124 lzjbblock(t
->corefd
, s
, b
->block
,
1127 bz2block(t
->corefd
, s
, b
->block
,
1130 (void) pthread_mutex_lock(&lock
);
1131 enqt(&freeblocks
, b
);
1132 (void) pthread_cond_signal(&cvfree
);
1137 (void) pthread_cond_signal(&cvbarrier
);
1139 if (!bound
&& !threads_stop
)
1140 (void) pthread_cond_wait(&cvwork
, &lock
);
1142 (void) close(t
->corefd
);
1143 (void) pthread_cond_signal(&cvwork
);
1144 (void) pthread_mutex_unlock(&lock
);
1149 * Process compressed pages.
1151 * The old format, now called single-threaded lzjb, is a 32-bit size
1152 * word followed by 'size' bytes of lzjb compression data for one
1153 * page. The new format extends this by storing a 12-bit "tag" in the
1154 * upper bits of the size word. When the size word is pagesize or
1155 * less, it is assumed to be one lzjb page. When the size word is
1156 * greater than pagesize, it is assumed to be a "stream block",
1157 * belonging to up to 4095 streams. In practice, the number of streams
1158 * is set to one less than the number of CPUs running at crash
1159 * time. One CPU processes the crash dump, the remaining CPUs
1160 * separately process groups of data pages.
1162 * savecore creates a thread per stream, but never more threads than
1163 * the number of CPUs running savecore. This is because savecore can
1164 * be processing a crash file from a remote machine, which may have
1167 * When the kernel uses parallel lzjb or parallel bzip2, we expect a
1168 * series of 128KB blocks of compression data. In this case, each
1169 * block has a "tag", in the range 1-4095. Each block is handed off to
1170 * to the threads running "runstreams". The dump format is either lzjb
1171 * or bzip2, never a mixture. These threads, in turn, process the
1172 * compression data for groups of pages. Groups of pages are delimited
1173 * by a "stream header", which indicates a starting pfn and number of
1174 * pages. When a stream block has been read, the condition variable
1175 * "cvwork" is signalled, which causes one of the avaiable threads to
1176 * wake up and process the stream.
1178 * In the parallel case there will be streams blocks encoding all data
1179 * pages. The stream of blocks is terminated by a zero size
1180 * word. There can be a few lzjb pages tacked on the end, depending on
1181 * the architecture. The sbarrier function ensures that all stream
1182 * blocks have been processed so that the page number for the few
1183 * single pages at the end can be known.
1186 decompress_pages(int corefd
)
1191 pgcnt_t curpage
= 0;
1194 FILE *tracef
= NULL
;
1197 size_t insz
= FBUFSIZE
;
1198 char *inbuf
= Zalloc(insz
);
1201 int nstreams
= datahdr
.dump_nstreams
;
1202 int maxcsize
= datahdr
.dump_maxcsize
;
1203 int nout
= 0, tag
, doflush
;
1205 dumpf
= fdopen(dup(dumpfd
), "rb");
1207 logprint(SC_SL_ERR
| SC_EXIT_ERR
, "fdopen: %s",
1210 (void) setvbuf(dumpf
, inbuf
, _IOFBF
, insz
);
1211 Fseek(dumphdr
.dump_data
, dumpf
);
1213 /*LINTED: E_CONSTANT_CONDITION*/
1217 * The csize word delimits stream blocks.
1218 * See dumphdr.h for a description.
1220 Fread(&dcsize
, sizeof (dcsize
), dumpf
);
1222 tag
= DUMP_GET_TAG(dcsize
);
1223 csize
= DUMP_GET_CSIZE(dcsize
);
1225 if (tag
!= 0) { /* a stream block */
1228 logprint(SC_SL_ERR
| SC_EXIT_ERR
,
1229 "starting data header is missing");
1232 logprint(SC_SL_ERR
| SC_EXIT_ERR
,
1233 "stream tag %d not in range 1..%d",
1236 if (csize
> maxcsize
)
1237 logprint(SC_SL_ERR
| SC_EXIT_ERR
,
1238 "block size 0x%x > max csize 0x%x",
1241 if (streams
== NULL
)
1242 initstreams(corefd
, nstreams
, maxcsize
);
1243 s
= &streams
[tag
- 1];
1248 Fread(b
->block
, csize
, dumpf
);
1250 (void) pthread_mutex_lock(&lock
);
1251 enqt(&s
->blocks
, b
);
1253 (void) pthread_cond_signal(&cvwork
);
1254 (void) pthread_mutex_unlock(&lock
);
1256 } else if (csize
> 0) { /* one lzjb page */
1258 if (csize
> pagesize
)
1259 logprint(SC_SL_ERR
| SC_EXIT_ERR
,
1260 "csize 0x%x > pagesize 0x%x",
1264 cpage
= Zalloc(pagesize
);
1265 if (dpage
== NULL
) {
1266 dpage
= Zalloc(coreblksize
);
1270 Fread(cpage
, csize
, dumpf
);
1272 out
= dpage
+ PTOB(nout
);
1273 dsize
= decompress(cpage
, out
, csize
, pagesize
);
1275 if (dsize
!= pagesize
)
1276 logprint(SC_SL_ERR
| SC_EXIT_ERR
,
1277 "dsize 0x%x != pagesize 0x%x",
1281 * wait for streams to flush so that 'saved' is correct
1290 atomic_inc_64(&saved
);
1292 if (nout
== 0 && iszpage(dpage
)) {
1294 atomic_inc_64(&zpages
);
1295 } else if (++nout
>= BTOP(coreblksize
) ||
1296 isblkbnd(curpage
+ nout
) ||
1297 saved
>= dumphdr
.dump_npages
) {
1302 putpage(corefd
, dpage
, curpage
, nout
);
1309 * Non-streams lzjb does not use blocks. Stop
1310 * here if all the pages have been decompressed.
1312 if (saved
>= dumphdr
.dump_npages
)
1316 break; /* end of data */
1322 (void) fclose(tracef
);
1323 (void) fclose(dumpf
);
1331 build_corefile(const char *namelist
, const char *corefile
)
1333 size_t pfn_table_size
= dumphdr
.dump_npages
* sizeof (pfn_t
);
1334 size_t ksyms_size
= dumphdr
.dump_ksyms_size
;
1335 size_t ksyms_csize
= dumphdr
.dump_ksyms_csize
;
1337 char *ksyms_base
= Zalloc(ksyms_size
);
1338 char *ksyms_cbase
= Zalloc(ksyms_csize
);
1341 int corefd
= Open(corefile
, O_WRONLY
| O_CREAT
| O_TRUNC
, 0644);
1342 int namefd
= Open(namelist
, O_WRONLY
| O_CREAT
| O_TRUNC
, 0644);
1344 (void) printf("Constructing namelist %s/%s\n", savedir
, namelist
);
1347 * Determine the optimum write size for the core file
1349 Fstat(corefd
, &st
, corefile
);
1352 (void) printf("%s: %ld block size\n", corefile
,
1353 (long)st
.st_blksize
);
1354 coreblksize
= st
.st_blksize
;
1355 if (coreblksize
< MINCOREBLKSIZE
|| !ISP2(coreblksize
))
1356 coreblksize
= MINCOREBLKSIZE
;
1358 hist
= Zalloc((sizeof (uint64_t) * BTOP(coreblksize
)) + 1);
1361 * This dump file is now uncompressed
1363 corehdr
.dump_flags
&= ~DF_COMPRESSED
;
1366 * Read in the compressed symbol table, copy it to corefile,
1367 * decompress it, and write the result to namelist.
1369 corehdr
.dump_ksyms
= pagesize
;
1370 Pread(dumpfd
, ksyms_cbase
, ksyms_csize
, dumphdr
.dump_ksyms
);
1371 Pwrite(corefd
, ksyms_cbase
, ksyms_csize
, corehdr
.dump_ksyms
);
1373 ksyms_dsize
= decompress(ksyms_cbase
, ksyms_base
, ksyms_csize
,
1375 if (ksyms_dsize
!= ksyms_size
)
1376 logprint(SC_SL_WARN
,
1377 "bad data in symbol table, %lu of %lu bytes saved",
1378 ksyms_dsize
, ksyms_size
);
1380 Pwrite(namefd
, ksyms_base
, ksyms_size
, 0);
1381 (void) close(namefd
);
1385 (void) printf("Constructing corefile %s/%s\n", savedir
, corefile
);
1388 * Read in and write out the pfn table.
1390 pfn_table
= Zalloc(pfn_table_size
);
1391 corehdr
.dump_pfn
= corehdr
.dump_ksyms
+ roundup(ksyms_size
, pagesize
);
1392 Pread(dumpfd
, pfn_table
, pfn_table_size
, dumphdr
.dump_pfn
);
1393 Pwrite(corefd
, pfn_table
, pfn_table_size
, corehdr
.dump_pfn
);
1396 * Convert the raw translation data into a hashed dump map.
1398 corehdr
.dump_map
= corehdr
.dump_pfn
+ roundup(pfn_table_size
, pagesize
);
1399 build_dump_map(corefd
, pfn_table
);
1403 * Decompress the pages
1405 decompress_pages(corefd
);
1406 (void) printf(": %ld of %ld pages saved\n", (pgcnt_t
)saved
,
1407 dumphdr
.dump_npages
);
1410 (void) printf("%ld (%ld%%) zero pages were not written\n",
1411 (pgcnt_t
)zpages
, (pgcnt_t
)zpages
* 100 /
1412 dumphdr
.dump_npages
);
1414 if (saved
!= dumphdr
.dump_npages
)
1415 logprint(SC_SL_WARN
, "bad data after page %ld", saved
);
1418 * Write out the modified dump headers.
1420 Pwrite(corefd
, &corehdr
, sizeof (corehdr
), 0);
1422 Pwrite(dumpfd
, &dumphdr
, sizeof (dumphdr
), endoff
);
1424 (void) close(corefd
);
1428 * When the system panics, the kernel saves all undelivered messages (messages
1429 * that never made it out to syslogd(8)) in the dump. At a mimimum, the
1430 * panic message itself will always fall into this category. Upon reboot,
1431 * the syslog startup script runs savecore -m to recover these messages.
1433 * To do this, we read the unsent messages from the dump and send them to
1434 * /dev/conslog on priority band 1. This has the effect of prepending them
1435 * to any already-accumulated messages in the console backlog, thus preserving
1436 * temporal ordering across the reboot.
1438 * Note: since savecore -m is used *only* for this purpose, it does *not*
1439 * attempt to save the crash dump. The dump will be saved later, after
1440 * syslogd(8) starts, by the savecore startup script.
1445 offset_t dumpoff
= -(DUMP_OFFSET
+ DUMP_LOGSIZE
);
1449 struct strbuf ctl
, dat
;
1452 logfd
= Open("/dev/conslog", O_WRONLY
, 0644);
1453 dumpfd
= Open(dumpfile
, O_RDWR
| O_DSYNC
, 0644);
1454 dumpoff
= llseek(dumpfd
, dumpoff
, SEEK_END
) & -DUMP_OFFSET
;
1456 ctl
.buf
= (void *)&lc
;
1457 ctl
.len
= sizeof (log_ctl_t
);
1459 dat
.buf
= Zalloc(DUMP_LOGSIZE
);
1464 Pread(dumpfd
, &ld
, sizeof (log_dump_t
), dumpoff
);
1465 dumpoff
+= sizeof (log_dump_t
);
1466 dat
.len
= ld
.ld_msgsize
;
1468 if (ld
.ld_magic
== 0)
1471 if (ld
.ld_magic
!= LOG_MAGIC
)
1472 logprint(SC_SL_ERR
| SC_IF_VERBOSE
| SC_EXIT_ERR
,
1473 "bad magic %x", ld
.ld_magic
);
1475 if (dat
.len
>= DUMP_LOGSIZE
)
1476 logprint(SC_SL_ERR
| SC_IF_VERBOSE
| SC_EXIT_ERR
,
1477 "bad size %d", ld
.ld_msgsize
);
1479 Pread(dumpfd
, ctl
.buf
, ctl
.len
, dumpoff
);
1482 if (ld
.ld_csum
!= checksum32(ctl
.buf
, ctl
.len
))
1483 logprint(SC_SL_ERR
| SC_IF_VERBOSE
| SC_EXIT_OK
,
1484 "bad log_ctl checksum");
1486 lc
.flags
|= SL_LOGONLY
;
1488 Pread(dumpfd
, dat
.buf
, dat
.len
, dumpoff
);
1491 if (ld
.ld_msum
!= checksum32(dat
.buf
, dat
.len
))
1492 logprint(SC_SL_ERR
| SC_IF_VERBOSE
| SC_EXIT_OK
,
1493 "bad message checksum");
1495 if (putpmsg(logfd
, &ctl
, &dat
, 1, MSG_BAND
) == -1)
1496 logprint(SC_SL_ERR
| SC_EXIT_ERR
, "putpmsg: %s",
1499 ld
.ld_magic
= 0; /* clear magic so we never save twice */
1500 Pwrite(dumpfd
, &ld
, sizeof (log_dump_t
), ldoff
);
1506 getbounds(const char *f
)
1509 const char *p
= strrchr(f
, '/');
1511 if (p
== NULL
|| strncmp(p
, "vmdump", 6) != 0)
1512 p
= strstr(f
, "vmdump");
1514 if (p
!= NULL
&& *p
== '/')
1517 (void) sscanf(p
? p
: f
, "vmdump.%ld", &b
);
1523 stack_retrieve(char *stack
)
1526 offset_t dumpoff
= -(DUMP_OFFSET
+ DUMP_LOGSIZE
+
1528 dumpoff
-= DUMP_SUMMARYSIZE
;
1530 dumpfd
= Open(dumpfile
, O_RDWR
| O_DSYNC
, 0644);
1531 dumpoff
= llseek(dumpfd
, dumpoff
, SEEK_END
) & -DUMP_OFFSET
;
1533 Pread(dumpfd
, &sd
, sizeof (summary_dump_t
), dumpoff
);
1534 dumpoff
+= sizeof (summary_dump_t
);
1536 if (sd
.sd_magic
== 0) {
1541 if (sd
.sd_magic
!= SUMMARY_MAGIC
) {
1543 logprint(SC_SL_NONE
| SC_IF_VERBOSE
,
1544 "bad summary magic %x", sd
.sd_magic
);
1547 Pread(dumpfd
, stack
, STACK_BUF_SIZE
, dumpoff
);
1548 if (sd
.sd_ssum
!= checksum32(stack
, STACK_BUF_SIZE
))
1549 logprint(SC_SL_NONE
| SC_IF_VERBOSE
, "bad stack checksum");
1553 raise_event(enum sc_event_type evidx
, char *warn_string
)
1555 uint32_t pl
= sc_event
[evidx
].sce_payload
;
1556 char panic_stack
[STACK_BUF_SIZE
];
1557 nvlist_t
*attr
= NULL
;
1558 char uuidbuf
[36 + 1];
1561 if (nvlist_alloc(&attr
, NV_UNIQUE_NAME
, 0) != 0)
1562 goto publish
; /* try to send payload-free event */
1564 if (pl
& SC_PAYLOAD_SAVEDIR
&& savedir
!= NULL
)
1565 err
|= nvlist_add_string(attr
, "dumpdir", savedir
);
1567 if (pl
& SC_PAYLOAD_INSTANCE
&& bounds
!= -1)
1568 err
|= nvlist_add_int64(attr
, "instance", bounds
);
1570 if (pl
& SC_PAYLOAD_ISCOMPRESSED
) {
1571 err
|= nvlist_add_boolean_value(attr
, "compressed",
1572 csave
? B_TRUE
: B_FALSE
);
1575 if (pl
& SC_PAYLOAD_DUMPADM_EN
) {
1576 char *disabled
= defread("DUMPADM_ENABLE=no");
1578 err
|= nvlist_add_boolean_value(attr
, "savecore-enabled",
1579 disabled
? B_FALSE
: B_TRUE
);
1582 if (pl
& SC_PAYLOAD_IMAGEUUID
) {
1583 (void) strncpy(uuidbuf
, corehdr
.dump_uuid
, 36);
1585 err
|= nvlist_add_string(attr
, "os-instance-uuid", uuidbuf
);
1588 if (pl
& SC_PAYLOAD_CRASHTIME
) {
1589 err
|= nvlist_add_int64(attr
, "crashtime",
1590 (int64_t)corehdr
.dump_crashtime
);
1593 if (pl
& SC_PAYLOAD_PANICSTR
&& corehdr
.dump_panicstring
[0] != '\0') {
1594 err
|= nvlist_add_string(attr
, "panicstr",
1595 corehdr
.dump_panicstring
);
1598 if (pl
& SC_PAYLOAD_PANICSTACK
) {
1599 stack_retrieve(panic_stack
);
1601 if (panic_stack
[0] != '\0') {
1603 * The summary page may not be present if the dump
1604 * was previously recorded compressed.
1606 (void) nvlist_add_string(attr
, "panicstack",
1611 /* add warning string if this is an ireport for dump failure */
1612 if (pl
& SC_PAYLOAD_FAILREASON
&& warn_string
!= NULL
)
1613 (void) nvlist_add_string(attr
, "failure-reason", warn_string
);
1615 if (pl
& SC_PAYLOAD_DUMPCOMPLETE
)
1616 err
|= nvlist_add_boolean_value(attr
, "dump-incomplete",
1617 dump_incomplete
? B_TRUE
: B_FALSE
);
1619 if (pl
& SC_PAYLOAD_FM_PANIC
) {
1620 err
|= nvlist_add_boolean_value(attr
, "fm-panic",
1621 fm_panic
? B_TRUE
: B_FALSE
);
1624 if (pl
& SC_PAYLOAD_JUSTCHECKING
) {
1625 err
|= nvlist_add_boolean_value(attr
, "will-attempt-savecore",
1626 cflag
? B_FALSE
: B_TRUE
);
1630 logprint(SC_SL_WARN
, "Errors while constructing '%s' "
1631 "event payload; will try to publish anyway.");
1633 if (fmev_rspublish_nvl(FMEV_RULESET_ON_SUNOS
,
1634 "panic", sc_event
[evidx
].sce_subclass
, FMEV_HIPRI
,
1635 attr
) != FMEV_SUCCESS
) {
1636 logprint(SC_SL_ERR
, "failed to publish '%s' event: %s",
1637 sc_event
[evidx
].sce_subclass
, fmev_strerror(fmev_errno
));
1645 main(int argc
, char *argv
[])
1650 long filebounds
= -1;
1651 char namelist
[30], corefile
[30], boundstr
[30];
1654 startts
= gethrtime();
1656 (void) getrlimit(RLIMIT_NOFILE
, &rl
);
1657 rl
.rlim_cur
= rl
.rlim_max
;
1658 (void) setrlimit(RLIMIT_NOFILE
, &rl
);
1660 openlog(progname
, LOG_ODELAY
, LOG_AUTH
);
1662 (void) defopen("/etc/dumpadm.conf");
1663 savedir
= defread("DUMPADM_SAVDIR=");
1664 if (savedir
!= NULL
)
1665 savedir
= strdup(savedir
);
1667 while ((c
= getopt(argc
, argv
, "Lvcdmf:")) != EOF
) {
1679 disregard_valid_flag
++;
1686 filebounds
= getbounds(dumpfile
);
1694 * If doing something other than extracting an existing dump (i.e.
1695 * dumpfile has been provided as an option), the user must be root.
1697 if (geteuid() != 0 && dumpfile
== NULL
) {
1698 (void) fprintf(stderr
, "%s: %s %s\n", progname
,
1699 gettext("you must be root to use"), progname
);
1703 interactive
= isatty(STDOUT_FILENO
);
1705 if (cflag
&& livedump
)
1708 if (dumpfile
== NULL
|| livedump
)
1709 dumpfd
= Open("/dev/dump", O_RDONLY
, 0444);
1711 if (dumpfile
== NULL
) {
1712 dumpfile
= Zalloc(MAXPATHLEN
);
1713 if (ioctl(dumpfd
, DIOCGETDEV
, dumpfile
) == -1) {
1714 have_dumpfile
= B_FALSE
;
1715 logprint(SC_SL_NONE
| SC_IF_ISATTY
| SC_EXIT_ERR
,
1716 "no dump device configured");
1721 return (message_save());
1723 if (optind
== argc
- 1)
1724 savedir
= argv
[optind
];
1726 if (savedir
== NULL
|| optind
< argc
- 1)
1729 if (livedump
&& ioctl(dumpfd
, DIOCDUMP
, NULL
) == -1)
1730 logprint(SC_SL_NONE
| SC_EXIT_ERR
,
1731 "dedicated dump device required");
1733 (void) close(dumpfd
);
1736 Stat(dumpfile
, &st
);
1738 filemode
= S_ISREG(st
.st_mode
);
1740 if (!filemode
&& defread("DUMPADM_CSAVE=off") == NULL
)
1746 * We want this message to go to the log file, but not the console.
1747 * There's no good way to do that with the existing syslog facility.
1748 * We could extend it to handle this, but there doesn't seem to be
1749 * a general need for it, so we isolate the complexity here instead.
1751 if (dumphdr
.dump_panicstring
[0] != '\0') {
1752 int logfd
= Open("/dev/conslog", O_WRONLY
, 0644);
1754 struct strbuf ctl
, dat
;
1755 char msg
[DUMP_PANICSIZE
+ 100];
1756 char fmt
[] = "reboot after panic: %s";
1759 STRLOG_MAKE_MSGID(fmt
, msgid
);
1761 /* LINTED: E_SEC_SPRINTF_UNBOUNDED_COPY */
1762 (void) sprintf(msg
, "%s: [ID %u FACILITY_AND_PRIORITY] ",
1764 /* LINTED: E_SEC_PRINTF_VAR_FMT */
1765 (void) sprintf(msg
+ strlen(msg
), fmt
,
1766 dumphdr
.dump_panicstring
);
1768 lc
.pri
= LOG_AUTH
| LOG_ERR
;
1769 lc
.flags
= SL_CONSOLE
| SL_LOGONLY
;
1772 ctl
.buf
= (void *)&lc
;
1773 ctl
.len
= sizeof (log_ctl_t
);
1775 dat
.buf
= (void *)msg
;
1776 dat
.len
= strlen(msg
) + 1;
1778 (void) putmsg(logfd
, &ctl
, &dat
, 0);
1779 (void) close(logfd
);
1782 if ((dumphdr
.dump_flags
& DF_COMPLETE
) == 0) {
1783 logprint(SC_SL_WARN
, "incomplete dump on dump device");
1784 dump_incomplete
= B_TRUE
;
1787 if (dumphdr
.dump_fm_panic
)
1791 * We have a valid dump on a dump device and know as much about
1792 * it as we're going to at this stage. Raise an event for
1793 * logging and so that FMA can open a case for this panic.
1794 * Avoid this step for FMA-initiated panics - FMA will replay
1795 * ereports off the dump device independently of savecore and
1796 * will make a diagnosis, so we don't want to open two cases
1797 * for the same event. Also avoid raising an event for a
1798 * livedump, or when we inflating a compressed dump.
1800 if (!fm_panic
&& !livedump
&& !filemode
)
1801 raise_event(SC_EVENT_DUMP_PENDING
, NULL
);
1803 logprint(SC_SL_WARN
, "System dump time: %s",
1804 ctime(&dumphdr
.dump_crashtime
));
1807 * Option -c is designed for use from svc-dumpadm where we know
1808 * that dumpadm -n is in effect but run savecore -c just to
1809 * get the above dump_pending_on_device event raised. If it is run
1810 * interactively then just print further panic details.
1813 char *disabled
= defread("DUMPADM_ENABLE=no");
1814 int lvl
= interactive
? SC_SL_WARN
: SC_SL_ERR
;
1815 int ec
= fm_panic
? SC_EXIT_FM
: SC_EXIT_PEND
;
1818 "Panic crashdump pending on dump device%s "
1819 "run savecore(8) manually to extract. "
1821 disabled
? " but dumpadm -n in effect;" : ";",
1823 fm_panic
? "(fault-management initiated)" : "");
1827 if (chdir(savedir
) == -1)
1828 logprint(SC_SL_ERR
| SC_EXIT_ERR
, "chdir(\"%s\"): %s",
1829 savedir
, strerror(errno
));
1834 bounds
= read_number_from_file("bounds", 0);
1836 bounds
= filebounds
;
1839 size_t metrics_size
= datahdr
.dump_metrics
;
1841 (void) sprintf(corefile
, "vmdump.%ld", bounds
);
1843 datahdr
.dump_metrics
= 0;
1846 "Saving compressed system crash dump in %s/%s",
1849 copy_crashfile(corefile
);
1852 * Raise a fault management event that indicates the system
1853 * has panicked. We know a reasonable amount about the
1854 * condition at this time, but the dump is still compressed.
1856 if (!livedump
&& !fm_panic
)
1857 raise_event(SC_EVENT_DUMP_AVAILABLE
, NULL
);
1859 if (metrics_size
> 0) {
1860 int sec
= (gethrtime() - startts
) / 1000 / 1000 / 1000;
1861 FILE *mfile
= fopen(METRICSFILE
, "a");
1862 char *metrics
= Zalloc(metrics_size
+ 1);
1864 Pread(dumpfd
, metrics
, metrics_size
, endoff
+
1865 sizeof (dumphdr
) + sizeof (datahdr
));
1870 if (mfile
== NULL
) {
1871 logprint(SC_SL_WARN
,
1872 "Can't create %s:\n%s",
1873 METRICSFILE
, metrics
);
1875 (void) fprintf(mfile
, "[[[[,,,");
1876 for (i
= 0; i
< argc
; i
++)
1877 (void) fprintf(mfile
, "%s ", argv
[i
]);
1878 (void) fprintf(mfile
, "\n");
1879 (void) fprintf(mfile
, ",,,%s %s %s %s %s\n",
1880 dumphdr
.dump_utsname
.sysname
,
1881 dumphdr
.dump_utsname
.nodename
,
1882 dumphdr
.dump_utsname
.release
,
1883 dumphdr
.dump_utsname
.version
,
1884 dumphdr
.dump_utsname
.machine
);
1885 (void) fprintf(mfile
, ",,,%s dump time %s\n",
1886 dumphdr
.dump_flags
& DF_LIVE
? "Live" :
1887 "Crash", ctime(&dumphdr
.dump_crashtime
));
1888 (void) fprintf(mfile
, ",,,%s/%s\n", savedir
,
1890 (void) fprintf(mfile
, "Metrics:\n%s\n",
1892 (void) fprintf(mfile
, "Copy pages,%ld\n",
1893 dumphdr
. dump_npages
);
1894 (void) fprintf(mfile
, "Copy time,%d\n", sec
);
1895 (void) fprintf(mfile
, "Copy pages/sec,%ld\n",
1896 dumphdr
.dump_npages
/ sec
);
1897 (void) fprintf(mfile
, "]]]]\n");
1898 (void) fclose(mfile
);
1904 "Decompress the crash dump with "
1905 "\n'savecore -vf %s/%s'",
1909 (void) sprintf(namelist
, "unix.%ld", bounds
);
1910 (void) sprintf(corefile
, "vmcore.%ld", bounds
);
1912 if (interactive
&& filebounds
>= 0 && access(corefile
, F_OK
)
1914 logprint(SC_SL_NONE
| SC_EXIT_ERR
,
1915 "%s already exists: remove with "
1916 "'rm -f %s/{unix,vmcore}.%ld'",
1917 corefile
, savedir
, bounds
);
1920 "saving system crash dump in %s/{unix,vmcore}.%ld",
1923 build_corefile(namelist
, corefile
);
1925 if (!livedump
&& !filemode
&& !fm_panic
)
1926 raise_event(SC_EVENT_DUMP_AVAILABLE
, NULL
);
1928 if (access(METRICSFILE
, F_OK
) == 0) {
1929 int sec
= (gethrtime() - startts
) / 1000 / 1000 / 1000;
1930 FILE *mfile
= fopen(METRICSFILE
, "a");
1935 if (mfile
== NULL
) {
1936 logprint(SC_SL_WARN
,
1937 "Can't create %s: %s",
1938 METRICSFILE
, strerror(errno
));
1940 (void) fprintf(mfile
, "[[[[,,,");
1941 for (i
= 0; i
< argc
; i
++)
1942 (void) fprintf(mfile
, "%s ", argv
[i
]);
1943 (void) fprintf(mfile
, "\n");
1944 (void) fprintf(mfile
, ",,,%s/%s\n", savedir
,
1946 (void) fprintf(mfile
, ",,,%s %s %s %s %s\n",
1947 dumphdr
.dump_utsname
.sysname
,
1948 dumphdr
.dump_utsname
.nodename
,
1949 dumphdr
.dump_utsname
.release
,
1950 dumphdr
.dump_utsname
.version
,
1951 dumphdr
.dump_utsname
.machine
);
1952 (void) fprintf(mfile
,
1953 "Uncompress pages,%"PRIu64
"\n", saved
);
1954 (void) fprintf(mfile
, "Uncompress time,%d\n",
1956 (void) fprintf(mfile
, "Uncompress pages/sec,%"
1957 PRIu64
"\n", saved
/ sec
);
1958 (void) fprintf(mfile
, "]]]]\n");
1959 (void) fclose(mfile
);
1964 if (filebounds
< 0) {
1965 (void) sprintf(boundstr
, "%ld\n", bounds
+ 1);
1966 bfd
= Open("bounds", O_WRONLY
| O_CREAT
| O_TRUNC
, 0644);
1967 Pwrite(bfd
, boundstr
, strlen(boundstr
), 0);
1972 int sec
= (gethrtime() - startts
) / 1000 / 1000 / 1000;
1974 (void) printf("%d:%02d dump %s is done\n",
1976 csave
? "copy" : "decompress");
1979 if (verbose
> 1 && hist
!= NULL
) {
1982 for (i
= 1, nw
= 0; i
<= BTOP(coreblksize
); ++i
)
1984 (void) printf("pages count %%\n");
1985 for (i
= 0; i
<= BTOP(coreblksize
); ++i
) {
1988 (void) printf("%3d %5u %6.2f\n",
1989 i
, hist
[i
], 100.0 * hist
[i
] * i
/ nw
);
1993 (void) close(dumpfd
);