Annotation of embedaddon/sqlite3/tool/spaceanal.tcl, revision 1.1
1.1 ! misho 1: # Run this TCL script using "testfixture" in order get a report that shows
! 2: # how much disk space is used by a particular data to actually store data
! 3: # versus how much space is unused.
! 4: #
! 5:
! 6: if {[catch {
! 7: # Get the name of the database to analyze
! 8: #
! 9: proc usage {} {
! 10: set argv0 [file rootname [file tail [info nameofexecutable]]]
! 11: puts stderr "Usage: $argv0 database-name"
! 12: exit 1
! 13: }
! 14: set file_to_analyze {}
! 15: set flags(-pageinfo) 0
! 16: set flags(-stats) 0
! 17: append argv {}
! 18: foreach arg $argv {
! 19: if {[regexp {^-+pageinfo$} $arg]} {
! 20: set flags(-pageinfo) 1
! 21: } elseif {[regexp {^-+stats$} $arg]} {
! 22: set flags(-stats) 1
! 23: } elseif {[regexp {^-} $arg]} {
! 24: puts stderr "Unknown option: $arg"
! 25: usage
! 26: } elseif {$file_to_analyze!=""} {
! 27: usage
! 28: } else {
! 29: set file_to_analyze $arg
! 30: }
! 31: }
! 32: if {$file_to_analyze==""} usage
! 33: if {![file exists $file_to_analyze]} {
! 34: puts stderr "No such file: $file_to_analyze"
! 35: exit 1
! 36: }
! 37: if {![file readable $file_to_analyze]} {
! 38: puts stderr "File is not readable: $file_to_analyze"
! 39: exit 1
! 40: }
! 41: set true_file_size [file size $file_to_analyze]
! 42: if {$true_file_size<512} {
! 43: puts stderr "Empty or malformed database: $file_to_analyze"
! 44: exit 1
! 45: }
! 46:
! 47: # Compute the total file size assuming test_multiplexor is being used.
! 48: # Assume that SQLITE_ENABLE_8_3_NAMES might be enabled
! 49: #
! 50: set extension [file extension $file_to_analyze]
! 51: set pattern $file_to_analyze
! 52: append pattern {[0-9][0-9]}
! 53: foreach f [glob -nocomplain $pattern] {
! 54: incr true_file_size [file size $f]
! 55: set extension {}
! 56: }
! 57: if {[string length $extension]>=2 && [string length $extension]<=4} {
! 58: set pattern [file rootname $file_to_analyze]
! 59: append pattern [string range $extension 0 1]
! 60: append pattern {[0-9][0-9]}
! 61: foreach f [glob -nocomplain $pattern] {
! 62: incr true_file_size [file size $f]
! 63: }
! 64: }
! 65:
! 66: # Open the database
! 67: #
! 68: sqlite3 db $file_to_analyze
! 69: register_dbstat_vtab db
! 70:
! 71: db eval {SELECT count(*) FROM sqlite_master}
! 72: set pageSize [expr {wide([db one {PRAGMA page_size}])}]
! 73:
! 74: if {$flags(-pageinfo)} {
! 75: db eval {CREATE VIRTUAL TABLE temp.stat USING dbstat}
! 76: db eval {SELECT name, path, pageno FROM temp.stat ORDER BY pageno} {
! 77: puts "$pageno $name $path"
! 78: }
! 79: exit 0
! 80: }
! 81: if {$flags(-stats)} {
! 82: db eval {CREATE VIRTUAL TABLE temp.stat USING dbstat}
! 83: puts "BEGIN;"
! 84: puts "CREATE TABLE stats("
! 85: puts " name STRING, /* Name of table or index */"
! 86: puts " path INTEGER, /* Path to page from root */"
! 87: puts " pageno INTEGER, /* Page number */"
! 88: puts " pagetype STRING, /* 'internal', 'leaf' or 'overflow' */"
! 89: puts " ncell INTEGER, /* Cells on page (0 for overflow) */"
! 90: puts " payload INTEGER, /* Bytes of payload on this page */"
! 91: puts " unused INTEGER, /* Bytes of unused space on this page */"
! 92: puts " mx_payload INTEGER, /* Largest payload size of all cells */"
! 93: puts " pgoffset INTEGER, /* Offset of page in file */"
! 94: puts " pgsize INTEGER /* Size of the page */"
! 95: puts ");"
! 96: db eval {SELECT quote(name) || ',' ||
! 97: quote(path) || ',' ||
! 98: quote(pageno) || ',' ||
! 99: quote(pagetype) || ',' ||
! 100: quote(ncell) || ',' ||
! 101: quote(payload) || ',' ||
! 102: quote(unused) || ',' ||
! 103: quote(mx_payload) || ',' ||
! 104: quote(pgoffset) || ',' ||
! 105: quote(pgsize) AS x FROM stat} {
! 106: puts "INSERT INTO stats VALUES($x);"
! 107: }
! 108: puts "COMMIT;"
! 109: exit 0
! 110: }
! 111:
! 112: # In-memory database for collecting statistics. This script loops through
! 113: # the tables and indices in the database being analyzed, adding a row for each
! 114: # to an in-memory database (for which the schema is shown below). It then
! 115: # queries the in-memory db to produce the space-analysis report.
! 116: #
! 117: sqlite3 mem :memory:
! 118: set tabledef {CREATE TABLE space_used(
! 119: name clob, -- Name of a table or index in the database file
! 120: tblname clob, -- Name of associated table
! 121: is_index boolean, -- TRUE if it is an index, false for a table
! 122: nentry int, -- Number of entries in the BTree
! 123: leaf_entries int, -- Number of leaf entries
! 124: payload int, -- Total amount of data stored in this table or index
! 125: ovfl_payload int, -- Total amount of data stored on overflow pages
! 126: ovfl_cnt int, -- Number of entries that use overflow
! 127: mx_payload int, -- Maximum payload size
! 128: int_pages int, -- Number of interior pages used
! 129: leaf_pages int, -- Number of leaf pages used
! 130: ovfl_pages int, -- Number of overflow pages used
! 131: int_unused int, -- Number of unused bytes on interior pages
! 132: leaf_unused int, -- Number of unused bytes on primary pages
! 133: ovfl_unused int, -- Number of unused bytes on overflow pages
! 134: gap_cnt int, -- Number of gaps in the page layout
! 135: compressed_size int -- Total bytes stored on disk
! 136: );}
! 137: mem eval $tabledef
! 138:
! 139: # Create a temporary "dbstat" virtual table.
! 140: #
! 141: db eval {CREATE VIRTUAL TABLE temp.stat USING dbstat}
! 142: db eval {CREATE TEMP TABLE dbstat AS SELECT * FROM temp.stat
! 143: ORDER BY name, path}
! 144: db eval {DROP TABLE temp.stat}
! 145:
! 146: proc isleaf {pagetype is_index} {
! 147: return [expr {$pagetype == "leaf" || ($pagetype == "internal" && $is_index)}]
! 148: }
! 149: proc isoverflow {pagetype is_index} {
! 150: return [expr {$pagetype == "overflow"}]
! 151: }
! 152: proc isinternal {pagetype is_index} {
! 153: return [expr {$pagetype == "internal" && $is_index==0}]
! 154: }
! 155:
! 156: db func isleaf isleaf
! 157: db func isinternal isinternal
! 158: db func isoverflow isoverflow
! 159:
! 160: set isCompressed 0
! 161: set compressOverhead 0
! 162: set sql { SELECT name, tbl_name FROM sqlite_master WHERE rootpage>0 }
! 163: foreach {name tblname} [concat sqlite_master sqlite_master [db eval $sql]] {
! 164:
! 165: set is_index [expr {$name!=$tblname}]
! 166: db eval {
! 167: SELECT
! 168: sum(ncell) AS nentry,
! 169: sum(isleaf(pagetype, $is_index) * ncell) AS leaf_entries,
! 170: sum(payload) AS payload,
! 171: sum(isoverflow(pagetype, $is_index) * payload) AS ovfl_payload,
! 172: sum(path LIKE '%+000000') AS ovfl_cnt,
! 173: max(mx_payload) AS mx_payload,
! 174: sum(isinternal(pagetype, $is_index)) AS int_pages,
! 175: sum(isleaf(pagetype, $is_index)) AS leaf_pages,
! 176: sum(isoverflow(pagetype, $is_index)) AS ovfl_pages,
! 177: sum(isinternal(pagetype, $is_index) * unused) AS int_unused,
! 178: sum(isleaf(pagetype, $is_index) * unused) AS leaf_unused,
! 179: sum(isoverflow(pagetype, $is_index) * unused) AS ovfl_unused,
! 180: sum(pgsize) AS compressed_size
! 181: FROM temp.dbstat WHERE name = $name
! 182: } break
! 183:
! 184: set total_pages [expr {$leaf_pages+$int_pages+$ovfl_pages}]
! 185: set storage [expr {$total_pages*$pageSize}]
! 186: if {!$isCompressed && $storage>$compressed_size} {
! 187: set isCompressed 1
! 188: set compressOverhead 14
! 189: }
! 190:
! 191: # Column 'gap_cnt' is set to the number of non-contiguous entries in the
! 192: # list of pages visited if the b-tree structure is traversed in a top-down
! 193: # fashion (each node visited before its child-tree is passed). Any overflow
! 194: # chains present are traversed from start to finish before any child-tree
! 195: # is.
! 196: #
! 197: set gap_cnt 0
! 198: set pglist [db eval {
! 199: SELECT pageno FROM temp.dbstat WHERE name = $name ORDER BY rowid
! 200: }]
! 201: set prev [lindex $pglist 0]
! 202: foreach pgno [lrange $pglist 1 end] {
! 203: if {$pgno != $prev+1} {incr gap_cnt}
! 204: set prev $pgno
! 205: }
! 206:
! 207: mem eval {
! 208: INSERT INTO space_used VALUES(
! 209: $name,
! 210: $tblname,
! 211: $is_index,
! 212: $nentry,
! 213: $leaf_entries,
! 214: $payload,
! 215: $ovfl_payload,
! 216: $ovfl_cnt,
! 217: $mx_payload,
! 218: $int_pages,
! 219: $leaf_pages,
! 220: $ovfl_pages,
! 221: $int_unused,
! 222: $leaf_unused,
! 223: $ovfl_unused,
! 224: $gap_cnt,
! 225: $compressed_size
! 226: );
! 227: }
! 228: }
! 229:
! 230: proc integerify {real} {
! 231: if {[string is double -strict $real]} {
! 232: return [expr {wide($real)}]
! 233: } else {
! 234: return 0
! 235: }
! 236: }
! 237: mem function int integerify
! 238:
! 239: # Quote a string for use in an SQL query. Examples:
! 240: #
! 241: # [quote {hello world}] == {'hello world'}
! 242: # [quote {hello world's}] == {'hello world''s'}
! 243: #
! 244: proc quote {txt} {
! 245: regsub -all ' $txt '' q
! 246: return '$q'
! 247: }
! 248:
! 249: # Generate a single line of output in the statistics section of the
! 250: # report.
! 251: #
! 252: proc statline {title value {extra {}}} {
! 253: set len [string length $title]
! 254: set dots [string range {......................................} $len end]
! 255: set len [string length $value]
! 256: set sp2 [string range { } $len end]
! 257: if {$extra ne ""} {
! 258: set extra " $extra"
! 259: }
! 260: puts "$title$dots $value$sp2$extra"
! 261: }
! 262:
! 263: # Generate a formatted percentage value for $num/$denom
! 264: #
! 265: proc percent {num denom {of {}}} {
! 266: if {$denom==0.0} {return ""}
! 267: set v [expr {$num*100.0/$denom}]
! 268: set of {}
! 269: if {$v==100.0 || $v<0.001 || ($v>1.0 && $v<99.0)} {
! 270: return [format {%5.1f%% %s} $v $of]
! 271: } elseif {$v<0.1 || $v>99.9} {
! 272: return [format {%7.3f%% %s} $v $of]
! 273: } else {
! 274: return [format {%6.2f%% %s} $v $of]
! 275: }
! 276: }
! 277:
! 278: proc divide {num denom} {
! 279: if {$denom==0} {return 0.0}
! 280: return [format %.2f [expr double($num)/double($denom)]]
! 281: }
! 282:
! 283: # Generate a subreport that covers some subset of the database.
! 284: # the $where clause determines which subset to analyze.
! 285: #
! 286: proc subreport {title where} {
! 287: global pageSize file_pgcnt compressOverhead
! 288:
! 289: # Query the in-memory database for the sum of various statistics
! 290: # for the subset of tables/indices identified by the WHERE clause in
! 291: # $where. Note that even if the WHERE clause matches no rows, the
! 292: # following query returns exactly one row (because it is an aggregate).
! 293: #
! 294: # The results of the query are stored directly by SQLite into local
! 295: # variables (i.e. $nentry, $nleaf etc.).
! 296: #
! 297: mem eval "
! 298: SELECT
! 299: int(sum(nentry)) AS nentry,
! 300: int(sum(leaf_entries)) AS nleaf,
! 301: int(sum(payload)) AS payload,
! 302: int(sum(ovfl_payload)) AS ovfl_payload,
! 303: max(mx_payload) AS mx_payload,
! 304: int(sum(ovfl_cnt)) as ovfl_cnt,
! 305: int(sum(leaf_pages)) AS leaf_pages,
! 306: int(sum(int_pages)) AS int_pages,
! 307: int(sum(ovfl_pages)) AS ovfl_pages,
! 308: int(sum(leaf_unused)) AS leaf_unused,
! 309: int(sum(int_unused)) AS int_unused,
! 310: int(sum(ovfl_unused)) AS ovfl_unused,
! 311: int(sum(gap_cnt)) AS gap_cnt,
! 312: int(sum(compressed_size)) AS compressed_size
! 313: FROM space_used WHERE $where" {} {}
! 314:
! 315: # Output the sub-report title, nicely decorated with * characters.
! 316: #
! 317: puts ""
! 318: set len [string length $title]
! 319: set stars [string repeat * [expr 65-$len]]
! 320: puts "*** $title $stars"
! 321: puts ""
! 322:
! 323: # Calculate statistics and store the results in TCL variables, as follows:
! 324: #
! 325: # total_pages: Database pages consumed.
! 326: # total_pages_percent: Pages consumed as a percentage of the file.
! 327: # storage: Bytes consumed.
! 328: # payload_percent: Payload bytes used as a percentage of $storage.
! 329: # total_unused: Unused bytes on pages.
! 330: # avg_payload: Average payload per btree entry.
! 331: # avg_fanout: Average fanout for internal pages.
! 332: # avg_unused: Average unused bytes per btree entry.
! 333: # ovfl_cnt_percent: Percentage of btree entries that use overflow pages.
! 334: #
! 335: set total_pages [expr {$leaf_pages+$int_pages+$ovfl_pages}]
! 336: set total_pages_percent [percent $total_pages $file_pgcnt]
! 337: set storage [expr {$total_pages*$pageSize}]
! 338: set payload_percent [percent $payload $storage {of storage consumed}]
! 339: set total_unused [expr {$ovfl_unused+$int_unused+$leaf_unused}]
! 340: set avg_payload [divide $payload $nleaf]
! 341: set avg_unused [divide $total_unused $nleaf]
! 342: if {$int_pages>0} {
! 343: # TODO: Is this formula correct?
! 344: set nTab [mem eval "
! 345: SELECT count(*) FROM (
! 346: SELECT DISTINCT tblname FROM space_used WHERE $where AND is_index=0
! 347: )
! 348: "]
! 349: set avg_fanout [mem eval "
! 350: SELECT (sum(leaf_pages+int_pages)-$nTab)/sum(int_pages) FROM space_used
! 351: WHERE $where AND is_index = 0
! 352: "]
! 353: set avg_fanout [format %.2f $avg_fanout]
! 354: }
! 355: set ovfl_cnt_percent [percent $ovfl_cnt $nleaf {of all entries}]
! 356:
! 357: # Print out the sub-report statistics.
! 358: #
! 359: statline {Percentage of total database} $total_pages_percent
! 360: statline {Number of entries} $nleaf
! 361: statline {Bytes of storage consumed} $storage
! 362: if {$compressed_size!=$storage} {
! 363: set compressed_size [expr {$compressed_size+$compressOverhead*$total_pages}]
! 364: set pct [expr {$compressed_size*100.0/$storage}]
! 365: set pct [format {%5.1f%%} $pct]
! 366: statline {Bytes used after compression} $compressed_size $pct
! 367: }
! 368: statline {Bytes of payload} $payload $payload_percent
! 369: statline {Average payload per entry} $avg_payload
! 370: statline {Average unused bytes per entry} $avg_unused
! 371: if {[info exists avg_fanout]} {
! 372: statline {Average fanout} $avg_fanout
! 373: }
! 374: if {$total_pages>1} {
! 375: set fragmentation [percent $gap_cnt [expr {$total_pages-1}] {fragmentation}]
! 376: statline {Fragmentation} $fragmentation
! 377: }
! 378: statline {Maximum payload per entry} $mx_payload
! 379: statline {Entries that use overflow} $ovfl_cnt $ovfl_cnt_percent
! 380: if {$int_pages>0} {
! 381: statline {Index pages used} $int_pages
! 382: }
! 383: statline {Primary pages used} $leaf_pages
! 384: statline {Overflow pages used} $ovfl_pages
! 385: statline {Total pages used} $total_pages
! 386: if {$int_unused>0} {
! 387: set int_unused_percent [
! 388: percent $int_unused [expr {$int_pages*$pageSize}] {of index space}]
! 389: statline "Unused bytes on index pages" $int_unused $int_unused_percent
! 390: }
! 391: statline "Unused bytes on primary pages" $leaf_unused [
! 392: percent $leaf_unused [expr {$leaf_pages*$pageSize}] {of primary space}]
! 393: statline "Unused bytes on overflow pages" $ovfl_unused [
! 394: percent $ovfl_unused [expr {$ovfl_pages*$pageSize}] {of overflow space}]
! 395: statline "Unused bytes on all pages" $total_unused [
! 396: percent $total_unused $storage {of all space}]
! 397: return 1
! 398: }
! 399:
! 400: # Calculate the overhead in pages caused by auto-vacuum.
! 401: #
! 402: # This procedure calculates and returns the number of pages used by the
! 403: # auto-vacuum 'pointer-map'. If the database does not support auto-vacuum,
! 404: # then 0 is returned. The two arguments are the size of the database file in
! 405: # pages and the page size used by the database (in bytes).
! 406: proc autovacuum_overhead {filePages pageSize} {
! 407:
! 408: # Set $autovacuum to non-zero for databases that support auto-vacuum.
! 409: set autovacuum [db one {PRAGMA auto_vacuum}]
! 410:
! 411: # If the database is not an auto-vacuum database or the file consists
! 412: # of one page only then there is no overhead for auto-vacuum. Return zero.
! 413: if {0==$autovacuum || $filePages==1} {
! 414: return 0
! 415: }
! 416:
! 417: # The number of entries on each pointer map page. The layout of the
! 418: # database file is one pointer-map page, followed by $ptrsPerPage other
! 419: # pages, followed by a pointer-map page etc. The first pointer-map page
! 420: # is the second page of the file overall.
! 421: set ptrsPerPage [expr double($pageSize/5)]
! 422:
! 423: # Return the number of pointer map pages in the database.
! 424: return [expr wide(ceil( ($filePages-1.0)/($ptrsPerPage+1.0) ))]
! 425: }
! 426:
! 427:
! 428: # Calculate the summary statistics for the database and store the results
! 429: # in TCL variables. They are output below. Variables are as follows:
! 430: #
! 431: # pageSize: Size of each page in bytes.
! 432: # file_bytes: File size in bytes.
! 433: # file_pgcnt: Number of pages in the file.
! 434: # file_pgcnt2: Number of pages in the file (calculated).
! 435: # av_pgcnt: Pages consumed by the auto-vacuum pointer-map.
! 436: # av_percent: Percentage of the file consumed by auto-vacuum pointer-map.
! 437: # inuse_pgcnt: Data pages in the file.
! 438: # inuse_percent: Percentage of pages used to store data.
! 439: # free_pgcnt: Free pages calculated as (<total pages> - <in-use pages>)
! 440: # free_pgcnt2: Free pages in the file according to the file header.
! 441: # free_percent: Percentage of file consumed by free pages (calculated).
! 442: # free_percent2: Percentage of file consumed by free pages (header).
! 443: # ntable: Number of tables in the db.
! 444: # nindex: Number of indices in the db.
! 445: # nautoindex: Number of indices created automatically.
! 446: # nmanindex: Number of indices created manually.
! 447: # user_payload: Number of bytes of payload in table btrees
! 448: # (not including sqlite_master)
! 449: # user_percent: $user_payload as a percentage of total file size.
! 450:
! 451: ### The following, setting $file_bytes based on the actual size of the file
! 452: ### on disk, causes this tool to choke on zipvfs databases. So set it based
! 453: ### on the return of [PRAGMA page_count] instead.
! 454: if 0 {
! 455: set file_bytes [file size $file_to_analyze]
! 456: set file_pgcnt [expr {$file_bytes/$pageSize}]
! 457: }
! 458: set file_pgcnt [db one {PRAGMA page_count}]
! 459: set file_bytes [expr {$file_pgcnt * $pageSize}]
! 460:
! 461: set av_pgcnt [autovacuum_overhead $file_pgcnt $pageSize]
! 462: set av_percent [percent $av_pgcnt $file_pgcnt]
! 463:
! 464: set sql {SELECT sum(leaf_pages+int_pages+ovfl_pages) FROM space_used}
! 465: set inuse_pgcnt [expr wide([mem eval $sql])]
! 466: set inuse_percent [percent $inuse_pgcnt $file_pgcnt]
! 467:
! 468: set free_pgcnt [expr {$file_pgcnt-$inuse_pgcnt-$av_pgcnt}]
! 469: set free_percent [percent $free_pgcnt $file_pgcnt]
! 470: set free_pgcnt2 [db one {PRAGMA freelist_count}]
! 471: set free_percent2 [percent $free_pgcnt2 $file_pgcnt]
! 472:
! 473: set file_pgcnt2 [expr {$inuse_pgcnt+$free_pgcnt2+$av_pgcnt}]
! 474:
! 475: set ntable [db eval {SELECT count(*)+1 FROM sqlite_master WHERE type='table'}]
! 476: set nindex [db eval {SELECT count(*) FROM sqlite_master WHERE type='index'}]
! 477: set sql {SELECT count(*) FROM sqlite_master WHERE name LIKE 'sqlite_autoindex%'}
! 478: set nautoindex [db eval $sql]
! 479: set nmanindex [expr {$nindex-$nautoindex}]
! 480:
! 481: # set total_payload [mem eval "SELECT sum(payload) FROM space_used"]
! 482: set user_payload [mem one {SELECT int(sum(payload)) FROM space_used
! 483: WHERE NOT is_index AND name NOT LIKE 'sqlite_master'}]
! 484: set user_percent [percent $user_payload $file_bytes]
! 485:
! 486: # Output the summary statistics calculated above.
! 487: #
! 488: puts "/** Disk-Space Utilization Report For $file_to_analyze"
! 489: catch {
! 490: puts "*** As of [clock format [clock seconds] -format {%Y-%b-%d %H:%M:%S}]"
! 491: }
! 492: puts ""
! 493: statline {Page size in bytes} $pageSize
! 494: statline {Pages in the whole file (measured)} $file_pgcnt
! 495: statline {Pages in the whole file (calculated)} $file_pgcnt2
! 496: statline {Pages that store data} $inuse_pgcnt $inuse_percent
! 497: statline {Pages on the freelist (per header)} $free_pgcnt2 $free_percent2
! 498: statline {Pages on the freelist (calculated)} $free_pgcnt $free_percent
! 499: statline {Pages of auto-vacuum overhead} $av_pgcnt $av_percent
! 500: statline {Number of tables in the database} $ntable
! 501: statline {Number of indices} $nindex
! 502: statline {Number of named indices} $nmanindex
! 503: statline {Automatically generated indices} $nautoindex
! 504: if {$isCompressed} {
! 505: statline {Size of uncompressed content in bytes} $file_bytes
! 506: set efficiency [percent $true_file_size $file_bytes]
! 507: statline {Size of compressed file on disk} $true_file_size $efficiency
! 508: } else {
! 509: statline {Size of the file in bytes} $file_bytes
! 510: }
! 511: statline {Bytes of user payload stored} $user_payload $user_percent
! 512:
! 513: # Output table rankings
! 514: #
! 515: puts ""
! 516: puts "*** Page counts for all tables with their indices ********************"
! 517: puts ""
! 518: mem eval {SELECT tblname, count(*) AS cnt,
! 519: int(sum(int_pages+leaf_pages+ovfl_pages)) AS size
! 520: FROM space_used GROUP BY tblname ORDER BY size+0 DESC, tblname} {} {
! 521: statline [string toupper $tblname] $size [percent $size $file_pgcnt]
! 522: }
! 523: if {$isCompressed} {
! 524: puts ""
! 525: puts "*** Bytes of disk space used after compression ***********************"
! 526: puts ""
! 527: set csum 0
! 528: mem eval {SELECT tblname,
! 529: int(sum(compressed_size)) +
! 530: $compressOverhead*sum(int_pages+leaf_pages+ovfl_pages)
! 531: AS csize
! 532: FROM space_used GROUP BY tblname ORDER BY csize+0 DESC, tblname} {} {
! 533: incr csum $csize
! 534: statline [string toupper $tblname] $csize [percent $csize $true_file_size]
! 535: }
! 536: set overhead [expr {$true_file_size - $csum}]
! 537: if {$overhead>0} {
! 538: statline {Header and free space} $overhead [percent $overhead $true_file_size]
! 539: }
! 540: }
! 541:
! 542: # Output subreports
! 543: #
! 544: if {$nindex>0} {
! 545: subreport {All tables and indices} 1
! 546: }
! 547: subreport {All tables} {NOT is_index}
! 548: if {$nindex>0} {
! 549: subreport {All indices} {is_index}
! 550: }
! 551: foreach tbl [mem eval {SELECT name FROM space_used WHERE NOT is_index
! 552: ORDER BY name}] {
! 553: regsub ' $tbl '' qn
! 554: set name [string toupper $tbl]
! 555: set n [mem eval "SELECT count(*) FROM space_used WHERE tblname='$qn'"]
! 556: if {$n>1} {
! 557: subreport "Table $name and all its indices" "tblname='$qn'"
! 558: subreport "Table $name w/o any indices" "name='$qn'"
! 559: subreport "Indices of table $name" "tblname='$qn' AND is_index"
! 560: } else {
! 561: subreport "Table $name" "name='$qn'"
! 562: }
! 563: }
! 564:
! 565: # Output instructions on what the numbers above mean.
! 566: #
! 567: puts {
! 568: *** Definitions ******************************************************
! 569:
! 570: Page size in bytes
! 571:
! 572: The number of bytes in a single page of the database file.
! 573: Usually 1024.
! 574:
! 575: Number of pages in the whole file
! 576: }
! 577: puts " The number of $pageSize-byte pages that go into forming the complete
! 578: database"
! 579: puts {
! 580: Pages that store data
! 581:
! 582: The number of pages that store data, either as primary B*Tree pages or
! 583: as overflow pages. The number at the right is the data pages divided by
! 584: the total number of pages in the file.
! 585:
! 586: Pages on the freelist
! 587:
! 588: The number of pages that are not currently in use but are reserved for
! 589: future use. The percentage at the right is the number of freelist pages
! 590: divided by the total number of pages in the file.
! 591:
! 592: Pages of auto-vacuum overhead
! 593:
! 594: The number of pages that store data used by the database to facilitate
! 595: auto-vacuum. This is zero for databases that do not support auto-vacuum.
! 596:
! 597: Number of tables in the database
! 598:
! 599: The number of tables in the database, including the SQLITE_MASTER table
! 600: used to store schema information.
! 601:
! 602: Number of indices
! 603:
! 604: The total number of indices in the database.
! 605:
! 606: Number of named indices
! 607:
! 608: The number of indices created using an explicit CREATE INDEX statement.
! 609:
! 610: Automatically generated indices
! 611:
! 612: The number of indices used to implement PRIMARY KEY or UNIQUE constraints
! 613: on tables.
! 614:
! 615: Size of the file in bytes
! 616:
! 617: The total amount of disk space used by the entire database files.
! 618:
! 619: Bytes of user payload stored
! 620:
! 621: The total number of bytes of user payload stored in the database. The
! 622: schema information in the SQLITE_MASTER table is not counted when
! 623: computing this number. The percentage at the right shows the payload
! 624: divided by the total file size.
! 625:
! 626: Percentage of total database
! 627:
! 628: The amount of the complete database file that is devoted to storing
! 629: information described by this category.
! 630:
! 631: Number of entries
! 632:
! 633: The total number of B-Tree key/value pairs stored under this category.
! 634:
! 635: Bytes of storage consumed
! 636:
! 637: The total amount of disk space required to store all B-Tree entries
! 638: under this category. The is the total number of pages used times
! 639: the pages size.
! 640:
! 641: Bytes of payload
! 642:
! 643: The amount of payload stored under this category. Payload is the data
! 644: part of table entries and the key part of index entries. The percentage
! 645: at the right is the bytes of payload divided by the bytes of storage
! 646: consumed.
! 647:
! 648: Average payload per entry
! 649:
! 650: The average amount of payload on each entry. This is just the bytes of
! 651: payload divided by the number of entries.
! 652:
! 653: Average unused bytes per entry
! 654:
! 655: The average amount of free space remaining on all pages under this
! 656: category on a per-entry basis. This is the number of unused bytes on
! 657: all pages divided by the number of entries.
! 658:
! 659: Fragmentation
! 660:
! 661: The percentage of pages in the table or index that are not
! 662: consecutive in the disk file. Many filesystems are optimized
! 663: for sequential file access so smaller fragmentation numbers
! 664: sometimes result in faster queries, especially for larger
! 665: database files that do not fit in the disk cache.
! 666:
! 667: Maximum payload per entry
! 668:
! 669: The largest payload size of any entry.
! 670:
! 671: Entries that use overflow
! 672:
! 673: The number of entries that user one or more overflow pages.
! 674:
! 675: Total pages used
! 676:
! 677: This is the number of pages used to hold all information in the current
! 678: category. This is the sum of index, primary, and overflow pages.
! 679:
! 680: Index pages used
! 681:
! 682: This is the number of pages in a table B-tree that hold only key (rowid)
! 683: information and no data.
! 684:
! 685: Primary pages used
! 686:
! 687: This is the number of B-tree pages that hold both key and data.
! 688:
! 689: Overflow pages used
! 690:
! 691: The total number of overflow pages used for this category.
! 692:
! 693: Unused bytes on index pages
! 694:
! 695: The total number of bytes of unused space on all index pages. The
! 696: percentage at the right is the number of unused bytes divided by the
! 697: total number of bytes on index pages.
! 698:
! 699: Unused bytes on primary pages
! 700:
! 701: The total number of bytes of unused space on all primary pages. The
! 702: percentage at the right is the number of unused bytes divided by the
! 703: total number of bytes on primary pages.
! 704:
! 705: Unused bytes on overflow pages
! 706:
! 707: The total number of bytes of unused space on all overflow pages. The
! 708: percentage at the right is the number of unused bytes divided by the
! 709: total number of bytes on overflow pages.
! 710:
! 711: Unused bytes on all pages
! 712:
! 713: The total number of bytes of unused space on all primary and overflow
! 714: pages. The percentage at the right is the number of unused bytes
! 715: divided by the total number of bytes.
! 716: }
! 717:
! 718: # Output a dump of the in-memory database. This can be used for more
! 719: # complex offline analysis.
! 720: #
! 721: puts "**********************************************************************"
! 722: puts "The entire text of this report can be sourced into any SQL database"
! 723: puts "engine for further analysis. All of the text above is an SQL comment."
! 724: puts "The data used to generate this report follows:"
! 725: puts "*/"
! 726: puts "BEGIN;"
! 727: puts $tabledef
! 728: unset -nocomplain x
! 729: mem eval {SELECT * FROM space_used} x {
! 730: puts -nonewline "INSERT INTO space_used VALUES"
! 731: set sep (
! 732: foreach col $x(*) {
! 733: set v $x($col)
! 734: if {$v=="" || ![string is double $v]} {set v [quote $v]}
! 735: puts -nonewline $sep$v
! 736: set sep ,
! 737: }
! 738: puts ");"
! 739: }
! 740: puts "COMMIT;"
! 741:
! 742: } err]} {
! 743: puts "ERROR: $err"
! 744: puts $errorInfo
! 745: exit 1
! 746: }
FreeBSD-CVSweb <freebsd-cvsweb@FreeBSD.org>