third_party/sqlite/sqlite-src-3080704/tool/spaceanal.tcl - Issue 949043002: Add //third_party/sqlite to dirs_to_snapshot, remove net_sql.patch

Unified Diff: third_party/sqlite/sqlite-src-3080704/tool/spaceanal.tcl

Issue 949043002: Add //third_party/sqlite to dirs_to_snapshot, remove net_sql.patch (Closed) Base URL: git@github.com:domokit/mojo.git@master

Patch Set: Created 5 years, 10 months ago

Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.

Jump to:

View side-by-side diff with in-line comments

Download patch

« no previous file with comments | « third_party/sqlite/sqlite-src-3080704/tool/space_used.tcl ('k') | third_party/sqlite/sqlite-src-3080704/tool/speedtest.tcl » ('j') | no next file with comments »
Expand Comments ('e') | Collapse Comments ('c') | Hide Comments ('s')

Index: third_party/sqlite/sqlite-src-3080704/tool/spaceanal.tcl

diff --git a/third_party/sqlite/sqlite-src-3080704/tool/spaceanal.tcl b/third_party/sqlite/sqlite-src-3080704/tool/spaceanal.tcl

new file mode 100644

index 0000000000000000000000000000000000000000..a227b8524359c00b9e75f052c092d5e65ab0575f

--- /dev/null

+++ b/third_party/sqlite/sqlite-src-3080704/tool/spaceanal.tcl

@@ -0,0 +1,781 @@

+# Run this TCL script using "testfixture" in order get a report that shows

+# how much disk space is used by a particular data to actually store data

+# versus how much space is unused.

+if {[catch {

+# Get the name of the database to analyze

+proc usage {} {

+ set argv0 [file rootname [file tail [info nameofexecutable]]]

+ puts stderr "Usage: $argv0 database-name"

+ exit 1

+set file_to_analyze {}

+set flags(-pageinfo) 0

+set flags(-stats) 0

+append argv {}

+foreach arg $argv {

+ if {[regexp {^-+pageinfo$} $arg]} {

+ set flags(-pageinfo) 1

+ } elseif {[regexp {^-+stats$} $arg]} {

+ set flags(-stats) 1

+ } elseif {[regexp {^-} $arg]} {

+ puts stderr "Unknown option: $arg"

+ usage

+ } elseif {$file_to_analyze!=""} {

+ usage

+ } else {

+ set file_to_analyze $arg

+ }

+if {$file_to_analyze==""} usage

+set root_filename $file_to_analyze

+regexp {^file:(//)?([^?]*)} $file_to_analyze all x1 root_filename

+if {![file exists $root_filename]} {

+ puts stderr "No such file: $root_filename"

+ exit 1

+if {![file readable $root_filename]} {

+ puts stderr "File is not readable: $root_filename"

+ exit 1

+set true_file_size [file size $root_filename]

+if {$true_file_size<512} {

+ puts stderr "Empty or malformed database: $root_filename"

+ exit 1

+# Compute the total file size assuming test_multiplexor is being used.

+# Assume that SQLITE_ENABLE_8_3_NAMES might be enabled

+set extension [file extension $root_filename]

+set pattern $root_filename

+append pattern {[0-3][0-9][0-9]}

+foreach f [glob -nocomplain $pattern] {

+ incr true_file_size [file size $f]

+ set extension {}

+if {[string length $extension]>=2 && [string length $extension]<=4} {

+ set pattern [file rootname $root_filename]

+ append pattern {.[0-3][0-9][0-9]}

+ foreach f [glob -nocomplain $pattern] {

+ incr true_file_size [file size $f]

+ }

+# Open the database

+if {[catch {sqlite3 db $file_to_analyze -uri 1} msg]} {

+ puts stderr "error trying to open $file_to_analyze: $msg"

+ exit 1

+register_dbstat_vtab db

+db eval {SELECT count(*) FROM sqlite_master}

+set pageSize [expr {wide([db one {PRAGMA page_size}])}]

+if {$flags(-pageinfo)} {

+ db eval {CREATE VIRTUAL TABLE temp.stat USING dbstat}

+ db eval {SELECT name, path, pageno FROM temp.stat ORDER BY pageno} {

+ puts "$pageno $name $path"

+ }

+ exit 0

+if {$flags(-stats)} {

+ db eval {CREATE VIRTUAL TABLE temp.stat USING dbstat}

+ puts "BEGIN;"

+ puts "CREATE TABLE stats("

+ puts " name STRING, /* Name of table or index */"

+ puts " path INTEGER, /* Path to page from root */"

+ puts " pageno INTEGER, /* Page number */"

+ puts " pagetype STRING, /* 'internal', 'leaf' or 'overflow' */"

+ puts " ncell INTEGER, /* Cells on page (0 for overflow) */"

+ puts " payload INTEGER, /* Bytes of payload on this page */"

+ puts " unused INTEGER, /* Bytes of unused space on this page */"

+ puts " mx_payload INTEGER, /* Largest payload size of all cells */"

+ puts " pgoffset INTEGER, /* Offset of page in file */"

+ puts " pgsize INTEGER /* Size of the page */"

+ puts ");"

+ db eval {SELECT quote(name) || ',' ||

+ quote(path) || ',' ||

+ quote(pageno) || ',' ||

+ quote(pagetype) || ',' ||

+ quote(ncell) || ',' ||

+ quote(payload) || ',' ||

+ quote(unused) || ',' ||

+ quote(mx_payload) || ',' ||

+ quote(pgoffset) || ',' ||

+ quote(pgsize) AS x FROM stat} {

+ puts "INSERT INTO stats VALUES($x);"

+ }

+ puts "COMMIT;"

+ exit 0

+# In-memory database for collecting statistics. This script loops through

+# the tables and indices in the database being analyzed, adding a row for each

+# to an in-memory database (for which the schema is shown below). It then

+# queries the in-memory db to produce the space-analysis report.

+sqlite3 mem :memory:

+set tabledef {CREATE TABLE space_used(

+ name clob, -- Name of a table or index in the database file

+ tblname clob, -- Name of associated table

+ is_index boolean, -- TRUE if it is an index, false for a table

+ nentry int, -- Number of entries in the BTree

+ leaf_entries int, -- Number of leaf entries

+ payload int, -- Total amount of data stored in this table or index

+ ovfl_payload int, -- Total amount of data stored on overflow pages

+ ovfl_cnt int, -- Number of entries that use overflow

+ mx_payload int, -- Maximum payload size

+ int_pages int, -- Number of interior pages used

+ leaf_pages int, -- Number of leaf pages used

+ ovfl_pages int, -- Number of overflow pages used

+ int_unused int, -- Number of unused bytes on interior pages

+ leaf_unused int, -- Number of unused bytes on primary pages

+ ovfl_unused int, -- Number of unused bytes on overflow pages

+ gap_cnt int, -- Number of gaps in the page layout

+ compressed_size int -- Total bytes stored on disk

+);}

+mem eval $tabledef

+# Create a temporary "dbstat" virtual table.

+db eval {CREATE VIRTUAL TABLE temp.stat USING dbstat}

+db eval {CREATE TEMP TABLE dbstat AS SELECT * FROM temp.stat

+ ORDER BY name, path}

+db eval {DROP TABLE temp.stat}

+proc isleaf {pagetype is_index} {

+ return [expr {$pagetype == "leaf" || ($pagetype == "internal" && $is_index)}]

+proc isoverflow {pagetype is_index} {

+ return [expr {$pagetype == "overflow"}]

+proc isinternal {pagetype is_index} {

+ return [expr {$pagetype == "internal" && $is_index==0}]

+db func isleaf isleaf

+db func isinternal isinternal

+db func isoverflow isoverflow

+set isCompressed 0

+set compressOverhead 0

+set sql { SELECT name, tbl_name FROM sqlite_master WHERE rootpage>0 }

+foreach {name tblname} [concat sqlite_master sqlite_master [db eval $sql]] {

+ set is_index [expr {$name!=$tblname}]

+ db eval {

+ SELECT

+ sum(ncell) AS nentry,

+ sum(isleaf(pagetype, $is_index) * ncell) AS leaf_entries,

+ sum(payload) AS payload,

+ sum(isoverflow(pagetype, $is_index) * payload) AS ovfl_payload,

+ sum(path LIKE '%+000000') AS ovfl_cnt,

+ max(mx_payload) AS mx_payload,

+ sum(isinternal(pagetype, $is_index)) AS int_pages,

+ sum(isleaf(pagetype, $is_index)) AS leaf_pages,

+ sum(isoverflow(pagetype, $is_index)) AS ovfl_pages,

+ sum(isinternal(pagetype, $is_index) * unused) AS int_unused,

+ sum(isleaf(pagetype, $is_index) * unused) AS leaf_unused,

+ sum(isoverflow(pagetype, $is_index) * unused) AS ovfl_unused,

+ sum(pgsize) AS compressed_size

+ FROM temp.dbstat WHERE name = $name

+ } break

+ set total_pages [expr {$leaf_pages+$int_pages+$ovfl_pages}]

+ set storage [expr {$total_pages*$pageSize}]

+ if {!$isCompressed && $storage>$compressed_size} {

+ set isCompressed 1

+ set compressOverhead 14

+ }

+ # Column 'gap_cnt' is set to the number of non-contiguous entries in the

+ # list of pages visited if the b-tree structure is traversed in a top-down

+ # fashion (each node visited before its child-tree is passed). Any overflow

+ # chains present are traversed from start to finish before any child-tree

+ # is.

+ #

+ set gap_cnt 0

+ set prev 0

+ db eval {

+ SELECT pageno, pagetype FROM temp.dbstat

+ WHERE name=$name

+ ORDER BY pageno

+ } {

+ if {$prev>0 && $pagetype=="leaf" && $pageno!=$prev+1} {

+ incr gap_cnt

+ }

+ set prev $pageno

+ }

+ mem eval {

+ INSERT INTO space_used VALUES(

+ $name,

+ $tblname,

+ $is_index,

+ $nentry,

+ $leaf_entries,

+ $payload,

+ $ovfl_payload,

+ $ovfl_cnt,

+ $mx_payload,

+ $int_pages,

+ $leaf_pages,

+ $ovfl_pages,

+ $int_unused,

+ $leaf_unused,

+ $ovfl_unused,

+ $gap_cnt,

+ $compressed_size

+ );

+ }

+proc integerify {real} {

+ if {[string is double -strict $real]} {

+ return [expr {wide($real)}]

+ } else {

+ return 0

+ }

+mem function int integerify

+# Quote a string for use in an SQL query. Examples:

+# [quote {hello world}] == {'hello world'}

+# [quote {hello world's}] == {'hello world''s'}

+proc quote {txt} {

+ return [string map {' ''} $txt]

+# Output a title line

+proc titleline {title} {

+ if {$title==""} {

+ puts [string repeat * 79]

+ } else {

+ set len [string length $title]

+ set stars [string repeat * [expr 79-$len-5]]

+ puts "*** $title $stars"

+ }

+# Generate a single line of output in the statistics section of the

+# report.

+proc statline {title value {extra {}}} {

+ set len [string length $title]

+ set dots [string repeat . [expr 50-$len]]

+ set len [string length $value]

+ set sp2 [string range { } $len end]

+ if {$extra ne ""} {

+ set extra " $extra"

+ }

+ puts "$title$dots $value$sp2$extra"

+# Generate a formatted percentage value for $num/$denom

+proc percent {num denom {of {}}} {

+ if {$denom==0.0} {return ""}

+ set v [expr {$num*100.0/$denom}]

+ set of {}

+ if {$v==100.0 || $v<0.001 || ($v>1.0 && $v<99.0)} {

+ return [format {%5.1f%% %s} $v $of]

+ } elseif {$v<0.1 || $v>99.9} {

+ return [format {%7.3f%% %s} $v $of]

+ } else {

+ return [format {%6.2f%% %s} $v $of]

+ }

+proc divide {num denom} {

+ if {$denom==0} {return 0.0}

+ return [format %.2f [expr double($num)/double($denom)]]

+# Generate a subreport that covers some subset of the database.

+# the $where clause determines which subset to analyze.

+proc subreport {title where showFrag} {

+ global pageSize file_pgcnt compressOverhead

+ # Query the in-memory database for the sum of various statistics

+ # for the subset of tables/indices identified by the WHERE clause in

+ # $where. Note that even if the WHERE clause matches no rows, the

+ # following query returns exactly one row (because it is an aggregate).

+ #

+ # The results of the query are stored directly by SQLite into local

+ # variables (i.e. $nentry, $nleaf etc.).

+ #

+ mem eval "

+ SELECT

+ int(sum(nentry)) AS nentry,

+ int(sum(leaf_entries)) AS nleaf,

+ int(sum(payload)) AS payload,

+ int(sum(ovfl_payload)) AS ovfl_payload,

+ max(mx_payload) AS mx_payload,

+ int(sum(ovfl_cnt)) as ovfl_cnt,

+ int(sum(leaf_pages)) AS leaf_pages,

+ int(sum(int_pages)) AS int_pages,

+ int(sum(ovfl_pages)) AS ovfl_pages,

+ int(sum(leaf_unused)) AS leaf_unused,

+ int(sum(int_unused)) AS int_unused,

+ int(sum(ovfl_unused)) AS ovfl_unused,

+ int(sum(gap_cnt)) AS gap_cnt,

+ int(sum(compressed_size)) AS compressed_size

+ FROM space_used WHERE $where" {} {}

+ # Output the sub-report title, nicely decorated with * characters.

+ #

+ puts ""

+ titleline $title

+ puts ""

+ # Calculate statistics and store the results in TCL variables, as follows:

+ #

+ # total_pages: Database pages consumed.

+ # total_pages_percent: Pages consumed as a percentage of the file.

+ # storage: Bytes consumed.

+ # payload_percent: Payload bytes used as a percentage of $storage.

+ # total_unused: Unused bytes on pages.

+ # avg_payload: Average payload per btree entry.

+ # avg_fanout: Average fanout for internal pages.

+ # avg_unused: Average unused bytes per btree entry.

+ # ovfl_cnt_percent: Percentage of btree entries that use overflow pages.

+ #

+ set total_pages [expr {$leaf_pages+$int_pages+$ovfl_pages}]

+ set total_pages_percent [percent $total_pages $file_pgcnt]

+ set storage [expr {$total_pages*$pageSize}]

+ set payload_percent [percent $payload $storage {of storage consumed}]

+ set total_unused [expr {$ovfl_unused+$int_unused+$leaf_unused}]

+ set avg_payload [divide $payload $nleaf]

+ set avg_unused [divide $total_unused $nleaf]

+ if {$int_pages>0} {

+ # TODO: Is this formula correct?

+ set nTab [mem eval "

+ SELECT count(*) FROM (

+ SELECT DISTINCT tblname FROM space_used WHERE $where AND is_index=0

+ )

+ "]

+ set avg_fanout [mem eval "

+ SELECT (sum(leaf_pages+int_pages)-$nTab)/sum(int_pages) FROM space_used

+ WHERE $where AND is_index = 0

+ "]

+ set avg_fanout [format %.2f $avg_fanout]

+ }

+ set ovfl_cnt_percent [percent $ovfl_cnt $nleaf {of all entries}]

+ # Print out the sub-report statistics.

+ #

+ statline {Percentage of total database} $total_pages_percent

+ statline {Number of entries} $nleaf

+ statline {Bytes of storage consumed} $storage

+ if {$compressed_size!=$storage} {

+ set compressed_size [expr {$compressed_size+$compressOverhead*$total_pages}]

+ set pct [expr {$compressed_size*100.0/$storage}]

+ set pct [format {%5.1f%%} $pct]

+ statline {Bytes used after compression} $compressed_size $pct

+ }

+ statline {Bytes of payload} $payload $payload_percent

+ statline {Average payload per entry} $avg_payload

+ statline {Average unused bytes per entry} $avg_unused

+ if {[info exists avg_fanout]} {

+ statline {Average fanout} $avg_fanout

+ }

+ if {$showFrag && $total_pages>1} {

+ set fragmentation [percent $gap_cnt [expr {$total_pages-1}]]

+ statline {Non-sequential pages} $gap_cnt $fragmentation

+ }

+ statline {Maximum payload per entry} $mx_payload

+ statline {Entries that use overflow} $ovfl_cnt $ovfl_cnt_percent

+ if {$int_pages>0} {

+ statline {Index pages used} $int_pages

+ }

+ statline {Primary pages used} $leaf_pages

+ statline {Overflow pages used} $ovfl_pages

+ statline {Total pages used} $total_pages

+ if {$int_unused>0} {

+ set int_unused_percent [

+ percent $int_unused [expr {$int_pages*$pageSize}] {of index space}]

+ statline "Unused bytes on index pages" $int_unused $int_unused_percent

+ }

+ statline "Unused bytes on primary pages" $leaf_unused [

+ percent $leaf_unused [expr {$leaf_pages*$pageSize}] {of primary space}]

+ statline "Unused bytes on overflow pages" $ovfl_unused [

+ percent $ovfl_unused [expr {$ovfl_pages*$pageSize}] {of overflow space}]

+ statline "Unused bytes on all pages" $total_unused [

+ percent $total_unused $storage {of all space}]

+ return 1

+# Calculate the overhead in pages caused by auto-vacuum.

+# This procedure calculates and returns the number of pages used by the

+# auto-vacuum 'pointer-map'. If the database does not support auto-vacuum,

+# then 0 is returned. The two arguments are the size of the database file in

+# pages and the page size used by the database (in bytes).

+proc autovacuum_overhead {filePages pageSize} {

+ # Set $autovacuum to non-zero for databases that support auto-vacuum.

+ set autovacuum [db one {PRAGMA auto_vacuum}]

+ # If the database is not an auto-vacuum database or the file consists

+ # of one page only then there is no overhead for auto-vacuum. Return zero.

+ if {0==$autovacuum || $filePages==1} {

+ return 0

+ }

+ # The number of entries on each pointer map page. The layout of the

+ # database file is one pointer-map page, followed by $ptrsPerPage other

+ # pages, followed by a pointer-map page etc. The first pointer-map page

+ # is the second page of the file overall.

+ set ptrsPerPage [expr double($pageSize/5)]

+ # Return the number of pointer map pages in the database.

+ return [expr wide(ceil( ($filePages-1.0)/($ptrsPerPage+1.0) ))]

+# Calculate the summary statistics for the database and store the results

+# in TCL variables. They are output below. Variables are as follows:

+# pageSize: Size of each page in bytes.

+# file_bytes: File size in bytes.

+# file_pgcnt: Number of pages in the file.

+# file_pgcnt2: Number of pages in the file (calculated).

+# av_pgcnt: Pages consumed by the auto-vacuum pointer-map.

+# av_percent: Percentage of the file consumed by auto-vacuum pointer-map.

+# inuse_pgcnt: Data pages in the file.

+# inuse_percent: Percentage of pages used to store data.

+# free_pgcnt: Free pages calculated as (<total pages> - <in-use pages>)

+# free_pgcnt2: Free pages in the file according to the file header.

+# free_percent: Percentage of file consumed by free pages (calculated).

+# free_percent2: Percentage of file consumed by free pages (header).

+# ntable: Number of tables in the db.

+# nindex: Number of indices in the db.

+# nautoindex: Number of indices created automatically.

+# nmanindex: Number of indices created manually.

+# user_payload: Number of bytes of payload in table btrees

+# (not including sqlite_master)

+# user_percent: $user_payload as a percentage of total file size.

+### The following, setting $file_bytes based on the actual size of the file

+### on disk, causes this tool to choke on zipvfs databases. So set it based

+### on the return of [PRAGMA page_count] instead.

+if 0 {

+ set file_bytes [file size $file_to_analyze]

+ set file_pgcnt [expr {$file_bytes/$pageSize}]

+set file_pgcnt [db one {PRAGMA page_count}]

+set file_bytes [expr {$file_pgcnt * $pageSize}]

+set av_pgcnt [autovacuum_overhead $file_pgcnt $pageSize]

+set av_percent [percent $av_pgcnt $file_pgcnt]

+set sql {SELECT sum(leaf_pages+int_pages+ovfl_pages) FROM space_used}

+set inuse_pgcnt [expr wide([mem eval $sql])]

+set inuse_percent [percent $inuse_pgcnt $file_pgcnt]

+set free_pgcnt [expr {$file_pgcnt-$inuse_pgcnt-$av_pgcnt}]

+set free_percent [percent $free_pgcnt $file_pgcnt]

+set free_pgcnt2 [db one {PRAGMA freelist_count}]

+set free_percent2 [percent $free_pgcnt2 $file_pgcnt]

+set file_pgcnt2 [expr {$inuse_pgcnt+$free_pgcnt2+$av_pgcnt}]

+set ntable [db eval {SELECT count(*)+1 FROM sqlite_master WHERE type='table'}]

+set nindex [db eval {SELECT count(*) FROM sqlite_master WHERE type='index'}]

+set sql {SELECT count(*) FROM sqlite_master WHERE name LIKE 'sqlite_autoindex%'}

+set nautoindex [db eval $sql]

+set nmanindex [expr {$nindex-$nautoindex}]

+# set total_payload [mem eval "SELECT sum(payload) FROM space_used"]

+set user_payload [mem one {SELECT int(sum(payload)) FROM space_used

+ WHERE NOT is_index AND name NOT LIKE 'sqlite_master'}]

+set user_percent [percent $user_payload $file_bytes]

+# Output the summary statistics calculated above.

+puts "/** Disk-Space Utilization Report For $root_filename"

+puts ""

+statline {Page size in bytes} $pageSize

+statline {Pages in the whole file (measured)} $file_pgcnt

+statline {Pages in the whole file (calculated)} $file_pgcnt2

+statline {Pages that store data} $inuse_pgcnt $inuse_percent

+statline {Pages on the freelist (per header)} $free_pgcnt2 $free_percent2

+statline {Pages on the freelist (calculated)} $free_pgcnt $free_percent

+statline {Pages of auto-vacuum overhead} $av_pgcnt $av_percent

+statline {Number of tables in the database} $ntable

+statline {Number of indices} $nindex

+statline {Number of defined indices} $nmanindex

+statline {Number of implied indices} $nautoindex

+if {$isCompressed} {

+ statline {Size of uncompressed content in bytes} $file_bytes

+ set efficiency [percent $true_file_size $file_bytes]

+ statline {Size of compressed file on disk} $true_file_size $efficiency

+} else {

+ statline {Size of the file in bytes} $file_bytes

+statline {Bytes of user payload stored} $user_payload $user_percent

+# Output table rankings

+puts ""

+titleline "Page counts for all tables with their indices"

+puts ""

+mem eval {SELECT tblname, count(*) AS cnt,

+ int(sum(int_pages+leaf_pages+ovfl_pages)) AS size

+ FROM space_used GROUP BY tblname ORDER BY size+0 DESC, tblname} {} {

+ statline [string toupper $tblname] $size [percent $size $file_pgcnt]

+puts ""

+titleline "Page counts for all tables and indices separately"

+puts ""

+mem eval {

+ SELECT

+ upper(name) AS nm,

+ int(int_pages+leaf_pages+ovfl_pages) AS size

+ FROM space_used

+ ORDER BY size+0 DESC, name} {} {

+ statline $nm $size [percent $size $file_pgcnt]

+if {$isCompressed} {

+ puts ""

+ titleline "Bytes of disk space used after compression"

+ puts ""

+ set csum 0

+ mem eval {SELECT tblname,

+ int(sum(compressed_size)) +

+ $compressOverhead*sum(int_pages+leaf_pages+ovfl_pages)

+ AS csize

+ FROM space_used GROUP BY tblname ORDER BY csize+0 DESC, tblname} {} {

+ incr csum $csize

+ statline [string toupper $tblname] $csize [percent $csize $true_file_size]

+ }

+ set overhead [expr {$true_file_size - $csum}]

+ if {$overhead>0} {

+ statline {Header and free space} $overhead [percent $overhead $true_file_size]

+ }

+# Output subreports

+if {$nindex>0} {

+ subreport {All tables and indices} 1 0

+subreport {All tables} {NOT is_index} 0

+if {$nindex>0} {

+ subreport {All indices} {is_index} 0

+foreach tbl [mem eval {SELECT DISTINCT tblname name FROM space_used

+ ORDER BY name}] {

+ set qn [quote $tbl]

+ set name [string toupper $tbl]

+ set n [mem eval {SELECT count(*) FROM space_used WHERE tblname=$tbl}]

+ if {$n>1} {

+ set idxlist [mem eval "SELECT name FROM space_used

+ WHERE tblname='$qn' AND is_index

+ ORDER BY 1"]

+ subreport "Table $name and all its indices" "tblname='$qn'" 0

+ subreport "Table $name w/o any indices" "name='$qn'" 1

+ if {[llength $idxlist]>1} {

+ subreport "Indices of table $name" "tblname='$qn' AND is_index" 0

+ }

+ foreach idx $idxlist {

+ set qidx [quote $idx]

+ subreport "Index [string toupper $idx] of table $name" "name='$qidx'" 1

+ }

+ } else {

+ subreport "Table $name" "name='$qn'" 1

+ }

+# Output instructions on what the numbers above mean.

+puts ""

+titleline Definitions

+puts {

+Page size in bytes

+ The number of bytes in a single page of the database file.

+ Usually 1024.

+Number of pages in the whole file

+puts " The number of $pageSize-byte pages that go into forming the complete

+ database"

+puts {

+Pages that store data

+ The number of pages that store data, either as primary B*Tree pages or

+ as overflow pages. The number at the right is the data pages divided by

+ the total number of pages in the file.

+Pages on the freelist

+ The number of pages that are not currently in use but are reserved for

+ future use. The percentage at the right is the number of freelist pages

+ divided by the total number of pages in the file.

+Pages of auto-vacuum overhead

+ The number of pages that store data used by the database to facilitate

+ auto-vacuum. This is zero for databases that do not support auto-vacuum.

+Number of tables in the database

+ The number of tables in the database, including the SQLITE_MASTER table

+ used to store schema information.

+Number of indices

+ The total number of indices in the database.

+Number of defined indices

+ The number of indices created using an explicit CREATE INDEX statement.

+Number of implied indices

+ The number of indices used to implement PRIMARY KEY or UNIQUE constraints

+ on tables.

+Size of the file in bytes

+ The total amount of disk space used by the entire database files.

+Bytes of user payload stored

+ The total number of bytes of user payload stored in the database. The

+ schema information in the SQLITE_MASTER table is not counted when

+ computing this number. The percentage at the right shows the payload

+ divided by the total file size.

+Percentage of total database

+ The amount of the complete database file that is devoted to storing

+ information described by this category.

+Number of entries

+ The total number of B-Tree key/value pairs stored under this category.

+Bytes of storage consumed

+ The total amount of disk space required to store all B-Tree entries

+ under this category. The is the total number of pages used times

+ the pages size.

+Bytes of payload

+ The amount of payload stored under this category. Payload is the data

+ part of table entries and the key part of index entries. The percentage

+ at the right is the bytes of payload divided by the bytes of storage

+ consumed.

+Average payload per entry

+ The average amount of payload on each entry. This is just the bytes of

+ payload divided by the number of entries.

+Average unused bytes per entry

+ The average amount of free space remaining on all pages under this

+ category on a per-entry basis. This is the number of unused bytes on

+ all pages divided by the number of entries.

+Non-sequential pages

+ The number of pages in the table or index that are out of sequence.

+ Many filesystems are optimized for sequential file access so a small

+ number of non-sequential pages might result in faster queries,

+ especially for larger database files that do not fit in the disk cache.

+ Note that after running VACUUM, the root page of each table or index is

+ at the beginning of the database file and all other pages are in a

+ separate part of the database file, resulting in a single non-

+ sequential page.

+Maximum payload per entry

+ The largest payload size of any entry.

+Entries that use overflow

+ The number of entries that user one or more overflow pages.

+Total pages used

+ This is the number of pages used to hold all information in the current

+ category. This is the sum of index, primary, and overflow pages.

+Index pages used

+ This is the number of pages in a table B-tree that hold only key (rowid)

+ information and no data.

+Primary pages used

+ This is the number of B-tree pages that hold both key and data.

+Overflow pages used

+ The total number of overflow pages used for this category.

+Unused bytes on index pages

+ The total number of bytes of unused space on all index pages. The

+ percentage at the right is the number of unused bytes divided by the

+ total number of bytes on index pages.

+Unused bytes on primary pages

+ The total number of bytes of unused space on all primary pages. The

+ percentage at the right is the number of unused bytes divided by the

+ total number of bytes on primary pages.

+Unused bytes on overflow pages

+ The total number of bytes of unused space on all overflow pages. The

+ percentage at the right is the number of unused bytes divided by the

+ total number of bytes on overflow pages.

+Unused bytes on all pages

+ The total number of bytes of unused space on all primary and overflow

+ pages. The percentage at the right is the number of unused bytes

+ divided by the total number of bytes.

+# Output a dump of the in-memory database. This can be used for more

+# complex offline analysis.

+titleline {}

+puts "The entire text of this report can be sourced into any SQL database"

+puts "engine for further analysis. All of the text above is an SQL comment."

+puts "The data used to generate this report follows:"

+puts "*/"

+puts "BEGIN;"

+puts $tabledef

+unset -nocomplain x

+mem eval {SELECT * FROM space_used} x {

+ puts -nonewline "INSERT INTO space_used VALUES"

+ set sep (

+ foreach col $x(*) {

+ set v $x($col)

+ if {$v=="" || ![string is double $v]} {set v '[quote $v]'}

+ puts -nonewline $sep$v

+ set sep ,

+ }

+ puts ");"

+puts "COMMIT;"

+} err]} {

+ puts "ERROR: $err"

+ puts $errorInfo

+ exit 1