Chromium Code Reviews
chromiumcodereview-hr@appspot.gserviceaccount.com (chromiumcodereview-hr) | Please choose your nickname with Settings | Help | Chromium Project | Gerrit Changes | Sign out
(107)

Unified Diff: third_party/sqlite/src/tool/spaceanal.tcl

Issue 6990047: Import SQLite 3.7.6.3. (Closed) Base URL: svn://svn.chromium.org/chrome/trunk/src
Patch Set: Created 9 years, 7 months ago
Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.
Jump to:
View side-by-side diff with in-line comments
Download patch
« no previous file with comments | « third_party/sqlite/src/tool/showwal.c ('k') | third_party/sqlite/src/tool/split-sqlite3c.tcl » ('j') | no next file with comments »
Expand Comments ('e') | Collapse Comments ('c') | Show Comments Hide Comments ('s')
Index: third_party/sqlite/src/tool/spaceanal.tcl
diff --git a/third_party/sqlite/src/tool/spaceanal.tcl b/third_party/sqlite/src/tool/spaceanal.tcl
index 3718357cbb27ad7b8d2cc070565779a8f3a0fff0..bf6244e8c994c269b3f7d4cfd356bd7da6548574 100644
--- a/third_party/sqlite/src/tool/spaceanal.tcl
+++ b/third_party/sqlite/src/tool/spaceanal.tcl
@@ -26,14 +26,14 @@ if {[file size $file_to_analyze]<512} {
exit 1
}
-# Maximum distance between pages before we consider it a "gap"
-#
-set MAXGAP 3
-
# Open the database
#
sqlite3 db [lindex $argv 0]
-set DB [btree_open [lindex $argv 0] 1000 0]
+register_dbstat_vtab db
+
+set pageSize [db one {PRAGMA page_size}]
+
+#set DB [btree_open [lindex $argv 0] 1000 0]
# In-memory database for collecting statistics. This script loops through
# the tables and indices in the database being analyzed, adding a row for each
@@ -62,6 +62,87 @@ set tabledef\
);}
mem eval $tabledef
+# Create a temporary "dbstat" virtual table.
+#
+db eval {
+ CREATE VIRTUAL TABLE temp.stat USING dbstat;
+ CREATE TEMP TABLE dbstat AS SELECT * FROM temp.stat ORDER BY name, path;
+ DROP TABLE temp.stat;
+}
+
+proc isleaf {pagetype is_index} {
+ return [expr {$pagetype == "leaf" || ($pagetype == "internal" && $is_index)}]
+}
+proc isoverflow {pagetype is_index} {
+ return [expr {$pagetype == "overflow"}]
+}
+proc isinternal {pagetype is_index} {
+ return [expr {$pagetype == "internal" && $is_index==0}]
+}
+
+db func isleaf isleaf
+db func isinternal isinternal
+db func isoverflow isoverflow
+
+set sql { SELECT name, tbl_name FROM sqlite_master WHERE rootpage>0 }
+foreach {name tblname} [concat sqlite_master sqlite_master [db eval $sql]] {
+
+ set is_index [expr {$name!=$tblname}]
+ db eval {
+ SELECT
+ sum(ncell) AS nentry,
+ sum(isleaf(pagetype, $is_index) * ncell) AS leaf_entries,
+ sum(payload) AS payload,
+ sum(isoverflow(pagetype, $is_index) * payload) AS ovfl_payload,
+ sum(path LIKE '%+000000') AS ovfl_cnt,
+ max(mx_payload) AS mx_payload,
+ sum(isinternal(pagetype, $is_index)) AS int_pages,
+ sum(isleaf(pagetype, $is_index)) AS leaf_pages,
+ sum(isoverflow(pagetype, $is_index)) AS ovfl_pages,
+ sum(isinternal(pagetype, $is_index) * unused) AS int_unused,
+ sum(isleaf(pagetype, $is_index) * unused) AS leaf_unused,
+ sum(isoverflow(pagetype, $is_index) * unused) AS ovfl_unused
+ FROM temp.dbstat WHERE name = $name
+ } break
+
+ # Column 'gap_cnt' is set to the number of non-contiguous entries in the
+ # list of pages visited if the b-tree structure is traversed in a top-down
+ # fashion (each node visited before its child-tree is passed). Any overflow
+ # chains present are traversed from start to finish before any child-tree
+ # is.
+ #
+ set gap_cnt 0
+ set pglist [db eval {
+ SELECT pageno FROM temp.dbstat WHERE name = $name ORDER BY rowid
+ }]
+ set prev [lindex $pglist 0]
+ foreach pgno [lrange $pglist 1 end] {
+ if {$pgno != $prev+1} {incr gap_cnt}
+ set prev $pgno
+ }
+
+ mem eval {
+ INSERT INTO space_used VALUES(
+ $name,
+ $tblname,
+ $is_index,
+ $nentry,
+ $leaf_entries,
+ $payload,
+ $ovfl_payload,
+ $ovfl_cnt,
+ $mx_payload,
+ $int_pages,
+ $leaf_pages,
+ $ovfl_pages,
+ $int_unused,
+ $leaf_unused,
+ $ovfl_unused,
+ $gap_cnt
+ );
+ }
+}
+
proc integerify {real} {
if {[string is double -strict $real]} {
return [expr {int($real)}]
@@ -81,321 +162,6 @@ proc quote {txt} {
return '$q'
}
-# This proc is a wrapper around the btree_cursor_info command. The
-# second argument is an open btree cursor returned by [btree_cursor].
-# The first argument is the name of an array variable that exists in
-# the scope of the caller. If the third argument is non-zero, then
-# info is returned for the page that lies $up entries upwards in the
-# tree-structure. (i.e. $up==1 returns the parent page, $up==2 the
-# grandparent etc.)
-#
-# The following entries in that array are filled in with information retrieved
-# using [btree_cursor_info]:
-#
-# $arrayvar(page_no) = The page number
-# $arrayvar(entry_no) = The entry number
-# $arrayvar(page_entries) = Total number of entries on this page
-# $arrayvar(cell_size) = Cell size (local payload + header)
-# $arrayvar(page_freebytes) = Number of free bytes on this page
-# $arrayvar(page_freeblocks) = Number of free blocks on the page
-# $arrayvar(payload_bytes) = Total payload size (local + overflow)
-# $arrayvar(header_bytes) = Header size in bytes
-# $arrayvar(local_payload_bytes) = Local payload size
-# $arrayvar(parent) = Parent page number
-#
-proc cursor_info {arrayvar csr {up 0}} {
- upvar $arrayvar a
- foreach [list a(page_no) \
- a(entry_no) \
- a(page_entries) \
- a(cell_size) \
- a(page_freebytes) \
- a(page_freeblocks) \
- a(payload_bytes) \
- a(header_bytes) \
- a(local_payload_bytes) \
- a(parent) \
- a(first_ovfl) ] [btree_cursor_info $csr $up] break
-}
-
-# Determine the page-size of the database. This global variable is used
-# throughout the script.
-#
-set pageSize [db eval {PRAGMA page_size}]
-
-# Analyze every table in the database, one at a time.
-#
-# The following query returns the name and root-page of each table in the
-# database, including the sqlite_master table.
-#
-set sql {
- SELECT name, rootpage FROM sqlite_master
- WHERE type='table' AND rootpage>0
- UNION ALL
- SELECT 'sqlite_master', 1
- ORDER BY 1
-}
-set wideZero [expr {10000000000 - 10000000000}]
-foreach {name rootpage} [db eval $sql] {
- puts stderr "Analyzing table $name..."
-
- # Code below traverses the table being analyzed (table name $name), using the
- # btree cursor $cursor. Statistics related to table $name are accumulated in
- # the following variables:
- #
- set total_payload $wideZero ;# Payload space used by all entries
- set total_ovfl $wideZero ;# Payload space on overflow pages
- set unused_int $wideZero ;# Unused space on interior nodes
- set unused_leaf $wideZero ;# Unused space on leaf nodes
- set unused_ovfl $wideZero ;# Unused space on overflow pages
- set cnt_ovfl $wideZero ;# Number of entries that use overflows
- set cnt_leaf_entry $wideZero ;# Number of leaf entries
- set cnt_int_entry $wideZero ;# Number of interor entries
- set mx_payload $wideZero ;# Maximum payload size
- set ovfl_pages $wideZero ;# Number of overflow pages used
- set leaf_pages $wideZero ;# Number of leaf pages
- set int_pages $wideZero ;# Number of interior pages
- set gap_cnt 0 ;# Number of holes in the page sequence
- set prev_pgno 0 ;# Last page number seen
-
- # As the btree is traversed, the array variable $seen($pgno) is set to 1
- # the first time page $pgno is encountered.
- #
- catch {unset seen}
-
- # The following loop runs once for each entry in table $name. The table
- # is traversed using the btree cursor stored in variable $csr
- #
- set csr [btree_cursor $DB $rootpage 0]
- for {btree_first $csr} {![btree_eof $csr]} {btree_next $csr} {
- incr cnt_leaf_entry
-
- # Retrieve information about the entry the btree-cursor points to into
- # the array variable $ci (cursor info).
- #
- cursor_info ci $csr
-
- # Check if the payload of this entry is greater than the current
- # $mx_payload statistic for the table. Also increase the $total_payload
- # statistic.
- #
- if {$ci(payload_bytes)>$mx_payload} {set mx_payload $ci(payload_bytes)}
- incr total_payload $ci(payload_bytes)
-
- # If this entry uses overflow pages, then update the $cnt_ovfl,
- # $total_ovfl, $ovfl_pages and $unused_ovfl statistics.
- #
- set ovfl [expr {$ci(payload_bytes)-$ci(local_payload_bytes)}]
- if {$ovfl} {
- incr cnt_ovfl
- incr total_ovfl $ovfl
- set n [expr {int(ceil($ovfl/($pageSize-4.0)))}]
- incr ovfl_pages $n
- incr unused_ovfl [expr {$n*($pageSize-4) - $ovfl}]
- set pglist [btree_ovfl_info $DB $csr]
- } else {
- set pglist {}
- }
-
- # If this is the first table entry analyzed for the page, then update
- # the page-related statistics $leaf_pages and $unused_leaf. Also, if
- # this page has a parent page that has not been analyzed, retrieve
- # info for the parent and update statistics for it too.
- #
- if {![info exists seen($ci(page_no))]} {
- set seen($ci(page_no)) 1
- incr leaf_pages
- incr unused_leaf $ci(page_freebytes)
- set pglist "$ci(page_no) $pglist"
-
- # Now check if the page has a parent that has not been analyzed. If
- # so, update the $int_pages, $cnt_int_entry and $unused_int statistics
- # accordingly. Then check if the parent page has a parent that has
- # not yet been analyzed etc.
- #
- # set parent $ci(parent_page_no)
- for {set up 1} \
- {$ci(parent)!=0 && ![info exists seen($ci(parent))]} {incr up} \
- {
- # Mark the parent as seen.
- #
- set seen($ci(parent)) 1
-
- # Retrieve info for the parent and update statistics.
- cursor_info ci $csr $up
- incr int_pages
- incr cnt_int_entry $ci(page_entries)
- incr unused_int $ci(page_freebytes)
-
- # parent pages come before their first child
- set pglist "$ci(page_no) $pglist"
- }
- }
-
- # Check the page list for fragmentation
- #
- foreach pg $pglist {
- if {$pg!=$prev_pgno+1 && $prev_pgno>0} {
- incr gap_cnt
- }
- set prev_pgno $pg
- }
- }
- btree_close_cursor $csr
-
- # Handle the special case where a table contains no data. In this case
- # all statistics are zero, except for the number of leaf pages (1) and
- # the unused bytes on leaf pages ($pageSize - 8).
- #
- # An exception to the above is the sqlite_master table. If it is empty
- # then all statistics are zero except for the number of leaf pages (1),
- # and the number of unused bytes on leaf pages ($pageSize - 112).
- #
- if {[llength [array names seen]]==0} {
- set leaf_pages 1
- if {$rootpage==1} {
- set unused_leaf [expr {$pageSize-112}]
- } else {
- set unused_leaf [expr {$pageSize-8}]
- }
- }
-
- # Insert the statistics for the table analyzed into the in-memory database.
- #
- set sql "INSERT INTO space_used VALUES("
- append sql [quote $name]
- append sql ",[quote $name]"
- append sql ",0"
- append sql ",[expr {$cnt_leaf_entry+$cnt_int_entry}]"
- append sql ",$cnt_leaf_entry"
- append sql ",$total_payload"
- append sql ",$total_ovfl"
- append sql ",$cnt_ovfl"
- append sql ",$mx_payload"
- append sql ",$int_pages"
- append sql ",$leaf_pages"
- append sql ",$ovfl_pages"
- append sql ",$unused_int"
- append sql ",$unused_leaf"
- append sql ",$unused_ovfl"
- append sql ",$gap_cnt"
- append sql );
- mem eval $sql
-}
-
-# Analyze every index in the database, one at a time.
-#
-# The query below returns the name, associated table and root-page number
-# for every index in the database.
-#
-set sql {
- SELECT name, tbl_name, rootpage FROM sqlite_master WHERE type='index'
- ORDER BY 2, 1
-}
-foreach {name tbl_name rootpage} [db eval $sql] {
- puts stderr "Analyzing index $name of table $tbl_name..."
-
- # Code below traverses the index being analyzed (index name $name), using the
- # btree cursor $cursor. Statistics related to index $name are accumulated in
- # the following variables:
- #
- set total_payload $wideZero ;# Payload space used by all entries
- set total_ovfl $wideZero ;# Payload space on overflow pages
- set unused_leaf $wideZero ;# Unused space on leaf nodes
- set unused_ovfl $wideZero ;# Unused space on overflow pages
- set cnt_ovfl $wideZero ;# Number of entries that use overflows
- set cnt_leaf_entry $wideZero ;# Number of leaf entries
- set mx_payload $wideZero ;# Maximum payload size
- set ovfl_pages $wideZero ;# Number of overflow pages used
- set leaf_pages $wideZero ;# Number of leaf pages
- set gap_cnt 0 ;# Number of holes in the page sequence
- set prev_pgno 0 ;# Last page number seen
-
- # As the btree is traversed, the array variable $seen($pgno) is set to 1
- # the first time page $pgno is encountered.
- #
- catch {unset seen}
-
- # The following loop runs once for each entry in index $name. The index
- # is traversed using the btree cursor stored in variable $csr
- #
- set csr [btree_cursor $DB $rootpage 0]
- for {btree_first $csr} {![btree_eof $csr]} {btree_next $csr} {
- incr cnt_leaf_entry
-
- # Retrieve information about the entry the btree-cursor points to into
- # the array variable $ci (cursor info).
- #
- cursor_info ci $csr
-
- # Check if the payload of this entry is greater than the current
- # $mx_payload statistic for the table. Also increase the $total_payload
- # statistic.
- #
- set payload [btree_keysize $csr]
- if {$payload>$mx_payload} {set mx_payload $payload}
- incr total_payload $payload
-
- # If this entry uses overflow pages, then update the $cnt_ovfl,
- # $total_ovfl, $ovfl_pages and $unused_ovfl statistics.
- #
- set ovfl [expr {$payload-$ci(local_payload_bytes)}]
- if {$ovfl} {
- incr cnt_ovfl
- incr total_ovfl $ovfl
- set n [expr {int(ceil($ovfl/($pageSize-4.0)))}]
- incr ovfl_pages $n
- incr unused_ovfl [expr {$n*($pageSize-4) - $ovfl}]
- }
-
- # If this is the first table entry analyzed for the page, then update
- # the page-related statistics $leaf_pages and $unused_leaf.
- #
- if {![info exists seen($ci(page_no))]} {
- set seen($ci(page_no)) 1
- incr leaf_pages
- incr unused_leaf $ci(page_freebytes)
- set pg $ci(page_no)
- if {$prev_pgno>0 && $pg!=$prev_pgno+1} {
- incr gap_cnt
- }
- set prev_pgno $ci(page_no)
- }
- }
- btree_close_cursor $csr
-
- # Handle the special case where a index contains no data. In this case
- # all statistics are zero, except for the number of leaf pages (1) and
- # the unused bytes on leaf pages ($pageSize - 8).
- #
- if {[llength [array names seen]]==0} {
- set leaf_pages 1
- set unused_leaf [expr {$pageSize-8}]
- }
-
- # Insert the statistics for the index analyzed into the in-memory database.
- #
- set sql "INSERT INTO space_used VALUES("
- append sql [quote $name]
- append sql ",[quote $tbl_name]"
- append sql ",1"
- append sql ",$cnt_leaf_entry"
- append sql ",$cnt_leaf_entry"
- append sql ",$total_payload"
- append sql ",$total_ovfl"
- append sql ",$cnt_ovfl"
- append sql ",$mx_payload"
- append sql ",0"
- append sql ",$leaf_pages"
- append sql ",$ovfl_pages"
- append sql ",0"
- append sql ",$unused_leaf"
- append sql ",$unused_ovfl"
- append sql ",$gap_cnt"
- append sql );
- mem eval $sql
-}
-
# Generate a single line of output in the statistics section of the
# report.
#
@@ -548,15 +314,12 @@ proc subreport {title where} {
# pages and the page size used by the database (in bytes).
proc autovacuum_overhead {filePages pageSize} {
- # Read the value of meta 4. If non-zero, then the database supports
- # auto-vacuum. It would be possible to use "PRAGMA auto_vacuum" instead,
- # but that would not work if the SQLITE_OMIT_PRAGMA macro was defined
- # when the library was built.
- set meta4 [lindex [btree_get_meta $::DB] 4]
+ # Set $autovacuum to non-zero for databases that support auto-vacuum.
+ set autovacuum [db one {PRAGMA auto_vacuum}]
# If the database is not an auto-vacuum database or the file consists
# of one page only then there is no overhead for auto-vacuum. Return zero.
- if {0==$meta4 || $filePages==1} {
+ if {0==$autovacuum || $filePages==1} {
return 0
}
@@ -606,7 +369,7 @@ set inuse_percent [percent $inuse_pgcnt $file_pgcnt]
set free_pgcnt [expr $file_pgcnt-$inuse_pgcnt-$av_pgcnt]
set free_percent [percent $free_pgcnt $file_pgcnt]
-set free_pgcnt2 [lindex [btree_get_meta $DB] 0]
+set free_pgcnt2 [db one {PRAGMA freelist_count}]
set free_percent2 [percent $free_pgcnt2 $file_pgcnt]
set file_pgcnt2 [expr {$inuse_pgcnt+$free_pgcnt2+$av_pgcnt}]
« no previous file with comments | « third_party/sqlite/src/tool/showwal.c ('k') | third_party/sqlite/src/tool/split-sqlite3c.tcl » ('j') | no next file with comments »

Powered by Google App Engine
This is Rietveld 408576698