Skip to content

Commit

Permalink
sql/stats: add cluster setting to disable generation of stats forecasts
Browse files Browse the repository at this point in the history
Add a new cluster setting `sql.stats.forecasts.enabled` that can be
used to disable generation of statistics forecasts in the stats cache.
Changing this setting will cause the stats cache to gradually evict and
reload all cached statistics as they are requested.

Fixes: #86350

Release justification: Low-risk update to new functionality.

Release note (sql change): Add a new cluster setting
`sql.stats.forecasts.enabled` which controls whether statistics
forecasts are generated by default for all tables. (Note that this is
different from the session setting `optimizer_use_forecasts` which
controls whether statistics forecasts are used when optimizing the
current query. If forecasting is disabled, then even if
`optimizer_use_forecasts` is true for a given query it won't have any
forecasts to use.)
  • Loading branch information
michae2 committed Aug 27, 2022
1 parent 770ff3c commit 896cf3c
Show file tree
Hide file tree
Showing 8 changed files with 146 additions and 18 deletions.
1 change: 1 addition & 0 deletions docs/generated/settings/settings-for-tenants.txt
Original file line number Diff line number Diff line change
Expand Up @@ -264,6 +264,7 @@ sql.stats.automatic_collection.min_stale_rows integer 500 target minimum number
sql.stats.cleanup.recurrence string @hourly cron-tab recurrence for SQL Stats cleanup job
sql.stats.flush.enabled boolean true if set, SQL execution statistics are periodically flushed to disk
sql.stats.flush.interval duration 10m0s the interval at which SQL execution statistics are flushed to disk, this value must be less than or equal to sql.stats.aggregation.interval
sql.stats.forecasts.enabled boolean true when true, enables generation of statistics forecasts by default for all tables
sql.stats.histogram_collection.enabled boolean true histogram collection mode
sql.stats.multi_column_collection.enabled boolean true multi-column statistics collection mode
sql.stats.non_default_columns.min_retention_period duration 24h0m0s minimum retention period for table statistics collected on non-default columns
Expand Down
1 change: 1 addition & 0 deletions docs/generated/settings/settings.html
Original file line number Diff line number Diff line change
Expand Up @@ -198,6 +198,7 @@
<tr><td><code>sql.stats.cleanup.recurrence</code></td><td>string</td><td><code>@hourly</code></td><td>cron-tab recurrence for SQL Stats cleanup job</td></tr>
<tr><td><code>sql.stats.flush.enabled</code></td><td>boolean</td><td><code>true</code></td><td>if set, SQL execution statistics are periodically flushed to disk</td></tr>
<tr><td><code>sql.stats.flush.interval</code></td><td>duration</td><td><code>10m0s</code></td><td>the interval at which SQL execution statistics are flushed to disk, this value must be less than or equal to sql.stats.aggregation.interval</td></tr>
<tr><td><code>sql.stats.forecasts.enabled</code></td><td>boolean</td><td><code>true</code></td><td>when true, enables generation of statistics forecasts by default for all tables</td></tr>
<tr><td><code>sql.stats.histogram_collection.enabled</code></td><td>boolean</td><td><code>true</code></td><td>histogram collection mode</td></tr>
<tr><td><code>sql.stats.multi_column_collection.enabled</code></td><td>boolean</td><td><code>true</code></td><td>multi-column statistics collection mode</td></tr>
<tr><td><code>sql.stats.non_default_columns.min_retention_period</code></td><td>duration</td><td><code>24h0m0s</code></td><td>minimum retention period for table statistics collected on non-default columns</td></tr>
Expand Down
97 changes: 97 additions & 0 deletions pkg/sql/opt/exec/execbuilder/testdata/forecast
Original file line number Diff line number Diff line change
Expand Up @@ -842,3 +842,100 @@ scan x
├── cost: 16.04
├── key: (1)
└── distribution: test

# Test that sql.stats.forecasts.enabled can be used to enable and disable
# generation of forecasts in the stats cache.

statement ok
SET CLUSTER SETTING sql.stats.forecasts.enabled = false

query T
EXPLAIN SELECT * FROM g WHERE a > 8
----
distribution: local
vectorized: true
·
• scan
estimated row count: 0 (<0.01% of the table; stats collected <hidden> ago)
table: g@g_pkey
spans: [/9 - ]

query T
EXPLAIN SELECT * FROM s WHERE b < 3
----
distribution: local
vectorized: true
·
• scan
estimated row count: 3 (100% of the table; stats collected <hidden> ago)
table: s@s_pkey
spans: [ - /2]

query T
EXPLAIN SELECT * FROM c WHERE h > '1988-08-07'
----
distribution: local
vectorized: true
·
• scan
estimated row count: 0 (<0.01% of the table; stats collected <hidden> ago)
table: c@c_pkey
spans: [/'1988-08-07 00:00:00.000001+00:00' - ]

query T
EXPLAIN SELECT * FROM x WHERE a > 16
----
distribution: local
vectorized: true
·
• scan
estimated row count: 0 (<0.01% of the table; stats collected <hidden> ago)
table: x@x_pkey
spans: [/17 - ]

statement ok
RESET CLUSTER SETTING sql.stats.forecasts.enabled

query T
EXPLAIN SELECT * FROM g WHERE a > 8
----
distribution: local
vectorized: true
·
• scan
estimated row count: 3 (22% of the table; stats collected <hidden> ago; using stats forecast)
table: g@g_pkey
spans: [/9 - ]

query T
EXPLAIN SELECT * FROM s WHERE b < 3
----
distribution: local
vectorized: true
·
• scan
estimated row count: 1 (100% of the table; stats collected <hidden> ago; using stats forecast)
table: s@s_pkey
spans: [ - /2]

query T
EXPLAIN SELECT * FROM c WHERE h > '1988-08-07'
----
distribution: local
vectorized: true
·
• scan
estimated row count: 23 (96% of the table; stats collected <hidden> ago; using stats forecast)
table: c@c_pkey
spans: [/'1988-08-07 00:00:00.000001+00:00' - ]

query T
EXPLAIN SELECT * FROM x WHERE a > 16
----
distribution: local
vectorized: true
·
• scan
estimated row count: 2 (50% of the table; stats collected <hidden> ago; using stats forecast)
table: x@x_pkey
spans: [/17 - ]
2 changes: 1 addition & 1 deletion pkg/sql/stats/automatic_stats.go
Original file line number Diff line number Diff line change
Expand Up @@ -678,7 +678,7 @@ func (r *Refresher) maybeRefreshStats(
rowsAffected int64,
asOf time.Duration,
) {
tableStats, err := r.cache.getTableStatsFromCache(ctx, tableID)
tableStats, err := r.cache.getTableStatsFromCache(ctx, tableID, nil /* forecast */)
if err != nil {
log.Errorf(ctx, "failed to get table statistics: %v", err)
return
Expand Down
8 changes: 4 additions & 4 deletions pkg/sql/stats/delete_stats_test.go
Original file line number Diff line number Diff line change
Expand Up @@ -262,15 +262,15 @@ func TestDeleteOldStatsForColumns(t *testing.T) {
}

return testutils.SucceedsSoonError(func() error {
tableStats, err := cache.getTableStatsFromCache(ctx, tableID)
tableStats, err := cache.getTableStatsFromCache(ctx, tableID, nil /* forecast */)
if err != nil {
return err
}

for i := range testData {
stat := &testData[i]
if stat.TableID != tableID {
stats, err := cache.getTableStatsFromCache(ctx, stat.TableID)
stats, err := cache.getTableStatsFromCache(ctx, stat.TableID, nil /* forecast */)
if err != nil {
return err
}
Expand Down Expand Up @@ -556,15 +556,15 @@ func TestDeleteOldStatsForOtherColumns(t *testing.T) {
}

return testutils.SucceedsSoonError(func() error {
tableStats, err := cache.getTableStatsFromCache(ctx, tableID)
tableStats, err := cache.getTableStatsFromCache(ctx, tableID, nil /* forecast */)
if err != nil {
return err
}

for i := range testData {
stat := &testData[i]
if stat.TableID != tableID {
stats, err := cache.getTableStatsFromCache(ctx, stat.TableID)
stats, err := cache.getTableStatsFromCache(ctx, stat.TableID, nil /* forecast */)
if err != nil {
return err
}
Expand Down
10 changes: 10 additions & 0 deletions pkg/sql/stats/forecast.go
Original file line number Diff line number Diff line change
Expand Up @@ -16,6 +16,7 @@ import (
"time"

"github.com/cockroachdb/cockroach/pkg/jobs/jobspb"
"github.com/cockroachdb/cockroach/pkg/settings"
"github.com/cockroachdb/cockroach/pkg/sql/opt/cat"
"github.com/cockroachdb/cockroach/pkg/sql/sem/eval"
"github.com/cockroachdb/cockroach/pkg/sql/types"
Expand All @@ -24,6 +25,15 @@ import (
"github.com/cockroachdb/redact"
)

// UseStatisticsForecasts controls whether statistics forecasts are generated in
// the stats cache.
var UseStatisticsForecasts = settings.RegisterBoolSetting(
settings.TenantWritable,
"sql.stats.forecasts.enabled",
"when true, enables generation of statistics forecasts by default for all tables",
true,
).WithPublic()

// minObservationsForForecast is the minimum number of observed statistics
// required to produce a statistics forecast. Forecasts based on 1 or 2
// observations will always have R² = 1 (perfect goodness of fit) regardless of
Expand Down
41 changes: 30 additions & 11 deletions pkg/sql/stats/stats_cache.go
Original file line number Diff line number Diff line change
Expand Up @@ -102,6 +102,9 @@ type cacheEntry struct {
// timestamp was moved, it will trigger another refresh.
refreshing bool

// forecast is true if stats could contain forecasts.
forecast bool

stats []*TableStatistic

// err is populated if the internal query to retrieve stats hit an error.
Expand Down Expand Up @@ -217,7 +220,8 @@ func (sc *TableStatisticsCache) GetTableStats(
if !statsUsageAllowed(table, sc.Settings) {
return nil, nil
}
return sc.getTableStatsFromCache(ctx, table.GetID())
forecast := forecastAllowed(table, sc.Settings)
return sc.getTableStatsFromCache(ctx, table.GetID(), &forecast)
}

func statsDisallowedSystemTable(tableID descpb.ID) bool {
Expand Down Expand Up @@ -286,19 +290,31 @@ func tableTypeCanHaveStats(table catalog.TableDescriptor) bool {
return true
}

// forecastAllowed returns true if statistics forecasting is allowed for the
// given table.
func forecastAllowed(table catalog.TableDescriptor, clusterSettings *cluster.Settings) bool {
return UseStatisticsForecasts.Get(&clusterSettings.SV)
}

// getTableStatsFromCache is like GetTableStats but assumes that the table ID
// is safe to fetch statistics for: non-system, non-virtual, non-view, etc.
func (sc *TableStatisticsCache) getTableStatsFromCache(
ctx context.Context, tableID descpb.ID,
ctx context.Context, tableID descpb.ID, forecast *bool,
) ([]*TableStatistic, error) {
sc.mu.Lock()
defer sc.mu.Unlock()

if found, e := sc.lookupStatsLocked(ctx, tableID, false /* stealthy */); found {
return e.stats, e.err
if forecast != nil && e.forecast != *forecast {
// Forecasting was recently enabled or disabled on this table. Evict the
// cache entry and build it again.
sc.mu.cache.Del(tableID)
} else {
return e.stats, e.err
}
}

return sc.addCacheEntryLocked(ctx, tableID)
return sc.addCacheEntryLocked(ctx, tableID, forecast != nil && *forecast)
}

// lookupStatsLocked retrieves any existing stats for the given table.
Expand Down Expand Up @@ -351,7 +367,7 @@ func (sc *TableStatisticsCache) lookupStatsLocked(
// - mutex is locked again and the entry is updated.
//
func (sc *TableStatisticsCache) addCacheEntryLocked(
ctx context.Context, tableID descpb.ID,
ctx context.Context, tableID descpb.ID, forecast bool,
) (stats []*TableStatistic, err error) {
// Add a cache entry that other queries can find and wait on until we have the
// stats.
Expand All @@ -367,12 +383,12 @@ func (sc *TableStatisticsCache) addCacheEntryLocked(
defer sc.mu.Lock()

log.VEventf(ctx, 1, "reading statistics for table %d", tableID)
stats, err = sc.getTableStatsFromDB(ctx, tableID)
stats, err = sc.getTableStatsFromDB(ctx, tableID, forecast)
log.VEventf(ctx, 1, "finished reading statistics for table %d", tableID)
}()

e.mustWait = false
e.stats, e.err = stats, err
e.forecast, e.stats, e.err = forecast, stats, err

// Wake up any other callers that are waiting on these stats.
e.waitCond.Broadcast()
Expand Down Expand Up @@ -422,6 +438,7 @@ func (sc *TableStatisticsCache) refreshCacheEntry(
}
e.refreshing = true

forecast := e.forecast
var stats []*TableStatistic
var err error
for {
Expand All @@ -432,7 +449,7 @@ func (sc *TableStatisticsCache) refreshCacheEntry(

log.VEventf(ctx, 1, "refreshing statistics for table %d", tableID)
// TODO(radu): pass the timestamp and use AS OF SYSTEM TIME.
stats, err = sc.getTableStatsFromDB(ctx, tableID)
stats, err = sc.getTableStatsFromDB(ctx, tableID, forecast)
log.VEventf(ctx, 1, "done refreshing statistics for table %d", tableID)
}()
if e.lastRefreshTimestamp.Equal(ts) {
Expand Down Expand Up @@ -678,7 +695,7 @@ func (tabStat *TableStatistic) String() string {
// It ignores any statistics that cannot be decoded (e.g. because a user-defined
// type that doesn't exist) and returns the rest (with no error).
func (sc *TableStatisticsCache) getTableStatsFromDB(
ctx context.Context, tableID descpb.ID,
ctx context.Context, tableID descpb.ID, forecast bool,
) ([]*TableStatistic, error) {
const getTableStatisticsStmt = `
SELECT
Expand Down Expand Up @@ -720,8 +737,10 @@ ORDER BY "createdAt" DESC, "columnIDs" DESC, "statisticID" DESC
return nil, err
}

forecasts := ForecastTableStatistics(ctx, statsList)
statsList = append(forecasts, statsList...)
if forecast {
forecasts := ForecastTableStatistics(ctx, statsList)
statsList = append(forecasts, statsList...)
}

return statsList, nil
}
4 changes: 2 additions & 2 deletions pkg/sql/stats/stats_cache_test.go
Original file line number Diff line number Diff line change
Expand Up @@ -117,7 +117,7 @@ func checkStatsForTable(

// Perform the lookup and refresh, and confirm the
// returned stats match the expected values.
statsList, err := sc.getTableStatsFromCache(ctx, tableID)
statsList, err := sc.getTableStatsFromCache(ctx, tableID, nil /* forecast */)
if err != nil {
t.Fatalf("error retrieving stats: %s", err)
}
Expand Down Expand Up @@ -426,7 +426,7 @@ func TestCacheWait(t *testing.T) {
for n := 0; n < 10; n++ {
wg.Add(1)
go func() {
stats, err := sc.getTableStatsFromCache(ctx, id)
stats, err := sc.getTableStatsFromCache(ctx, id, nil /* forecast */)
if err != nil {
t.Error(err)
} else if !checkStats(stats, expectedStats[id]) {
Expand Down

0 comments on commit 896cf3c

Please sign in to comment.