diff --git a/.github/workflows/docker.yml b/.github/workflows/docker.yml index 58bcb8f1951..63d66d94da6 100644 --- a/.github/workflows/docker.yml +++ b/.github/workflows/docker.yml @@ -6,6 +6,7 @@ on: - master - staging - dev + - phoebe/hotfix/0.11.1/divide-by-zero tags: - 'v*' diff --git a/crates/core/src/db/datastore/locking_tx_datastore/tx.rs b/crates/core/src/db/datastore/locking_tx_datastore/tx.rs index deec7e1e84f..3d1f01f0415 100644 --- a/crates/core/src/db/datastore/locking_tx_datastore/tx.rs +++ b/crates/core/src/db/datastore/locking_tx_datastore/tx.rs @@ -9,6 +9,7 @@ use crate::execution_context::ExecutionContext; use spacetimedb_primitives::{ColList, TableId}; use spacetimedb_sats::AlgebraicValue; use spacetimedb_schema::schema::TableSchema; +use std::num::NonZeroU64; use std::sync::Arc; use std::{ ops::RangeBounds, @@ -68,9 +69,19 @@ impl TxId { /// The Number of Distinct Values (NDV) for a column or list of columns, /// if there's an index available on `cols`. - pub(crate) fn num_distinct_values(&self, table_id: TableId, cols: &ColList) -> Option { - self.committed_state_shared_lock - .get_table(table_id) - .and_then(|t| t.indexes.get(cols).map(|index| index.num_keys() as u64)) + /// + /// Returns `None` if: + /// - No such table as `table_id` exists. + /// - The table `table_id` does not have an index on exactly the `cols`. + /// - The table `table_id` contains zero rows. + // + // This method must never return 0, as it's used as the divisor in quotients. + // Do not change its return type to a bare `u64`. + pub(crate) fn num_distinct_values(&self, table_id: TableId, cols: &ColList) -> Option { + self.committed_state_shared_lock.get_table(table_id).and_then(|t| { + t.indexes + .get(cols) + .and_then(|index| NonZeroU64::new(index.num_keys() as u64)) + }) } } diff --git a/crates/core/src/estimation.rs b/crates/core/src/estimation.rs index 72a6f8c461e..6a94dca8d07 100644 --- a/crates/core/src/estimation.rs +++ b/crates/core/src/estimation.rs @@ -18,6 +18,8 @@ fn row_est(tx: &Tx, src: &SourceExpr, ops: &[Query]) -> u64 { // We assume a uniform distribution of keys, // which implies a selectivity = 1 / NDV, // where NDV stands for Number of Distinct Values. + // We assume that the table exists and has an index on the columns, + // so `index_row_est` will only return 0 if the table is empty. Query::IndexScan(scan) if scan.is_point() => { index_row_est(tx, scan.table.table_id, &scan.columns) } @@ -41,6 +43,8 @@ fn row_est(tx: &Tx, src: &SourceExpr, ops: &[Query]) -> u64 { Query::IndexJoin(join) => { row_est(tx, &join.probe_side.source, &join.probe_side.query) .saturating_mul( + // We assume that the table exists and has an index on the columns, + // so `index_row_est` will only return 0 if the table is empty. index_row_est(tx, src.table_id().unwrap(), &join.index_col.into()) ) } @@ -59,8 +63,15 @@ fn row_est(tx: &Tx, src: &SourceExpr, ops: &[Query]) -> u64 { /// The estimated number of rows that an index probe will return. /// Note this method is not applicable to range scans. +/// +/// Returns 0 in any case that [`Tx::num_distinct_values`] would return `None`: +/// - If there is no such table as `table_id`. +/// - If the table `table_id` does not have an index on exactly the `cols`. +/// - If the table `table_id` contains 0 rows. fn index_row_est(tx: &Tx, table_id: TableId, cols: &ColList) -> u64 { tx.num_distinct_values(table_id, cols) + // `num_distinct_values` returns `Option`, + // so this division can never panic. .map_or(0, |ndv| tx.get_row_count(table_id).unwrap_or(0) / ndv) }