-
Notifications
You must be signed in to change notification settings - Fork 80
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
Merge branch 'main' into refactor/remove-get-test-accessor-and-rename…
…-vars
- Loading branch information
Showing
32 changed files
with
594 additions
and
573 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,35 @@ | ||
Country,Continent,GDP,GDPP | ||
UnitedStates,NorthAmerica,21137,63543 | ||
China,Asia,14342,10261 | ||
Japan,Asia,5081,40293 | ||
Germany,Europe,3846,46329 | ||
India,Asia,2875,2099 | ||
UnitedKingdom,Europe,2825,42330 | ||
France,Europe,2716,41463 | ||
Italy,Europe,2001,33279 | ||
Brazil,SouthAmerica,1839,8718 | ||
Canada,NorthAmerica,1643,43119 | ||
Russia,EuropeAsia,1637,11229 | ||
SouthKorea,Asia,1622,31489 | ||
Australia,Oceania,1382,53799 | ||
Spain,Europe,1316,28152 | ||
Mexico,NorthAmerica,1265,9958 | ||
Indonesia,Asia,1119,4152 | ||
Netherlands,Europe,902,52477 | ||
SaudiArabia,Asia,793,23206 | ||
Turkey,EuropeAsia,761,9005 | ||
Switzerland,Europe,703,81392 | ||
Argentina,SouthAmerica,449,9921 | ||
Sweden,Europe,528,52073 | ||
Nigeria,Africa,448,2190 | ||
Poland,Europe,594,15673 | ||
Thailand,Asia,509,7306 | ||
SouthAfrica,Africa,350,5883 | ||
Philippines,Asia,402,3685 | ||
Colombia,SouthAmerica,323,6458 | ||
Egypt,Africa,302,3012 | ||
Pakistan,Asia,278,1450 | ||
Bangladesh,Asia,302,1855 | ||
Vietnam,Asia,283,2900 | ||
Chile,SouthAmerica,252,13120 | ||
Finland,Europe,268,48888 |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,132 @@ | ||
//! This is a non-interactive example of using Proof of SQL with a countries dataset. | ||
//! To run this, use `cargo run --release --example countries`. | ||
//! | ||
//! NOTE: If this doesn't work because you do not have the appropriate GPU drivers installed, | ||
//! you can run `cargo run --release --example countries --no-default-features --features="arrow cpu-perf"` instead. It will be slower for proof generation. | ||
|
||
use arrow::datatypes::SchemaRef; | ||
use arrow_csv::{infer_schema_from_files, ReaderBuilder}; | ||
use proof_of_sql::{ | ||
base::database::{ | ||
arrow_schema_utility::get_posql_compatible_schema, OwnedTable, OwnedTableTestAccessor, | ||
TestAccessor, | ||
}, | ||
proof_primitive::dory::{ | ||
DynamicDoryCommitment, DynamicDoryEvaluationProof, ProverSetup, PublicParameters, | ||
VerifierSetup, | ||
}, | ||
sql::{parse::QueryExpr, postprocessing::apply_postprocessing_steps, proof::QueryProof}, | ||
}; | ||
use rand::{rngs::StdRng, SeedableRng}; | ||
use std::{fs::File, time::Instant}; | ||
|
||
// We generate the public parameters and the setups used by the prover and verifier for the Dory PCS. | ||
// The `max_nu` should be set such that the maximum table size is less than `2^(2*max_nu-1)`. | ||
const DORY_SETUP_MAX_NU: usize = 8; | ||
// This should be a "nothing-up-my-sleeve" phrase or number. | ||
const DORY_SEED: [u8; 32] = *b"7a1b3c8d2e4f9g6h5i0j7k2l8m3n9o1p"; | ||
|
||
/// # Panics | ||
/// Will panic if the query does not parse or the proof fails to verify. | ||
fn prove_and_verify_query( | ||
sql: &str, | ||
accessor: &OwnedTableTestAccessor<DynamicDoryEvaluationProof>, | ||
prover_setup: &ProverSetup, | ||
verifier_setup: &VerifierSetup, | ||
) { | ||
// Parse the query: | ||
println!("Parsing the query: {sql}..."); | ||
let now = Instant::now(); | ||
let query_plan = QueryExpr::<DynamicDoryCommitment>::try_new( | ||
sql.parse().unwrap(), | ||
"countries".parse().unwrap(), | ||
accessor, | ||
) | ||
.unwrap(); | ||
println!("Done in {} ms.", now.elapsed().as_secs_f64() * 1000.); | ||
|
||
// Generate the proof and result: | ||
print!("Generating proof..."); | ||
let now = Instant::now(); | ||
let (proof, provable_result) = QueryProof::<DynamicDoryEvaluationProof>::new( | ||
query_plan.proof_expr(), | ||
accessor, | ||
&prover_setup, | ||
); | ||
println!("Done in {} ms.", now.elapsed().as_secs_f64() * 1000.); | ||
|
||
// Verify the result with the proof: | ||
print!("Verifying proof..."); | ||
let now = Instant::now(); | ||
let result = proof | ||
.verify( | ||
query_plan.proof_expr(), | ||
accessor, | ||
&provable_result, | ||
&verifier_setup, | ||
) | ||
.unwrap(); | ||
let result = apply_postprocessing_steps(result.table, query_plan.postprocessing()); | ||
println!("Verified in {} ms.", now.elapsed().as_secs_f64() * 1000.); | ||
|
||
// Display the result | ||
println!("Query Result:"); | ||
println!("{result:?}"); | ||
} | ||
|
||
fn main() { | ||
let mut rng = StdRng::from_seed(DORY_SEED); | ||
let public_parameters = PublicParameters::rand(DORY_SETUP_MAX_NU, &mut rng); | ||
let prover_setup = ProverSetup::from(&public_parameters); | ||
let verifier_setup = VerifierSetup::from(&public_parameters); | ||
|
||
let filename = "./crates/proof-of-sql/examples/countries/countries_gdp.csv"; | ||
let inferred_schema = | ||
SchemaRef::new(infer_schema_from_files(&[filename.to_string()], b',', None, true).unwrap()); | ||
let posql_compatible_schema = get_posql_compatible_schema(&inferred_schema); | ||
|
||
let countries_batch = ReaderBuilder::new(posql_compatible_schema) | ||
.with_header(true) | ||
.build(File::open(filename).unwrap()) | ||
.unwrap() | ||
.next() | ||
.unwrap() | ||
.unwrap(); | ||
|
||
// Load the table into an "Accessor" so that the prover and verifier can access the data/commitments. | ||
let mut accessor = | ||
OwnedTableTestAccessor::<DynamicDoryEvaluationProof>::new_empty_with_setup(&prover_setup); | ||
accessor.add_table( | ||
"countries.countries".parse().unwrap(), | ||
OwnedTable::try_from(countries_batch).unwrap(), | ||
0, | ||
); | ||
|
||
prove_and_verify_query( | ||
"SELECT COUNT(*) AS total_countries FROM countries", | ||
&accessor, | ||
&prover_setup, | ||
&verifier_setup, | ||
); | ||
|
||
prove_and_verify_query( | ||
"SELECT country FROM countries WHERE continent = 'Asia'", | ||
&accessor, | ||
&prover_setup, | ||
&verifier_setup, | ||
); | ||
|
||
prove_and_verify_query( | ||
"SELECT country FROM countries WHERE gdp > 500 AND gdp < 1500", | ||
&accessor, | ||
&prover_setup, | ||
&verifier_setup, | ||
); | ||
|
||
prove_and_verify_query( | ||
"SELECT SUM(gdp) AS total_market_cap FROM countries WHERE country = 'China' OR country = 'India'", | ||
&accessor, | ||
&prover_setup, | ||
&verifier_setup, | ||
); | ||
} |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
File renamed without changes.
79 changes: 79 additions & 0 deletions
79
crates/proof-of-sql/src/base/arrow/column_arrow_conversions.rs
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,79 @@ | ||
use crate::base::{ | ||
database::{ColumnField, ColumnType}, | ||
math::decimal::Precision, | ||
}; | ||
use alloc::sync::Arc; | ||
use arrow::datatypes::{DataType, Field, TimeUnit as ArrowTimeUnit}; | ||
use proof_of_sql_parser::posql_time::{PoSQLTimeUnit, PoSQLTimeZone}; | ||
|
||
/// Convert [`ColumnType`] values to some arrow [`DataType`] | ||
impl From<&ColumnType> for DataType { | ||
fn from(column_type: &ColumnType) -> Self { | ||
match column_type { | ||
ColumnType::Boolean => DataType::Boolean, | ||
ColumnType::TinyInt => DataType::Int8, | ||
ColumnType::SmallInt => DataType::Int16, | ||
ColumnType::Int => DataType::Int32, | ||
ColumnType::BigInt => DataType::Int64, | ||
ColumnType::Int128 => DataType::Decimal128(38, 0), | ||
ColumnType::Decimal75(precision, scale) => { | ||
DataType::Decimal256(precision.value(), *scale) | ||
} | ||
ColumnType::VarChar => DataType::Utf8, | ||
ColumnType::Scalar => unimplemented!("Cannot convert Scalar type to arrow type"), | ||
ColumnType::TimestampTZ(timeunit, timezone) => { | ||
let arrow_timezone = Some(Arc::from(timezone.to_string())); | ||
let arrow_timeunit = match timeunit { | ||
PoSQLTimeUnit::Second => ArrowTimeUnit::Second, | ||
PoSQLTimeUnit::Millisecond => ArrowTimeUnit::Millisecond, | ||
PoSQLTimeUnit::Microsecond => ArrowTimeUnit::Microsecond, | ||
PoSQLTimeUnit::Nanosecond => ArrowTimeUnit::Nanosecond, | ||
}; | ||
DataType::Timestamp(arrow_timeunit, arrow_timezone) | ||
} | ||
} | ||
} | ||
} | ||
|
||
/// Convert arrow [`DataType`] values to some [`ColumnType`] | ||
impl TryFrom<DataType> for ColumnType { | ||
type Error = String; | ||
|
||
fn try_from(data_type: DataType) -> Result<Self, Self::Error> { | ||
match data_type { | ||
DataType::Boolean => Ok(ColumnType::Boolean), | ||
DataType::Int8 => Ok(ColumnType::TinyInt), | ||
DataType::Int16 => Ok(ColumnType::SmallInt), | ||
DataType::Int32 => Ok(ColumnType::Int), | ||
DataType::Int64 => Ok(ColumnType::BigInt), | ||
DataType::Decimal128(38, 0) => Ok(ColumnType::Int128), | ||
DataType::Decimal256(precision, scale) if precision <= 75 => { | ||
Ok(ColumnType::Decimal75(Precision::new(precision)?, scale)) | ||
} | ||
DataType::Timestamp(time_unit, timezone_option) => { | ||
let posql_time_unit = match time_unit { | ||
ArrowTimeUnit::Second => PoSQLTimeUnit::Second, | ||
ArrowTimeUnit::Millisecond => PoSQLTimeUnit::Millisecond, | ||
ArrowTimeUnit::Microsecond => PoSQLTimeUnit::Microsecond, | ||
ArrowTimeUnit::Nanosecond => PoSQLTimeUnit::Nanosecond, | ||
}; | ||
Ok(ColumnType::TimestampTZ( | ||
posql_time_unit, | ||
PoSQLTimeZone::try_from(&timezone_option)?, | ||
)) | ||
} | ||
DataType::Utf8 => Ok(ColumnType::VarChar), | ||
_ => Err(format!("Unsupported arrow data type {data_type:?}")), | ||
} | ||
} | ||
} | ||
/// Convert [`ColumnField`] values to arrow Field | ||
impl From<&ColumnField> for Field { | ||
fn from(column_field: &ColumnField) -> Self { | ||
Field::new( | ||
column_field.name().name(), | ||
(&column_field.data_type()).into(), | ||
false, | ||
) | ||
} | ||
} |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,26 @@ | ||
//! This module provides conversions and utilities for working with Arrow data structures. | ||
|
||
/// Module for handling conversion from Arrow arrays to columns. | ||
pub mod arrow_array_to_column_conversion; | ||
|
||
/// Module for converting between owned and Arrow data structures. | ||
pub mod owned_and_arrow_conversions; | ||
|
||
#[cfg(test)] | ||
/// Tests for owned and Arrow conversions. | ||
mod owned_and_arrow_conversions_test; | ||
|
||
/// Module for converting record batches. | ||
pub mod record_batch_conversion; | ||
|
||
/// Module for record batch error definitions. | ||
pub mod record_batch_errors; | ||
|
||
/// Utility functions for record batches. | ||
pub mod record_batch_utility; | ||
|
||
/// Module for scalar and i256 conversions. | ||
pub mod scalar_and_i256_conversions; | ||
|
||
/// Module for handling conversions between columns and Arrow arrays. | ||
pub mod column_arrow_conversions; |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
4 changes: 2 additions & 2 deletions
4
...abase/owned_and_arrow_conversions_test.rs → ...arrow/owned_and_arrow_conversions_test.rs
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Oops, something went wrong.