Skip to content

Commit

Permalink
feat: books example
Browse files Browse the repository at this point in the history
  • Loading branch information
henrymai committed Oct 23, 2024
1 parent 6d435e4 commit d13f654
Show file tree
Hide file tree
Showing 4 changed files with 163 additions and 0 deletions.
2 changes: 2 additions & 0 deletions .github/workflows/lint-and-test.yml
Original file line number Diff line number Diff line change
Expand Up @@ -120,6 +120,8 @@ jobs:
run: cargo run --example wood_types
- name: Run dinosaurs example
run: cargo run --example dinosaurs
- name: Run books example
run: cargo run --example books
- name: Run posql_db example (With Blitzar)
run: bash crates/proof-of-sql/examples/posql_db/run_example.sh
- name: Run posql_db example (Without Blitzar)
Expand Down
4 changes: 4 additions & 0 deletions crates/proof-of-sql/Cargo.toml
Original file line number Diff line number Diff line change
Expand Up @@ -107,6 +107,10 @@ required-features = [ "arrow" ]
name = "dinosaurs"
required-features = [ "arrow" ]

[[example]]
name = "books"
required-features = [ "arrow" ]

[[bench]]
name = "posql_benches"
harness = false
Expand Down
21 changes: 21 additions & 0 deletions crates/proof-of-sql/examples/books/books.csv
Original file line number Diff line number Diff line change
@@ -0,0 +1,21 @@
id,title,author,publication_year,genre,rating
1,To Kill a Mockingbird,Harper Lee,1960,Fiction,4.5
2,1984,George Orwell,1949,Science Fiction,4.7
3,Pride and Prejudice,Jane Austen,1813,Romance,4.3
4,The Great Gatsby,F. Scott Fitzgerald,1925,Fiction,4.2
5,The Catcher in the Rye,J.D. Salinger,1951,Fiction,4.0
6,Moby-Dick,Herman Melville,1851,Adventure,4.1
7,The Lord of the Rings,J.R.R. Tolkien,1954,Fantasy,4.9
8,The Hobbit,J.R.R. Tolkien,1937,Fantasy,4.6
9,Brave New World,Aldous Huxley,1932,Science Fiction,4.4
10,The Hunger Games,Suzanne Collins,2008,Young Adult,4.3
11,Harry Potter and the Philosopher's Stone,J.K. Rowling,1997,Fantasy,4.8
12,The Da Vinci Code,Dan Brown,2003,Thriller,3.9
13,The Alchemist,Paulo Coelho,1988,Fiction,4.2
14,The Girl with the Dragon Tattoo,Stieg Larsson,2005,Mystery,4.1
15,The Hitchhiker's Guide to the Galaxy,Douglas Adams,1979,Science Fiction,4.5
16,The Shining,Stephen King,1977,Horror,4.3
17,The Catch-22,Joseph Heller,1961,Satire,4.0
18,The Chronicles of Narnia,C.S. Lewis,1950,Fantasy,4.7
19,The Fault in Our Stars,John Green,2012,Young Adult,4.2
20,The Old Man and the Sea,Ernest Hemingway,1952,Fiction,4.1
136 changes: 136 additions & 0 deletions crates/proof-of-sql/examples/books/main.rs
Original file line number Diff line number Diff line change
@@ -0,0 +1,136 @@
//! This is a non-interactive example of using Proof of SQL with a books dataset.
//! To run this, use `cargo run --release --example books`.
//!
//! NOTE: If this doesn't work because you do not have the appropriate GPU drivers installed,
//! you can run `cargo run --release --example books --no-default-features --features="arrow cpu-perf"` instead. It will be slower for proof generation.

use arrow::datatypes::SchemaRef;
use arrow_csv::{infer_schema_from_files, ReaderBuilder};
use proof_of_sql::{
base::database::{
arrow_schema_utility::get_posql_compatible_schema, OwnedTable, OwnedTableTestAccessor,
TestAccessor,
},
proof_primitive::dory::{
DynamicDoryCommitment, DynamicDoryEvaluationProof, ProverSetup, PublicParameters,
VerifierSetup,
},
sql::{parse::QueryExpr, postprocessing::apply_postprocessing_steps, proof::QueryProof},
};
use rand::{rngs::StdRng, SeedableRng};
use std::{fs::File, time::Instant};

// We generate the public parameters and the setups used by the prover and verifier for the Dory PCS.
// The `max_nu` should be set such that the maximum table size is less than `2^(2*max_nu-1)`.
const DORY_SETUP_MAX_NU: usize = 8;
// This should be a "nothing-up-my-sleeve" phrase or number.
const DORY_SEED: [u8; 32] = *b"ebab60d58dee4cc69658939b7c2a582d";

/// # Panics
/// Will panic if the query does not parse or the proof fails to verify.
fn prove_and_verify_query(
sql: &str,
accessor: &OwnedTableTestAccessor<DynamicDoryEvaluationProof>,
prover_setup: &ProverSetup,
verifier_setup: &VerifierSetup,
) {
// Parse the query:
println!("Parsing the query: {sql}...");
let now = Instant::now();
let query_plan = QueryExpr::<DynamicDoryCommitment>::try_new(
sql.parse().unwrap(),
"books".parse().unwrap(),
accessor,
)
.unwrap();
println!("Done in {} ms.", now.elapsed().as_secs_f64() * 1000.);

// Generate the proof and result:
print!("Generating proof...");
let now = Instant::now();
let (proof, provable_result) = QueryProof::<DynamicDoryEvaluationProof>::new(
query_plan.proof_expr(),
accessor,
&prover_setup,
);
println!("Done in {} ms.", now.elapsed().as_secs_f64() * 1000.);

// Verify the result with the proof:
print!("Verifying proof...");
let now = Instant::now();
let result = proof
.verify(
query_plan.proof_expr(),
accessor,
&provable_result,
&verifier_setup,
)
.unwrap();
let result = apply_postprocessing_steps(result.table, query_plan.postprocessing());
println!("Verified in {} ms.", now.elapsed().as_secs_f64() * 1000.);

// Display the result
println!("Query Result:");
println!("{result:?}");
}

fn main() {
let mut rng = StdRng::from_seed(DORY_SEED);
let public_parameters = PublicParameters::rand(DORY_SETUP_MAX_NU, &mut rng);
let prover_setup = ProverSetup::from(&public_parameters);
let verifier_setup = VerifierSetup::from(&public_parameters);

let filename = "./crates/proof-of-sql/examples/books/books.csv";
let inferred_schema =
SchemaRef::new(infer_schema_from_files(&[filename.to_string()], b',', None, true).unwrap());
let posql_compatible_schema = get_posql_compatible_schema(&inferred_schema);

let books_batch = ReaderBuilder::new(posql_compatible_schema)
.with_header(true)
.build(File::open(filename).unwrap())
.unwrap()
.next()
.unwrap()
.unwrap();

// Load the table into an "Accessor" so that the prover and verifier can access the data/commitments.
let mut accessor =
OwnedTableTestAccessor::<DynamicDoryEvaluationProof>::new_empty_with_setup(&prover_setup);
accessor.add_table(
"books.books".parse().unwrap(),
OwnedTable::try_from(books_batch).unwrap(),
0,
);

// Query 1: Count the total number of books
prove_and_verify_query(
"SELECT COUNT(*) AS total_books FROM books",
&accessor,
&prover_setup,
&verifier_setup,
);

// Query 2: Find the top 5 highest-rated books
prove_and_verify_query(
"SELECT title, author, rating FROM books ORDER BY rating DESC LIMIT 5",
&accessor,
&prover_setup,
&verifier_setup,
);

// Query 3: Count the number of books in each genre
prove_and_verify_query(
"SELECT genre, COUNT(*) AS book_count FROM books GROUP BY genre ORDER BY book_count DESC",
&accessor,
&prover_setup,
&verifier_setup,
);

// Query 4: Find books published after 2000 with a rating higher than 4.5
prove_and_verify_query(
"SELECT title, author, publication_year, rating FROM books WHERE publication_year > 2000 AND rating > 4.5",
&accessor,
&prover_setup,
&verifier_setup,
);
}

0 comments on commit d13f654

Please sign in to comment.