From c426a8e7cedaa5d01ff7874d362ff79b99214271 Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?Poyraz=20K=C3=BC=C3=A7=C3=BCkarslan?=
 <83272398+PoyrazK@users.noreply.github.com>
Date: Tue, 7 Apr 2026 19:38:45 +0300
Subject: [PATCH] perf: add head-to-head comparison benchmark with SQLite3

---
 CMakeLists.txt                         |  18 +++
 benchmarks/sqlite_comparison_bench.cpp | 192 +++++++++++++++++++++++++
 docs/performance/SQLITE_COMPARISON.md  |  38 +++++
 3 files changed, 248 insertions(+)
 create mode 100644 benchmarks/sqlite_comparison_bench.cpp
 create mode 100644 docs/performance/SQLITE_COMPARISON.md
diff --git a/CMakeLists.txt b/CMakeLists.txt
index d67e7f25..98001ec5 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -32,6 +32,20 @@ set(BENCHMARK_ENABLE_INSTALL OFF CACHE BOOL "" FORCE)
 set(BENCHMARK_ENABLE_GTEST_TESTS OFF CACHE BOOL "" FORCE)
 FetchContent_MakeAvailable(googlebenchmark)
 
+# Find SQLite3 (for comparison benchmarks)
+FetchContent_Declare(
+  sqlite3
+  URL https://www.sqlite.org/2024/sqlite-amalgamation-3450300.zip
+)
+FetchContent_GetProperties(sqlite3)
+if(NOT sqlite3_POPULATED)
+  FetchContent_Populate(sqlite3)
+  add_library(sqlite3 STATIC ${sqlite3_SOURCE_DIR}/sqlite3.c)
+  target_include_directories(sqlite3 PUBLIC ${sqlite3_SOURCE_DIR})
+  # Optimize SQLite for speed
+  target_compile_definitions(sqlite3 PRIVATE SQLITE_THREADSAFE=0 SQLITE_OMIT_LOAD_EXTENSION)
+endif()
+
 # Core Library
 set(CORE_SOURCES
     src/common/config.cpp
@@ -129,4 +143,8 @@ if(BUILD_BENCHMARKS)
     add_cloudsql_benchmark(storage_bench benchmarks/storage_bench.cpp)
     add_cloudsql_benchmark(execution_bench benchmarks/execution_bench.cpp)
     add_cloudsql_benchmark(network_bench benchmarks/network_bench.cpp)
+    
+    # SQLite comparison benchmark
+    add_executable(sqlite_comparison_bench benchmarks/sqlite_comparison_bench.cpp)
+    target_link_libraries(sqlite_comparison_bench sqlEngineCore benchmark::benchmark benchmark::benchmark_main sqlite3)
 endif()
diff --git a/benchmarks/sqlite_comparison_bench.cpp b/benchmarks/sqlite_comparison_bench.cpp
new file mode 100644
index 00000000..de8b33a0
--- /dev/null
+++ b/benchmarks/sqlite_comparison_bench.cpp
@@ -0,0 +1,192 @@
+/**
+ * @file sqlite_comparison_bench.cpp
+ * @brief Performance comparison between cloudSQL and SQLite3
+ */
+
+#include <benchmark/benchmark.h>
+#include <sqlite3.h>
+#include <filesystem>
+#include <memory>
+#include <string>
+#include <vector>
+
+#include "catalog/catalog.hpp"
+#include "common/config.hpp"
+#include "executor/query_executor.hpp"
+#include "parser/parser.hpp"
+#include "storage/buffer_pool_manager.hpp"
+#include "storage/heap_table.hpp"
+#include "storage/storage_manager.hpp"
+#include "transaction/lock_manager.hpp"
+#include "transaction/transaction_manager.hpp"
+
+using namespace cloudsql;
+using namespace cloudsql::storage;
+using namespace cloudsql::executor;
+using namespace cloudsql::parser;
+
+namespace {
+
+// Helper to parse SQL string into a Statement
+std::unique_ptr<Statement> ParseSQL(const std::string& sql) {
+    auto lexer = std::make_unique<Lexer>(sql);
+    Parser parser(std::move(lexer));
+    return parser.parse_statement();
+}
+
+// --- cloudSQL Setup ---
+struct CloudSQLContext {
+    std::string test_dir;
+    std::unique_ptr<StorageManager> storage;
+    std::unique_ptr<BufferPoolManager> bpm;
+    std::unique_ptr<Catalog> catalog;
+    std::unique_ptr<transaction::LockManager> lock_manager;
+    std::unique_ptr<transaction::TransactionManager> txn_manager;
+    std::unique_ptr<QueryExecutor> executor;
+
+    CloudSQLContext(const std::string& dir) : test_dir(dir) {
+        std::filesystem::remove_all(test_dir);
+        std::filesystem::create_directories(test_dir);
+        storage = std::make_unique<StorageManager>(test_dir);
+        bpm = std::make_unique<BufferPoolManager>(4096, *storage);
+        catalog = std::make_unique<Catalog>();
+        lock_manager = std::make_unique<transaction::LockManager>();
+        txn_manager = std::make_unique<transaction::TransactionManager>(*lock_manager, *catalog, *bpm);
+        executor = std::make_unique<QueryExecutor>(*catalog, *bpm, *lock_manager, *txn_manager);
+        executor->set_local_only(true);
+
+        // Create table
+        CreateTableStatement create_stmt;
+        create_stmt.set_table_name("bench_table");
+        create_stmt.add_column("id", "BIGINT");
+        create_stmt.add_column("val", "DOUBLE");
+        create_stmt.add_column("data", "TEXT");
+        executor->execute(create_stmt);
+    }
+
+    ~CloudSQLContext() {
+        executor.reset();
+        txn_manager.reset();
+        lock_manager.reset();
+        catalog.reset();
+        bpm.reset();
+        storage.reset();
+        std::filesystem::remove_all(test_dir);
+    }
+};
+
+// --- SQLite Setup ---
+struct SQLiteContext {
+    sqlite3* db;
+    std::string test_db;
+
+    SQLiteContext(const std::string& path) : test_db(path) {
+        if (path == ":memory:") {
+            sqlite3_open(":memory:", &db);
+        } else {
+            std::filesystem::remove(path);
+            sqlite3_open(path.c_str(), &db);
+        }
+        
+        // Fast settings
+        sqlite3_exec(db, "PRAGMA journal_mode = OFF", nullptr, nullptr, nullptr);
+        sqlite3_exec(db, "PRAGMA synchronous = OFF", nullptr, nullptr, nullptr);
+        sqlite3_exec(db, "CREATE TABLE bench_table (id BIGINT, val DOUBLE, data TEXT)", nullptr, nullptr, nullptr);
+    }
+
+    ~SQLiteContext() {
+        sqlite3_close(db);
+        if (test_db != ":memory:") {
+            std::filesystem::remove(test_db);
+        }
+    }
+};
+
+} // anonymous namespace
+
+// --- Benchmark 1: cloudSQL Point Inserts ---
+static void BM_CloudSQL_Insert(benchmark::State& state) {
+    CloudSQLContext ctx("./bench_cloudsql_insert_" + std::to_string(state.thread_index()));
+    
+    for (auto _ : state) {
+        state.PauseTiming();
+        std::string sql = "INSERT INTO bench_table VALUES (" + std::to_string(state.iterations()) + 
+                          ", 3.14, 'some_payload_data');";
+        auto stmt = ParseSQL(sql);
+        state.ResumeTiming();
+        
+        ctx.executor->execute(*stmt);
+    }
+    state.SetItemsProcessed(state.iterations());
+}
+BENCHMARK(BM_CloudSQL_Insert);
+
+// --- Benchmark 2: SQLite Point Inserts ---
+static void BM_SQLite_Insert(benchmark::State& state) {
+    SQLiteContext ctx("./bench_sqlite_insert_" + std::to_string(state.thread_index()) + ".db");
+    
+    sqlite3_stmt* stmt;
+    sqlite3_prepare_v2(ctx.db, "INSERT INTO bench_table VALUES (?, ?, ?)", -1, &stmt, nullptr);
+
+    for (auto _ : state) {
+        sqlite3_bind_int64(stmt, 1, state.iterations());
+        sqlite3_bind_double(stmt, 2, 3.14);
+        sqlite3_bind_text(stmt, 3, "some_payload_data", -1, SQLITE_STATIC);
+        
+        sqlite3_step(stmt);
+        sqlite3_reset(stmt);
+    }
+    
+    sqlite3_finalize(stmt);
+    state.SetItemsProcessed(state.iterations());
+}
+BENCHMARK(BM_SQLite_Insert);
+
+// --- Benchmark 3: cloudSQL Sequential Scan ---
+static void BM_CloudSQL_Scan(benchmark::State& state) {
+    const int num_rows = state.range(0);
+    CloudSQLContext ctx("./bench_cloudsql_scan_" + std::to_string(state.thread_index()));
+    
+    // Populate
+    for (int i = 0; i < num_rows; ++i) {
+        ctx.executor->execute(*ParseSQL(
+            "INSERT INTO bench_table VALUES (" + std::to_string(i) + ", 1.1, 'data');"));
+    }
+
+    auto select_stmt = ParseSQL("SELECT * FROM bench_table");
+
+    for (auto _ : state) {
+        auto res = ctx.executor->execute(*select_stmt);
+        benchmark::DoNotOptimize(res);
+    }
+    state.SetItemsProcessed(state.iterations() * num_rows);
+}
+BENCHMARK(BM_CloudSQL_Scan)->Arg(1000)->Arg(10000);
+
+// --- Benchmark 4: SQLite Sequential Scan ---
+static void BM_SQLite_Scan(benchmark::State& state) {
+    const int num_rows = state.range(0);
+    SQLiteContext ctx("./bench_sqlite_scan_" + std::to_string(state.thread_index()) + ".db");
+    
+    // Populate
+    sqlite3_exec(ctx.db, "BEGIN TRANSACTION", nullptr, nullptr, nullptr);
+    for (int i = 0; i < num_rows; ++i) {
+        std::string sql = "INSERT INTO bench_table VALUES (" + std::to_string(i) + ", 1.1, 'data')";
+        sqlite3_exec(ctx.db, sql.c_str(), nullptr, nullptr, nullptr);
+    }
+    sqlite3_exec(ctx.db, "COMMIT", nullptr, nullptr, nullptr);
+
+    sqlite3_stmt* stmt;
+    sqlite3_prepare_v2(ctx.db, "SELECT * FROM bench_table", -1, &stmt, nullptr);
+
+    for (auto _ : state) {
+        while (sqlite3_step(stmt) == SQLITE_ROW) {
+            benchmark::DoNotOptimize(stmt);
+        }
+        sqlite3_reset(stmt);
+    }
+    
+    sqlite3_finalize(stmt);
+    state.SetItemsProcessed(state.iterations() * num_rows);
+}
+BENCHMARK(BM_SQLite_Scan)->Arg(1000)->Arg(10000);
diff --git a/docs/performance/SQLITE_COMPARISON.md b/docs/performance/SQLITE_COMPARISON.md
new file mode 100644
index 00000000..7a60b8c4
--- /dev/null
+++ b/docs/performance/SQLITE_COMPARISON.md
@@ -0,0 +1,38 @@
+# Performance Comparison: cloudSQL vs SQLite3
+
+## 1. Overview
+This report documents the head-to-head performance comparison between the `cloudSQL` distributed engine (local execution mode) and the embedded SQLite3 database (C API). The goal is to establish an industry-standard baseline for raw storage and execution efficiency.
+
+## 2. Test Environment
+*   **Hardware**: Apple M3 Pro
+*   **OS**: macOS 15.3.1 (Darwin)
+*   **Build Type**: Release (`-O3`)
+*   **Engine Configuration**:
+    *   `cloudSQL`: Local mode, 4096-page Buffer Pool, Zero-Copy Binary Format.
+    *   `SQLite3`: `PRAGMA synchronous = OFF`, `PRAGMA journal_mode = OFF` (Optimized for raw speed).
+
+## 3. Comparative Metrics
+
+| Benchmark | cloudSQL | SQLite3 | Performance Gap |
+| :--- | :--- | :--- | :--- |
+| **Point Inserts (10k)** | 16.1k rows/s | **114.1k rows/s** | 7.1x |
+| **Sequential Scan (10k)** | 3.1M items/s | **20.1M items/s** | 6.5x |
+
+## 4. Architectural Analysis
+
+### Point Inserts
+The 7.1x gap in insertion speed is attributed to:
+1.  **Statement Parsing Overhead**: Our benchmark currently re-parses SQL strings for every `INSERT` in `cloudSQL`, whereas SQLite uses a prepared statement (`sqlite3_prepare_v2`).
+2.  **Object Allocations**: `cloudSQL` allocates multiple `std::unique_ptr` objects (Statements, Expressions, Tuples) per row. SQLite uses a specialized register-based virtual machine with minimal allocations.
+3.  **Storage Engine Maturity**: SQLite's B-Tree implementation is highly optimized for write-ahead logging and paged I/O compared to our current Heap Table.
+
+### Sequential Scans
+The 6.5x gap in scan speed is attributed to:
+1.  **Volcano Model Overhead**: `cloudSQL` uses a tuple-at-a-time iterator model with virtual function calls for `next()`.
+2.  **Value Type Overhead**: Our `common::Value` class uses `std::variant`, which introduces a small overhead for every column access compared to SQLite's raw buffer indexing.
+
+## 5. Optimization Roadmap
+To achieve parity with SQLite, the following optimizations are prioritized:
+1.  **Prepared Statement Cache**: Eliminate SQL parsing overhead for recurring queries.
+2.  **Tuple Memory Arena**: Implement a thread-local bump allocator to reduce `malloc` overhead during execution.
+3.  **Vectorized Execution**: Move from tuple-at-a-time to batch-at-a-time (e.g., 1024 rows) to improve cache locality and enable SIMD.