devrev
diff --git a/‎meerkat-browser/README.md
Lines changed: 80 additions & 6 deletions b/‎meerkat-browser/README.md
Lines changed: 80 additions & 6 deletions
diff --git a/‎meerkat-core/README.md
Lines changed: 70 additions & 6 deletions b/‎meerkat-core/README.md
Lines changed: 70 additions & 6 deletions
diff --git a/‎meerkat-dbm/README.md
Lines changed: 209 additions & 6 deletions b/‎meerkat-dbm/README.md
Lines changed: 209 additions & 6 deletions
@@ -1,11 +1,85 @@
-# meerkat-browser
+# @devrev/meerkat-browser
 
-This library was generated with [Nx](https://nx.dev).
+`@devrev/meerkat-browser` is a library for converting cube queries into SQL and executing them in a browser environment using [@duckdb/duckdb-wasm](https://github.com/duckdb/duckdb-wasm). It serves as a client-side query engine within the Meerkat ecosystem.
 
-## Building
+This package uses `@devrev/meerkat-core` to generate a DuckDB-compatible AST and `@duckdb/duckdb-wasm` to execute the resulting query against data sources available to the browser.
 
-Run `nx build meerkat-browser` to build the library.
+## Key Features
 
-## Running unit tests
+- **Cube to SQL Execution**: Translates cube queries into SQL and executes them in the browser.
+- **Browser Optimized**: Built to work seamlessly with `@duckdb/duckdb-wasm`.
+- **Client-Side Analytics**: Enables powerful, in-browser data analysis without a server round-trip.
 
-Run `nx test meerkat-browser` to execute the unit tests via [Jest](https://jestjs.io).
+## Installation
+
+```bash
+npm install @devrev/meerkat-browser @devrev/meerkat-core @duckdb/duckdb-wasm
+```
+
+`@duckdb/duckdb-wasm` is a peer dependency and should be configured according to its documentation.
+
+## Usage
+
+Here's a example of how to convert a cube query into SQL and execute the query in the client side with duckdb-wasm.
+
+```typescript
+import * as duckdb from '@duckdb/duckdb-wasm';
+import { cubeQueryToSQL } from '@devrev/meerkat-browser';
+import { Query, TableSchema } from '@devrev/meerkat-core';
+
+async function main() {
+  // 1. Initialize DuckDB-WASM
+  const logger = new duckdb.ConsoleLogger();
+  const worker = new Worker(duckdb.getJsDelivrWorker());
+  const bundle = await duckdb.selectBundle(duckdb.getJsDelivrBundles());
+  const db = new duckdb.AsyncDuckDB(logger, worker);
+  await db.open(bundle);
+  const connection = await db.connect();
+
+  // 2. Define your table schemas
+  const tableSchemas: TableSchema[] = [
+    {
+      name: 'users',
+      // The SQL could point to a registered file or another data source
+      sql: 'SELECT * FROM users',
+      columns: [
+        { name: 'id', type: 'INTEGER' },
+        { name: 'name', type: 'VARCHAR' },
+        { name: 'city', type: 'VARCHAR' },
+        { name: 'signed_up_at', type: 'TIMESTAMP' },
+      ],
+    },
+  ];
+
+  // 3. Define your Cube query
+  const query: Query = {
+    measures: ['users.count'],
+    dimensions: ['users.city'],
+    filters: [
+      {
+        member: 'users.city',
+        operator: 'equals',
+        values: ['New York'],
+      },
+    ],
+    limit: 100,
+  };
+
+  // 4. Convert the query to SQL
+  const sqlQuery = await cubeQueryToSQL({
+    connection,
+    query,
+    tableSchemas,
+  });
+
+  // 5. You can now execute the generated SQL query with DuckDB
+  const result = await connection.query(sqlQuery);
+
+  console.log(
+    'Query Results:',
+    result.toArray().map((row) => row.toJSON())
+  );
+}
+
+main();
+```
@@ -1,11 +1,75 @@
-# meerkat-core
+# @devrev/meerkat-core
 
-This library was generated with [Nx](https://nx.dev).
+`@devrev/meerkat-core` is the foundational library for the Meerkat ecosystem, a TypeScript SDK that seamlessly translates Cube-like queries into DuckDB Abstract Syntax Trees (AST). It provides the core logic for query transformation, designed to be environment-agnostic, running in both Node.js and browser environments.
 
-## Building
+This package focuses exclusively on generating a DuckDB-compatible AST from a JSON-based query object. It does not handle query execution, which is the responsibility of environment-specific packages like `@devrev/meerkat-node` and `@devrev/meerkat-browser`.
 
-Run `nx build meerkat-core` to build the library.
+## Key Features
 
-## Running unit tests
+- **Cube-to-AST Transformation**: Converts Cube-style JSON queries into DuckDB-compatible SQL ASTs.
+- **Environment Agnostic**: Runs in both Node.js and browser environments.
+- **Type-Safe**: Provides strong TypeScript definitions for queries, schemas, and filters.
+- **Advanced Filtering and Joins**: Supports complex filters, logical operators, and multi-table joins.
+- **Extensible by Design**: Leverages DuckDB's native JSON serialization, avoiding the limitations of traditional query builders.
 
-Run `nx test meerkat-core` to execute the unit tests via [Jest](https://jestjs.io).
+## Installation
+
+```bash
+npm install @devrev/meerkat-core
+```
+
+## Core Concepts
+
+`meerkat-core` revolves around two main objects:
+
+1.  **`Query`**: A JSON object that defines your analytics request. It specifies measures, dimensions, filters, and ordering.
+2.  **`TableSchema`**: Defines the structure of your data tables, including columns, measures, dimensions, and joins.
+
+The library uses these objects to generate a DuckDB AST. This AST can then be passed to an execution engine.
+
+## Usage
+
+Here's how to transform a Cube-style query into a DuckDB AST:
+
+```typescript
+import { cubeToDuckdbAST, Query, TableSchema } from '@devrev/meerkat-core';
+
+// 1. Define the schema for your table
+const schema: TableSchema = {
+  name: 'users',
+  sql: 'SELECT * FROM users',
+  columns: [
+    { name: 'id', type: 'INTEGER' },
+    { name: 'name', type: 'VARCHAR' },
+    { name: 'city', type: 'VARCHAR' },
+    { name: 'signed_up_at', type: 'TIMESTAMP' },
+  ],
+};
+
+// 2. Define your query
+const query: Query = {
+  measures: ['users.count'],
+  dimensions: ['users.city'],
+  filters: [
+    {
+      member: 'users.city',
+      operator: 'equals',
+      values: ['New York'],
+    },
+  ],
+  limit: 100,
+};
+
+// 3. Generate the DuckDB AST
+const ast = cubeToDuckdbAST(query, schema);
+
+// The `ast` can now be deserialized into a SQL string for execution.
+console.log(JSON.stringify(ast, null, 2));
+```
+
+## Ecosystem
+
+`meerkat-core` is the foundation for:
+
+- **`@devrev/meerkat-node`**: For server-side analytics in Node.js with `@duckdb/node-api`.
+- **`@devrev/meerkat-browser`**: For client-side analytics in the browser with `@duckdb/duckdb-wasm`.
@@ -1,11 +1,214 @@
-# meerkat-dbm
+# @devrev/meerkat-dbm
 
-This library was generated with [Nx](https://nx.dev).
+`@devrev/meerkat-dbm` is a browser-first database management layer built on [duckdb-wasm](https://github.com/duckdb/duckdb-wasm). It orchestrates query execution, manages DuckDB instances, caches files, persists data in browser storage, and optimizes memory usage to enable robust, high-performance data processing in web applications.
 
-## Building
+It's designed to bring the power of analytical SQL to the browser without compromising application stability or user experience. Whether you're building a data-intensive dashboard, an interactive reporting tool, or an offline-first application, Meerkat DBM provides the foundation you need.
 
-Run `nx build meerkat-dbm` to build the library.
+## Architecture
 
-## Running unit tests
+Meerkat DBM is composed of several key components that work together to manage data and execute queries in the browser:
 
-Run `nx test meerkat-dbm` to execute the unit tests via [Jest](https://jestjs.io).
+- **DBM (Database Manager)**: The central orchestrator. It receives queries, manages the execution lifecycle, and coordinates with other components.
+- **FileManager**: Handles all aspects of data storage and retrieval. It can manage data in-memory or persist it to IndexedDB.
+- **InstanceManager**: A user-implemented component responsible for creating, managing, and terminating `duckdb-wasm` instances.
+- **DuckDB Instances**: The underlying `duckdb-wasm` engines where queries are executed, running in the main thread or in iFrames for parallelism.
+
+This modular design provides a clear separation of concerns for managing complex data workflows in the browser.
+
+## Why Meerkat DBM?
+
+While `duckdb-wasm` is incredibly powerful, using it directly in a complex web application can be challenging. Meerkat DBM provides a structured, production-ready layer that solves common problems:
+
+- **🧠 Memory Safety**: Prevents Out-Of-Memory (OOM) errors by managing query queues and memory swapping, ensuring your app remains stable even with large datasets.
+- **💾 Persistence**: Offers seamless IndexedDB storage, allowing data to persist across browser sessions.
+- **🗂️ Advanced File Management**: Simplifies handling of various file formats (Parquet, JSON, remote URLs) with intelligent caching and partitioning.
+- **⚡ Parallel Processing**: Unlocks high-performance analytics with an optional iframe-based architecture for parallel query execution, preventing UI freezes.
+
+## Key Features
+
+### 🚀 Database Management
+
+- **Instance Management**: Automated lifecycle management for DuckDB instances.
+- **Connection Pooling**: Efficient management of database connections.
+- **Query Queueing**: Intelligent scheduling of queries for sequential or parallel execution.
+- **Table Locking**: Ensures thread-safe table operations during concurrent access.
+
+### 📂 File Management
+
+- **Multiple Formats**: Native support for Parquet, JSON files.
+- **Bulk Operations**: High-performance APIs for registering and processing files in bulk.
+- **Partitioning**: Support for table partitioning to efficiently manage and query large datasets.
+- **Metadata Handling**: Rich metadata support for tables and files.
+- **Multiple Storage Modes**: Flexible storage options, including in-memory and IndexedDB.
+
+## Installation
+
+```bash
+npm install @devrev/meerkat-dbm @duckdb/duckdb-wasm
+```
+
+## Usage
+
+### 1. Implement the InstanceManager
+
+Meerkat DBM requires you to provide an `InstanceManager`. This decouples the library from a specific `duckdb-wasm` version, giving you full control over its instantiation and configuration.
+
+```typescript
+// src/instance-manager.ts
+import * as duckdb from '@duckdb/duckdb-wasm';
+import { InstanceManagerType } from '@devrev/meerkat-dbm';
+
+// Select the desired DuckDB bundle
+const JSDELIVR_BUNDLES = duckdb.getJsDelivrBundles();
+
+export class InstanceManager implements InstanceManagerType {
+  private db: duckdb.AsyncDuckDB | null = null;
+
+  private async initDB(): Promise<duckdb.AsyncDuckDB> {
+    const bundle = await duckdb.selectBundle(JSDELIVR_BUNDLES);
+
+    const worker_url = URL.createObjectURL(new Blob([`importScripts("${bundle.mainWorker!}");`], { type: 'text/javascript' }));
+
+    const worker = new Worker(worker_url);
+    const logger = { log: (msg: any) => console.log(msg) };
+    const db = new duckdb.AsyncDuckDB(logger, worker);
+
+    await db.instantiate(bundle.mainModule, bundle.pthreadWorker);
+
+    URL.revokeObjectURL(worker_url);
+    return db;
+  }
+
+  async getDB(): Promise<duckdb.AsyncDuckDB> {
+    if (!this.db) {
+      this.db = await this.initDB();
+    }
+    return this.db;
+  }
+
+  async terminateDB(): Promise<void> {
+    if (this.db) {
+      await this.db.terminate();
+      this.db = null;
+    }
+  }
+}
+```
+
+### 2. Example: Sequential Queries with Persistent Storage
+
+This example uses the `DBM` with an `IndexedDBFileManager` for safe, sequential query execution and data persistence across browser sessions.
+
+```typescript
+import { DBM, IndexedDBFileManager } from '@devrev/meerkat-dbm';
+import { InstanceManager } from './instance-manager';
+
+// 1. Create the managers
+const instanceManager = new InstanceManager();
+const fileManager = new IndexedDBFileManager({
+  instanceManager,
+  // This function is called by Meerkat to fetch file data when needed
+  fetchTableFileBuffers: async (tableName) => {
+    // In a real app, you would fetch data from a indexdb
+    return [];
+  },
+});
+
+// 2. Create the DBM instance
+const dbm = new DBM({
+  instanceManager,
+  fileManager,
+  onEvent: (event) => console.info('DBM Event:', event),
+  options: {
+    // Automatically shut down the DuckDB instance after 5s of inactivity
+    shutdownInactiveTime: 5000,
+  },
+});
+
+// 3. Register data
+await fileManager.registerJSON({
+  tableName: 'sales',
+  fileName: 'sales.json',
+  json: [
+    { id: 1, product: 'Laptop', amount: 1200 },
+    { id: 2, product: 'Mouse', amount: 25 },
+    { id: 3, product: 'Keyboard', amount: 75 },
+  ],
+});
+
+// 4. Run a query
+const results = await dbm.query('SELECT * FROM sales WHERE amount > 50');
+console.log(results);
+```
+
+### 3. Example: Parallel Queries with IFrame Runners
+
+This setup uses `DBMParallel` and `ParallelIndexedDBFileManager` for maximum performance, executing queries in parallel across multiple iframe-based DuckDB instances.
+
+```typescript
+import { DBMParallel, IFrameRunnerManager, ParallelIndexedDBFileManager } from '@devrev/meerkat-dbm';
+import log from 'loglevel';
+import { InstanceManager } from './instance-manager';
+
+// 1. Create instance and file managers
+const instanceManager = new InstanceManager();
+const fileManager = new ParallelIndexedDBFileManager({
+  instanceManager,
+  fetchTableFileBuffers: async (table) => [],
+  logger: log,
+});
+
+// 2. Set up the iframe runner manager for parallel execution
+const iframeManager = new IFrameRunnerManager({
+  // URL to the runner HTML file that hosts the DuckDB instance
+  runnerURL: 'http://localhost:4204/runner/indexeddb-runner.html',
+  origin: 'http://localhost:4204',
+  totalRunners: 4, // Number of parallel iframes
+  fetchTableFileBuffers: async (table) => [],
+  logger: log,
+});
+
+// 3. Create the parallel DBM instance
+const parallelDBM = new DBMParallel({
+  instanceManager,
+  fileManager,
+  iFrameRunnerManager: iframeManager,
+  logger: log,
+  options: {
+    shutdownInactiveTime: 10000,
+  },
+});
+
+// 4. Register data
+await fileManager.bulkRegisterJSON([
+  {
+    tableName: 'transactions',
+    fileName: 'transactions.json',
+    json: [
+      { id: 1, product_id: 101, amount: 1200 },
+      { id: 2, product_id: 102, amount: 25 },
+    ],
+  },
+  {
+    tableName: 'products',
+    fileName: 'products.json',
+    json: [
+      { id: 101, name: 'Laptop', category: 'Electronics' },
+      { id: 102, name: 'Mouse', category: 'Accessories' },
+    ],
+  },
+]);
+
+// 5. Execute queries in parallel
+const results = await Promise.all([
+  parallelDBM.query('SELECT * FROM transactions WHERE amount > 100'),
+  parallelDBM.query(`
+    SELECT p.category, COUNT(*) as product_count 
+    FROM transactions t 
+    JOIN products p ON t.product_id = p.id 
+    GROUP BY p.category
+  `),
+]);
+
+console.log('Query Results', results);
+```