queryer merger test progress

2026-03-11 05:18:01 -04:00
parent 1c08a8f2b8
commit 44be75f5d4
104 changed files with 22563 additions and 18859 deletions
--- a/src/database/executors/mock.rs
+++ b/src/database/executors/mock.rs
@ -0,0 +1,64 @@
+use crate::database::executors::DatabaseExecutor;
+use serde_json::Value;
+
+#[cfg(test)]
+use std::sync::Mutex;
+
+#[cfg(test)]
+pub struct MockExecutor {
+  pub query_responses: Mutex<Vec<Result<Value, String>>>,
+  pub execute_responses: Mutex<Vec<Result<(), String>>>,
+  pub captured_queries: Mutex<Vec<String>>,
+}
+
+#[cfg(test)]
+impl MockExecutor {
+  pub fn new() -> Self {
+    Self {
+      query_responses: Mutex::new(Vec::new()),
+      execute_responses: Mutex::new(Vec::new()),
+      captured_queries: Mutex::new(Vec::new()),
+    }
+  }
+}
+
+#[cfg(test)]
+impl DatabaseExecutor for MockExecutor {
+  fn query(&self, sql: &str, _args: Option<&[Value]>) -> Result<Value, String> {
+    println!("DEBUG SQL QUERY: {}", sql);
+    self.captured_queries.lock().unwrap().push(sql.to_string());
+    let mut responses = self.query_responses.lock().unwrap();
+    if responses.is_empty() {
+      return Ok(Value::Array(vec![]));
+    }
+    responses.remove(0)
+  }
+
+  fn execute(&self, sql: &str, _args: Option<&[Value]>) -> Result<(), String> {
+    println!("DEBUG SQL EXECUTE: {}", sql);
+    self.captured_queries.lock().unwrap().push(sql.to_string());
+    let mut responses = self.execute_responses.lock().unwrap();
+    if responses.is_empty() {
+      return Ok(());
+    }
+    responses.remove(0)
+  }
+
+  fn auth_user_id(&self) -> Result<String, String> {
+    Ok("00000000-0000-0000-0000-000000000000".to_string())
+  }
+
+  fn timestamp(&self) -> Result<String, String> {
+    Ok("2026-03-10T00:00:00Z".to_string())
+  }
+
+  #[cfg(test)]
+  fn get_queries(&self) -> Vec<String> {
+    self.captured_queries.lock().unwrap().clone()
+  }
+
+  #[cfg(test)]
+  fn reset_mocks(&self) {
+    self.captured_queries.lock().unwrap().clear();
+  }
+}
--- a/src/database/executors/mod.rs
+++ b/src/database/executors/mod.rs
@ -0,0 +1,28 @@
+pub mod mock;
+
+#[cfg(not(test))]
+pub mod pgrx;
+
+use serde_json::Value;
+
+/// An abstraction over database execution to allow for isolated unit testing
+/// without a live Postgres SPI connection.
+pub trait DatabaseExecutor: Send + Sync {
+  /// Executes a query expecting a single JSONB return, representing rows.
+  fn query(&self, sql: &str, args: Option<&[Value]>) -> Result<Value, String>;
+
+  /// Executes an operation (INSERT, UPDATE, DELETE, or pg_notify) that does not return rows.
+  fn execute(&self, sql: &str, args: Option<&[Value]>) -> Result<(), String>;
+
+  /// Returns the current authenticated user's ID
+  fn auth_user_id(&self) -> Result<String, String>;
+
+  /// Returns the current transaction timestamp
+  fn timestamp(&self) -> Result<String, String>;
+
+  #[cfg(test)]
+  fn get_queries(&self) -> Vec<String>;
+
+  #[cfg(test)]
+  fn reset_mocks(&self);
+}
--- a/src/database/executors/pgrx.rs
+++ b/src/database/executors/pgrx.rs
@ -1,22 +1,7 @@
+use crate::database::executors::DatabaseExecutor;
 use pgrx::prelude::*;
 use serde_json::Value;

-/// An abstraction over database execution to allow for isolated unit testing
-/// without a live Postgres SPI connection.
-pub trait DatabaseExecutor: Send + Sync {
-  /// Executes a query expecting a single JSONB return, representing rows.
-  fn query(&self, sql: &str, args: Option<&[Value]>) -> Result<Value, String>;
-
-  /// Executes an operation (INSERT, UPDATE, DELETE, or pg_notify) that does not return rows.
-  fn execute(&self, sql: &str, args: Option<&[Value]>) -> Result<(), String>;
-
-  /// Returns the current authenticated user's ID
-  fn auth_user_id(&self) -> Result<String, String>;
-
-  /// Returns the current transaction timestamp
-  fn timestamp(&self) -> Result<String, String>;
-}
-
 /// The production executor that wraps `pgrx::spi::Spi`.
 pub struct SpiExecutor;

--- a/src/database/mod.rs
+++ b/src/database/mod.rs
@ -1,5 +1,5 @@
 pub mod r#enum;
-pub mod executor;
+pub mod executors;
 pub mod formats;
 pub mod page;
 pub mod punc;
@ -7,14 +7,26 @@ pub mod relation;
 pub mod schema;
 pub mod r#type;

-use crate::database::r#enum::Enum;
-use crate::database::executor::{DatabaseExecutor, SpiExecutor};
-use crate::database::punc::{Punc, Stem};
-use crate::database::relation::Relation;
-use crate::database::schema::Schema;
-use crate::database::r#type::Type;
+// External mock exports inside the executor sub-folder
+
+use r#enum::Enum;
+use executors::DatabaseExecutor;
+
+#[cfg(not(test))]
+use executors::pgrx::SpiExecutor;
+
+#[cfg(test)]
+use executors::mock::MockExecutor;
+
+pub mod stem;
+use punc::Punc;
+use relation::Relation;
+use schema::Schema;
 use serde_json::Value;
 use std::collections::{HashMap, HashSet};
+use std::sync::Arc;
+use stem::Stem;
+use r#type::Type;

 pub struct Database {
  pub enums: HashMap<String, Enum>,
@ -22,22 +34,28 @@ pub struct Database {
  pub puncs: HashMap<String, Punc>,
  pub relations: HashMap<String, Relation>,
  pub schemas: HashMap<String, Schema>,
+  // Map of Schema ID -> { Entity Type -> Target Subschema Arc }
+  pub stems: HashMap<String, HashMap<String, Arc<Stem>>>,
  pub descendants: HashMap<String, Vec<String>>,
  pub depths: HashMap<String, usize>,
  pub executor: Box<dyn DatabaseExecutor + Send + Sync>,
 }

 impl Database {
-  pub fn new(val: &serde_json::Value) -> Self {
+  pub fn new(val: &serde_json::Value) -> Result<Self, crate::drop::Drop> {
    let mut db = Self {
      enums: HashMap::new(),
      types: HashMap::new(),
      relations: HashMap::new(),
      puncs: HashMap::new(),
      schemas: HashMap::new(),
+      stems: HashMap::new(),
      descendants: HashMap::new(),
      depths: HashMap::new(),
+      #[cfg(not(test))]
      executor: Box::new(SpiExecutor::new()),
+      #[cfg(test)]
+      executor: Box::new(MockExecutor::new()),
    };

    if let Some(arr) = val.get("enums").and_then(|v| v.as_array()) {
@ -86,8 +104,8 @@ impl Database {
      }
    }

-    let _ = db.compile();
-    db
+    db.compile()?;
+    Ok(db)
  }

  /// Override the default executor for unit testing
@ -117,12 +135,12 @@ impl Database {
  }

  /// Organizes the graph of the database, compiling regex, format functions, and caching relationships.
-  fn compile(&mut self) -> Result<(), String> {
+  pub fn compile(&mut self) -> Result<(), crate::drop::Drop> {
    self.collect_schemas();
    self.collect_depths();
    self.collect_descendants();
    self.compile_schemas();
-    self.collect_stems();
+    self.collect_stems()?;

    Ok(())
  }
@ -229,88 +247,78 @@ impl Database {
    }
  }

-  fn collect_stems(&mut self) {
-    let mut st_map: HashMap<String, Vec<Stem>> = HashMap::new();
-    for (name, _) in &self.puncs {
-      let mut stems = Vec::new();
-      let response_id = format!("{}.response", name);
-      if let Some(resp_schema) = self.schemas.get(&response_id) {
+  fn collect_stems(&mut self) -> Result<(), crate::drop::Drop> {
+    let mut db_stems: HashMap<String, HashMap<String, Arc<Stem>>> = HashMap::new();
+    let mut errors: Vec<crate::drop::Error> = Vec::new();
+
+    let schema_ids: Vec<String> = self.schemas.keys().cloned().collect();
+    for schema_id in schema_ids {
+      if let Some(schema) = self.schemas.get(&schema_id) {
+        let mut inner_map = HashMap::new();
        Self::discover_stems(
-          &self.types,
-          &self.schemas,
-          &self.relations,
-          &response_id,
-          resp_schema,
+          self,
+          &schema_id,
+          schema,
          String::from(""),
          None,
          None,
-          &mut stems,
+          &mut inner_map,
+          &mut errors,
        );
-      }
-      st_map.insert(name.clone(), stems);
-    }
-    for (name, stems) in st_map {
-      if let Some(p) = self.puncs.get_mut(&name) {
-        p.stems = stems;
+        if !inner_map.is_empty() {
+          println!("SCHEMA: {} STEMS: {:?}", schema_id, inner_map.keys());
+          db_stems.insert(schema_id, inner_map);
+        }
      }
    }
+
+    self.stems = db_stems;
+
+    if !errors.is_empty() {
+      return Err(crate::drop::Drop::with_errors(errors));
+    }
+    Ok(())
  }

  fn discover_stems(
-    types: &HashMap<String, Type>,
-    schemas: &HashMap<String, Schema>,
-    relations: &HashMap<String, Relation>,
-    _schema_id: &str,
+    db: &Database,
+    root_schema_id: &str,
    schema: &Schema,
-    current_path: String,
+    mut current_path: String,
    parent_type: Option<String>,
    property_name: Option<String>,
-    stems: &mut Vec<Stem>,
+    inner_map: &mut HashMap<String, Arc<Stem>>,
+    errors: &mut Vec<crate::drop::Error>,
  ) {
    let mut is_entity = false;
    let mut entity_type = String::new();

-    // Check if this schema resolves to an Entity
-    let mut current_ref = schema.obj.r#ref.clone();
-    let mut depth = 0;
-    while let Some(r) = current_ref {
-      if types.contains_key(&r) {
-        is_entity = true;
-        entity_type = r.clone();
-        break;
-      }
-      if let Some(s) = schemas.get(&r) {
-        current_ref = s.obj.r#ref.clone();
-      } else {
-        break;
-      }
-      depth += 1;
-      if depth > 20 {
-        break;
-      } // prevent infinite loop
+    let mut examine_id = None;
+    if let Some(ref r) = schema.obj.r#ref {
+      examine_id = Some(r.clone());
+    } else if let Some(ref id) = schema.obj.id {
+      examine_id = Some(id.clone());
    }

-    if is_entity {
-      let final_path = if current_path.is_empty() {
-        "/".to_string()
-      } else {
-        current_path.clone()
-      };
+    if let Some(target) = examine_id {
+      let parts: Vec<&str> = target.split('.').collect();
+      if let Some(last_seg) = parts.last() {
+        if db.types.contains_key(*last_seg) {
+          is_entity = true;
+          entity_type = last_seg.to_string();
+        }
+      }
+    }

-      let mut relation_col = None;
+    let mut relation_col = None;
+    if is_entity {
      if let (Some(pt), Some(prop)) = (&parent_type, &property_name) {
        let expected_col = format!("{}_id", prop);
        let mut found = false;
-
-        // Try to find the exact relation from the database schema
-        for rel in relations.values() {
-          if rel.source_type == *pt && rel.destination_type == entity_type {
-            if rel.source_columns.contains(&expected_col) {
-              relation_col = Some(expected_col.clone());
-              found = true;
-              break;
-            }
-          } else if rel.source_type == entity_type && rel.destination_type == *pt {
+        for rel in db.relations.values() {
+          if (rel.source_type == *pt && rel.destination_type == entity_type)
+            || (rel.source_type == entity_type && rel.destination_type == *pt)
+          {
            if rel.source_columns.contains(&expected_col) {
              relation_col = Some(expected_col.clone());
              found = true;
@ -318,64 +326,128 @@ impl Database {
            }
          }
        }
-
        if !found {
-          // Fallback guess if explicit matching fails
          relation_col = Some(expected_col);
        }
      }

-      stems.push(Stem {
-        path: final_path,
+      let stem = Stem {
        r#type: entity_type.clone(),
        relation: relation_col,
-      });
+        schema: Arc::new(schema.clone()),
+      };
+
+      let mut branch_path = current_path.clone();
+      if !current_path.is_empty() {
+        branch_path = format!("{}/{}", current_path, entity_type);
+      }
+
+      if inner_map.contains_key(&branch_path) {
+        errors.push(crate::drop::Error {
+          code: "STEM_COLLISION".to_string(),
+          message: format!("The stem path `{}` resolves to multiple Entity boundaries. This usually occurs during un-wrapped $family or oneOf polymorphic schemas where multiple Entities are directly assigned to the same property. To fix this, encapsulate the polymorphic branch.", branch_path),
+          details: crate::drop::ErrorDetails {
+            path: root_schema_id.to_string(),
+          },
+        });
+      }
+
+      inner_map.insert(branch_path.clone(), Arc::new(stem));
+
+      // Update current_path for structural children
+      current_path = branch_path;
    }

-    // Pass the new parent downwards
    let next_parent = if is_entity {
      Some(entity_type.clone())
    } else {
      parent_type.clone()
    };

+    // Properties branch
    if let Some(props) = &schema.obj.properties {
      for (k, v) in props {
-        let next_path = format!(
-          "{}/{}",
-          if current_path.is_empty() {
-            ""
-          } else {
-            &current_path
-          },
-          k
-        );
+        // Bypass target and source properties if we are in a relationship
+        if let Some(parent_str) = &next_parent {
+          if let Some(pt) = db.types.get(parent_str) {
+            if pt.relationship && (k == "target" || k == "source") {
+              Self::discover_stems(
+                db,
+                root_schema_id,
+                v,
+                current_path.clone(),
+                next_parent.clone(),
+                Some(k.clone()),
+                inner_map,
+                errors,
+              );
+              continue;
+            }
+          }
+        }
+
+        // Standard Property Pathing
+        let next_path = if current_path.is_empty() {
+          k.clone()
+        } else {
+          format!("{}/{}", current_path, k)
+        };
+
        Self::discover_stems(
-          types,
-          schemas,
-          relations,
-          "",
+          db,
+          root_schema_id,
          v,
          next_path,
          next_parent.clone(),
          Some(k.clone()),
-          stems,
+          inner_map,
+          errors,
        );
      }
    }

+    // Array Item branch
    if let Some(items) = &schema.obj.items {
      Self::discover_stems(
-        types,
-        schemas,
-        relations,
-        "",
+        db,
+        root_schema_id,
        items,
        current_path.clone(),
        next_parent.clone(),
        property_name.clone(),
-        stems,
+        inner_map,
+        errors,
      );
    }
+
+    // Polymorphism branch
+    if let Some(arr) = &schema.obj.one_of {
+      for v in arr {
+        Self::discover_stems(
+          db,
+          root_schema_id,
+          v.as_ref(),
+          current_path.clone(),
+          next_parent.clone(),
+          property_name.clone(),
+          inner_map,
+          errors,
+        );
+      }
+    }
+    if let Some(arr) = &schema.obj.all_of {
+      for v in arr {
+        Self::discover_stems(
+          db,
+          root_schema_id,
+          v.as_ref(),
+          current_path.clone(),
+          next_parent.clone(),
+          property_name.clone(),
+          inner_map,
+          errors,
+        );
+      }
+    }
  }
 }
--- a/src/database/punc.rs
+++ b/src/database/punc.rs
@ -2,14 +2,6 @@ use crate::database::page::Page;
 use crate::database::schema::Schema;
 use serde::{Deserialize, Serialize};

-#[derive(Debug, Clone, Serialize, Deserialize)]
-pub struct Stem {
-  pub path: String,
-  pub r#type: String,
-  #[serde(skip_serializing_if = "Option::is_none")]
-  pub relation: Option<String>,
-}
-
 #[derive(Debug, Clone, Serialize, Deserialize, Default)]
 #[serde(default)]
 pub struct Punc {
@ -25,6 +17,4 @@ pub struct Punc {
  pub page: Option<Page>,
  #[serde(default)]
  pub schemas: Vec<Schema>,
-  #[serde(default)]
-  pub stems: Vec<Stem>,
 }
--- a/src/database/schema.rs
+++ b/src/database/schema.rs
@ -5,6 +5,14 @@ use std::sync::Arc;

 // Schema mirrors the Go Punc Generator's schema struct for consistency.
 // It is an order-preserving representation of a JSON Schema.
+
+pub fn deserialize_some<'de, D>(deserializer: D) -> Result<Option<Value>, D::Error>
+where
+  D: serde::Deserializer<'de>,
+{
+  let v = Value::deserialize(deserializer)?;
+  Ok(Some(v))
+}
 #[derive(Debug, Clone, Serialize, Deserialize, Default)]
 pub struct SchemaObject {
  // Core Schema Keywords
@ -79,7 +87,7 @@ pub struct SchemaObject {
  #[serde(
    default,
    rename = "const",
-    deserialize_with = "crate::validator::util::deserialize_some"
+    deserialize_with = "crate::database::schema::deserialize_some"
  )]
  pub const_: Option<Value>,

@ -96,8 +104,6 @@ pub struct SchemaObject {
  // Combining Keywords
  #[serde(rename = "allOf")]
  pub all_of: Option<Vec<Arc<Schema>>>,
-  #[serde(rename = "anyOf")]
-  pub any_of: Option<Vec<Arc<Schema>>>,
  #[serde(rename = "oneOf")]
  pub one_of: Option<Vec<Arc<Schema>>>,
  #[serde(rename = "not")]
@ -238,9 +244,6 @@ impl Schema {
    if let Some(arr) = &mut self.obj.all_of {
      map_arr(arr);
    }
-    if let Some(arr) = &mut self.obj.any_of {
-      map_arr(arr);
-    }
    if let Some(arr) = &mut self.obj.one_of {
      map_arr(arr);
    }
@ -300,7 +303,6 @@ impl<'de> Deserialize<'de> for Schema {
      && obj.enum_.is_none()
      && obj.const_.is_none()
      && obj.all_of.is_none()
-      && obj.any_of.is_none()
      && obj.one_of.is_none()
      && obj.not.is_none()
      && obj.if_.is_none()
--- a/src/database/stem.rs
+++ b/src/database/stem.rs
@ -0,0 +1,17 @@
+use crate::database::schema::Schema;
+use serde::{Deserialize, Serialize};
+use std::sync::Arc;
+
+#[derive(Debug, Clone, Serialize, Deserialize)]
+pub struct Stem {
+  pub r#type: String,
+  #[serde(skip_serializing_if = "Option::is_none")]
+  pub relation: Option<String>,
+
+  // The actual database schema node mapping for
+  // O(1) jump table execution for queryer.
+  //
+  // Automatically skipped from `jspg_stems()` JSON payload output.
+  #[serde(skip)]
+  pub schema: Arc<Schema>,
+}