From a910d24d2e68156c66395bc24c2e3abb55bfece4 Mon Sep 17 00:00:00 2001 From: Duckki Oe Date: Fri, 13 Dec 2024 10:59:55 -0800 Subject: [PATCH] feat(federation): started query plan correctness checker - implemented ResponseShape computation from an operation --- apollo-federation/cli/src/main.rs | 11 +- .../src/query_plan/correctness/mod.rs | 23 + .../query_plan/correctness/response_shape.rs | 913 ++++++++++++++++++ .../correctness/response_shape_test.rs | 518 ++++++++++ apollo-federation/src/query_plan/mod.rs | 1 + 5 files changed, 1462 insertions(+), 4 deletions(-) create mode 100644 apollo-federation/src/query_plan/correctness/mod.rs create mode 100644 apollo-federation/src/query_plan/correctness/response_shape.rs create mode 100644 apollo-federation/src/query_plan/correctness/response_shape_test.rs diff --git a/apollo-federation/cli/src/main.rs b/apollo-federation/cli/src/main.rs index c89afb689cf..58a0873c6f8 100644 --- a/apollo-federation/cli/src/main.rs +++ b/apollo-federation/cli/src/main.rs @@ -248,10 +248,13 @@ fn cmd_plan( let query_doc = ExecutableDocument::parse_and_validate(planner.api_schema().schema(), query, query_path)?; - print!( - "{}", - planner.build_query_plan(&query_doc, None, Default::default())? - ); + let query_plan = planner.build_query_plan(&query_doc, None, Default::default())?; + println!("{query_plan}"); + apollo_federation::query_plan::correctness::check_plan( + planner.api_schema(), + &query_doc, + &query_plan, + )?; Ok(()) } diff --git a/apollo-federation/src/query_plan/correctness/mod.rs b/apollo-federation/src/query_plan/correctness/mod.rs new file mode 100644 index 00000000000..11cdd771edd --- /dev/null +++ b/apollo-federation/src/query_plan/correctness/mod.rs @@ -0,0 +1,23 @@ +pub mod response_shape; +#[cfg(test)] +pub mod response_shape_test; + +use apollo_compiler::validation::Valid; +use apollo_compiler::ExecutableDocument; + +use crate::query_plan::QueryPlan; +use crate::schema::ValidFederationSchema; +use crate::FederationError; + +//================================================================================================== +// check_plan + +pub fn check_plan( + schema: &ValidFederationSchema, + operation_doc: &Valid, + _plan: &QueryPlan, +) -> Result<(), FederationError> { + let rs = response_shape::compute_response_shape(operation_doc, schema)?; + println!("\nResponse shape from operation:\n{rs}"); + Ok(()) +} diff --git a/apollo-federation/src/query_plan/correctness/response_shape.rs b/apollo-federation/src/query_plan/correctness/response_shape.rs new file mode 100644 index 00000000000..caaabac9134 --- /dev/null +++ b/apollo-federation/src/query_plan/correctness/response_shape.rs @@ -0,0 +1,913 @@ +use std::fmt; +use std::sync::Arc; + +use apollo_compiler::ast; +use apollo_compiler::collections::IndexMap; +use apollo_compiler::collections::IndexSet; +use apollo_compiler::executable::Field; +use apollo_compiler::executable::Fragment; +use apollo_compiler::executable::Selection; +use apollo_compiler::executable::SelectionSet; +use apollo_compiler::validation::Valid; +use apollo_compiler::ExecutableDocument; +use apollo_compiler::Name; +use apollo_compiler::Node; + +use crate::bail; +use crate::display_helpers; +use crate::internal_error; +use crate::schema::position::CompositeTypeDefinitionPosition; +use crate::schema::position::InterfaceTypeDefinitionPosition; +use crate::schema::position::ObjectTypeDefinitionPosition; +use crate::schema::ValidFederationSchema; +use crate::utils::FallibleIterator; +use crate::FederationError; + +//================================================================================================== +// Vec utilities + +fn vec_sorted_by(src: &[T], compare: impl Fn(&T, &T) -> std::cmp::Ordering) -> Vec { + let mut sorted = src.to_owned(); + sorted.sort_by(&compare); + sorted +} + +//================================================================================================== +// Type conditions + +fn get_interface_implementers<'a>( + interface: &InterfaceTypeDefinitionPosition, + schema: &'a ValidFederationSchema, +) -> Result<&'a IndexSet, FederationError> { + Ok(&schema + .referencers() + .get_interface_type(&interface.type_name)? + .object_types) +} + +/// Does `x` implies `y`? (`x`'s possible types is a subset of `y`'s possible types) +/// - All type-definition positions are in the API schema. +// Note: Similar to `runtime_types_intersect` (avoids using `possible_runtime_types`) +fn runtime_types_implies( + x: &CompositeTypeDefinitionPosition, + y: &CompositeTypeDefinitionPosition, + schema: &ValidFederationSchema, +) -> Result { + use CompositeTypeDefinitionPosition::*; + match (x, y) { + (Object(x), Object(y)) => Ok(x == y), + (Object(object), Union(union)) => { + // Union members must be object types in GraphQL. + let union_type = union.get(schema.schema())?; + Ok(union_type.members.contains(&object.type_name)) + } + (Union(union), Object(object)) => { + // Is `object` the only member of `union`? + let union_type = union.get(schema.schema())?; + Ok(union_type.members.len() == 1 && union_type.members.contains(&object.type_name)) + } + (Object(object), Interface(interface)) => { + // Interface implementers must be object types in GraphQL. + let interface_implementers = get_interface_implementers(interface, schema)?; + Ok(interface_implementers.contains(object)) + } + (Interface(interface), Object(object)) => { + // Is `object` the only implementer of `interface`? + let interface_implementers = get_interface_implementers(interface, schema)?; + Ok(interface_implementers.len() == 1 && interface_implementers.contains(object)) + } + + (Union(x), Union(y)) if x == y => Ok(true), + (Union(x), Union(y)) => { + let (x, y) = (x.get(schema.schema())?, y.get(schema.schema())?); + Ok(x.members.is_subset(&y.members)) + } + + (Interface(x), Interface(y)) if x == y => Ok(true), + (Interface(x), Interface(y)) => { + let x = get_interface_implementers(x, schema)?; + let y = get_interface_implementers(y, schema)?; + Ok(x.is_subset(y)) + } + + (Union(union), Interface(interface)) => { + let union = union.get(schema.schema())?; + let interface_implementers = get_interface_implementers(interface, schema)?; + Ok(union.members.iter().all(|m| { + let m_ty = ObjectTypeDefinitionPosition::new(m.name.clone()); + interface_implementers.contains(&m_ty) + })) + } + (Interface(interface), Union(union)) => { + let interface_implementers = get_interface_implementers(interface, schema)?; + let union = union.get(schema.schema())?; + Ok(interface_implementers + .iter() + .all(|t| union.members.contains(&t.type_name))) + } + } +} + +/// Constructs a set of object types +/// - Slow: calls `possible_runtime_types` and sorts the result. +fn get_ground_types( + ty: &CompositeTypeDefinitionPosition, + schema: &ValidFederationSchema, +) -> Result, FederationError> { + let mut result = schema.possible_runtime_types(ty.clone())?; + result.sort_by(|a, b| a.type_name.cmp(&b.type_name)); + Ok(result.into_iter().collect()) +} + +/// A sequence of type conditions applied (used for display) +// - The vector must be non-empty. +#[derive(Debug, Clone)] +struct AppliedTypeCondition(Vec); + +impl fmt::Display for AppliedTypeCondition { + fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result { + for (i, cond) in self.0.iter().enumerate() { + if i > 0 { + write!(f, " ∧ ")?; + } + write!(f, "{}", cond.type_name())?; + } + Ok(()) + } +} + +impl AppliedTypeCondition { + fn new(ty: CompositeTypeDefinitionPosition) -> Self { + AppliedTypeCondition(vec![ty]) + } + + /// Construct a new type condition with a named type condition added. + fn add_type_name( + &self, + name: Name, + schema: &ValidFederationSchema, + ) -> Result { + let ty: CompositeTypeDefinitionPosition = schema.get_type(name)?.try_into()?; + if self + .0 + .iter() + .fallible_any(|t| runtime_types_implies(t, &ty, schema))? + { + return Ok(self.clone()); + } + // filter out existing conditions that are implied by `ty`. + let mut buf = Vec::new(); + for t in &self.0 { + if !runtime_types_implies(&ty, t, schema)? { + buf.push(t.clone()); + } + } + buf.push(ty); + buf.sort_by(|a, b| a.type_name().cmp(b.type_name())); + Ok(AppliedTypeCondition(buf)) + } +} + +#[derive(Debug, Clone)] +struct NormalizedTypeCondition { + // The set of object types that are used for comparison. + // - The ground_set must be non-empty. + // - The ground_set must be sorted by type name. + ground_set: Vec, + + // Simplified type condition for display. + for_display: AppliedTypeCondition, +} + +impl PartialEq for NormalizedTypeCondition { + fn eq(&self, other: &Self) -> bool { + self.ground_set == other.ground_set + } +} + +impl Eq for NormalizedTypeCondition {} + +impl fmt::Display for NormalizedTypeCondition { + fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result { + write!(f, "{}", self.for_display)?; + if self.for_display.0.len() > 1 { + write!(f, " = {{")?; + for (i, ty) in self.ground_set.iter().enumerate() { + if i > 0 { + write!(f, ", ")?; + } + write!(f, "{}", ty.type_name)?; + } + write!(f, "}}")?; + } + Ok(()) + } +} + +impl std::hash::Hash for NormalizedTypeCondition { + fn hash(&self, state: &mut H) { + self.ground_set.hash(state); + } +} + +impl NormalizedTypeCondition { + /// Construct a new type condition with a single named type condition. + fn from_type_name(name: Name, schema: &ValidFederationSchema) -> Result { + let ty: CompositeTypeDefinitionPosition = schema.get_type(name)?.try_into()?; + Ok(NormalizedTypeCondition { + ground_set: get_ground_types(&ty, schema)?, + for_display: AppliedTypeCondition::new(ty), + }) + } + + /// Construct a new type condition with a named type condition added. + fn add_type_name( + &self, + name: Name, + schema: &ValidFederationSchema, + ) -> Result, FederationError> { + let other_ty: CompositeTypeDefinitionPosition = + schema.get_type(name.clone())?.try_into()?; + let other_types = get_ground_types(&other_ty, schema)?; + let ground_set: Vec = self + .ground_set + .iter() + .filter(|t| other_types.contains(t)) + .cloned() + .collect(); + if ground_set.is_empty() { + // Unsatisfiable condition + Ok(None) + } else { + let for_display = if ground_set.len() == self.ground_set.len() { + // unchanged + self.for_display.clone() + } else { + self.for_display.add_type_name(name, schema)? + }; + Ok(Some(NormalizedTypeCondition { + ground_set, + for_display, + })) + } + } +} + +//================================================================================================== +// Logical conditions + +#[derive(Debug, Clone, PartialEq, Eq, Hash)] +enum Literal { + Pos(Name), // positive occurrence of the variable with the given name + Neg(Name), // negated variable with the given name +} + +impl Literal { + fn variable(&self) -> &Name { + match self { + Literal::Pos(name) | Literal::Neg(name) => name, + } + } + + fn polarity(&self) -> bool { + matches!(self, Literal::Pos(_)) + } +} + +// A clause is a conjunction of literals. +// Empty Clause means "true". +// "false" can't be represented. Any cases with false condition must be dropped entirely. +// This vector must be deduplicated. +#[derive(Debug, Clone, Default, Eq)] +struct Clause(Vec); + +impl fmt::Display for Clause { + fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result { + if self.0.is_empty() { + write!(f, "true") + } else { + for (i, l) in self.0.iter().enumerate() { + if i > 0 { + write!(f, " ∧ ")?; + } + match l { + Literal::Pos(v) => write!(f, "{}", v)?, + Literal::Neg(v) => write!(f, "¬{}", v)?, + } + } + Ok(()) + } + } +} + +impl Clause { + fn is_always_true(&self) -> bool { + self.0.is_empty() + } + + fn is_unsatisfiable(&self) -> bool { + let mut variables: IndexMap = IndexMap::default(); + for lit in &self.0 { + let var = lit.variable(); + let entry = variables.entry(var.clone()).or_insert(lit.clone()); + if entry.polarity() != lit.polarity() { + return true; // conflict + } + } + false + } + + /// variables: variable name (Name) -> polarity (bool) + fn from_variable_map(variables: &IndexMap) -> Self { + let mut buf: Vec = variables + .iter() + .map(|(name, polarity)| match polarity { + false => Literal::Neg(name.clone()), + true => Literal::Pos(name.clone()), + }) + .collect(); + buf.sort_by(|a, b| a.variable().cmp(b.variable())); + Clause(buf) + } + + fn concatenate(&self, other: &Clause) -> Option { + let mut variables: IndexMap = IndexMap::default(); + // Assume that `self` has no conflicts. + for lit in &self.0 { + variables.insert(lit.variable().clone(), lit.polarity()); + } + for lit in &other.0 { + let var = lit.variable(); + let entry = variables.entry(var.clone()).or_insert(lit.polarity()); + if *entry != lit.polarity() { + return None; // conflict + } + } + Some(Self::from_variable_map(&variables)) + } + + fn add_selection_directives( + &self, + directives: &ast::DirectiveList, + ) -> Result, FederationError> { + let Some(selection_clause) = boolean_clause_from_directives(directives)? else { + // The condition is unsatisfiable within the field itself. + return Ok(None); + }; + Ok(self.concatenate(&selection_clause)) + } + + /// Returns a clause with everything included and a simplified version of the `clause`. + /// - The simplified clause does not include variables that are already in `self`. + fn concatenate_and_simplify(&self, clause: &Clause) -> Option<(Clause, Clause)> { + let mut all_variables: IndexMap = IndexMap::default(); + // Load `self` on `variables`. + // - Assume that `self` has no conflicts. + for lit in &self.0 { + all_variables.insert(lit.variable().clone(), lit.polarity()); + } + + let mut added_variables: IndexMap = IndexMap::default(); + for lit in &clause.0 { + let var = lit.variable(); + match all_variables.entry(var.clone()) { + indexmap::map::Entry::Occupied(entry) => { + if entry.get() != &lit.polarity() { + return None; // conflict + } + } + indexmap::map::Entry::Vacant(entry) => { + entry.insert(lit.polarity()); + added_variables.insert(var.clone(), lit.polarity()); + } + } + } + Some(( + Self::from_variable_map(&all_variables), + Self::from_variable_map(&added_variables), + )) + } +} + +impl PartialEq for Clause { + fn eq(&self, other: &Self) -> bool { + // assume: The underlying vectors are deduplicated. + self.0.len() == other.0.len() && self.0.iter().all(|l| other.0.contains(l)) + } +} + +//================================================================================================== +// Normalization of Field Selection + +/// Extracts the Boolean clause from the directive list. +// Similar to `Conditions::from_directives` in `conditions.rs`. +fn boolean_clause_from_directives( + directives: &ast::DirectiveList, +) -> Result, FederationError> { + let mut variables = IndexMap::default(); // variable name (Name) -> polarity (bool) + if let Some(skip) = directives.get("skip") { + let Some(value) = skip.specified_argument_by_name("if") else { + bail!("missing @skip(if:) argument"); + }; + + match value.as_ref() { + // Constant @skip(if: true) can never match + ast::Value::Boolean(true) => return Ok(None), + // Constant @skip(if: false) always matches + ast::Value::Boolean(_) => {} + ast::Value::Variable(name) => { + variables.insert(name.clone(), false); + } + _ => { + bail!("expected boolean or variable `if` argument, got {value}"); + } + } + } + + if let Some(include) = directives.get("include") { + let Some(value) = include.specified_argument_by_name("if") else { + bail!("missing @include(if:) argument"); + }; + + match value.as_ref() { + // Constant @include(if: false) can never match + ast::Value::Boolean(false) => return Ok(None), + // Constant @include(if: true) always matches + ast::Value::Boolean(true) => {} + // If both @skip(if: $var) and @include(if: $var) exist, the condition can also + // never match + ast::Value::Variable(name) => { + if variables.insert(name.clone(), true) == Some(false) { + // Conflict found + return Ok(None); + } + } + _ => { + bail!("expected boolean or variable `if` argument, got {value}"); + } + } + } + Ok(Some(Clause::from_variable_map(&variables))) +} + +fn normalized_arguments(args: &[Node]) -> Vec> { + vec_sorted_by(args, |a, b| a.name.cmp(&b.name)) +} + +fn remove_conditions_from_directives(directives: &ast::DirectiveList) -> ast::DirectiveList { + directives + .iter() + .filter(|d| d.name != "skip" && d.name != "include") + .cloned() + .collect() +} + +type FieldSelectionKey = Field; + +// Extract the selection key +fn field_selection_key(field: &Field) -> FieldSelectionKey { + Field { + definition: field.definition.clone(), + alias: None, // not used for comparison + name: field.name.clone(), + arguments: normalized_arguments(&field.arguments), + directives: ast::DirectiveList::default(), // not used for comparison + selection_set: SelectionSet::new(field.selection_set.ty.clone()), // not used for comparison + } +} + +//================================================================================================== +// ResponseShape + +/// Simplified field value used for display purposes +fn field_display(field: &Field) -> Field { + Field { + definition: field.definition.clone(), + alias: None, // not used for display + name: field.name.clone(), + arguments: field.arguments.clone(), + directives: remove_conditions_from_directives(&field.directives), + selection_set: SelectionSet::new(field.selection_set.ty.clone()), // not used for display + } +} + +#[derive(Debug, PartialEq, Eq, Clone)] +struct DefinitionVariant { + /// Boolean clause is the secondary key after NormalizedTypeCondition as primary key. + boolean_clause: Clause, + + /// Field selection for definition/display (see `fn field_display`). + /// - This is the first field of the same field selection key in depth-first order as + /// defined by `CollectFields` and `ExecuteField` algorithms in the GraphQL spec. + field_display: Field, + + /// Different variants can have different sets of sub-selections (if any). + sub_selection_response_shape: Option, +} + +#[derive(Debug, PartialEq, Eq, Clone)] +struct PossibleDefinitionsPerTypeCondition { + /// The key for comparison (only used for GraphQL invariant check). + /// - Under each type condition, all variants must have the same selection key. + field_selection_key: FieldSelectionKey, + + /// Under each type condition, there may be multiple variants with different Boolean conditions. + conditional_variants: Vec, + // - Every variant's (Boolean condition, directive key) must be unique. + // - (TBD) Their Boolean conditions must be mutually exclusive. +} + +impl PossibleDefinitionsPerTypeCondition { + fn insert_variant(&mut self, variant: DefinitionVariant) { + for existing in &mut self.conditional_variants { + if existing.boolean_clause == variant.boolean_clause { + // Merge response shapes (MergeSelectionSets from GraphQL spec 6.4.3) + match ( + &mut existing.sub_selection_response_shape, + variant.sub_selection_response_shape, + ) { + (None, None) => {} // nothing to do + (Some(existing_rs), Some(ref variant_rs)) => { + existing_rs.merge_with(variant_rs); + } + (None, Some(_)) | (Some(_), None) => { + unreachable!("mismatched sub-selection options") + } + } + return; + } + } + self.conditional_variants.push(variant); + } +} + +/// All possible definitions that a response key can have. +/// - At the top level, all possibilities are indexed by the type condition. +/// - However, they are not necessarily mutually exclusive. +#[derive(Debug, Default, PartialEq, Eq, Clone)] +struct PossibleDefinitions(IndexMap); + +impl PossibleDefinitions { + fn insert_possible_definition( + &mut self, + type_conditions: NormalizedTypeCondition, + boolean_clause: Clause, // the aggregate boolean condition of the current selection set + field_display: Field, + sub_selection_response_shape: Option, + ) { + let field_selection_key = field_selection_key(&field_display); + let entry = self.0.entry(type_conditions); + let insert_variant = |per_type_cond: &mut PossibleDefinitionsPerTypeCondition| { + let value = DefinitionVariant { + boolean_clause, + field_display, + sub_selection_response_shape, + }; + per_type_cond.insert_variant(value); + }; + match entry { + indexmap::map::Entry::Vacant(e) => { + // New type condition + let empty_per_type_cond = PossibleDefinitionsPerTypeCondition { + field_selection_key, + conditional_variants: vec![], + }; + insert_variant(e.insert(empty_per_type_cond)); + } + indexmap::map::Entry::Occupied(mut e) => { + // GraphQL invariant: per_type_cond.field_selection_key must be the same + // as the given field_selection_key. + assert_eq!(e.get().field_selection_key, field_selection_key); + insert_variant(e.get_mut()); + } + }; + } +} + +#[derive(Debug, PartialEq, Eq, Clone)] +pub struct ResponseShape { + /// The default type condition is only used for display. + default_type_condition: NormalizedTypeCondition, + definitions_per_response_key: IndexMap, +} + +impl ResponseShape { + fn new(default_type_condition: NormalizedTypeCondition) -> Self { + ResponseShape { + default_type_condition, + definitions_per_response_key: IndexMap::default(), + } + } + + fn merge_with(&mut self, other: &Self) { + for (response_key, other_defs) in &other.definitions_per_response_key { + let value = self + .definitions_per_response_key + .entry(response_key.clone()) + .or_default(); + for (type_condition, per_type_cond) in &other_defs.0 { + for variant in &per_type_cond.conditional_variants { + value.insert_possible_definition( + type_condition.clone(), + variant.boolean_clause.clone(), + variant.field_display.clone(), + variant.sub_selection_response_shape.clone(), + ); + } + } + } + } +} + +//================================================================================================== +// ResponseShape display + +impl PossibleDefinitionsPerTypeCondition { + fn has_boolean_conditions(&self) -> bool { + self.conditional_variants.len() > 1 + || self + .conditional_variants + .first() + .is_some_and(|variant| !variant.boolean_clause.is_always_true()) + } +} + +impl PossibleDefinitions { + /// Is conditional on runtime type? + fn has_type_conditions(&self, default_type_condition: &NormalizedTypeCondition) -> bool { + self.0.len() > 1 + || self + .0 + .first() + .is_some_and(|(type_condition, _)| type_condition != default_type_condition) + } + + /// Has multiple possible definitions or has any boolean conditions? + /// Note: This method may miss a type condition. So, check `has_type_conditions` as well. + fn has_multiple_definitions(&self) -> bool { + self.0.len() > 1 + || self + .0 + .first() + .is_some_and(|(_, per_type_cond)| per_type_cond.has_boolean_conditions()) + } +} + +impl ResponseShape { + fn write_indented(&self, state: &mut display_helpers::State<'_, '_>) -> fmt::Result { + state.write("{")?; + state.indent_no_new_line(); + for (response_key, defs) in &self.definitions_per_response_key { + let has_type_cond = defs.has_type_conditions(&self.default_type_condition); + let arrow_sym = if has_type_cond || defs.has_multiple_definitions() { + "-may->" + } else { + "----->" + }; + for (type_condition, per_type_cond) in &defs.0 { + for variant in &per_type_cond.conditional_variants { + let field_display = &variant.field_display; + let type_cond_str = if has_type_cond { + format!(" on {}", type_condition) + } else { + "".to_string() + }; + let boolean_str = if !variant.boolean_clause.is_always_true() { + format!(" if {}", variant.boolean_clause) + } else { + "".to_string() + }; + state.new_line()?; + state.write(format_args!( + "{response_key} {arrow_sym} {field_display}{type_cond_str}{boolean_str}" + ))?; + if let Some(sub_selection_response_shape) = + &variant.sub_selection_response_shape + { + state.write(" ")?; + sub_selection_response_shape.write_indented(state)?; + } + } + } + } + state.dedent()?; + state.write("}") + } +} + +impl fmt::Display for ResponseShape { + fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result { + self.write_indented(&mut display_helpers::State::new(f)) + } +} + +//================================================================================================== +// ResponseShape computation + +struct ResponseShapeContext { + schema: ValidFederationSchema, + fragment_defs: Arc>>, // fragment definitions in the operation + parent_type: Name, // the type of the current selection set + type_condition: NormalizedTypeCondition, // accumulated type condition down from the parent field. + inherited_clause: Clause, // accumulated conditions from the root up to parent field + current_clause: Clause, // accumulated conditions down from the parent field +} + +impl ResponseShapeContext { + fn process_selection( + &self, + response_shape: &mut ResponseShape, + selection: &Selection, + ) -> Result<(), FederationError> { + match selection { + Selection::Field(field) => self.process_field_selection(response_shape, field), + Selection::FragmentSpread(fragment_spread) => { + let fragment_def = self + .fragment_defs + .get(&fragment_spread.fragment_name) + .ok_or_else(|| { + internal_error!("Fragment not found: {}", fragment_spread.fragment_name) + })?; + // Note: `@skip/@include` directives are not allowed on fragment definitions. + // Thus, no need to check their directives for Boolean conditions. + self.process_fragment_selection( + response_shape, + fragment_def.type_condition(), + &fragment_spread.directives, + &fragment_def.selection_set, + ) + } + Selection::InlineFragment(inline_fragment) => { + let fragment_type_condition = inline_fragment + .type_condition + .as_ref() + .unwrap_or(&self.parent_type); + self.process_fragment_selection( + response_shape, + fragment_type_condition, + &inline_fragment.directives, + &inline_fragment.selection_set, + ) + } + } + } + + fn process_field_selection( + &self, + response_shape: &mut ResponseShape, + field: &Node, + ) -> Result<(), FederationError> { + let Some(field_clause) = self + .current_clause + .add_selection_directives(&field.directives)? + else { + // Unsatisfiable local condition under the parent field => skip + return Ok(()); + }; + let Some((inherited_clause, field_clause)) = self + .inherited_clause + .concatenate_and_simplify(&field_clause) + else { + // Unsatisfiable full condition from the root => skip + return Ok(()); + }; + // Process the field's sub-selection + let sub_selection_response_shape: Option = if field.selection_set.is_empty() + { + None + } else { + // internal invariant check + assert_eq!(*field.ty().inner_named_type(), field.selection_set.ty); + + // A brand new context with the new type condition. + // - Still inherits the boolean conditions for simplification purposes. + let parent_type = field.selection_set.ty.clone(); + let type_condition = + NormalizedTypeCondition::from_type_name(parent_type.clone(), &self.schema)?; + let context = ResponseShapeContext { + schema: self.schema.clone(), + fragment_defs: self.fragment_defs.clone(), + parent_type, + type_condition, + inherited_clause, + current_clause: Clause::default(), // empty + }; + Some(context.process_selection_set(&field.selection_set)?) + }; + // Record this selection's definition. + let value = response_shape + .definitions_per_response_key + .entry(field.response_key().clone()) + .or_default(); + value.insert_possible_definition( + self.type_condition.clone(), + field_clause, + field_display(field), + sub_selection_response_shape, + ); + Ok(()) + } + + /// For both inline fragments and fragment spreads + fn process_fragment_selection( + &self, + response_shape: &mut ResponseShape, + fragment_type_condition: &Name, + directives: &ast::DirectiveList, + selection_set: &SelectionSet, + ) -> Result<(), FederationError> { + // internal invariant check + assert_eq!(*fragment_type_condition, selection_set.ty); + + let Some(type_condition) = NormalizedTypeCondition::add_type_name( + &self.type_condition, + fragment_type_condition.clone(), + &self.schema, + )? + else { + // Unsatisfiable type condition => skip + return Ok(()); + }; + let Some(current_clause) = self.current_clause.add_selection_directives(directives)? else { + // Unsatisfiable local condition under the parent field => skip + return Ok(()); + }; + // check if `self.inherited_clause` and `current_clause` are unsatisfiable together. + if self.inherited_clause.concatenate(¤t_clause).is_none() { + // Unsatisfiable full condition from the root => skip + return Ok(()); + } + + // The inner context with a new type condition. + // Note: Non-conditional directives on inline spreads are ignored. + let context = ResponseShapeContext { + schema: self.schema.clone(), + fragment_defs: self.fragment_defs.clone(), + parent_type: fragment_type_condition.clone(), + type_condition, + inherited_clause: self.inherited_clause.clone(), // no change + current_clause, + }; + context.process_selection_set_within(response_shape, selection_set) + } + + /// Using an existing response shape + fn process_selection_set_within( + &self, + response_shape: &mut ResponseShape, + selection_set: &SelectionSet, + ) -> Result<(), FederationError> { + for selection in &selection_set.selections { + self.process_selection(response_shape, selection)?; + } + Ok(()) + } + + /// For a new sub-ResponseShape + /// - This corresponds to the `CollectFields` algorithm in the GraphQL specification. + fn process_selection_set( + &self, + selection_set: &SelectionSet, + ) -> Result { + let type_condition = + NormalizedTypeCondition::from_type_name(selection_set.ty.clone(), &self.schema)?; + let mut response_shape = ResponseShape::new(type_condition); + self.process_selection_set_within(&mut response_shape, selection_set)?; + Ok(response_shape) + } + + fn process_operation( + operation_doc: &Valid, + schema: &ValidFederationSchema, + ) -> Result { + let mut op_iter = operation_doc.operations.iter(); + let Some(first) = op_iter.next() else { + return Err(internal_error!("Operation not found")); + }; + if op_iter.next().is_some() { + return Err(internal_error!("Multiple operations are not supported")); + } + + let fragment_defs = Arc::new(operation_doc.fragments.clone()); + let parent_type = first.selection_set.ty.clone(); + let type_condition = NormalizedTypeCondition::from_type_name(parent_type.clone(), schema)?; + // Start a new root context. + // - Not using `process_selection_set` because there is no parent context. + let context = ResponseShapeContext { + schema: schema.clone(), + fragment_defs, + parent_type, + type_condition, + inherited_clause: Clause::default(), // empty + current_clause: Clause::default(), // empty + }; + context.process_selection_set(&first.selection_set) + } +} + +pub fn compute_response_shape( + operation_doc: &Valid, + schema: &ValidFederationSchema, +) -> Result { + ResponseShapeContext::process_operation(operation_doc, schema) +} diff --git a/apollo-federation/src/query_plan/correctness/response_shape_test.rs b/apollo-federation/src/query_plan/correctness/response_shape_test.rs new file mode 100644 index 00000000000..0a218a916b3 --- /dev/null +++ b/apollo-federation/src/query_plan/correctness/response_shape_test.rs @@ -0,0 +1,518 @@ +use apollo_compiler::schema::Schema; +use apollo_compiler::ExecutableDocument; + +use super::*; + +// The schema used in these tests. +const SCHEMA_STR: &str = r#" + type Query { + test_i: I! + test_j: J! + test_u: U! + test_v: V! + } + + interface I { + id: ID! + data(arg: Int!): String! + } + + interface J { + id: ID! + data(arg: Int!): String! + object(id: ID!): J! + } + + type R implements I & J { + id: ID! + data(arg: Int!): String! + object(id: ID!): J! + r: Int! + } + + type S implements I & J { + id: ID! + data(arg: Int!): String! + object(id: ID!): J! + s: Int! + } + + type T implements I { + id: ID! + data(arg: Int!): String! + t: Int! + } + + type X implements J { + id: ID! + data(arg: Int!): String! + object(id: ID!): J! + x: String! + } + + type Y { + id: ID! + y: String! + } + + type Z implements J { + id: ID! + data(arg: Int!): String! + object(id: ID!): J! + z: String! + } + + union U = R | S | X + union V = R | S | Y + + directive @mod(arg: Int!) on FIELD +"#; + +fn response_shape(op_str: &str) -> response_shape::ResponseShape { + let schema = Schema::parse_and_validate(SCHEMA_STR, "schema.graphql").unwrap(); + let schema = ValidFederationSchema::new(schema).unwrap(); + let op = ExecutableDocument::parse_and_validate(schema.schema(), op_str, "op.graphql").unwrap(); + response_shape::compute_response_shape(&op, &schema).unwrap() +} + +//================================================================================================= +// Basic response key and alias tests + +#[test] +fn test_aliases() { + let op_str = r#" + query { + test_i { + data(arg: 0) + alias1: data(arg: 1) + alias2: data(arg: 1) + } + } + "#; + insta::assert_snapshot!(response_shape(op_str), @r###" + { + test_i -----> test_i { + data -----> data(arg: 0) + alias1 -----> data(arg: 1) + alias2 -----> data(arg: 1) + } + } + "###); +} + +//================================================================================================= +// Type condition tests + +#[test] +fn test_type_conditions_over_multiple_different_types() { + let op_str = r#" + query { + test_i { + ... on R { + data(arg: 0) + } + ... on S { + data(arg: 1) + } + } + } + "#; + insta::assert_snapshot!(response_shape(op_str), @r###" + { + test_i -----> test_i { + data -may-> data(arg: 0) on R + data -may-> data(arg: 1) on S + } + } + "###); +} + +#[test] +fn test_type_conditions_over_multiple_different_interface_types() { + // These two intersections are distinct type conditions. + // - `U ∧ I` = {R, S} + // - `U ∧ J` = `U` = {R, S, X} + let op_str = r#" + query { + test_u { + ... on I { + data(arg: 0) + } + ... on J { + data(arg: 0) + } + } + } + "#; + // Note: The set {R, S} has no corresponding named type definition in the schema, while + // `U ∧ J` is just the same as `U`. + insta::assert_snapshot!(response_shape(op_str), @r###" + { + test_u -----> test_u { + data -may-> data(arg: 0) on I ∧ U = {R, S} + data -may-> data(arg: 0) on U + } + } + "###); +} + +#[test] +fn test_type_conditions_merge_same_object_type() { + // Testing equivalent conditions: `U ∧ R` = `U ∧ I ∧ R` = `U ∧ R ∧ I` = `R` + // Also, that's different from `U ∧ I` = {R, S}. + let op_str = r#" + query { + test_u { + ... on R { + data(arg: 0) + } + ... on I { + ... on R { + data(arg: 0) + } + } + ... on R { + ... on I { + data(arg: 0) + } + } + ... on I { # different condition + data(arg: 0) + } + } + } + "#; + insta::assert_snapshot!(response_shape(op_str), @r###" + { + test_u -----> test_u { + data -may-> data(arg: 0) on R + data -may-> data(arg: 0) on I ∧ U = {R, S} + } + } + "###); +} + +#[test] +fn test_type_conditions_merge_equivalent_intersections() { + // Testing equivalent conditions: `U ∧ I ∧ J` = `U ∧ J ∧ I` = `U ∧ I`= {R, S} + // Note: The order of applied type conditions is irrelevant. + let op_str = r#" + query { + test_u { + ... on I { + ... on J { + data(arg: 0) + } + } + ... on J { + ... on I { + data(arg: 0) + } + } + ... on I { + data(arg: 0) + } + } + } + "#; + // Note: They are merged into the same condition `I ∧ U`, since that is minimal. + insta::assert_snapshot!(response_shape(op_str), @r###" + { + test_u -----> test_u { + data -may-> data(arg: 0) on I ∧ U = {R, S} + } + } + "###); +} + +#[test] +fn test_type_conditions_merge_different_but_equivalent_intersection_expressions() { + // Testing equivalent conditions: `V ∧ I` = `V ∧ J` = `V ∧ J ∧ I` = {R, S} + // Note: Those conditions have different sets of types. But, they are still equivalent. + let op_str = r#" + query { + test_v { + ... on I { + data(arg: 0) + } + ... on J { + data(arg: 0) + } + ... on J { + ... on I { + data(arg: 0) + } + } + } + } + "#; + insta::assert_snapshot!(response_shape(op_str), @r###" + { + test_v -----> test_v { + data -may-> data(arg: 0) on I ∧ V = {R, S} + } + } + "###); +} + +#[test] +fn test_type_conditions_empty_intersection() { + // Testing unsatisfiable conditions: `U ∧ I ∧ T`= ∅ + let op_str = r#" + query { + test_u { + ... on I { + ... on T { + infeasible: data(arg: 0) + } + } + } + } + "#; + // Note: The response shape under `test_u` is empty. + insta::assert_snapshot!(response_shape(op_str), @r###" + { + test_u -----> test_u { + } + } + "###); +} + +//================================================================================================= +// Boolean condition tests + +#[test] +fn test_boolean_conditions_constants() { + let op_str = r#" + query { + test_i { + # constant true conditions + merged: data(arg: 0) + merged: data(arg: 0) @include(if: true) + merged: data(arg: 0) @skip(if: false) + + # constant false conditions + infeasible_1: data(arg: 0) @include(if: false) + infeasible_2: data(arg: 0) @skip(if: true) + } + } + "#; + insta::assert_snapshot!(response_shape(op_str), @r###" + { + test_i -----> test_i { + merged -----> data(arg: 0) + } + } + "###); +} + +#[test] +fn test_boolean_conditions_different_multiple_conditions() { + let op_str = r#" + query($v0: Boolean!, $v1: Boolean!, $v2: Boolean!) { + test_i @include(if: $v0) { + data(arg: 0) + data(arg: 0) @include(if: $v1) + ... @include(if: $v1) { + data(arg: 0) @include(if: $v2) + } + } + } + "#; + insta::assert_snapshot!(response_shape(op_str), @r###" + { + test_i -may-> test_i if v0 { + data -may-> data(arg: 0) + data -may-> data(arg: 0) if v1 + data -may-> data(arg: 0) if v1 ∧ v2 + } + } + "###); +} + +#[test] +fn test_boolean_conditions_unsatisfiable_conditions() { + let op_str = r#" + query($v0: Boolean!, $v1: Boolean!) { + test_i @include(if: $v0) { + # conflict directly within the field directives + infeasible_1: data(arg: 0) @include(if: $v1) @skip(if: $v1) + # conflicting with the parent inline fragment + ... @skip(if: $v1) { + infeasible_2: data(arg: 0) @include(if: $v1) + } + infeasible_3: data(arg: 0) @skip(if: $v0) # conflicting with the parent-selection condition + } + } + "#; + // Note: The response shape under `test_i` is empty. + insta::assert_snapshot!(response_shape(op_str), @r###" + { + test_i -may-> test_i if v0 { + } + } + "###); +} + +//================================================================================================= +// Non-conditional directive tests + +#[test] +fn test_non_conditional_directives() { + let op_str = r#" + query { + test_i { + data(arg: 0) @mod(arg: 0) # different only in directives + data(arg: 0) @mod(arg: 1) # different only in directives + data(arg: 0) # no directives + } + } + "#; + // Note: All `data` definitions are merged, but the first selection (in depth-first order) is + // chosen as the representative. + insta::assert_snapshot!(response_shape(op_str), @r###" + { + test_i -----> test_i { + data -----> data(arg: 0) @mod(arg: 0) + } + } + "###); +} + +//================================================================================================= +// Fragment spread tests + +#[test] +fn test_fragment_spread() { + let op_str = r#" + query($v0: Boolean!) { + test_i @include(if: $v0) { + merge_1: data(arg: 0) + ...F + } + } + + fragment F on I { + merge_1: data(arg: 0) + from_fragment: data(arg: 0) + infeasible_1: data(arg: 0) @skip(if: $v0) + } + "#; + insta::assert_snapshot!(response_shape(op_str), @r###" + { + test_i -may-> test_i if v0 { + merge_1 -----> data(arg: 0) + from_fragment -----> data(arg: 0) + } + } + "###); +} + +//================================================================================================= +// Sub-selection merging tests + +#[test] +fn test_merge_sub_selection_sets() { + let op_str = r#" + query($v0: Boolean!, $v1: Boolean!) { + test_j { + object(id: 0) { + merged_1: data(arg: 0) + ... on R { + merged_2: data(arg: 0) + } + merged_3: data(arg: 0) @include(if: $v0) + } + object(id: 0) { + merged_1: data(arg: 0) + ... on S { + merged_2: data(arg: 1) + } + merged_3: data(arg: 0) @include(if: $v1) + } + object(id: 0) { + merged_3: data(arg: 0) # no condition + } + } + } + "#; + insta::assert_snapshot!(response_shape(op_str), @r###" + { + test_j -----> test_j { + object -----> object(id: 0) { + merged_1 -----> data(arg: 0) + merged_2 -may-> data(arg: 0) on R + merged_2 -may-> data(arg: 1) on S + merged_3 -may-> data(arg: 0) if v0 + merged_3 -may-> data(arg: 0) if v1 + merged_3 -may-> data(arg: 0) + } + } + } + "###); +} + +#[test] +fn test_not_merge_sub_selection_sets_under_different_type_conditions() { + let op_str = r#" + query { + test_j { + object(id: 0) { + unmerged: data(arg: 0) + } + # unmerged due to parents with different type conditions + ... on R { + object(id: 0) { + unmerged: data(arg: 0) + } + } + } + } + "#; + insta::assert_snapshot!(response_shape(op_str), @r###" + { + test_j -----> test_j { + object -may-> object(id: 0) on J { + unmerged -----> data(arg: 0) + } + object -may-> object(id: 0) on R { + unmerged -----> data(arg: 0) + } + } + } + "###); +} + +#[test] +fn test_merge_sub_selection_sets_with_boolean_conditions() { + let op_str = r#" + query($v0: Boolean!, $v1: Boolean!) { + test_j { + object(id: 0) @include(if: $v0) { + merged: data(arg: 0) + unmerged: data(arg: 0) + } + object(id: 0) @include(if: $v0) { + merged: data(arg: 0) @include(if: $v0) + } + # unmerged due to parents with different Boolean conditions + object(id: 0) @include(if: $v1) { + unmerged: data(arg: 0) + } + } + } + "#; + insta::assert_snapshot!(response_shape(op_str), @r###" + { + test_j -----> test_j { + object -may-> object(id: 0) if v0 { + merged -----> data(arg: 0) + unmerged -----> data(arg: 0) + } + object -may-> object(id: 0) if v1 { + unmerged -----> data(arg: 0) + } + } + } + "###); +} diff --git a/apollo-federation/src/query_plan/mod.rs b/apollo-federation/src/query_plan/mod.rs index 60e0b396a6c..893807dc149 100644 --- a/apollo-federation/src/query_plan/mod.rs +++ b/apollo-federation/src/query_plan/mod.rs @@ -9,6 +9,7 @@ use serde::Serialize; use crate::query_plan::query_planner::QueryPlanningStatistics; pub(crate) mod conditions; +pub mod correctness; pub(crate) mod display; pub(crate) mod fetch_dependency_graph; pub(crate) mod fetch_dependency_graph_processor;