Skip to content
Open
Show file tree
Hide file tree
Changes from 23 commits
Commits
Show all changes
27 commits
Select commit Hold shift + click to select a range
295c431
Add some tests for CRD generation for enums
sbernauer Oct 8, 2025
13db30c
Update assertions to valid CRDs from kube 1.1.0
sbernauer Oct 9, 2025
fb77413
test: Add some un-documented variants to the NormalEnum
NickLarsenNZ Oct 9, 2025
0cb62f1
test: Partial new impl for one_of hoisting
NickLarsenNZ Oct 9, 2025
85eaf36
Finish enum oneOf hoisting
sbernauer Oct 9, 2025
285ab64
adjust and document the hoist_one_of_enum function
NickLarsenNZ Oct 10, 2025
e256f3a
test: Add more basic testing to ensure hoisting is not performed when…
NickLarsenNZ Oct 10, 2025
35034c5
hoist anyOf optional enums
NickLarsenNZ Oct 10, 2025
3850a19
left a todo for empty structural variants in untagged enums
NickLarsenNZ Oct 10, 2025
c2fbe70
test: Add missing enum entries to expected schemas
NickLarsenNZ Oct 10, 2025
8abef36
test: Add empty object handling to existing hoisting function
NickLarsenNZ Oct 10, 2025
8f578c2
fix: Change hoist_any_of_option_enum to cater to nested any_of as wel…
NickLarsenNZ Oct 14, 2025
c23aabc
test: Add test for internal function, and add docs after seeing it's …
NickLarsenNZ Oct 14, 2025
e91665b
feat: Add functions for specific hoisting tasks
NickLarsenNZ Oct 21, 2025
f13a751
chore: Add a crude fix to code that will be removed in a later commit
NickLarsenNZ Oct 21, 2025
730e0db
fix: update changed function name in tests
NickLarsenNZ Oct 21, 2025
7503fcc
chore: Make new hoisting functions pub(crate)
NickLarsenNZ Oct 21, 2025
17e7a28
chore: Move schema.rs to schema/mod.rs
NickLarsenNZ Oct 21, 2025
cc6b20a
feat: Implement new hoisting logic
NickLarsenNZ Oct 21, 2025
8e40d01
fix: Handle property hoisting for tagged enums (oneOf subschemas)
NickLarsenNZ Oct 22, 2025
e311361
lint: commit whitespace differences
NickLarsenNZ Oct 22, 2025
307e828
chore: use assert/assert_eq with message instead of panic
NickLarsenNZ Oct 22, 2025
25e10db
Add integration test for (optional) complex enums
sbernauer Oct 23, 2025
764c418
Add test case for Option<Option<Option<String>>>
sbernauer Oct 23, 2025
d52c2c6
Remove leftover newline
sbernauer Oct 23, 2025
6d156a0
Add (failing) test for enums without descriptions
sbernauer Oct 23, 2025
e3172d5
Improve test comment
sbernauer Oct 23, 2025
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
163 changes: 24 additions & 139 deletions kube-core/src/schema.rs → kube-core/src/schema/mod.rs
Original file line number Diff line number Diff line change
Expand Up @@ -2,13 +2,23 @@
//!
//! [`CustomResourceDefinition`]: `k8s_openapi::apiextensions_apiserver::pkg::apis::apiextensions::v1::CustomResourceDefinition`

mod transform_any_of;
mod transform_one_of;
mod transform_properties;

// Used in docs
#[allow(unused_imports)] use schemars::generate::SchemaSettings;

use schemars::{transform::Transform, JsonSchema};
use serde::{Deserialize, Serialize};
use serde_json::Value;
use std::collections::{btree_map::Entry, BTreeMap, BTreeSet};
use std::collections::{BTreeMap, BTreeSet};

use crate::schema::{
transform_any_of::hoist_any_of_subschema_with_a_nullable_variant,
transform_one_of::hoist_one_of_enum_with_unit_variants,
transform_properties::hoist_properties_for_any_of_subschemas,
};

/// schemars [`Visitor`] that rewrites a [`Schema`] to conform to Kubernetes' "structural schema" rules
///
Expand Down Expand Up @@ -246,34 +256,28 @@ enum SingleOrVec<T> {
Vec(Vec<T>),
}

#[cfg(test)]
fn schemars_schema_to_kube_schema(incoming: schemars::Schema) -> Result<Schema, serde_json::Error> {
serde_json::from_value(incoming.to_value())
}

Comment on lines +259 to +263
Copy link
Member

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

This is unused. @sbernauer did you want to do something with is?

Else I will remove it:

Suggested change
#[cfg(test)]
fn schemars_schema_to_kube_schema(incoming: schemars::Schema) -> Result<Schema, serde_json::Error> {
serde_json::from_value(incoming.to_value())
}

impl Transform for StructuralSchemaRewriter {
fn transform(&mut self, transform_schema: &mut schemars::Schema) {
// Apply this (self) transform to all subschemas
schemars::transform::transform_subschemas(self, transform_schema);

let mut schema: SchemaObject = match serde_json::from_value(transform_schema.clone().to_value()).ok()
{
// TODO (@NickLarsenNZ): At this point, we are seeing duplicate `title` when printing schema as json.
// This is because `title` is specified under both `extensions` and `other`.
Comment on lines +271 to +272
Copy link
Member

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

I guess I should remove it, but worth sharing the knowledge before I do:

Suggested change
// TODO (@NickLarsenNZ): At this point, we are seeing duplicate `title` when printing schema as json.
// This is because `title` is specified under both `extensions` and `other`.

Copy link
Member

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

I think we actually should leave it here (reworded/adjusted) to explicitly share the knowledge.

Some(schema) => schema,
None => return,
};

if let Some(subschemas) = &mut schema.subschemas {
if let Some(one_of) = subschemas.one_of.as_mut() {
// Tagged enums are serialized using `one_of`
hoist_subschema_properties(one_of, &mut schema.object, &mut schema.instance_type);

// "Plain" enums are serialized using `one_of` if they have doc tags
hoist_subschema_enum_values(one_of, &mut schema.enum_values, &mut schema.instance_type);

if one_of.is_empty() {
subschemas.one_of = None;
}
}

if let Some(any_of) = &mut subschemas.any_of {
// Untagged enums are serialized using `any_of`
hoist_subschema_properties(any_of, &mut schema.object, &mut schema.instance_type);
}
}
// Hoist parts of the schema to make it valid for k8s
hoist_one_of_enum_with_unit_variants(&mut schema);
hoist_any_of_subschema_with_a_nullable_variant(&mut schema);
hoist_properties_for_any_of_subschemas(&mut schema);

// check for maps without with properties (i.e. flattened maps)
// and allow these to persist dynamically
Expand All @@ -297,130 +301,11 @@ impl Transform for StructuralSchemaRewriter {
array.unique_items = None;
}

// Convert back to schemars::Schema
if let Ok(schema) = serde_json::to_value(schema) {
if let Ok(transformed) = serde_json::from_value(schema) {
*transform_schema = transformed;
}
}
}
}

/// Bring all plain enum values up to the root schema,
/// since Kubernetes doesn't allow subschemas to define enum options.
///
/// (Enum here means a list of hard-coded values, not a tagged union.)
fn hoist_subschema_enum_values(
subschemas: &mut Vec<Schema>,
common_enum_values: &mut Option<Vec<serde_json::Value>>,
instance_type: &mut Option<SingleOrVec<InstanceType>>,
) {
subschemas.retain(|variant| {
if let Schema::Object(SchemaObject {
instance_type: variant_type,
enum_values: Some(variant_enum_values),
..
}) = variant
{
if let Some(variant_type) = variant_type {
match instance_type {
None => *instance_type = Some(variant_type.clone()),
Some(tpe) => {
if tpe != variant_type {
panic!("Enum variant set {variant_enum_values:?} has type {variant_type:?} but was already defined as {instance_type:?}. The instance type must be equal for all subschema variants.")
}
}
}
}
common_enum_values
.get_or_insert_with(Vec::new)
.extend(variant_enum_values.iter().cloned());
false
} else {
true
}
})
}

/// Bring all property definitions from subschemas up to the root schema,
/// since Kubernetes doesn't allow subschemas to define properties.
fn hoist_subschema_properties(
subschemas: &mut Vec<Schema>,
common_obj: &mut Option<Box<ObjectValidation>>,
instance_type: &mut Option<SingleOrVec<InstanceType>>,
) {
for variant in subschemas {
if let Schema::Object(SchemaObject {
instance_type: variant_type,
object: Some(variant_obj),
metadata: variant_metadata,
..
}) = variant
{
let common_obj = common_obj.get_or_insert_with(Box::<ObjectValidation>::default);

if let Some(variant_metadata) = variant_metadata {
// Move enum variant description from oneOf clause to its corresponding property
if let Some(description) = std::mem::take(&mut variant_metadata.description) {
if let Some(Schema::Object(variant_object)) =
only_item(variant_obj.properties.values_mut())
{
let metadata = variant_object
.metadata
.get_or_insert_with(Box::<Metadata>::default);
metadata.description = Some(description);
}
}
}

// Move all properties
let variant_properties = std::mem::take(&mut variant_obj.properties);
for (property_name, property) in variant_properties {
match common_obj.properties.entry(property_name) {
Entry::Vacant(entry) => {
entry.insert(property);
}
Entry::Occupied(entry) => {
if &property != entry.get() {
panic!("Property {:?} has the schema {:?} but was already defined as {:?} in another subschema. The schemas for a property used in multiple subschemas must be identical",
entry.key(),
&property,
entry.get());
}
}
}
}

// Kubernetes doesn't allow variants to set additionalProperties
variant_obj.additional_properties = None;

merge_metadata(instance_type, variant_type.take());
}
}
}

fn only_item<I: Iterator>(mut i: I) -> Option<I::Item> {
let item = i.next()?;
if i.next().is_some() {
return None;
}
Some(item)
}

fn merge_metadata(
instance_type: &mut Option<SingleOrVec<InstanceType>>,
variant_type: Option<SingleOrVec<InstanceType>>,
) {
match (instance_type, variant_type) {
(_, None) => {}
(common_type @ None, variant_type) => {
*common_type = variant_type;
}
(Some(common_type), Some(variant_type)) => {
if *common_type != variant_type {
panic!(
"variant defined type {variant_type:?}, conflicting with existing type {common_type:?}"
);
}
}
}
}
164 changes: 164 additions & 0 deletions kube-core/src/schema/transform_any_of.rs
Original file line number Diff line number Diff line change
@@ -0,0 +1,164 @@
use std::ops::DerefMut;

use crate::schema::{Schema, SchemaObject, SubschemaValidation};

#[cfg(test)]
#[test]
fn optional_tagged_enum_with_unit_variants() {
let original_schema_object_value = serde_json::json!({
"anyOf": [
{
"description": "A very simple enum with empty variants",
"oneOf": [
{
"type": "string",
"enum": [
"C",
"D"
]
},
{
"description": "First variant doc-comment",
"type": "string",
"enum": [
"A"
]
},
{
"description": "Second variant doc-comment",
"type": "string",
"enum": [
"B"
]
}
]
},
{
"enum": [
null
],
"nullable": true
}
]
});

let expected_converted_schema_object_value = serde_json::json!({
"description": "A very simple enum with empty variants",
"nullable": true,
"oneOf": [
{
"type": "string",
"enum": [
"C",
"D"
]
},
{
"description": "First variant doc-comment",
"type": "string",
"enum": [
"A"
]
},
{
"description": "Second variant doc-comment",
"type": "string",
"enum": [
"B"
]
}
]
});


let original_schema_object: SchemaObject =
serde_json::from_value(original_schema_object_value).expect("valid JSON");
let expected_converted_schema_object: SchemaObject =
serde_json::from_value(expected_converted_schema_object_value).expect("valid JSON");

let mut actual_converted_schema_object = original_schema_object.clone();
hoist_any_of_subschema_with_a_nullable_variant(&mut actual_converted_schema_object);

assert_json_diff::assert_json_eq!(actual_converted_schema_object, expected_converted_schema_object);
}


/// Replace the schema with the anyOf subschema and set to nullable when the
/// only other subschema is the nullable entry.
///
/// Used for correcting the schema for optional tagged unit enums.
/// The non-null subschema is hoisted, and nullable will be set to true.
///
/// This will return early without modifications unless:
/// - There are exactly 2 `anyOf` subschemas.
/// - One subschema represents the nullability (ie: it has an enum with a single
/// null entry, and nullable set to true).
///
/// NOTE: This should work regardless of whether other hoisting has been performed or not.
pub(crate) fn hoist_any_of_subschema_with_a_nullable_variant(kube_schema: &mut SchemaObject) {
// Run some initial checks in case there is nothing to do
let SchemaObject {
subschemas: Some(subschemas),
..
} = kube_schema
else {
return;
};

let SubschemaValidation {
any_of: Some(any_of),
one_of,
} = subschemas.deref_mut()
else {
return;
};

if any_of.len() != 2 {
return;
}

// This is the signature for the null variant, indicating the "other"
// variant is the subschema that needs hoisting
let null = serde_json::json!({
"enum": [null],
"nullable": true
});

// iter through any_of entries, converting them to Value,
// and build a truth table for null matches
let entry_is_null: [bool; 2] = any_of
.iter()
.map(|x| serde_json::to_value(x).expect("schema should be able to convert to JSON"))
.map(|x| x == null)
.collect::<Vec<_>>()
.try_into()
.expect("there should be exactly 2 elements. We checked earlier");

// Get the `any_of` subschema that isn't the null entry
let subschema_to_hoist = match entry_is_null {
[true, false] => &any_of[1],
[false, true] => &any_of[0],
_ => return,
};

// At this point, we can be reasonably sure we need to hoist the non-null
// anyOf subschema up to the schema level, and unset the anyOf field.
// From here, anything that looks wrong will panic instead of return.
// TODO (@NickLarsenNZ): Return errors instead of panicking, leave panicking up to the infallible schemars::Transform

let Schema::Object(to_hoist) = subschema_to_hoist else {
panic!("the non-null anyOf subschema is a bool. That is not expected here");
};

// There should not be any oneOf's adjacent to the anyOf
if one_of.is_some() {
panic!("oneOf is set when there is already an anyOf: {one_of:#?}");
}

// Replace the schema with the non-null subschema
*kube_schema = to_hoist.clone();

// Set the schema to nullable (as we know we matched the null variant earlier)
// TODO (@NickLarsenNZ): Do we need to insert `nullable` into `other` too?
kube_schema.extensions.insert("nullable".to_owned(), true.into());
Comment on lines +161 to +163
Copy link
Member

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

Anyone know what to do here?
I don't know if it's good enough being in one place, or if it should be in both for compatibility with something.

schemars sends fields that are the same between extensions and other.

}
Loading
Loading