-
Notifications
You must be signed in to change notification settings - Fork 40
New issue
Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.
By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.
Already on GitHub? Sign in to your account
[sled agent] API to manage datasets explicitly #6144
Changes from all commits
5c2e5b0
1709d80
a80313d
7193d1b
9464cc1
fb23666
29c4eb7
75f006b
24d93a8
178e20e
cf3f35c
11f49fb
b999bf7
fac6456
fdf0644
a042439
9c27213
c562125
c7a5adf
181507c
8e1df07
93134c2
d88d541
95ebbb8
994757e
7156ba0
14a2dc4
aa60254
67c5d7e
927efd1
3e14cc4
40f93ae
077908d
a600494
0a63161
c9f170e
f5bc35a
474ec13
File filter
Filter by extension
Conversations
Jump to
Diff view
Diff view
There are no files selected for viewing
Original file line number | Diff line number | Diff line change | ||
---|---|---|---|---|
|
@@ -10,13 +10,14 @@ use crate::{ | |||
}; | ||||
use oxnet::{IpNet, Ipv4Net, Ipv6Net}; | ||||
use schemars::JsonSchema; | ||||
use serde::{Deserialize, Serialize}; | ||||
use serde::{de, Deserialize, Deserializer, Serialize, Serializer}; | ||||
use std::{ | ||||
collections::{HashMap, HashSet}, | ||||
fmt, | ||||
net::{IpAddr, Ipv4Addr, Ipv6Addr}, | ||||
str::FromStr, | ||||
}; | ||||
use strum::EnumCount; | ||||
use uuid::Uuid; | ||||
|
||||
use super::nexus::HostIdentifier; | ||||
|
@@ -837,13 +838,11 @@ pub struct ResolvedVpcRouteSet { | |||
} | ||||
|
||||
/// Describes the purpose of the dataset. | ||||
#[derive( | ||||
Debug, Serialize, Deserialize, JsonSchema, Clone, Copy, PartialEq, Eq, | ||||
)] | ||||
#[serde(rename_all = "snake_case")] | ||||
#[derive(Debug, Clone, PartialEq, Eq, Ord, PartialOrd, Hash, EnumCount)] | ||||
pub enum DatasetKind { | ||||
Crucible, | ||||
// Durable datasets for zones | ||||
Cockroach, | ||||
Crucible, | ||||
/// Used for single-node clickhouse deployments | ||||
Clickhouse, | ||||
/// Used for replicated clickhouse deployments | ||||
|
@@ -852,24 +851,153 @@ pub enum DatasetKind { | |||
ClickhouseServer, | ||||
ExternalDns, | ||||
InternalDns, | ||||
|
||||
// Zone filesystems | ||||
ZoneRoot, | ||||
Zone { | ||||
name: String, | ||||
}, | ||||
|
||||
// Other datasets | ||||
Debug, | ||||
} | ||||
|
||||
impl Serialize for DatasetKind { | ||||
fn serialize<S>(&self, serializer: S) -> Result<S::Ok, S::Error> | ||||
where | ||||
S: Serializer, | ||||
{ | ||||
serializer.serialize_str(&self.to_string()) | ||||
} | ||||
} | ||||
|
||||
impl<'de> Deserialize<'de> for DatasetKind { | ||||
fn deserialize<D>(deserializer: D) -> Result<Self, D::Error> | ||||
where | ||||
D: Deserializer<'de>, | ||||
{ | ||||
let s = String::deserialize(deserializer)?; | ||||
s.parse().map_err(de::Error::custom) | ||||
} | ||||
} | ||||
|
||||
impl JsonSchema for DatasetKind { | ||||
fn schema_name() -> String { | ||||
"DatasetKind".to_string() | ||||
} | ||||
|
||||
fn json_schema( | ||||
gen: &mut schemars::gen::SchemaGenerator, | ||||
) -> schemars::schema::Schema { | ||||
// The schema is a bit more complicated than this -- it's either one of | ||||
// the fixed values or a string starting with "zone/" -- but this is | ||||
// good enough for now. | ||||
let mut schema = <String>::json_schema(gen).into_object(); | ||||
schema.metadata().description = Some( | ||||
"The kind of dataset. See the `DatasetKind` enum \ | ||||
in omicron-common for possible values." | ||||
.to_owned(), | ||||
); | ||||
schema.into() | ||||
} | ||||
} | ||||
|
||||
impl DatasetKind { | ||||
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. A chunk of this implementation was moved from History lesson: We used to have types defined that would be usable by Nexus ( This PR merges both concepts, but tweaks some names to avoid changing any schemas that are saved on M.2s. |
||||
pub fn dataset_should_be_encrypted(&self) -> bool { | ||||
match self { | ||||
// We encrypt all datasets except Crucible. | ||||
// | ||||
// Crucible already performs encryption internally, and we | ||||
// avoid double-encryption. | ||||
DatasetKind::Crucible => false, | ||||
_ => true, | ||||
} | ||||
} | ||||
|
||||
/// Returns true if this dataset is delegated to a non-global zone. | ||||
pub fn zoned(&self) -> bool { | ||||
use DatasetKind::*; | ||||
match self { | ||||
Cockroach | Crucible | Clickhouse | ClickhouseKeeper | ||||
| ClickhouseServer | ExternalDns | InternalDns => true, | ||||
ZoneRoot | Zone { .. } | Debug => false, | ||||
} | ||||
} | ||||
|
||||
/// Returns the zone name, if this is a dataset for a zone filesystem. | ||||
/// | ||||
/// Otherwise, returns "None". | ||||
pub fn zone_name(&self) -> Option<&str> { | ||||
if let DatasetKind::Zone { name } = self { | ||||
Some(name) | ||||
} else { | ||||
None | ||||
} | ||||
} | ||||
} | ||||
|
||||
// Be cautious updating this implementation: | ||||
// | ||||
// - It should align with [DatasetKind::FromStr], below | ||||
// - The strings here are used here comprise the dataset name, stored durably | ||||
// on-disk | ||||
impl fmt::Display for DatasetKind { | ||||
fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result { | ||||
use DatasetKind::*; | ||||
let s = match self { | ||||
Crucible => "crucible", | ||||
Cockroach => "cockroach", | ||||
Cockroach => "cockroachdb", | ||||
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. When is the There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. +1, i would have a slight preference for the There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. +1 as well. For
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. So my mishaps with naming here were intended to keep backwards compatibility between:
To be clear, I think I misinterpreted this in my original PR. I was attempting to merge HOWEVER, upon closer inspection, the Updated in 93134c2 to just use |
||||
Clickhouse => "clickhouse", | ||||
ClickhouseKeeper => "clickhouse_keeper", | ||||
ClickhouseServer => "clickhouse_server", | ||||
ExternalDns => "external_dns", | ||||
InternalDns => "internal_dns", | ||||
ZoneRoot => "zone", | ||||
Zone { name } => { | ||||
write!(f, "zone/{}", name)?; | ||||
return Ok(()); | ||||
} | ||||
smklein marked this conversation as resolved.
Show resolved
Hide resolved
|
||||
Debug => "debug", | ||||
}; | ||||
write!(f, "{}", s) | ||||
} | ||||
} | ||||
|
||||
#[derive(Debug, thiserror::Error)] | ||||
pub enum DatasetKindParseError { | ||||
#[error("Dataset unknown: {0}")] | ||||
UnknownDataset(String), | ||||
} | ||||
|
||||
impl FromStr for DatasetKind { | ||||
type Err = DatasetKindParseError; | ||||
|
||||
fn from_str(s: &str) -> Result<Self, Self::Err> { | ||||
use DatasetKind::*; | ||||
let kind = match s { | ||||
"cockroachdb" => Cockroach, | ||||
"crucible" => Crucible, | ||||
"clickhouse" => Clickhouse, | ||||
"clickhouse_keeper" => ClickhouseKeeper, | ||||
"clickhouse_server" => ClickhouseServer, | ||||
"external_dns" => ExternalDns, | ||||
"internal_dns" => InternalDns, | ||||
"zone" => ZoneRoot, | ||||
"debug" => Debug, | ||||
other => { | ||||
if let Some(name) = other.strip_prefix("zone/") { | ||||
Zone { name: name.to_string() } | ||||
} else { | ||||
return Err(DatasetKindParseError::UnknownDataset( | ||||
s.to_string(), | ||||
)); | ||||
} | ||||
} | ||||
}; | ||||
Ok(kind) | ||||
} | ||||
} | ||||
|
||||
/// Identifiers for a single sled. | ||||
/// | ||||
/// This is intended primarily to be used in timeseries, to identify | ||||
|
@@ -892,6 +1020,7 @@ pub struct SledIdentifiers { | |||
|
||||
#[cfg(test)] | ||||
mod tests { | ||||
use super::*; | ||||
use crate::api::internal::shared::AllowedSourceIps; | ||||
use oxnet::{IpNet, Ipv4Net, Ipv6Net}; | ||||
use std::net::{Ipv4Addr, Ipv6Addr}; | ||||
|
@@ -936,4 +1065,49 @@ mod tests { | |||
serde_json::from_str(r#"{"allow":"any"}"#).unwrap(), | ||||
); | ||||
} | ||||
|
||||
#[test] | ||||
fn test_dataset_kind_serialization() { | ||||
let kinds = [ | ||||
DatasetKind::Cockroach, | ||||
DatasetKind::Crucible, | ||||
DatasetKind::Clickhouse, | ||||
DatasetKind::ClickhouseKeeper, | ||||
DatasetKind::ClickhouseServer, | ||||
DatasetKind::ExternalDns, | ||||
DatasetKind::InternalDns, | ||||
DatasetKind::ZoneRoot, | ||||
DatasetKind::Zone { name: String::from("myzone") }, | ||||
DatasetKind::Debug, | ||||
]; | ||||
|
||||
assert_eq!(kinds.len(), DatasetKind::COUNT); | ||||
|
||||
for kind in &kinds { | ||||
// To string, from string | ||||
let as_str = kind.to_string(); | ||||
let from_str = | ||||
DatasetKind::from_str(&as_str).unwrap_or_else(|_| { | ||||
panic!("Failed to convert {kind} to and from string") | ||||
}); | ||||
assert_eq!( | ||||
*kind, from_str, | ||||
"{kind} failed to convert to/from a string" | ||||
); | ||||
|
||||
// Serialize, deserialize | ||||
let ser = serde_json::to_string(&kind) | ||||
.unwrap_or_else(|_| panic!("Failed to serialize {kind}")); | ||||
let de: DatasetKind = serde_json::from_str(&ser) | ||||
.unwrap_or_else(|_| panic!("Failed to deserialize {kind}")); | ||||
assert_eq!(*kind, de, "{kind} failed serialization"); | ||||
|
||||
// Test that serialization is equivalent to stringifying. | ||||
assert_eq!( | ||||
format!("\"{as_str}\""), | ||||
ser, | ||||
"{kind} does not match stringification/serialization" | ||||
); | ||||
} | ||||
} | ||||
} |
There was a problem hiding this comment.
Choose a reason for hiding this comment
The reason will be displayed to describe this comment to others. Learn more.
Oh hmm, I think you'll also want to update the
JsonSchema
impl to match this.There was a problem hiding this comment.
Choose a reason for hiding this comment
The reason will be displayed to describe this comment to others. Learn more.
Just to confirm -- what about the JsonSchema implementation should we update? It's currently being derived, and is used as part of internal APIs, but I don't think it needs to match the serialization + to/from string implementations.
There was a problem hiding this comment.
Choose a reason for hiding this comment
The reason will be displayed to describe this comment to others. Learn more.
Updated the PR with a fixed JSON schema.
Basically the issue was that JSON schemas are meant to be a description of the serialization format, and they were out of sync since we'd manually implemented
Serialize
andDeserialize
. It was currently moot for us because we were usingreplace
, but it's a lurking bug that can lead to issues down the road.I've changed the schema to be just
string
, which is overly generic but is at least correct. A more sophisticated impl would be something likestring
with a validation regex that lists all the possibilities, but that seems like overkill given that we're usingreplace
anyway.