From e5b1067fadfd7ce6a351812311ca2194968fea01 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Wojciech=20Przytu=C5=82a?= Date: Mon, 7 Oct 2024 17:36:17 +0200 Subject: [PATCH 1/4] result: extract deser_table_spec_for_col_spec This refactor: 1) aids readability; 2) allows sharing the common logic with soon-to-be-added deser_col_specs_borrowed. --- scylla-cql/src/frame/response/result.rs | 102 +++++++++++++++--------- 1 file changed, 64 insertions(+), 38 deletions(-) diff --git a/scylla-cql/src/frame/response/result.rs b/scylla-cql/src/frame/response/result.rs index cd02e6d2a..2f216beae 100644 --- a/scylla-cql/src/frame/response/result.rs +++ b/scylla-cql/src/frame/response/result.rs @@ -721,6 +721,61 @@ fn mk_col_spec_parse_error( } } +/// Deserializes table spec of a column spec in the borrowed form. +/// +/// Checks for equality of table specs across columns, because the protocol +/// does not guarantee that and we want to be sure that the assumption +/// of them being all the same is correct. +/// To this end, the first column's table spec is written to `known_table_spec` +/// and compared with remaining columns' table spec. +/// +/// To avoid needless allocations, it is advised to pass `known_table_spec` +/// in the borrowed form, so that cloning it is cheap. +fn deser_table_spec_for_col_spec<'frame>( + buf: &'_ mut &'frame [u8], + global_table_spec_provided: bool, + known_table_spec: &'_ mut Option>, + col_idx: usize, +) -> StdResult, ColumnSpecParseError> { + let table_spec = match known_table_spec { + // If global table spec was provided, we simply clone it to each column spec. + Some(ref known_spec) if global_table_spec_provided => known_spec.clone(), + + // Else, we deserialize the table spec for a column and, if we already know some + // previous spec (i.e. that of the first column), we perform equality check + // against it. + Some(_) | None => { + let table_spec = + deser_table_spec(buf).map_err(|err| mk_col_spec_parse_error(col_idx, err))?; + + if let Some(ref known_spec) = known_table_spec { + // We assume that for each column, table spec is the same. + // As this is not guaranteed by the CQL protocol specification but only by how + // Cassandra and ScyllaDB work (no support for joins), we perform a sanity check here. + if known_spec.table_name != table_spec.table_name + || known_spec.ks_name != table_spec.ks_name + { + return Err(mk_col_spec_parse_error( + col_idx, + ColumnSpecParseErrorKind::TableSpecDiffersAcrossColumns( + known_spec.clone().into_owned(), + table_spec.into_owned(), + ), + )); + } + } else { + // Once we have read the first column spec, we save its table spec + // in order to verify its equality with other columns'. + *known_table_spec = Some(table_spec.clone()); + } + + table_spec + } + }; + + Ok(table_spec) +} + /// Deserializes col specs (part of ResultMetadata or PreparedMetadata) /// in the owned form. /// @@ -730,9 +785,9 @@ fn mk_col_spec_parse_error( /// /// To avoid needless allocations, it is advised to pass `global_table_spec` /// in the borrowed form, so that cloning it is cheap. -fn deser_col_specs( - buf: &mut &[u8], - global_table_spec: Option>, +fn deser_col_specs<'frame>( + buf: &'_ mut &'frame [u8], + global_table_spec: Option>, col_count: usize, ) -> StdResult>, ColumnSpecParseError> { let global_table_spec_provided = global_table_spec.is_some(); @@ -740,41 +795,12 @@ fn deser_col_specs( let mut col_specs = Vec::with_capacity(col_count); for col_idx in 0..col_count { - let table_spec = match known_table_spec { - // If global table spec was provided, we simply clone it to each column spec. - Some(ref known_spec) if global_table_spec_provided => known_spec.clone(), - - // Else, we deserialize the table spec for a column and, if we already know some - // previous spec (i.e. that of the first column), we perform equality check - // against it. - Some(_) | None => { - let table_spec = - deser_table_spec(buf).map_err(|err| mk_col_spec_parse_error(col_idx, err))?; - - if let Some(ref known_spec) = known_table_spec { - // We assume that for each column, table spec is the same. - // As this is not guaranteed by the CQL protocol specification but only by how - // Cassandra and ScyllaDB work (no support for joins), we perform a sanity check here. - if known_spec.table_name != table_spec.table_name - || known_spec.ks_name != table_spec.ks_name - { - return Err(mk_col_spec_parse_error( - col_idx, - ColumnSpecParseErrorKind::TableSpecDiffersAcrossColumns( - known_spec.clone().into_owned(), - table_spec.into_owned(), - ), - )); - } - } else { - // Once we have read the first column spec, we save its table spec - // in order to verify its equality with other columns'. - known_table_spec = Some(table_spec.clone()); - } - - table_spec - } - }; + let table_spec = deser_table_spec_for_col_spec( + buf, + global_table_spec_provided, + &mut known_table_spec, + col_idx, + )?; let name = types::read_string(buf) .map_err(|err| mk_col_spec_parse_error(col_idx, err))? From 4f9c860b0d2e581768283bfb9bd80526a0de0852 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Wojciech=20Przytu=C5=82a?= Date: Fri, 11 Oct 2024 07:52:43 +0200 Subject: [PATCH 2/4] result: deser_col_specs as ownership-generic macro Similarly to what has been recently done with `deser_cql_type`, `deser_col_specs` is made a macro to avoid code duplication between owned and borrowed variant of that function. For now, to avoid warnings, borrowed variants of `deser_cql_type` and `deser_col_specs` are prefixed with an underscore. This will change once they are actually used. --- scylla-cql/src/frame/response/result.rs | 94 +++++++++++++++---------- 1 file changed, 56 insertions(+), 38 deletions(-) diff --git a/scylla-cql/src/frame/response/result.rs b/scylla-cql/src/frame/response/result.rs index 2f216beae..ab85cfa3c 100644 --- a/scylla-cql/src/frame/response/result.rs +++ b/scylla-cql/src/frame/response/result.rs @@ -693,11 +693,10 @@ macro_rules! generate_deser_type { }; } -generate_deser_type!(deser_type_owned, 'static, |buf| types::read_string(buf).map(ToOwned::to_owned)); - -// This is going to be used for deserializing borrowed result metadata. generate_deser_type!(_deser_type_borrowed, 'frame, types::read_string); +generate_deser_type!(deser_type_owned, 'static, |buf| types::read_string(buf).map(ToOwned::to_owned)); + /// Deserializes a table spec, be it per-column one or a global one, /// in the borrowed form. /// @@ -776,41 +775,59 @@ fn deser_table_spec_for_col_spec<'frame>( Ok(table_spec) } -/// Deserializes col specs (part of ResultMetadata or PreparedMetadata) -/// in the owned form. -/// -/// Checks for equality of table specs across columns, because the protocol -/// does not guarantee that and we want to be sure that the assumption -/// of them being all the same is correct. -/// -/// To avoid needless allocations, it is advised to pass `global_table_spec` -/// in the borrowed form, so that cloning it is cheap. -fn deser_col_specs<'frame>( - buf: &'_ mut &'frame [u8], - global_table_spec: Option>, - col_count: usize, -) -> StdResult>, ColumnSpecParseError> { - let global_table_spec_provided = global_table_spec.is_some(); - let mut known_table_spec = global_table_spec; - - let mut col_specs = Vec::with_capacity(col_count); - for col_idx in 0..col_count { - let table_spec = deser_table_spec_for_col_spec( - buf, - global_table_spec_provided, - &mut known_table_spec, - col_idx, - )?; - - let name = types::read_string(buf) - .map_err(|err| mk_col_spec_parse_error(col_idx, err))? - .to_owned(); - let typ = deser_type_owned(buf).map_err(|err| mk_col_spec_parse_error(col_idx, err))?; - col_specs.push(ColumnSpec::owned(name, typ, table_spec.into_owned())); - } - Ok(col_specs) +macro_rules! generate_deser_col_specs { + ($deser_col_specs: ident, $l: lifetime, $deser_type: ident, $make_col_spec: expr $(,)?) => { + /// Deserializes col specs (part of ResultMetadata or PreparedMetadata) + /// in the form mentioned by its name. + /// + /// Checks for equality of table specs across columns, because the protocol + /// does not guarantee that and we want to be sure that the assumption + /// of them being all the same is correct. + /// + /// To avoid needless allocations, it is advised to pass `global_table_spec` + /// in the borrowed form, so that cloning it is cheap. + fn $deser_col_specs<'frame>( + buf: &mut &'frame [u8], + global_table_spec: Option>, + col_count: usize, + ) -> StdResult>, ColumnSpecParseError> { + let global_table_spec_provided = global_table_spec.is_some(); + let mut known_table_spec = global_table_spec; + + let mut col_specs = Vec::with_capacity(col_count); + for col_idx in 0..col_count { + let table_spec = deser_table_spec_for_col_spec( + buf, + global_table_spec_provided, + &mut known_table_spec, + col_idx, + )?; + + let name = + types::read_string(buf).map_err(|err| mk_col_spec_parse_error(col_idx, err))?; + let typ = $deser_type(buf).map_err(|err| mk_col_spec_parse_error(col_idx, err))?; + let col_spec = $make_col_spec(name, typ, table_spec); + col_specs.push(col_spec); + } + Ok(col_specs) + } + }; } +generate_deser_col_specs!( + _deser_col_specs_borrowed, + 'frame, + _deser_type_borrowed, + ColumnSpec::borrowed, +); + +generate_deser_col_specs!( + deser_col_specs_owned, + 'static, + deser_type_owned, + |name: &str, typ, table_spec: TableSpec| ColumnSpec::owned(name.to_owned(), typ, table_spec.into_owned()), +); + fn deser_result_metadata( buf: &mut &[u8], ) -> StdResult<(ResultMetadata<'static>, PagingStateResponse), ResultMetadataParseError> { @@ -826,6 +843,7 @@ fn deser_result_metadata( let raw_paging_state = has_more_pages .then(|| types::read_bytes(buf).map_err(ResultMetadataParseError::PagingStateParseError)) .transpose()?; + let paging_state = PagingStateResponse::new_from_raw_bytes(raw_paging_state); let col_specs = if no_metadata { @@ -835,7 +853,7 @@ fn deser_result_metadata( .then(|| deser_table_spec(buf)) .transpose()?; - deser_col_specs(buf, global_table_spec, col_count)? + deser_col_specs_owned(buf, global_table_spec, col_count)? }; let metadata = ResultMetadata { @@ -873,7 +891,7 @@ fn deser_prepared_metadata( .then(|| deser_table_spec(buf)) .transpose()?; - let col_specs = deser_col_specs(buf, global_table_spec, col_count)?; + let col_specs = deser_col_specs_owned(buf, global_table_spec, col_count)?; Ok(PreparedMetadata { flags, From 413573c1abde9cbf9cc066c19db21a465557ef35 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Wojciech=20Przytu=C5=82a?= Date: Thu, 19 Sep 2024 17:35:44 +0200 Subject: [PATCH 3/4] RowsParseError: add variant for TypeCheckError When parsing rows, type check is a distinct phase in the new deserialization framework. To support propagation of errors related to type checking, a corresponding variant is added to RowsParseError. --- scylla-cql/src/frame/frame_errors.rs | 4 +++- 1 file changed, 3 insertions(+), 1 deletion(-) diff --git a/scylla-cql/src/frame/frame_errors.rs b/scylla-cql/src/frame/frame_errors.rs index 37f940e35..94e455bb7 100644 --- a/scylla-cql/src/frame/frame_errors.rs +++ b/scylla-cql/src/frame/frame_errors.rs @@ -14,7 +14,7 @@ pub use super::request::{ use super::response::result::TableSpec; use super::response::CqlResponseKind; use super::TryFromPrimitiveError; -use crate::types::deserialize::DeserializationError; +use crate::types::deserialize::{DeserializationError, TypeCheckError}; use thiserror::Error; /// An error returned by `parse_response_body_extensions`. @@ -320,6 +320,8 @@ pub enum RowsParseError { }, #[error("Malformed rows count: {0}")] RowsCountParseError(LowLevelDeserializationError), + #[error("Data type check prior to deserialization failed: {0}")] + IncomingDataTypeCheckError(#[from] TypeCheckError), #[error("Data deserialization failed: {0}")] DataDeserializationError(#[from] DeserializationError), } From 5cb42fac07da174648da8e4e68fda8e83640ab37 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Wojciech=20Przytu=C5=82a?= Date: Thu, 26 Sep 2024 15:09:21 +0200 Subject: [PATCH 4/4] errors: impl From for QueryError RowsParseError is going to be a user-facing error type, because it is going to be returned from new QueryResult API. For convenient conversion into QueryError, a shortcut From impl is added. --- scylla/src/transport/errors.rs | 14 +++++++++++++- 1 file changed, 13 insertions(+), 1 deletion(-) diff --git a/scylla/src/transport/errors.rs b/scylla/src/transport/errors.rs index f6b31b6c9..8ef4a9943 100644 --- a/scylla/src/transport/errors.rs +++ b/scylla/src/transport/errors.rs @@ -19,7 +19,7 @@ use scylla_cql::{ CqlAuthChallengeParseError, CqlAuthSuccessParseError, CqlAuthenticateParseError, CqlErrorParseError, CqlEventParseError, CqlRequestSerializationError, CqlResponseParseError, CqlResultParseError, CqlSupportedParseError, - FrameBodyExtensionsParseError, FrameHeaderParseError, + FrameBodyExtensionsParseError, FrameHeaderParseError, RowsParseError, }, request::CqlRequestKind, response::CqlResponseKind, @@ -178,6 +178,18 @@ impl From for QueryError { } } +impl From for QueryError { + fn from(err: RowsParseError) -> Self { + let err: CqlResultParseError = err.into(); + let err: CqlResponseParseError = err.into(); + let err: RequestError = err.into(); + let err: UserRequestError = err.into(); + let err: QueryError = err.into(); + + err + } +} + /// Error that occurred during session creation #[derive(Error, Debug, Clone)] #[non_exhaustive]