From 205e40d0e702631d5a41cb6542cc2625a8c8d854 Mon Sep 17 00:00:00 2001 From: Tai Le Manh Date: Tue, 12 Nov 2024 08:28:28 +0700 Subject: [PATCH 1/6] [arrow-cast] Support cast numeric to string view Signed-off-by: Tai Le Manh --- arrow-cast/src/cast/mod.rs | 114 +++++++++++++++++++++++++++------- arrow-cast/src/cast/string.rs | 16 +++++ 2 files changed, 109 insertions(+), 21 deletions(-) diff --git a/arrow-cast/src/cast/mod.rs b/arrow-cast/src/cast/mod.rs index f7059be170f4..e5f9f9db16df 100644 --- a/arrow-cast/src/cast/mod.rs +++ b/arrow-cast/src/cast/mod.rs @@ -175,15 +175,19 @@ pub fn can_cast_types(from_type: &DataType, to_type: &DataType) -> bool { // unsigned integer to decimal (UInt8 | UInt16 | UInt32 | UInt64, Decimal128(_, _)) | (UInt8 | UInt16 | UInt32 | UInt64, Decimal256(_, _)) | + // unsigned integer to string + (UInt8 | UInt16 | UInt32 | UInt64, Utf8View | Utf8 | LargeUtf8) | // signed numeric to decimal (Null | Int8 | Int16 | Int32 | Int64 | Float32 | Float64, Decimal128(_, _)) | (Null | Int8 | Int16 | Int32 | Int64 | Float32 | Float64, Decimal256(_, _)) | + // signed numeric to string + (Int8 | Int16 | Int32 | Int64 | Float16 | Float32 | Float64, Utf8View | Utf8 | LargeUtf8) | // decimal to unsigned numeric (Decimal128(_, _) | Decimal256(_, _), UInt8 | UInt16 | UInt32 | UInt64) | // decimal to signed numeric (Decimal128(_, _) | Decimal256(_, _), Null | Int8 | Int16 | Int32 | Int64 | Float32 | Float64) => true, - // decimal to Utf8 - (Decimal128(_, _) | Decimal256(_, _), Utf8 | LargeUtf8) => true, + // decimal to string + (Decimal128(_, _) | Decimal256(_, _), Utf8View | Utf8 | LargeUtf8) => true, // Utf8 to decimal (Utf8 | LargeUtf8, Decimal128(_, _) | Decimal256(_, _)) => true, (Struct(from_fields), Struct(to_fields)) => { @@ -917,6 +921,7 @@ pub fn cast_with_options( Float64 => cast_decimal_to_float::(array, |x| { x as f64 / 10_f64.powi(*scale as i32) }), + Utf8View => value_to_string_view(array, cast_options), Utf8 => value_to_string::(array, cast_options), LargeUtf8 => value_to_string::(array, cast_options), Null => Ok(new_null_array(to_type, array.len())), @@ -982,6 +987,7 @@ pub fn cast_with_options( Float64 => cast_decimal_to_float::(array, |x| { x.to_f64().unwrap() / 10_f64.powi(*scale as i32) }), + Utf8View => value_to_string_view(array, cast_options), Utf8 => value_to_string::(array, cast_options), LargeUtf8 => value_to_string::(array, cast_options), Null => Ok(new_null_array(to_type, array.len())), @@ -1462,6 +1468,9 @@ pub fn cast_with_options( (BinaryView, _) => Err(ArrowError::CastError(format!( "Casting from {from_type:?} to {to_type:?} not supported", ))), + (from_type, Utf8View) if from_type.is_primitive() => { + value_to_string_view(array, cast_options) + } (from_type, LargeUtf8) if from_type.is_primitive() => { value_to_string::(array, cast_options) } @@ -2485,12 +2494,11 @@ where #[cfg(test)] mod tests { + use super::*; use arrow_buffer::{Buffer, IntervalDayTime, NullBuffer}; use chrono::NaiveDate; use half::f16; - use super::*; - macro_rules! generate_cast_test_case { ($INPUT_ARRAY: expr, $OUTPUT_TYPE_ARRAY: ident, $OUTPUT_TYPE: expr, $OUTPUT_VALUES: expr) => { let output = @@ -3708,6 +3716,40 @@ mod tests { assert_eq!(10.0, c.value(3)); } + #[test] + fn test_cast_int_to_utf8view() { + assert!(can_cast_types(&DataType::Int8, &DataType::Utf8View)); + assert!(can_cast_types(&DataType::Int16, &DataType::Utf8View)); + assert!(can_cast_types(&DataType::Int32, &DataType::Utf8View)); + assert!(can_cast_types(&DataType::Int64, &DataType::Utf8View)); + + let array = Int32Array::from(vec![None, Some(8), Some(9), Some(10)]); + let arr = cast(&array, &DataType::Utf8View).unwrap(); + assert_eq!(4, arr.len()); + assert_eq!(1, arr.null_count()); + let c = arr.as_string_view(); + assert!(c.is_null(0)); + assert_eq!("8", c.value(1)); + assert_eq!("9", c.value(2)); + assert_eq!("10", c.value(3)); + } + + #[test] + fn test_cast_float_to_utf8view() { + assert!(can_cast_types(&DataType::Float16, &DataType::Utf8View)); + assert!(can_cast_types(&DataType::Float32, &DataType::Utf8View)); + assert!(can_cast_types(&DataType::Float64, &DataType::Utf8View)); + + let array = Float32Array::from(vec![Some(8.64), Some(9.81), None]); + let arr = cast(&array, &DataType::Utf8View).unwrap(); + assert_eq!(3, arr.len()); + assert_eq!(1, arr.null_count()); + let c = arr.as_string_view(); + assert_eq!("8.64", c.value(0)); + assert_eq!("9.81", c.value(1)); + assert!(c.is_null(2)); + } + #[test] fn test_cast_utf8_to_i32() { let array = StringArray::from(vec!["5", "6", "seven", "8", "9.1"]); @@ -9114,7 +9156,22 @@ mod tests { } #[test] - fn test_cast_decimal_to_utf8() { + fn test_cast_decimal_to_string() { + macro_rules! assert_decimal_values { + ($array:expr) => { + let c = $array; + assert_eq!("1123.454", c.value(0)); + assert_eq!("2123.456", c.value(1)); + assert_eq!("-3123.453", c.value(2)); + assert_eq!("-3123.456", c.value(3)); + assert_eq!("0.000", c.value(4)); + assert_eq!("0.123", c.value(5)); + assert_eq!("1234.567", c.value(6)); + assert_eq!("-1234.567", c.value(7)); + assert!(c.is_null(8)); + }; + } + fn test_decimal_to_string( output_type: DataType, array: PrimitiveArray, @@ -9122,18 +9179,19 @@ mod tests { let b = cast(&array, &output_type).unwrap(); assert_eq!(b.data_type(), &output_type); - let c = b.as_string::(); - - assert_eq!("1123.454", c.value(0)); - assert_eq!("2123.456", c.value(1)); - assert_eq!("-3123.453", c.value(2)); - assert_eq!("-3123.456", c.value(3)); - assert_eq!("0.000", c.value(4)); - assert_eq!("0.123", c.value(5)); - assert_eq!("1234.567", c.value(6)); - assert_eq!("-1234.567", c.value(7)); - assert!(c.is_null(8)); + match b.data_type() { + DataType::Utf8View => { + let c = b.as_string_view(); + assert_decimal_values!(c); + } + DataType::Utf8 | DataType::LargeUtf8 => { + let c = b.as_string::(); + assert_decimal_values!(c); + } + _ => (), + } } + let array128: Vec> = vec![ Some(1123454), Some(2123456), @@ -9145,22 +9203,36 @@ mod tests { Some(-123456789), None, ]; + let array256: Vec> = array128 + .iter() + .map(|num| num.map(i256::from_i128)) + .collect(); - let array256: Vec> = array128.iter().map(|v| v.map(i256::from_i128)).collect(); + assert!(can_cast_types(&DataType::Decimal128(10, 4), &DataType::Utf8View)); + assert!(can_cast_types(&DataType::Decimal256(38, 10), &DataType::Utf8View)); - test_decimal_to_string::( + test_decimal_to_string::( + DataType::Utf8View, + create_decimal_array(array128.clone(), 7, 3).unwrap(), + ); + test_decimal_to_string::( DataType::Utf8, create_decimal_array(array128.clone(), 7, 3).unwrap(), ); - test_decimal_to_string::( + test_decimal_to_string::( DataType::LargeUtf8, create_decimal_array(array128, 7, 3).unwrap(), ); - test_decimal_to_string::( + + test_decimal_to_string::( + DataType::Utf8View, + create_decimal256_array(array256.clone(), 7, 3).unwrap(), + ); + test_decimal_to_string::( DataType::Utf8, create_decimal256_array(array256.clone(), 7, 3).unwrap(), ); - test_decimal_to_string::( + test_decimal_to_string::( DataType::LargeUtf8, create_decimal256_array(array256, 7, 3).unwrap(), ); diff --git a/arrow-cast/src/cast/string.rs b/arrow-cast/src/cast/string.rs index 7d0e7e21c859..36142848f45c 100644 --- a/arrow-cast/src/cast/string.rs +++ b/arrow-cast/src/cast/string.rs @@ -38,6 +38,22 @@ pub(crate) fn value_to_string( Ok(Arc::new(builder.finish())) } +pub(crate) fn value_to_string_view( + array: &dyn Array, + options: &CastOptions, +) -> Result { + let mut builder = StringViewBuilder::with_capacity(array.len()); + let formatter = ArrayFormatter::try_new(array, &options.format_options)?; + let nulls = array.nulls(); + for i in 0..array.len() { + match nulls.map(|x| x.is_null(i)).unwrap_or_default() { + false => builder.append_value(formatter.value(i).try_to_string()?), + true => builder.append_null(), + } + } + Ok(Arc::new(builder.finish())) +} + /// Parse UTF-8 pub(crate) fn parse_string( array: &dyn Array, From 2a937feb1bd63d0113bcb830e577e82c35e80436 Mon Sep 17 00:00:00 2001 From: Tai Le Manh Date: Tue, 12 Nov 2024 08:43:50 +0700 Subject: [PATCH 2/6] fix fmt error --- arrow-cast/src/cast/mod.rs | 18 ++++++++++-------- 1 file changed, 10 insertions(+), 8 deletions(-) diff --git a/arrow-cast/src/cast/mod.rs b/arrow-cast/src/cast/mod.rs index e5f9f9db16df..450cee42da57 100644 --- a/arrow-cast/src/cast/mod.rs +++ b/arrow-cast/src/cast/mod.rs @@ -175,13 +175,9 @@ pub fn can_cast_types(from_type: &DataType, to_type: &DataType) -> bool { // unsigned integer to decimal (UInt8 | UInt16 | UInt32 | UInt64, Decimal128(_, _)) | (UInt8 | UInt16 | UInt32 | UInt64, Decimal256(_, _)) | - // unsigned integer to string - (UInt8 | UInt16 | UInt32 | UInt64, Utf8View | Utf8 | LargeUtf8) | // signed numeric to decimal (Null | Int8 | Int16 | Int32 | Int64 | Float32 | Float64, Decimal128(_, _)) | (Null | Int8 | Int16 | Int32 | Int64 | Float32 | Float64, Decimal256(_, _)) | - // signed numeric to string - (Int8 | Int16 | Int32 | Int64 | Float16 | Float32 | Float64, Utf8View | Utf8 | LargeUtf8) | // decimal to unsigned numeric (Decimal128(_, _) | Decimal256(_, _), UInt8 | UInt16 | UInt32 | UInt64) | // decimal to signed numeric @@ -235,7 +231,7 @@ pub fn can_cast_types(from_type: &DataType, to_type: &DataType) -> bool { (Utf8 | LargeUtf8, Utf8View) => true, (BinaryView, Binary | LargeBinary | Utf8 | LargeUtf8 | Utf8View ) => true, (Utf8 | LargeUtf8, _) => to_type.is_numeric() && to_type != &Float16, - (_, Utf8 | LargeUtf8) => from_type.is_primitive(), + (_, Utf8View | Utf8 | LargeUtf8) => from_type.is_primitive(), (_, Binary | LargeBinary) => from_type.is_integer(), @@ -9157,6 +9153,15 @@ mod tests { #[test] fn test_cast_decimal_to_string() { + assert!(can_cast_types( + &DataType::Decimal128(10, 4), + &DataType::Utf8View + )); + assert!(can_cast_types( + &DataType::Decimal256(38, 10), + &DataType::Utf8View + )); + macro_rules! assert_decimal_values { ($array:expr) => { let c = $array; @@ -9208,9 +9213,6 @@ mod tests { .map(|num| num.map(i256::from_i128)) .collect(); - assert!(can_cast_types(&DataType::Decimal128(10, 4), &DataType::Utf8View)); - assert!(can_cast_types(&DataType::Decimal256(38, 10), &DataType::Utf8View)); - test_decimal_to_string::( DataType::Utf8View, create_decimal_array(array128.clone(), 7, 3).unwrap(), From 2f8f9c37fdfdd12dcd27c9eae9534f072e6ecea2 Mon Sep 17 00:00:00 2001 From: Tai Le Manh Date: Wed, 13 Nov 2024 01:59:19 +0700 Subject: [PATCH 3/6] Implement std::fmt::Write for StringViewBuilder Signed-off-by: Tai Le Manh --- arrow-array/src/builder/generic_bytes_view_builder.rs | 7 +++++++ arrow-cast/src/cast/string.rs | 2 +- 2 files changed, 8 insertions(+), 1 deletion(-) diff --git a/arrow-array/src/builder/generic_bytes_view_builder.rs b/arrow-array/src/builder/generic_bytes_view_builder.rs index d12c2b7db468..ab37b098f8bf 100644 --- a/arrow-array/src/builder/generic_bytes_view_builder.rs +++ b/arrow-array/src/builder/generic_bytes_view_builder.rs @@ -484,6 +484,13 @@ impl> Extend> /// ``` pub type StringViewBuilder = GenericByteViewBuilder; +impl std::fmt::Write for StringViewBuilder { + fn write_str(&mut self, s: &str) -> std::fmt::Result { + self.append_value(s); + Ok(()) + } +} + /// Array builder for [`BinaryViewArray`][crate::BinaryViewArray] /// /// Values can be appended using [`GenericByteViewBuilder::append_value`], and nulls with diff --git a/arrow-cast/src/cast/string.rs b/arrow-cast/src/cast/string.rs index 36142848f45c..44ba6460f9e7 100644 --- a/arrow-cast/src/cast/string.rs +++ b/arrow-cast/src/cast/string.rs @@ -47,8 +47,8 @@ pub(crate) fn value_to_string_view( let nulls = array.nulls(); for i in 0..array.len() { match nulls.map(|x| x.is_null(i)).unwrap_or_default() { - false => builder.append_value(formatter.value(i).try_to_string()?), true => builder.append_null(), + false => formatter.value(i).write(&mut builder)?, } } Ok(Arc::new(builder.finish())) From 74de9bcea9f8142b5bfd93bce3da105493ae98de Mon Sep 17 00:00:00 2001 From: Tai Le Manh Date: Fri, 15 Nov 2024 12:12:15 +0700 Subject: [PATCH 4/6] Update that current impl support only for numeric -> string view Signed-off-by: Tai Le Manh --- arrow-cast/src/cast/mod.rs | 163 +++++++++++++++++-------------------- 1 file changed, 74 insertions(+), 89 deletions(-) diff --git a/arrow-cast/src/cast/mod.rs b/arrow-cast/src/cast/mod.rs index 450cee42da57..0a1ae1fde7d0 100644 --- a/arrow-cast/src/cast/mod.rs +++ b/arrow-cast/src/cast/mod.rs @@ -231,7 +231,8 @@ pub fn can_cast_types(from_type: &DataType, to_type: &DataType) -> bool { (Utf8 | LargeUtf8, Utf8View) => true, (BinaryView, Binary | LargeBinary | Utf8 | LargeUtf8 | Utf8View ) => true, (Utf8 | LargeUtf8, _) => to_type.is_numeric() && to_type != &Float16, - (_, Utf8View | Utf8 | LargeUtf8) => from_type.is_primitive(), + (_, Utf8 | LargeUtf8) => from_type.is_primitive(), + (_, Utf8View) => from_type.is_numeric(), (_, Binary | LargeBinary) => from_type.is_integer(), @@ -1464,7 +1465,7 @@ pub fn cast_with_options( (BinaryView, _) => Err(ArrowError::CastError(format!( "Casting from {from_type:?} to {to_type:?} not supported", ))), - (from_type, Utf8View) if from_type.is_primitive() => { + (from_type, Utf8View) if from_type.is_numeric() => { value_to_string_view(array, cast_options) } (from_type, LargeUtf8) if from_type.is_primitive() => { @@ -5184,41 +5185,45 @@ mod tests { assert_eq!("2018-12-25T00:00:00", c.value(1)); } + // Cast Timestamp to Utf8View is not supported yet + // TODO: Implement casting from Timestamp to Utf8View + macro_rules! assert_cast_timestamp_to_string { + ($array:expr, $datatype:expr, $output_array_type: ty, $expected:expr) => {{ + let out = cast(&$array, &$datatype).unwrap(); + let actual = out + .as_any() + .downcast_ref::<$output_array_type>() + .unwrap() + .into_iter() + .collect::>(); + assert_eq!(actual, $expected); + }}; + ($array:expr, $datatype:expr, $output_array_type: ty, $options:expr, $expected:expr) => {{ + let out = cast_with_options(&$array, &$datatype, &$options).unwrap(); + let actual = out + .as_any() + .downcast_ref::<$output_array_type>() + .unwrap() + .into_iter() + .collect::>(); + assert_eq!(actual, $expected); + }}; + } + #[test] fn test_cast_timestamp_to_strings() { // "2018-12-25T00:00:02.001", "1997-05-19T00:00:03.005", None let array = TimestampMillisecondArray::from(vec![Some(864000003005), Some(1545696002001), None]); - let out = cast(&array, &DataType::Utf8).unwrap(); - let out = out - .as_any() - .downcast_ref::() - .unwrap() - .into_iter() - .collect::>(); - assert_eq!( - out, - vec![ - Some("1997-05-19T00:00:03.005"), - Some("2018-12-25T00:00:02.001"), - None - ] - ); - let out = cast(&array, &DataType::LargeUtf8).unwrap(); - let out = out - .as_any() - .downcast_ref::() - .unwrap() - .into_iter() - .collect::>(); - assert_eq!( - out, - vec![ - Some("1997-05-19T00:00:03.005"), - Some("2018-12-25T00:00:02.001"), - None - ] - ); + let expected = vec![ + Some("1997-05-19T00:00:03.005"), + Some("2018-12-25T00:00:02.001"), + None, + ]; + + // assert_cast_timestamp_to_string!(array, DataType::Utf8View, StringViewArray, expected); + assert_cast_timestamp_to_string!(array, DataType::Utf8, StringArray, expected); + assert_cast_timestamp_to_string!(array, DataType::LargeUtf8, LargeStringArray, expected); } #[test] @@ -5231,73 +5236,53 @@ mod tests { .with_timestamp_format(Some(ts_format)) .with_timestamp_tz_format(Some(ts_format)), }; + // "2018-12-25T00:00:02.001", "1997-05-19T00:00:03.005", None let array_without_tz = TimestampMillisecondArray::from(vec![Some(864000003005), Some(1545696002001), None]); - let out = cast_with_options(&array_without_tz, &DataType::Utf8, &cast_options).unwrap(); - let out = out - .as_any() - .downcast_ref::() - .unwrap() - .into_iter() - .collect::>(); - assert_eq!( - out, - vec![ - Some("1997-05-19 00:00:03.005000"), - Some("2018-12-25 00:00:02.001000"), - None - ] + let expected = vec![ + Some("1997-05-19 00:00:03.005000"), + Some("2018-12-25 00:00:02.001000"), + None, + ]; + // assert_cast_timestamp_to_string!(array_without_tz, DataType::Utf8View, StringViewArray, cast_options, expected); + assert_cast_timestamp_to_string!( + array_without_tz, + DataType::Utf8, + StringArray, + cast_options, + expected ); - let out = - cast_with_options(&array_without_tz, &DataType::LargeUtf8, &cast_options).unwrap(); - let out = out - .as_any() - .downcast_ref::() - .unwrap() - .into_iter() - .collect::>(); - assert_eq!( - out, - vec![ - Some("1997-05-19 00:00:03.005000"), - Some("2018-12-25 00:00:02.001000"), - None - ] + assert_cast_timestamp_to_string!( + array_without_tz, + DataType::LargeUtf8, + LargeStringArray, + cast_options, + expected ); let array_with_tz = TimestampMillisecondArray::from(vec![Some(864000003005), Some(1545696002001), None]) .with_timezone(tz.to_string()); - let out = cast_with_options(&array_with_tz, &DataType::Utf8, &cast_options).unwrap(); - let out = out - .as_any() - .downcast_ref::() - .unwrap() - .into_iter() - .collect::>(); - assert_eq!( - out, - vec![ - Some("1997-05-19 05:45:03.005000"), - Some("2018-12-25 05:45:02.001000"), - None - ] + let expected = vec![ + Some("1997-05-19 05:45:03.005000"), + Some("2018-12-25 05:45:02.001000"), + None, + ]; + // assert_cast_timestamp_to_string!(array_with_tz, DataType::Utf8View, StringViewArray, cast_options, expected); + assert_cast_timestamp_to_string!( + array_with_tz, + DataType::Utf8, + StringArray, + cast_options, + expected ); - let out = cast_with_options(&array_with_tz, &DataType::LargeUtf8, &cast_options).unwrap(); - let out = out - .as_any() - .downcast_ref::() - .unwrap() - .into_iter() - .collect::>(); - assert_eq!( - out, - vec![ - Some("1997-05-19 05:45:03.005000"), - Some("2018-12-25 05:45:02.001000"), - None - ] + assert_cast_timestamp_to_string!( + array_with_tz, + DataType::LargeUtf8, + LargeStringArray, + cast_options, + expected ); } From d65e228f60166dfcf2ac3b8ffcc55e13c9e9c705 Mon Sep 17 00:00:00 2001 From: Andrew Lamb Date: Fri, 22 Nov 2024 14:32:30 -0500 Subject: [PATCH 5/6] Update arrow-cast/src/cast/mod.rs --- arrow-cast/src/cast/mod.rs | 1 + 1 file changed, 1 insertion(+) diff --git a/arrow-cast/src/cast/mod.rs b/arrow-cast/src/cast/mod.rs index ef45e2052ca9..d1e313794f11 100644 --- a/arrow-cast/src/cast/mod.rs +++ b/arrow-cast/src/cast/mod.rs @@ -5223,6 +5223,7 @@ mod tests { // Cast Timestamp to Utf8View is not supported yet // TODO: Implement casting from Timestamp to Utf8View + // https://github.com/apache/arrow-rs/issues/6734 macro_rules! assert_cast_timestamp_to_string { ($array:expr, $datatype:expr, $output_array_type: ty, $expected:expr) => {{ let out = cast(&$array, &$datatype).unwrap(); From b90782789c47d9fbee24afd6267e92354aff7ab2 Mon Sep 17 00:00:00 2001 From: Andrew Lamb Date: Fri, 22 Nov 2024 14:41:58 -0500 Subject: [PATCH 6/6] Add documentation examples for `StringViewBuilder::write_str` --- .../src/builder/generic_bytes_view_builder.rs | 38 ++++++++++++++++--- 1 file changed, 33 insertions(+), 5 deletions(-) diff --git a/arrow-array/src/builder/generic_bytes_view_builder.rs b/arrow-array/src/builder/generic_bytes_view_builder.rs index ab37b098f8bf..3487727d71f9 100644 --- a/arrow-array/src/builder/generic_bytes_view_builder.rs +++ b/arrow-array/src/builder/generic_bytes_view_builder.rs @@ -466,22 +466,50 @@ impl> Extend> /// Array builder for [`StringViewArray`][crate::StringViewArray] /// /// Values can be appended using [`GenericByteViewBuilder::append_value`], and nulls with -/// [`GenericByteViewBuilder::append_null`] as normal. +/// [`GenericByteViewBuilder::append_null`]. /// -/// # Example +/// This builder also implements [`std::fmt::Write`] with any written data +/// included in the next appended value. This allows using [`std::fmt::Display`] +/// with standard Rust idioms like `write!` and `writeln!` to write data +/// directly to the builder without intermediate allocations. +/// +/// # Example writing strings with `append_value` /// ``` /// # use arrow_array::builder::StringViewBuilder; /// # use arrow_array::StringViewArray; /// let mut builder = StringViewBuilder::new(); -/// builder.append_value("hello"); -/// builder.append_null(); -/// builder.append_value("world"); +/// builder.append_value("hello"); // row 0 is a value +/// builder.append_null(); // row 1 is null +/// builder.append_value("world"); // row 2 is a value /// let array = builder.finish(); /// /// let expected = vec![Some("hello"), None, Some("world")]; /// let actual: Vec<_> = array.iter().collect(); /// assert_eq!(expected, actual); /// ``` +/// +/// /// # Example incrementally writing strings with `std::fmt::Write` +/// ``` +/// # use std::fmt::Write; +/// # use arrow_array::builder::StringViewBuilder; +/// let mut builder = StringViewBuilder::new(); +/// +/// // Write data in multiple `write!` calls +/// write!(builder, "foo").unwrap(); +/// write!(builder, "bar").unwrap(); +/// // The next call to append_value finishes the current string +/// // including all previously written strings. +/// builder.append_value("baz"); +/// +/// // Write second value with a single write call +/// write!(builder, "v2").unwrap(); +/// // finish the value by calling append_value with an empty string +/// builder.append_value(""); +/// +/// let array = builder.finish(); +/// assert_eq!(array.value(0), "foobarbaz"); +/// assert_eq!(array.value(1), "v2"); +/// ``` pub type StringViewBuilder = GenericByteViewBuilder; impl std::fmt::Write for StringViewBuilder {