From 7f09225f01b3945d268dd0469e58d83331f4a352 Mon Sep 17 00:00:00 2001 From: Mohammad Razeghi Date: Fri, 8 Dec 2023 00:17:54 +0100 Subject: [PATCH] Fixed issue where timestamp parser incorrectly accepted characters after 'Z --- arrow-cast/src/cast.rs | 24 ++++++++++++++++++++++++ arrow-cast/src/parse.rs | 2 +- 2 files changed, 25 insertions(+), 1 deletion(-) diff --git a/arrow-cast/src/cast.rs b/arrow-cast/src/cast.rs index 51acd36c3fe4..f5fbc61b8673 100644 --- a/arrow-cast/src/cast.rs +++ b/arrow-cast/src/cast.rs @@ -9449,4 +9449,28 @@ mod tests { let r: Vec<_> = a.as_string::().iter().map(|x| x.unwrap()).collect(); assert_eq!(r, &["[0, 1, 2]", "[0, null, 2]"]); } + #[test] + fn test_cast_string_to_timestamp_invalid_tz() { + // content after Z should be ignored + let bad_timestamp = "2023-12-05T21:58:10.45ZZTOP"; + let array = StringArray::from(vec![Some(bad_timestamp)]); + + let data_types = [ + DataType::Timestamp(TimeUnit::Second, None), + DataType::Timestamp(TimeUnit::Millisecond, None), + DataType::Timestamp(TimeUnit::Microsecond, None), + DataType::Timestamp(TimeUnit::Nanosecond, None), + ]; + + let cast_options = CastOptions { + safe: false, ..Default::default() + }; + + for dt in data_types { + assert_eq!( + cast_with_options(&array, &dt, &cast_options).unwrap_err().to_string(), + "Parser error: Invalid timezone \"ZZTOP\": only offset based timezones supported without chrono-tz feature" + ); + } + } } diff --git a/arrow-cast/src/parse.rs b/arrow-cast/src/parse.rs index 750f38006d33..3d2e47ed95a4 100644 --- a/arrow-cast/src/parse.rs +++ b/arrow-cast/src/parse.rs @@ -210,7 +210,7 @@ pub fn string_to_datetime(timezone: &T, s: &str) -> Result