Skip to content

Commit c9029c5

Browse files
kylebarronalamb
andauthored
Don't omit schema metadata when removing column (#5328)
* Don't omit schema metadata when removing column * Add test * Update arrow-schema/src/schema.rs Co-authored-by: Andrew Lamb <andrew@nerdnetworks.org> --------- Co-authored-by: Andrew Lamb <andrew@nerdnetworks.org>
1 parent 0b45993 commit c9029c5

File tree

2 files changed

+36
-1
lines changed

2 files changed

+36
-1
lines changed

arrow-array/src/record_batch.rs

+30-1
Original file line numberDiff line numberDiff line change
@@ -355,7 +355,7 @@ impl RecordBatch {
355355
/// assert_eq!(batch.num_columns(), 1);
356356
/// ```
357357
pub fn remove_column(&mut self, index: usize) -> ArrayRef {
358-
let mut builder = SchemaBuilder::from(self.schema.fields());
358+
let mut builder = SchemaBuilder::from(self.schema.as_ref());
359359
builder.remove(index);
360360
self.schema = Arc::new(builder.finish());
361361
self.columns.remove(index)
@@ -618,6 +618,8 @@ where
618618

619619
#[cfg(test)]
620620
mod tests {
621+
use std::collections::HashMap;
622+
621623
use super::*;
622624
use crate::{BooleanArray, Int32Array, Int64Array, Int8Array, ListArray, StringArray};
623625
use arrow_buffer::{Buffer, ToByteSlice};
@@ -1155,4 +1157,31 @@ mod tests {
11551157
let size = get_size(reader);
11561158
assert_eq!(size, 0);
11571159
}
1160+
1161+
#[test]
1162+
fn test_remove_column_maintains_schema_metadata() {
1163+
let id_array = Int32Array::from(vec![1, 2, 3, 4, 5]);
1164+
let bool_array = BooleanArray::from(vec![true, false, false, true, true]);
1165+
1166+
let mut metadata = HashMap::new();
1167+
metadata.insert("foo".to_string(), "bar".to_string());
1168+
let schema = Schema::new(vec![
1169+
Field::new("id", DataType::Int32, false),
1170+
Field::new("bool", DataType::Boolean, false),
1171+
])
1172+
.with_metadata(metadata);
1173+
1174+
let mut batch = RecordBatch::try_new(
1175+
Arc::new(schema),
1176+
vec![Arc::new(id_array), Arc::new(bool_array)],
1177+
)
1178+
.unwrap();
1179+
1180+
let _removed_column = batch.remove_column(0);
1181+
assert_eq!(batch.schema().metadata().len(), 1);
1182+
assert_eq!(
1183+
batch.schema().metadata().get("foo").unwrap().as_str(),
1184+
"bar"
1185+
);
1186+
}
11581187
}

arrow-schema/src/schema.rs

+6
Original file line numberDiff line numberDiff line change
@@ -140,6 +140,12 @@ impl From<Fields> for SchemaBuilder {
140140
}
141141
}
142142

143+
impl From<&Schema> for SchemaBuilder {
144+
fn from(value: &Schema) -> Self {
145+
Self::from(value.clone())
146+
}
147+
}
148+
143149
impl From<Schema> for SchemaBuilder {
144150
fn from(value: Schema) -> Self {
145151
Self {

0 commit comments

Comments
 (0)