forked from apache/arrow-rs
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathunion_array.rs
84 lines (70 loc) · 2.85 KB
/
union_array.rs
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
// Licensed to the Apache Software Foundation (ASF) under one
// or more contributor license agreements. See the NOTICE file
// distributed with this work for additional information
// regarding copyright ownership. The ASF licenses this file
// to you under the Apache License, Version 2.0 (the
// "License"); you may not use this file except in compliance
// with the License. You may obtain a copy of the License at
//
// http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing,
// software distributed under the License is distributed on an
// "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
// KIND, either express or implied. See the License for the
// specific language governing permissions and limitations
// under the License.
use std::{
iter::{repeat, repeat_with},
sync::Arc,
};
use arrow_array::{Array, ArrayRef, Int32Array, UnionArray};
use arrow_buffer::{NullBuffer, ScalarBuffer};
use arrow_schema::{DataType, Field, UnionFields};
use criterion::*;
use rand::{thread_rng, Rng};
fn array_with_nulls() -> ArrayRef {
let mut rng = thread_rng();
let values = ScalarBuffer::from_iter(repeat_with(|| rng.gen()).take(4096));
// nulls with at least one null and one valid
let nulls: NullBuffer = [true, false]
.into_iter()
.chain(repeat_with(|| rng.gen()))
.take(4096)
.collect();
Arc::new(Int32Array::new(values.clone(), Some(nulls)))
}
fn array_without_nulls() -> ArrayRef {
let mut rng = thread_rng();
let values = ScalarBuffer::from_iter(repeat_with(|| rng.gen()).take(4096));
Arc::new(Int32Array::new(values.clone(), None))
}
fn criterion_benchmark(c: &mut Criterion) {
for with_nulls in 1..12 {
for without_nulls in [0, 1, 10] {
c.bench_function(
&format!("union logical nulls 4096 {with_nulls} children with nulls, {without_nulls} without nulls"),
|b| {
let type_ids = 0..with_nulls+without_nulls;
let fields = UnionFields::new(
type_ids.clone(),
type_ids.clone().map(|i| Field::new(format!("f{i}"), DataType::Int32, true)),
);
let array = UnionArray::try_new(
fields,
type_ids.cycle().take(4096).collect(),
None,
repeat(array_with_nulls())
.take(with_nulls as usize)
.chain(repeat(array_without_nulls()).take(without_nulls as usize))
.collect(),
)
.unwrap();
b.iter(|| black_box(array.logical_nulls()))
},
);
}
}
}
criterion_group!(benches, criterion_benchmark);
criterion_main!(benches);