summaryrefslogtreecommitdiffstats
path: root/src/arrow/ruby/red-arrow/benchmark
diff options
context:
space:
mode:
authorDaniel Baumann <daniel.baumann@progress-linux.org>2024-04-21 11:54:28 +0000
committerDaniel Baumann <daniel.baumann@progress-linux.org>2024-04-21 11:54:28 +0000
commite6918187568dbd01842d8d1d2c808ce16a894239 (patch)
tree64f88b554b444a49f656b6c656111a145cbbaa28 /src/arrow/ruby/red-arrow/benchmark
parentInitial commit. (diff)
downloadceph-e6918187568dbd01842d8d1d2c808ce16a894239.tar.xz
ceph-e6918187568dbd01842d8d1d2c808ce16a894239.zip
Adding upstream version 18.2.2.upstream/18.2.2
Signed-off-by: Daniel Baumann <daniel.baumann@progress-linux.org>
Diffstat (limited to 'src/arrow/ruby/red-arrow/benchmark')
-rw-r--r--src/arrow/ruby/red-arrow/benchmark/raw-records/boolean.yml65
-rw-r--r--src/arrow/ruby/red-arrow/benchmark/raw-records/decimal128.yml68
-rw-r--r--src/arrow/ruby/red-arrow/benchmark/raw-records/dictionary.yml75
-rw-r--r--src/arrow/ruby/red-arrow/benchmark/raw-records/int64.yml67
-rw-r--r--src/arrow/ruby/red-arrow/benchmark/raw-records/list.yml70
-rw-r--r--src/arrow/ruby/red-arrow/benchmark/raw-records/string.yml65
-rw-r--r--src/arrow/ruby/red-arrow/benchmark/raw-records/timestamp.yml75
-rw-r--r--src/arrow/ruby/red-arrow/benchmark/values/boolean.yml37
-rw-r--r--src/arrow/ruby/red-arrow/benchmark/values/decimal128.yml38
-rw-r--r--src/arrow/ruby/red-arrow/benchmark/values/dictionary.yml46
-rw-r--r--src/arrow/ruby/red-arrow/benchmark/values/int64.yml37
-rw-r--r--src/arrow/ruby/red-arrow/benchmark/values/list.yml44
-rw-r--r--src/arrow/ruby/red-arrow/benchmark/values/string.yml38
-rw-r--r--src/arrow/ruby/red-arrow/benchmark/values/timestamp.yml49
14 files changed, 774 insertions, 0 deletions
diff --git a/src/arrow/ruby/red-arrow/benchmark/raw-records/boolean.yml b/src/arrow/ruby/red-arrow/benchmark/raw-records/boolean.yml
new file mode 100644
index 000000000..5e2551e2c
--- /dev/null
+++ b/src/arrow/ruby/red-arrow/benchmark/raw-records/boolean.yml
@@ -0,0 +1,65 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements. See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership. The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License. You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied. See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+contexts:
+ - name: master
+ prelude: |
+ $LOAD_PATH.unshift(File.expand_path("ext/arrow"))
+ $LOAD_PATH.unshift(File.expand_path("lib"))
+prelude: |-
+ require "arrow"
+ require "faker"
+
+ state = ENV.fetch("FAKER_RANDOM_SEED", 17).to_i
+ Faker::Config.random = Random.new(state)
+
+ n_rows = 1000
+ n_columns = 10
+ type = :boolean
+
+ fields = {}
+ arrays = {}
+ n_columns.times do |i|
+ column_name = "column_#{i}"
+ fields[column_name] = type
+ arrays[column_name] = n_rows.times.map { Faker::Boolean.boolean }
+ end
+ record_batch = Arrow::RecordBatch.new(fields, arrays)
+
+ def pure_ruby_raw_records(record_batch)
+ n_rows = record_batch.n_rows
+ n_columns = record_batch.n_columns
+ columns = record_batch.columns
+ records = []
+ i = 0
+ while i < n_rows
+ record = []
+ j = 0
+ while j < n_columns
+ record << columns[j][i]
+ j += 1
+ end
+ records << record
+ i += 1
+ end
+ records
+ end
+benchmark:
+ pure_ruby: |-
+ pure_ruby_raw_records(record_batch)
+ raw_records: |-
+ record_batch.raw_records
diff --git a/src/arrow/ruby/red-arrow/benchmark/raw-records/decimal128.yml b/src/arrow/ruby/red-arrow/benchmark/raw-records/decimal128.yml
new file mode 100644
index 000000000..367e7c713
--- /dev/null
+++ b/src/arrow/ruby/red-arrow/benchmark/raw-records/decimal128.yml
@@ -0,0 +1,68 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements. See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership. The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License. You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied. See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+contexts:
+ - name: master
+ prelude: |
+ $LOAD_PATH.unshift(File.expand_path("ext/arrow"))
+ $LOAD_PATH.unshift(File.expand_path("lib"))
+prelude: |-
+ require "arrow"
+ require "faker"
+
+ state = ENV.fetch("FAKER_RANDOM_SEED", 17).to_i
+ Faker::Config.random = Random.new(state)
+
+ n_rows = 1000
+ n_columns = 10
+ type = Arrow::Decimal128DataType.new(10, 5)
+
+ fields = {}
+ arrays = {}
+ n_columns.times do |i|
+ column_name = "column_#{i}"
+ fields[column_name] = type
+ arrays[column_name] = n_rows.times.map do
+ Faker::Number.decimal(l_digits: 10, r_digits: 5)
+ end
+ end
+ record_batch = Arrow::RecordBatch.new(fields, arrays)
+
+ def pure_ruby_raw_records(record_batch)
+ n_rows = record_batch.n_rows
+ n_columns = record_batch.n_columns
+ columns = record_batch.columns
+ records = []
+ i = 0
+ while i < n_rows
+ record = []
+ j = 0
+ while j < n_columns
+ x = columns[j][i]
+ record << BigDecimal(x.to_s)
+ j += 1
+ end
+ records << record
+ i += 1
+ end
+ records
+ end
+benchmark:
+ pure_ruby: |-
+ pure_ruby_raw_records(record_batch)
+ raw_records: |-
+ record_batch.raw_records()
diff --git a/src/arrow/ruby/red-arrow/benchmark/raw-records/dictionary.yml b/src/arrow/ruby/red-arrow/benchmark/raw-records/dictionary.yml
new file mode 100644
index 000000000..151bb412f
--- /dev/null
+++ b/src/arrow/ruby/red-arrow/benchmark/raw-records/dictionary.yml
@@ -0,0 +1,75 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements. See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership. The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License. You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied. See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+contexts:
+ - name: master
+ prelude: |
+ $LOAD_PATH.unshift(File.expand_path("ext/arrow"))
+ $LOAD_PATH.unshift(File.expand_path("lib"))
+prelude: |-
+ require "arrow"
+ require "faker"
+
+ state = ENV.fetch("FAKER_RANDOM_SEED", 17).to_i
+ Faker::Config.random = Random.new(state)
+
+ n_rows = 1000
+ n_columns = 10
+ type = Arrow::DictionaryDataType.new(:int8, :string, true)
+
+ fields = n_columns.times.map {|i| ["column_#{i}".to_sym, type] }.to_h
+ schema = Arrow::Schema.new(**fields)
+ dictionary = Arrow::StringArray.new(
+ 100.times.map { Faker::Book.genre }.uniq.sort
+ )
+ indices = Arrow::Int8Array.new(
+ n_rows.times.map {
+ Faker::Number.within(range: 0 ... dictionary.length)
+ }
+ )
+ arrays = n_columns.times.map do
+ Arrow::DictionaryArray.new(
+ type,
+ indices,
+ dictionary,
+ )
+ end
+ record_batch = Arrow::RecordBatch.new(schema, n_rows, arrays)
+
+ def pure_ruby_raw_records(record_batch)
+ n_rows = record_batch.n_rows
+ n_columns = record_batch.n_columns
+ columns = record_batch.columns
+ records = []
+ i = 0
+ while i < n_rows
+ record = []
+ j = 0
+ while j < n_columns
+ record << columns[j].data.indices[i]
+ j += 1
+ end
+ records << record
+ i += 1
+ end
+ records
+ end
+benchmark:
+ pure_ruby: |-
+ pure_ruby_raw_records(record_batch)
+ raw_records: |-
+ record_batch.raw_records
diff --git a/src/arrow/ruby/red-arrow/benchmark/raw-records/int64.yml b/src/arrow/ruby/red-arrow/benchmark/raw-records/int64.yml
new file mode 100644
index 000000000..bd03ab942
--- /dev/null
+++ b/src/arrow/ruby/red-arrow/benchmark/raw-records/int64.yml
@@ -0,0 +1,67 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements. See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership. The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License. You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied. See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+contexts:
+ - name: master
+ prelude: |
+ $LOAD_PATH.unshift(File.expand_path("ext/arrow"))
+ $LOAD_PATH.unshift(File.expand_path("lib"))
+prelude: |-
+ require "arrow"
+ require "faker"
+
+ state = ENV.fetch("FAKER_RANDOM_SEED", 17).to_i
+ Faker::Config.random = Random.new(state)
+
+ n_rows = 1000
+ n_columns = 10
+ type = :int64
+
+ fields = {}
+ arrays = {}
+ n_columns.times do |i|
+ column_name = "column_#{i}"
+ fields[column_name] = type
+ arrays[column_name] = n_rows.times.map do
+ Faker::Number.number(digits: 18).to_i
+ end
+ end
+ record_batch = Arrow::RecordBatch.new(fields, arrays)
+
+ def pure_ruby_raw_records(record_batch)
+ n_rows = record_batch.n_rows
+ n_columns = record_batch.n_columns
+ columns = record_batch.columns
+ records = []
+ i = 0
+ while i < n_rows
+ record = []
+ j = 0
+ while j < n_columns
+ record << columns[j][i]
+ j += 1
+ end
+ records << record
+ i += 1
+ end
+ records
+ end
+benchmark:
+ pure_ruby: |-
+ pure_ruby_raw_records(record_batch)
+ raw_records: |-
+ record_batch.raw_records
diff --git a/src/arrow/ruby/red-arrow/benchmark/raw-records/list.yml b/src/arrow/ruby/red-arrow/benchmark/raw-records/list.yml
new file mode 100644
index 000000000..b9a526710
--- /dev/null
+++ b/src/arrow/ruby/red-arrow/benchmark/raw-records/list.yml
@@ -0,0 +1,70 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements. See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership. The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License. You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied. See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+contexts:
+ - name: master
+ prelude: |
+ $LOAD_PATH.unshift(File.expand_path("ext/arrow"))
+ $LOAD_PATH.unshift(File.expand_path("lib"))
+prelude: |-
+ require "arrow"
+ require "faker"
+
+ state = ENV.fetch("FAKER_RANDOM_SEED", 17).to_i
+ Faker::Config.random = Random.new(state)
+
+ n_rows = 1000
+ n_columns = 10
+ type = Arrow::ListDataType.new(name: "values", type: :double)
+
+ fields = {}
+ arrays = {}
+ n_columns.times do |i|
+ column_name = "column_#{i}"
+ fields[column_name] = type
+ arrays[column_name] = n_rows.times.map do
+ n_elements = Faker::Number.within(range: 1 ... 100)
+ n_elements.times.map do
+ Faker::Number.normal(mean: 0, standard_deviation: 1e+6)
+ end
+ end
+ end
+ record_batch = Arrow::RecordBatch.new(fields, arrays)
+
+ def pure_ruby_raw_records(record_batch)
+ n_rows = record_batch.n_rows
+ n_columns = record_batch.n_columns
+ columns = record_batch.columns
+ records = []
+ i = 0
+ while i < n_rows
+ record = []
+ j = 0
+ while j < n_columns
+ record << columns[j][i]
+ j += 1
+ end
+ records << record
+ i += 1
+ end
+ records
+ end
+benchmark:
+ pure_ruby: |-
+ pure_ruby_raw_records(record_batch)
+ raw_records: |-
+ record_batch.raw_records
diff --git a/src/arrow/ruby/red-arrow/benchmark/raw-records/string.yml b/src/arrow/ruby/red-arrow/benchmark/raw-records/string.yml
new file mode 100644
index 000000000..2854a376b
--- /dev/null
+++ b/src/arrow/ruby/red-arrow/benchmark/raw-records/string.yml
@@ -0,0 +1,65 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements. See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership. The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License. You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied. See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+contexts:
+ - name: master
+ prelude: |
+ $LOAD_PATH.unshift(File.expand_path("ext/arrow"))
+ $LOAD_PATH.unshift(File.expand_path("lib"))
+prelude: |-
+ require "arrow"
+ require "faker"
+
+ state = ENV.fetch("FAKER_RANDOM_SEED", 17).to_i
+ Faker::Config.random = Random.new(state)
+
+ n_rows = 1000
+ n_columns = 10
+ type = :string
+
+ fields = {}
+ arrays = {}
+ n_columns.times do |i|
+ column_name = "column_#{i}"
+ fields[column_name] = type
+ arrays[column_name] = n_rows.times.map { Faker::Name.name }
+ end
+ record_batch = Arrow::RecordBatch.new(fields, arrays)
+
+ def pure_ruby_raw_records(record_batch)
+ n_rows = record_batch.n_rows
+ n_columns = record_batch.n_columns
+ columns = record_batch.columns
+ records = []
+ i = 0
+ while i < n_rows
+ record = []
+ j = 0
+ while j < n_columns
+ record << columns[j][i]
+ j += 1
+ end
+ records << record
+ i += 1
+ end
+ records
+ end
+benchmark:
+ pure_ruby: |-
+ pure_ruby_raw_records(record_batch)
+ raw_records: |-
+ record_batch.raw_records
diff --git a/src/arrow/ruby/red-arrow/benchmark/raw-records/timestamp.yml b/src/arrow/ruby/red-arrow/benchmark/raw-records/timestamp.yml
new file mode 100644
index 000000000..9b65b790a
--- /dev/null
+++ b/src/arrow/ruby/red-arrow/benchmark/raw-records/timestamp.yml
@@ -0,0 +1,75 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements. See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership. The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License. You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied. See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+contexts:
+ - name: master
+ prelude: |
+ $LOAD_PATH.unshift(File.expand_path("ext/arrow"))
+ $LOAD_PATH.unshift(File.expand_path("lib"))
+prelude: |-
+ require "arrow"
+ require "faker"
+
+ state = ENV.fetch("FAKER_RANDOM_SEED", 17).to_i
+ Faker::Config.random = Random.new(state)
+
+ n_rows = 1000
+ n_columns = 10
+ type = Arrow::TimestampDataType.new(:micro)
+ base_timestamp = Time.at(Faker::Number.within(range: 0 ... 1_000_000_000))
+ thirty_days_in_sec = 30*24*3600
+ timestamp_range = {
+ from: base_timestamp - thirty_days_in_sec,
+ to: base_timestamp + thirty_days_in_sec,
+ }
+
+ fields = {}
+ arrays = {}
+ n_columns.times do |i|
+ column_name = "column_#{i}"
+ fields[column_name] = type
+ arrays[column_name] = n_rows.times.map do
+ sec = Faker::Time.between(timestamp_range).to_i
+ micro = Faker::Number.within(range: 0 ... 1_000_000)
+ sec * 1_000_000 + micro
+ end
+ end
+ record_batch = Arrow::RecordBatch.new(fields, arrays)
+
+ def pure_ruby_raw_records(record_batch)
+ n_rows = record_batch.n_rows
+ n_columns = record_batch.n_columns
+ columns = record_batch.columns
+ records = []
+ i = 0
+ while i < n_rows
+ record = []
+ j = 0
+ while j < n_columns
+ record << columns[j][i]
+ j += 1
+ end
+ records << record
+ i += 1
+ end
+ records
+ end
+benchmark:
+ pure_ruby: |-
+ pure_ruby_raw_records(record_batch)
+ raw_records: |-
+ record_batch.raw_records
diff --git a/src/arrow/ruby/red-arrow/benchmark/values/boolean.yml b/src/arrow/ruby/red-arrow/benchmark/values/boolean.yml
new file mode 100644
index 000000000..45abff523
--- /dev/null
+++ b/src/arrow/ruby/red-arrow/benchmark/values/boolean.yml
@@ -0,0 +1,37 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements. See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership. The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License. You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied. See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+contexts:
+ - name: master
+ prelude: |
+ $LOAD_PATH.unshift(File.expand_path("ext/arrow"))
+ $LOAD_PATH.unshift(File.expand_path("lib"))
+prelude: |-
+ require "arrow"
+ require "faker"
+
+ state = ENV.fetch("FAKER_RANDOM_SEED", 17).to_i
+ Faker::Config.random = Random.new(state)
+
+ n_values = 1000
+ values = n_values.times.map { Faker::Boolean.boolean }
+ array = Arrow::BooleanArray.new(values)
+benchmark:
+ pure_ruby: |-
+ array.collect.to_a
+ values: |-
+ array.values
diff --git a/src/arrow/ruby/red-arrow/benchmark/values/decimal128.yml b/src/arrow/ruby/red-arrow/benchmark/values/decimal128.yml
new file mode 100644
index 000000000..4a2a5bff5
--- /dev/null
+++ b/src/arrow/ruby/red-arrow/benchmark/values/decimal128.yml
@@ -0,0 +1,38 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements. See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership. The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License. You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied. See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+contexts:
+ - name: master
+ prelude: |
+ $LOAD_PATH.unshift(File.expand_path("ext/arrow"))
+ $LOAD_PATH.unshift(File.expand_path("lib"))
+prelude: |-
+ require "arrow"
+ require "faker"
+
+ state = ENV.fetch("FAKER_RANDOM_SEED", 17).to_i
+ Faker::Config.random = Random.new(state)
+
+ n_values = 1000
+ type = Arrow::Decimal128DataType.new(10, 5)
+ values = n_values.times.map { Faker::Number.decimal(l_digits: 10, r_digits: 5) }
+ array = Arrow::Decimal128Array.new(type, values)
+benchmark:
+ pure_ruby: |-
+ array.collect.to_a
+ values: |-
+ array.values
diff --git a/src/arrow/ruby/red-arrow/benchmark/values/dictionary.yml b/src/arrow/ruby/red-arrow/benchmark/values/dictionary.yml
new file mode 100644
index 000000000..5b4f20dc8
--- /dev/null
+++ b/src/arrow/ruby/red-arrow/benchmark/values/dictionary.yml
@@ -0,0 +1,46 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements. See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership. The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License. You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied. See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+contexts:
+ - name: master
+ prelude: |
+ $LOAD_PATH.unshift(File.expand_path("ext/arrow"))
+ $LOAD_PATH.unshift(File.expand_path("lib"))
+prelude: |-
+ require "arrow"
+ require "faker"
+
+ state = ENV.fetch("FAKER_RANDOM_SEED", 17).to_i
+ Faker::Config.random = Random.new(state)
+
+ n_values = 1000
+ type = Arrow::DictionaryDataType.new(:int8, :string, true)
+
+ dictionary = Arrow::StringArray.new(
+ 100.times.map { Faker::Book.genre }.uniq.sort
+ )
+ indices = Arrow::Int8Array.new(
+ n_values.times.map {
+ Faker::Number.within(range: 0 ... dictionary.length)
+ }
+ )
+ array = Arrow::DictionaryArray.new(type, indices, dictionary)
+benchmark:
+ pure_ruby: |-
+ array.length.times.collect {|i| array.indices[i]}
+ values: |-
+ array.values
diff --git a/src/arrow/ruby/red-arrow/benchmark/values/int64.yml b/src/arrow/ruby/red-arrow/benchmark/values/int64.yml
new file mode 100644
index 000000000..d9e89261a
--- /dev/null
+++ b/src/arrow/ruby/red-arrow/benchmark/values/int64.yml
@@ -0,0 +1,37 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements. See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership. The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License. You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied. See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+contexts:
+ - name: master
+ prelude: |
+ $LOAD_PATH.unshift(File.expand_path("ext/arrow"))
+ $LOAD_PATH.unshift(File.expand_path("lib"))
+prelude: |-
+ require "arrow"
+ require "faker"
+
+ state = ENV.fetch("FAKER_RANDOM_SEED", 17).to_i
+ Faker::Config.random = Random.new(state)
+
+ n_values = 1000
+ values = n_values.times.map { Faker::Number.number(digits: 18).to_i }
+ array = Arrow::Int64Array.new(values)
+benchmark:
+ pure_ruby: |-
+ array.collect.to_a
+ values: |-
+ array.values
diff --git a/src/arrow/ruby/red-arrow/benchmark/values/list.yml b/src/arrow/ruby/red-arrow/benchmark/values/list.yml
new file mode 100644
index 000000000..2764c1a61
--- /dev/null
+++ b/src/arrow/ruby/red-arrow/benchmark/values/list.yml
@@ -0,0 +1,44 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements. See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership. The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License. You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied. See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+contexts:
+ - name: master
+ prelude: |
+ $LOAD_PATH.unshift(File.expand_path("ext/arrow"))
+ $LOAD_PATH.unshift(File.expand_path("lib"))
+prelude: |-
+ require "arrow"
+ require "faker"
+
+ state = ENV.fetch("FAKER_RANDOM_SEED", 17).to_i
+ Faker::Config.random = Random.new(state)
+
+ n_values = 1000
+ type = Arrow::ListDataType.new(name: "values", type: :double)
+
+ values = n_values.times.map do
+ n_elements = Faker::Number.within(range: 1 ... 100)
+ n_elements.times.map do
+ Faker::Number.normal(mean: 0, standard_deviation: 1e+6)
+ end
+ end
+ array = Arrow::ListArray.new(type, values)
+benchmark:
+ pure_ruby: |-
+ array.collect.to_a
+ values: |-
+ array.values
diff --git a/src/arrow/ruby/red-arrow/benchmark/values/string.yml b/src/arrow/ruby/red-arrow/benchmark/values/string.yml
new file mode 100644
index 000000000..8a40deaa0
--- /dev/null
+++ b/src/arrow/ruby/red-arrow/benchmark/values/string.yml
@@ -0,0 +1,38 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements. See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership. The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License. You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied. See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+contexts:
+ - name: master
+ prelude: |
+ $LOAD_PATH.unshift(File.expand_path("ext/arrow"))
+ $LOAD_PATH.unshift(File.expand_path("lib"))
+prelude: |-
+ require "arrow"
+ require "faker"
+
+ state = ENV.fetch("FAKER_RANDOM_SEED", 17).to_i
+ Faker::Config.random = Random.new(state)
+
+ n_values = 1000
+
+ values = n_values.times.map { Faker::Name.name }
+ array = Arrow::StringArray.new(values)
+benchmark:
+ pure_ruby: |-
+ array.collect.to_a
+ values: |-
+ array.values
diff --git a/src/arrow/ruby/red-arrow/benchmark/values/timestamp.yml b/src/arrow/ruby/red-arrow/benchmark/values/timestamp.yml
new file mode 100644
index 000000000..4af46d1db
--- /dev/null
+++ b/src/arrow/ruby/red-arrow/benchmark/values/timestamp.yml
@@ -0,0 +1,49 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements. See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership. The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License. You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied. See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+contexts:
+ - name: master
+ prelude: |
+ $LOAD_PATH.unshift(File.expand_path("ext/arrow"))
+ $LOAD_PATH.unshift(File.expand_path("lib"))
+prelude: |-
+ require "arrow"
+ require "faker"
+
+ state = ENV.fetch("FAKER_RANDOM_SEED", 17).to_i
+ Faker::Config.random = Random.new(state)
+
+ n_values = 1000
+ type = Arrow::TimestampDataType.new(:micro)
+ base_timestamp = Time.at(Faker::Number.within(range: 0 ... 1_000_000_000))
+ thirty_days_in_sec = 30*24*3600
+ timestamp_range = {
+ from: base_timestamp - thirty_days_in_sec,
+ to: base_timestamp + thirty_days_in_sec,
+ }
+
+ values = n_values.times.map do
+ sec = Faker::Time.between(timestamp_range).to_i
+ micro = Faker::Number.within(range: 0 ... 1_000_000)
+ sec * 1_000_000 + micro
+ end
+ array = Arrow::TimestampArray.new(type, values)
+benchmark:
+ pure_ruby: |-
+ array.collect.to_a
+ values: |-
+ array.values