Skip to content

Commit 9ab7bb0

Browse files
committed
clippy fixes
1 parent da66845 commit 9ab7bb0

File tree

5 files changed

+37
-46
lines changed

5 files changed

+37
-46
lines changed

parquet/benches/metadata.rs

Lines changed: 21 additions & 23 deletions
Original file line numberDiff line numberDiff line change
@@ -15,6 +15,8 @@
1515
// specific language governing permissions and limitations
1616
// under the License.
1717

18+
#[cfg(feature = "arrow")]
19+
use parquet::file::metadata::ParquetMetaData;
1820
use parquet::file::metadata::ParquetMetaDataReader;
1921
use rand::Rng;
2022
use thrift::protocol::TCompactOutputProtocol;
@@ -164,7 +166,7 @@ fn get_footer_bytes(data: Bytes) -> Bytes {
164166
}
165167

166168
#[cfg(feature = "arrow")]
167-
fn rewrite_file(bytes: Bytes) -> (Bytes, FileMetaData) {
169+
fn rewrite_file(bytes: Bytes) -> (Bytes, ParquetMetaData) {
168170
use arrow::array::RecordBatchReader;
169171
use parquet::arrow::{arrow_reader::ParquetRecordBatchReaderBuilder, ArrowWriter};
170172
use parquet::file::properties::{EnabledStatistics, WriterProperties};
@@ -242,40 +244,36 @@ fn criterion_benchmark(c: &mut Criterion) {
242244
#[cfg(feature = "arrow")]
243245
c.bench_function("page headers", |b| {
244246
b.iter(|| {
245-
metadata.row_groups.iter().for_each(|rg| {
246-
rg.columns.iter().for_each(|col| {
247-
if let Some(col_meta) = &col.meta_data {
248-
if let Some(dict_offset) = col_meta.dictionary_page_offset {
249-
parquet::thrift::bench_page_header(
250-
&file_bytes.slice(dict_offset as usize..),
251-
);
252-
}
247+
for rg in metadata.row_groups() {
248+
for col in rg.columns() {
249+
if let Some(dict_offset) = col.dictionary_page_offset() {
253250
parquet::thrift::bench_page_header(
254-
&file_bytes.slice(col_meta.data_page_offset as usize..),
251+
&file_bytes.slice(dict_offset as usize..),
255252
);
256253
}
257-
});
258-
});
254+
parquet::thrift::bench_page_header(
255+
&file_bytes.slice(col.data_page_offset() as usize..),
256+
);
257+
}
258+
}
259259
})
260260
});
261261

262262
#[cfg(feature = "arrow")]
263263
c.bench_function("page headers (no stats)", |b| {
264264
b.iter(|| {
265-
metadata.row_groups.iter().for_each(|rg| {
266-
rg.columns.iter().for_each(|col| {
267-
if let Some(col_meta) = &col.meta_data {
268-
if let Some(dict_offset) = col_meta.dictionary_page_offset {
269-
parquet::thrift::bench_page_header_no_stats(
270-
&file_bytes.slice(dict_offset as usize..),
271-
);
272-
}
265+
for rg in metadata.row_groups() {
266+
for col in rg.columns() {
267+
if let Some(dict_offset) = col.dictionary_page_offset() {
273268
parquet::thrift::bench_page_header_no_stats(
274-
&file_bytes.slice(col_meta.data_page_offset as usize..),
269+
&file_bytes.slice(dict_offset as usize..),
275270
);
276271
}
277-
});
278-
});
272+
parquet::thrift::bench_page_header_no_stats(
273+
&file_bytes.slice(col.data_page_offset() as usize..),
274+
);
275+
}
276+
}
279277
})
280278
});
281279
}

parquet/src/file/metadata/thrift_gen.rs

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1444,7 +1444,7 @@ impl WriteThrift for ColumnChunkMetaData {
14441444
// only write the ColumnMetaData if we haven't already encrypted it
14451445
if self.encrypted_column_metadata.is_none() {
14461446
writer.write_field_begin(FieldType::Struct, 3, last_field_id)?;
1447-
serialize_column_meta_data(&self, writer)?;
1447+
serialize_column_meta_data(self, writer)?;
14481448
last_field_id = 3;
14491449
}
14501450

@@ -1488,7 +1488,7 @@ impl WriteThrift for ColumnChunkMetaData {
14881488

14891489
// always write the ColumnMetaData
14901490
writer.write_field_begin(FieldType::Struct, 3, last_field_id)?;
1491-
serialize_column_meta_data(&self, writer)?;
1491+
serialize_column_meta_data(self, writer)?;
14921492
last_field_id = 3;
14931493

14941494
if let Some(offset_idx_off) = self.offset_index_offset() {

parquet/src/file/metadata/writer.rs

Lines changed: 10 additions & 14 deletions
Original file line numberDiff line numberDiff line change
@@ -433,8 +433,9 @@ impl<'a, W: Write> ParquetMetaDataWriter<'a, W> {
433433
fn convert_column_indexes(&self) -> Option<Vec<Vec<Option<ColumnIndexMetaData>>>> {
434434
// FIXME(ets): we're converting from ParquetColumnIndex to vec<vec<option>>,
435435
// but then converting back to ParquetColumnIndex in the end. need to unify this.
436-
if let Some(row_group_column_indexes) = self.metadata.column_index() {
437-
Some(
436+
self.metadata
437+
.column_index()
438+
.map(|row_group_column_indexes| {
438439
(0..self.metadata.row_groups().len())
439440
.map(|rg_idx| {
440441
let column_indexes = &row_group_column_indexes[rg_idx];
@@ -443,16 +444,14 @@ impl<'a, W: Write> ParquetMetaDataWriter<'a, W> {
443444
.map(|column_index| Some(column_index.clone()))
444445
.collect()
445446
})
446-
.collect(),
447-
)
448-
} else {
449-
None
450-
}
447+
.collect()
448+
})
451449
}
452450

453451
fn convert_offset_index(&self) -> Option<Vec<Vec<Option<OffsetIndexMetaData>>>> {
454-
if let Some(row_group_offset_indexes) = self.metadata.offset_index() {
455-
Some(
452+
self.metadata
453+
.offset_index()
454+
.map(|row_group_offset_indexes| {
456455
(0..self.metadata.row_groups().len())
457456
.map(|rg_idx| {
458457
let offset_indexes = &row_group_offset_indexes[rg_idx];
@@ -461,11 +460,8 @@ impl<'a, W: Write> ParquetMetaDataWriter<'a, W> {
461460
.map(|offset_index| Some(offset_index.clone()))
462461
.collect()
463462
})
464-
.collect(),
465-
)
466-
} else {
467-
None
468-
}
463+
.collect()
464+
})
469465
}
470466
}
471467

parquet/src/file/writer.rs

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -2098,7 +2098,7 @@ mod tests {
20982098
unenc_size,
20992099
meta_data.unencoded_byte_array_data_bytes().unwrap()
21002100
);
2101-
check_def_hist(&meta_data.definition_level_histogram().unwrap().values());
2101+
check_def_hist(meta_data.definition_level_histogram().unwrap().values());
21022102

21032103
// check that the read metadata is also correct
21042104
let options = ReadOptionsBuilder::new().with_page_index().build();

parquet/src/schema/types.rs

Lines changed: 3 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -1125,13 +1125,10 @@ pub(crate) fn num_nodes(tp: &TypePtr) -> usize {
11251125

11261126
pub(crate) fn count_nodes(tp: &TypePtr, n_nodes: &mut usize) {
11271127
*n_nodes += 1;
1128-
match tp.as_ref() {
1129-
Type::GroupType { ref fields, .. } => {
1130-
for f in fields {
1131-
count_nodes(f, n_nodes);
1132-
}
1128+
if let Type::GroupType { ref fields, .. } = tp.as_ref() {
1129+
for f in fields {
1130+
count_nodes(f, n_nodes);
11331131
}
1134-
_ => (),
11351132
}
11361133
}
11371134

0 commit comments

Comments
 (0)