1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
use std::convert::TryInto;
use parquet_format_async_temp::SchemaElement;
use crate::error::{ParquetError, Result};
use super::super::types::{
converted_to_group_converted, converted_to_primitive_converted, type_to_physical_type,
ParquetType,
};
impl ParquetType {
pub fn try_from_thrift(elements: &[&SchemaElement]) -> Result<ParquetType> {
let mut index = 0;
let mut schema_nodes = Vec::new();
while index < elements.len() {
let t = from_thrift_helper(elements, index)?;
index = t.0;
schema_nodes.push(t.1);
}
if schema_nodes.len() != 1 {
return Err(general_err!(
"Expected exactly one root node, but found {}",
schema_nodes.len()
));
}
Ok(schema_nodes.remove(0))
}
}
fn from_thrift_helper(elements: &[&SchemaElement], index: usize) -> Result<(usize, ParquetType)> {
let is_root_node = index == 0;
let element = elements[index];
let name = element.name.clone();
let converted_type = element.converted_type;
let logical_type = &element.logical_type;
let field_id = element.field_id;
match element.num_children {
None | Some(0) => {
let repetition = element
.repetition_type
.ok_or_else(|| {
general_err!("Repetition level must be defined for a primitive type")
})?
.try_into()
.unwrap();
let physical_type = element.type_.ok_or_else(|| {
general_err!("Physical type must be defined for a primitive type")
})?;
let length = element.type_length;
let physical_type = type_to_physical_type(&physical_type, length)?;
let converted_type = match converted_type {
Some(converted_type) => Some({
let maybe_decimal = match (element.precision, element.scale) {
(Some(precision), Some(scale)) => Some((precision, scale)),
(None, None) => None,
_ => {
return Err(general_err!(
"When precision or scale are defined, both must be defined"
))
}
};
converted_to_primitive_converted(&converted_type, maybe_decimal)?
}),
None => None,
};
let tp = ParquetType::try_from_primitive(
name,
physical_type,
repetition,
converted_type,
logical_type.clone(),
field_id,
)?;
Ok((index + 1, tp))
}
Some(n) => {
let repetition = element.repetition_type.map(|x| x.try_into().unwrap());
let mut fields = vec![];
let mut next_index = index + 1;
for _ in 0..n {
let child_result = from_thrift_helper(elements, next_index)?;
next_index = child_result.0;
fields.push(child_result.1);
}
let tp = if is_root_node {
ParquetType::new_root(name, fields)
} else {
let converted_type = match converted_type {
Some(converted_type) => Some(converted_to_group_converted(&converted_type)?),
None => None,
};
ParquetType::from_converted(name, fields, repetition, converted_type, field_id)
};
Ok((next_index, tp))
}
}
}