Skip to content

Commit 519cd3d

Browse files
committed
feat: support create table with map type
support cast improve check
1 parent 7e3a095 commit 519cd3d

File tree

15 files changed

+227
-37
lines changed

15 files changed

+227
-37
lines changed

e2e_test/batch/distribution_mode.slt

+1-1
Original file line numberDiff line numberDiff line change
@@ -4,7 +4,7 @@ SET RW_IMPLICIT_FLUSH TO true;
44
statement ok
55
SET QUERY_MODE TO distributed;
66

7-
include ./basic/*.slt.part
7+
include ./basic/**/*.slt.part
88
include ./duckdb/all.slt.part
99
include ./order/*.slt.part
1010
include ./join/*.slt.part

e2e_test/batch/local_mode.slt

+1-1
Original file line numberDiff line numberDiff line change
@@ -4,7 +4,7 @@ SET RW_IMPLICIT_FLUSH TO true;
44
statement ok
55
SET QUERY_MODE TO local;
66

7-
include ./basic/*.slt.part
7+
include ./basic/**/*.slt.part
88
include ./duckdb/all.slt.part
99
include ./order/*.slt.part
1010
include ./join/*.slt.part

e2e_test/batch/types/list.slt.part

-2
This file was deleted.

e2e_test/batch/types/map.slt.part

+120
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,120 @@
1+
statement ok
2+
SET RW_IMPLICIT_FLUSH TO true;
3+
4+
5+
statement error
6+
create table t (m map (float, float));
7+
----
8+
db error: ERROR: Failed to run the query
9+
10+
Caused by:
11+
invalid map key type: double precision
12+
13+
14+
query error
15+
select map_from_entries(array[1.0,2.0,3.0], array[1,2,3]);
16+
----
17+
db error: ERROR: Failed to run the query
18+
19+
Caused by these errors (recent errors listed first):
20+
1: Failed to bind expression: map_from_entries(ARRAY[1.0, 2.0, 3.0], ARRAY[1, 2, 3])
21+
2: Expr error
22+
3: invalid map key type: numeric
23+
24+
25+
query error
26+
select map_from_entries(array[1,1,3], array[1,2,3]);
27+
----
28+
db error: ERROR: Failed to run the query
29+
30+
Caused by these errors (recent errors listed first):
31+
1: Expr error
32+
2: error while evaluating expression `map('{1,1,3}', '{1,2,3}')`
33+
3: map keys must be unique
34+
35+
36+
query ?
37+
select map_from_entries(array[1,2,3], array[1,null,3]);
38+
----
39+
{"1":1,"2":NULL,"3":3}
40+
41+
42+
query error
43+
select map_from_entries(array[1,null,3], array[1,2,3]);
44+
----
45+
db error: ERROR: Failed to run the query
46+
47+
Caused by these errors (recent errors listed first):
48+
1: Expr error
49+
2: error while evaluating expression `map('{1,NULL,3}', '{1,2,3}')`
50+
3: map keys must not be NULL
51+
52+
53+
query error
54+
select map_from_entries(array[1,3], array[1,2,3]);
55+
----
56+
db error: ERROR: Failed to run the query
57+
58+
Caused by these errors (recent errors listed first):
59+
1: Expr error
60+
2: error while evaluating expression `map('{1,3}', '{1,2,3}')`
61+
3: map keys and values have different length
62+
63+
64+
query error
65+
select map_from_entries(array[1,2], array[1,2]) = map_from_entries(array[2,1], array[2,1]);
66+
----
67+
db error: ERROR: Failed to run the query
68+
69+
Caused by these errors (recent errors listed first):
70+
1: Failed to bind expression: map_from_entries(ARRAY[1, 2], ARRAY[1, 2]) = map_from_entries(ARRAY[2, 1], ARRAY[2, 1])
71+
2: function equal(map(integer,integer), map(integer,integer)) does not exist
72+
73+
74+
statement ok
75+
create table t (
76+
m1 map(varchar, float),
77+
m2 map(int, bool),
78+
m3 map(varchar, map(varchar, varchar)),
79+
l map(varchar,int)[],
80+
s struct<m map(varchar, struct<x int>)>,
81+
);
82+
83+
84+
statement ok
85+
insert into t values (
86+
map_from_entries(array['a','b','c'], array[1.0,2.0,3.0]::float[]),
87+
map_from_entries(array[1,2,3], array[true,false,true]),
88+
map_from_entries(array['a','b'],
89+
array[
90+
map_from_entries(array['a1'], array['a2']),
91+
map_from_entries(array['b1'], array['b2'])
92+
]
93+
),
94+
array[
95+
map_from_entries(array['a','b','c'], array[1,2,3]),
96+
map_from_entries(array['d','e','f'], array[4,5,6])
97+
],
98+
row(
99+
map_from_entries(array['a','b','c'], array[row(1),row(2),row(3)]::struct<x int>[])
100+
)
101+
);
102+
103+
# cast(map(character varying,integer)) -> map(character varying,double precision)
104+
query ?
105+
select map_from_entries(array['a','b','c'], array[1,2,3])::map(varchar,float);
106+
----
107+
{"a":1,"b":2,"c":3}
108+
109+
110+
statement ok
111+
insert into t(m1) values (map_from_entries(array['a','b','c'], array[1,2,3]));
112+
113+
query ????? rowsort
114+
select * from t;
115+
----
116+
{"a":1,"b":2,"c":3} NULL NULL NULL NULL
117+
{"a":1,"b":2,"c":3} {"1":t,"2":f,"3":t} {"a":{"a1":a2},"b":{"b1":b2}} {"{\"a\":1,\"b\":2,\"c\":3}","{\"d\":4,\"e\":5,\"f\":6}"} ("{""a"":(1),""b"":(2),""c"":(3)}")
118+
119+
statement ok
120+
drop table t;

e2e_test/batch/types/struct.slt.part

-1
This file was deleted.

src/expr/impl/src/scalar/cast.rs

+12-1
Original file line numberDiff line numberDiff line change
@@ -21,7 +21,7 @@ use itertools::Itertools;
2121
use risingwave_common::array::{ArrayImpl, DataChunk, ListRef, ListValue, StructRef, StructValue};
2222
use risingwave_common::cast;
2323
use risingwave_common::row::OwnedRow;
24-
use risingwave_common::types::{Int256, JsonbRef, ToText, F64};
24+
use risingwave_common::types::{Int256, JsonbRef, MapRef, MapValue, ToText, F64};
2525
use risingwave_common::util::iter_util::ZipEqFast;
2626
use risingwave_expr::expr::{build_func, Context, ExpressionBoxExt, InputRefExpression};
2727
use risingwave_expr::{function, ExprError, Result};
@@ -241,6 +241,17 @@ fn struct_cast(input: StructRef<'_>, ctx: &Context) -> Result<StructValue> {
241241
Ok(StructValue::new(fields))
242242
}
243243

244+
/// Cast array with `source_elem_type` into array with `target_elem_type` by casting each element.
245+
#[function("cast(anymap) -> anymap", type_infer = "panic")]
246+
fn map_cast(map: MapRef<'_>, ctx: &Context) -> Result<MapValue> {
247+
let new_ctx = Context {
248+
arg_types: vec![ctx.arg_types[0].clone().as_map().clone().into_list()],
249+
return_type: ctx.return_type.as_map().clone().into_list(),
250+
variadic: ctx.variadic,
251+
};
252+
list_cast(map.into_inner(), &new_ctx).map(MapValue::from_list_entries)
253+
}
254+
244255
#[cfg(test)]
245256
mod tests {
246257
use chrono::NaiveDateTime;

src/frontend/planner_test/tests/testdata/output/insert.yaml

+10-2
Original file line numberDiff line numberDiff line change
@@ -80,7 +80,11 @@
8080
sql: |
8181
create table t (v1 real, v2 int);
8282
insert into t values (22.33, true);
83-
binder_error: 'Bind error: cannot cast type "boolean" to "integer" in Assign context'
83+
binder_error: |
84+
failed to cast the 2nd column
85+
86+
Caused by:
87+
cannot cast type "boolean" to "integer" in Assign context
8488
- name: simple insert
8589
sql: |
8690
create table t (v1 int, v2 int);
@@ -175,7 +179,11 @@
175179
sql: |
176180
create table t (v1 timestamp, v2 real);
177181
insert into t select time '01:02:03', 4.5 from t;
178-
binder_error: 'Bind error: cannot cast type "time without time zone" to "timestamp without time zone" in Assign context'
182+
binder_error: |
183+
failed to cast the 1st column
184+
185+
Caused by:
186+
cannot cast type "time without time zone" to "timestamp without time zone" in Assign context
179187
- name: insert into select mismatch columns length
180188
sql: |
181189
create table t (v1 int, v2 real);

src/frontend/src/binder/expr/mod.rs

+6-1
Original file line numberDiff line numberDiff line change
@@ -14,7 +14,7 @@
1414

1515
use itertools::Itertools;
1616
use risingwave_common::catalog::{ColumnDesc, ColumnId, PG_CATALOG_SCHEMA_NAME};
17-
use risingwave_common::types::DataType;
17+
use risingwave_common::types::{DataType, MapType};
1818
use risingwave_common::util::iter_util::zip_eq_fast;
1919
use risingwave_common::{bail_no_function, bail_not_implemented, not_implemented};
2020
use risingwave_pb::plan_common::{AdditionalColumn, ColumnDescVersion};
@@ -999,6 +999,11 @@ pub fn bind_data_type(data_type: &AstDataType) -> Result<DataType> {
999999
.collect::<Result<Vec<_>>>()?,
10001000
types.iter().map(|f| f.name.real_value()).collect_vec(),
10011001
),
1002+
AstDataType::Map(kv) => {
1003+
let key = bind_data_type(&kv.0)?;
1004+
let value = bind_data_type(&kv.1)?;
1005+
DataType::Map(MapType::try_from_kv(key, value)?)
1006+
}
10021007
AstDataType::Custom(qualified_type_name) => {
10031008
let idents = qualified_type_name
10041009
.0

src/frontend/src/binder/insert.rs

+18-4
Original file line numberDiff line numberDiff line change
@@ -14,6 +14,7 @@
1414

1515
use std::collections::{BTreeMap, HashMap, HashSet};
1616

17+
use anyhow::Context;
1718
use itertools::Itertools;
1819
use risingwave_common::catalog::{ColumnCatalog, Schema, TableVersionId};
1920
use risingwave_common::types::DataType;
@@ -26,6 +27,7 @@ use crate::binder::{Binder, Clause};
2627
use crate::catalog::TableId;
2728
use crate::error::{ErrorCode, Result, RwError};
2829
use crate::expr::{ExprImpl, InputRef};
30+
use crate::handler::create_mv::ordinal;
2931
use crate::user::UserId;
3032

3133
#[derive(Debug, Clone)]
@@ -197,7 +199,7 @@ impl Binder {
197199
let bound_query;
198200
let cast_exprs;
199201

200-
let bounded_column_nums = match source.as_simple_values() {
202+
let bound_column_nums = match source.as_simple_values() {
201203
None => {
202204
bound_query = self.bind_query(source)?;
203205
let actual_types = bound_query.data_types();
@@ -234,7 +236,7 @@ impl Binder {
234236
cols_to_insert_in_table.len()
235237
};
236238

237-
let (err_msg, default_column_indices) = match num_target_cols.cmp(&bounded_column_nums) {
239+
let (err_msg, default_column_indices) = match num_target_cols.cmp(&bound_column_nums) {
238240
std::cmp::Ordering::Equal => (None, default_column_indices),
239241
std::cmp::Ordering::Greater => {
240242
if has_user_specified_columns {
@@ -248,7 +250,7 @@ impl Binder {
248250
// insert into t values (7)
249251
// this kind of usage is fine, null values will be provided
250252
// implicitly.
251-
(None, col_indices_to_insert.split_off(bounded_column_nums))
253+
(None, col_indices_to_insert.split_off(bound_column_nums))
252254
}
253255
}
254256
std::cmp::Ordering::Less => {
@@ -312,10 +314,22 @@ impl Binder {
312314
let msg = match expected_types.len().cmp(&exprs.len()) {
313315
std::cmp::Ordering::Less => "INSERT has more expressions than target columns",
314316
_ => {
317+
let expr_len = exprs.len();
315318
return exprs
316319
.into_iter()
317320
.zip_eq_fast(expected_types.iter().take(expr_num))
318-
.map(|(e, t)| e.cast_assign(t.clone()).map_err(Into::into))
321+
.enumerate()
322+
.map(|(i, (e, t))| {
323+
let res = e.cast_assign(t.clone());
324+
if expr_len > 1 {
325+
res.with_context(|| {
326+
format!("failed to cast the {} column", ordinal(i + 1))
327+
})
328+
.map_err(Into::into)
329+
} else {
330+
res.map_err(Into::into)
331+
}
332+
})
319333
.try_collect();
320334
}
321335
};

src/frontend/src/binder/select.rs

+2-2
Original file line numberDiff line numberDiff line change
@@ -714,8 +714,8 @@ fn data_type_to_alias(data_type: &AstDataType) -> Option<String> {
714714
AstDataType::Jsonb => "jsonb".to_string(),
715715
AstDataType::Array(ty) => return data_type_to_alias(ty),
716716
AstDataType::Custom(ty) => format!("{}", ty),
717-
AstDataType::Struct(_) => {
718-
// Note: Postgres doesn't have anonymous structs
717+
AstDataType::Struct(_) | AstDataType::Map(_) => {
718+
// Note: Postgres doesn't have maps and anonymous structs
719719
return None;
720720
}
721721
};

src/frontend/src/expr/type_inference/cast.rs

+12
Original file line numberDiff line numberDiff line change
@@ -114,6 +114,7 @@ pub fn align_array_and_element(
114114
pub fn cast_ok(source: &DataType, target: &DataType, allows: CastContext) -> bool {
115115
cast_ok_struct(source, target, allows)
116116
|| cast_ok_array(source, target, allows)
117+
|| cast_ok_map(source, target, allows)
117118
|| cast_ok_base(source, target, allows)
118119
}
119120

@@ -161,6 +162,17 @@ fn cast_ok_array(source: &DataType, target: &DataType, allows: CastContext) -> b
161162
}
162163
}
163164

165+
fn cast_ok_map(source: &DataType, target: &DataType, allows: CastContext) -> bool {
166+
match (source, target) {
167+
(DataType::Map(source_elem), DataType::Map(target_elem)) => cast_ok(
168+
&source_elem.clone().into_list(),
169+
&target_elem.clone().into_list(),
170+
allows,
171+
),
172+
_ => false,
173+
}
174+
}
175+
164176
pub fn cast_map_array() -> Vec<(DataTypeName, DataTypeName, CastContext)> {
165177
CAST_MAP
166178
.iter()

src/frontend/src/handler/create_mv.rs

+1-1
Original file line numberDiff line numberDiff line change
@@ -278,7 +278,7 @@ It only indicates the physical clustering of the data, which may improve the per
278278
))
279279
}
280280

281-
fn ordinal(i: usize) -> String {
281+
pub fn ordinal(i: usize) -> String {
282282
let s = i.to_string();
283283
let suffix = if s.ends_with('1') && !s.ends_with("11") {
284284
"st"

src/sqlparser/src/ast/data_type.rs

+5
Original file line numberDiff line numberDiff line change
@@ -70,6 +70,8 @@ pub enum DataType {
7070
Array(Box<DataType>),
7171
/// Structs
7272
Struct(Vec<StructField>),
73+
/// Map(key_type, value_type)
74+
Map(Box<(DataType, DataType)>),
7375
}
7476

7577
impl fmt::Display for DataType {
@@ -110,6 +112,9 @@ impl fmt::Display for DataType {
110112
DataType::Struct(defs) => {
111113
write!(f, "STRUCT<{}>", display_comma_separated(defs))
112114
}
115+
DataType::Map(kv) => {
116+
write!(f, "MAP({},{})", kv.0, kv.1)
117+
}
113118
}
114119
}
115120
}

src/sqlparser/src/parser.rs

+1-2
Original file line numberDiff line numberDiff line change
@@ -3632,8 +3632,7 @@ impl Parser<'_> {
36323632
.parse_next(self)
36333633
}
36343634

3635-
/// Parse a SQL datatype (in the context of a CREATE TABLE statement for example) and convert
3636-
/// into an array of that datatype if needed
3635+
/// Parse a SQL datatype (in the context of a CREATE TABLE statement for example)
36373636
pub fn parse_data_type(&mut self) -> PResult<DataType> {
36383637
parser_v2::data_type(self)
36393638
}

0 commit comments

Comments
 (0)