Files
greptimedb/tests-fuzz/src/context.rs
Weny Xu 7f47ce0e44 test: add repartition fuzz target with partition IR and translators (#7666)
* test: add repartition fuzz target with partition IR and translators

Signed-off-by: WenyXu <wenymedia@gmail.com>

* fix: fix unit tests

Signed-off-by: WenyXu <wenymedia@gmail.com>

* chore: apply suggestions

Signed-off-by: WenyXu <wenymedia@gmail.com>

---------

Signed-off-by: WenyXu <wenymedia@gmail.com>
2026-02-05 06:04:04 +00:00

426 lines
15 KiB
Rust

// Copyright 2023 Greptime Team
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
// http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.
use std::sync::Arc;
use common_query::AddColumnLocation;
use datatypes::types::cast;
use rand::Rng;
use snafu::{OptionExt, ensure};
use crate::error::{self, Result};
use crate::generator::Random;
use crate::ir::alter_expr::{AlterTableOperation, AlterTableOption};
use crate::ir::create_expr::{ColumnOption, PartitionDef};
use crate::ir::partition_expr::SimplePartitions;
use crate::ir::repartition_expr::RepartitionExpr;
use crate::ir::{AlterTableExpr, Column, CreateTableExpr, Ident};
pub type TableContextRef = Arc<TableContext>;
/// TableContext stores table info.
#[derive(Debug, Clone)]
pub struct TableContext {
pub name: Ident,
pub columns: Vec<Column>,
// GreptimeDB specific options
pub partition: Option<PartitionDef>,
pub primary_keys: Vec<usize>,
pub table_options: Vec<AlterTableOption>,
}
impl From<&CreateTableExpr> for TableContext {
fn from(
CreateTableExpr {
table_name: name,
columns,
partition,
primary_keys,
..
}: &CreateTableExpr,
) -> Self {
Self {
name: name.clone(),
columns: columns.clone(),
partition: partition.clone(),
primary_keys: primary_keys.clone(),
table_options: vec![],
}
}
}
impl TableContext {
/// Returns the timestamp column
pub fn timestamp_column(&self) -> Option<Column> {
self.columns.iter().find(|c| c.is_time_index()).cloned()
}
/// Applies the [AlterTableExpr].
pub fn alter(mut self, expr: AlterTableExpr) -> Result<TableContext> {
match expr.alter_kinds {
AlterTableOperation::AddColumn { column, location } => {
ensure!(
!self.columns.iter().any(|col| col.name == column.name),
error::UnexpectedSnafu {
violated: format!("Column {} exists", column.name),
}
);
match location {
Some(AddColumnLocation::First) => {
let mut columns = Vec::with_capacity(self.columns.len() + 1);
columns.push(column);
columns.extend(self.columns);
self.columns = columns;
}
Some(AddColumnLocation::After { column_name }) => {
let index = self
.columns
.iter()
// TODO(weny): find a better way?
.position(|col| col.name.to_string() == column_name)
.context(error::UnexpectedSnafu {
violated: format!("Column: {column_name} not found"),
})?;
self.columns.insert(index + 1, column);
}
None => self.columns.push(column),
}
// Re-generates the primary_keys
self.primary_keys = self
.columns
.iter()
.enumerate()
.flat_map(|(idx, col)| {
if col.is_primary_key() {
Some(idx)
} else {
None
}
})
.collect();
Ok(self)
}
AlterTableOperation::DropColumn { name } => {
self.columns.retain(|col| col.name != name);
// Re-generates the primary_keys
self.primary_keys = self
.columns
.iter()
.enumerate()
.flat_map(|(idx, col)| {
if col.is_primary_key() {
Some(idx)
} else {
None
}
})
.collect();
Ok(self)
}
AlterTableOperation::RenameTable { new_table_name } => {
ensure!(
new_table_name != self.name,
error::UnexpectedSnafu {
violated: "The new table name is equal the current name",
}
);
self.name = new_table_name;
Ok(self)
}
AlterTableOperation::ModifyDataType { column } => {
if let Some(idx) = self.columns.iter().position(|col| col.name == column.name) {
self.columns[idx].column_type = column.column_type.clone();
for opt in self.columns[idx].options.iter_mut() {
if let ColumnOption::DefaultValue(value) = opt {
*value = cast(value.clone(), &column.column_type).unwrap();
}
}
}
Ok(self)
}
AlterTableOperation::SetTableOptions { options } => {
for option in options {
if let Some(idx) = self
.table_options
.iter()
.position(|opt| opt.key() == option.key())
{
self.table_options[idx] = option;
} else {
self.table_options.push(option);
}
}
Ok(self)
}
AlterTableOperation::UnsetTableOptions { keys } => {
self.table_options
.retain(|opt| !keys.contains(&opt.key().to_string()));
Ok(self)
}
}
}
pub fn repartition(mut self, expr: RepartitionExpr) -> Result<TableContext> {
match expr {
RepartitionExpr::Split(split) => {
let partition_def = self.partition.as_mut().expect("expected partition def");
let insert_pos = partition_def
.exprs
.iter()
.position(|expr| expr == &split.target)
.unwrap();
partition_def.exprs[insert_pos] = split.into[0].clone();
partition_def
.exprs
.insert(insert_pos + 1, split.into[1].clone());
}
RepartitionExpr::Merge(merge) => {
let partition_def = self.partition.as_mut().expect("expected partition def");
let removed_idx = partition_def
.exprs
.iter()
.position(|expr| expr == &merge.targets[0])
.unwrap();
let mut partitions = SimplePartitions::from_exprs(
partition_def.columns[0].clone(),
&partition_def.exprs,
)?;
partitions.remove_bound(removed_idx)?;
partition_def.exprs = partitions.generate()?;
}
}
Ok(self)
}
pub fn generate_unique_column_name<R: Rng>(
&self,
rng: &mut R,
generator: &dyn Random<Ident, R>,
) -> Ident {
let mut name = generator.generate(rng);
while self.columns.iter().any(|col| col.name.value == name.value) {
name = generator.generate(rng);
}
name
}
pub fn generate_unique_table_name<R: Rng>(
&self,
rng: &mut R,
generator: &dyn Random<Ident, R>,
) -> Ident {
let mut name = generator.generate(rng);
while self.name.value == name.value {
name = generator.generate(rng);
}
name
}
}
#[cfg(test)]
mod tests {
use common_query::AddColumnLocation;
use common_time::Duration;
use datatypes::data_type::ConcreteDataType;
use datatypes::value::Value;
use rand::SeedableRng;
use super::TableContext;
use crate::generator::Generator;
use crate::generator::create_expr::CreateTableExprGeneratorBuilder;
use crate::ir::alter_expr::{AlterTableOperation, AlterTableOption, Ttl};
use crate::ir::create_expr::ColumnOption;
use crate::ir::partition_expr::SimplePartitions;
use crate::ir::repartition_expr::{MergePartitionExpr, RepartitionExpr, SplitPartitionExpr};
use crate::ir::{AlterTableExpr, Column, Ident};
#[test]
fn test_table_context_alter() {
let table_ctx = TableContext {
name: "foo".into(),
columns: vec![],
partition: None,
primary_keys: vec![],
table_options: vec![],
};
// Add a column
let expr = AlterTableExpr {
table_name: "foo".into(),
alter_kinds: AlterTableOperation::AddColumn {
column: Column {
name: "a".into(),
column_type: ConcreteDataType::timestamp_microsecond_datatype(),
options: vec![ColumnOption::PrimaryKey],
},
location: None,
},
};
let table_ctx = table_ctx.alter(expr).unwrap();
assert_eq!(table_ctx.columns[0].name, Ident::new("a"));
assert_eq!(table_ctx.primary_keys, vec![0]);
// Add a column at first
let expr = AlterTableExpr {
table_name: "foo".into(),
alter_kinds: AlterTableOperation::AddColumn {
column: Column {
name: "b".into(),
column_type: ConcreteDataType::timestamp_microsecond_datatype(),
options: vec![ColumnOption::PrimaryKey],
},
location: Some(AddColumnLocation::First),
},
};
let table_ctx = table_ctx.alter(expr).unwrap();
assert_eq!(table_ctx.columns[0].name, Ident::new("b"));
assert_eq!(table_ctx.primary_keys, vec![0, 1]);
// Add a column after "b"
let expr = AlterTableExpr {
table_name: "foo".into(),
alter_kinds: AlterTableOperation::AddColumn {
column: Column {
name: "c".into(),
column_type: ConcreteDataType::timestamp_microsecond_datatype(),
options: vec![ColumnOption::PrimaryKey],
},
location: Some(AddColumnLocation::After {
column_name: "b".into(),
}),
},
};
let table_ctx = table_ctx.alter(expr).unwrap();
assert_eq!(table_ctx.columns[1].name, Ident::new("c"));
assert_eq!(table_ctx.primary_keys, vec![0, 1, 2]);
// Drop the column "b"
let expr = AlterTableExpr {
table_name: "foo".into(),
alter_kinds: AlterTableOperation::DropColumn { name: "b".into() },
};
let table_ctx = table_ctx.alter(expr).unwrap();
assert_eq!(table_ctx.columns[1].name, Ident::new("a"));
assert_eq!(table_ctx.primary_keys, vec![0, 1]);
// Set table options
let ttl_option = AlterTableOption::Ttl(Ttl::Duration(Duration::new_second(60)));
let expr = AlterTableExpr {
table_name: "foo".into(),
alter_kinds: AlterTableOperation::SetTableOptions {
options: vec![ttl_option.clone()],
},
};
let table_ctx = table_ctx.alter(expr).unwrap();
assert_eq!(table_ctx.table_options.len(), 1);
assert_eq!(table_ctx.table_options[0], ttl_option);
// Unset table options
let expr = AlterTableExpr {
table_name: "foo".into(),
alter_kinds: AlterTableOperation::UnsetTableOptions {
keys: vec![ttl_option.key().to_string()],
},
};
let table_ctx = table_ctx.alter(expr).unwrap();
assert_eq!(table_ctx.table_options.len(), 0);
}
#[test]
fn test_apply_split_partition_expr() {
let mut rng = rand_chacha::ChaCha8Rng::seed_from_u64(0);
let expr = CreateTableExprGeneratorBuilder::default()
.columns(10)
.partition(10)
.if_not_exists(true)
.engine("mito2")
.build()
.unwrap()
.generate(&mut rng)
.unwrap();
let mut table_ctx = TableContext::from(&expr);
// "age < 10"
// "age >= 10 AND age < 20"
// "age >= 20" (SPLIT) INTO (age >= 20 AND age < 30, age >= 30)
let partitions = SimplePartitions::new(
table_ctx.partition.as_ref().unwrap().columns[0].clone(),
vec![Value::from(10), Value::from(20)],
)
.generate()
.unwrap();
// "age < 10"
// "age >= 10 AND age < 20"
// "age >= 20" AND age < 30"
// "age >= 30"
let expected_exprs = SimplePartitions::new(
table_ctx.partition.as_ref().unwrap().columns[0].clone(),
vec![Value::from(10), Value::from(20), Value::from(30)],
)
.generate()
.unwrap();
table_ctx.partition.as_mut().unwrap().exprs = partitions.clone();
let table_ctx = table_ctx
.repartition(RepartitionExpr::Split(SplitPartitionExpr {
table_name: expr.table_name.clone(),
target: partitions.last().unwrap().clone(),
into: vec![expected_exprs[2].clone(), expected_exprs[3].clone()],
}))
.unwrap();
let partition_def = table_ctx.partition.as_ref().unwrap();
assert_eq!(partition_def.exprs, expected_exprs);
}
#[test]
fn test_apply_merge_partition_expr() {
let mut rng = rand_chacha::ChaCha8Rng::seed_from_u64(0);
let expr = CreateTableExprGeneratorBuilder::default()
.columns(10)
.partition(10)
.if_not_exists(true)
.engine("mito2")
.build()
.unwrap()
.generate(&mut rng)
.unwrap();
let mut table_ctx = TableContext::from(&expr);
// "age < 10"
// "age >= 10 AND age < 20" (MERGE)
// "age >= 20" (MERGE)
let partitions = SimplePartitions::new(
table_ctx.partition.as_ref().unwrap().columns[0].clone(),
vec![Value::from(10), Value::from(20)],
)
.generate()
.unwrap();
// "age < 10"
// "age >= 10
let expected_exprs = SimplePartitions::new(
table_ctx.partition.as_ref().unwrap().columns[0].clone(),
vec![Value::from(10)],
)
.generate()
.unwrap();
table_ctx.partition.as_mut().unwrap().exprs = partitions.clone();
let table_ctx = table_ctx
.repartition(RepartitionExpr::Merge(MergePartitionExpr {
table_name: expr.table_name.clone(),
targets: vec![partitions[1].clone(), partitions[2].clone()],
}))
.unwrap();
let partition_def = table_ctx.partition.as_ref().unwrap();
assert_eq!(partition_def.exprs, expected_exprs);
}
}