DDL语句 - 《clickhouse》

普通表
临时表
分区表
视图
分布式表
表操作

普通表

目前只有MergeTree、Merge和Distributed这三类表引擎支持ALTER查询,所以在进行alter操作的时候注意表的引擎。

所在建表的时候一般要求指定表的引擎

# 建表方式1
# 表引擎为MergeTree时需要指定主键primary key和排序order by 当两个字段一致时可以省略primary key关键字
create table student (
s_id Int8,
s_name String,
s_birth DateTime,
s_sex Int8
)
engine = MergeTree()
order by s_id;
# 建表方式2 - 复制student表的表结构
create table if not exists student_copy as student engine=MergeTree() order by s_id;
# 建表方式3 - 通过select查询的方式创建表, 同时也会导入查询的结果数据
create table if not exists student_select engine = MergeTree() primary key s_id order by s_id as select * from student;
insert into student values(s);

临时表

创建临时表的方法是在普通表的基础之上添加 temporary关键字，相比普通表而言，临时表需要注意一下三点特殊之处。

只支持Memory 表引擎
临时表不属于任何数据库
会话断开以后表删除 ,不会持久化
如果本地表和临时表冲突 , 临时表优先

# 临时表不需要指定引擎
create temporary table student (
s_id Int8,
s_name String,
s_birth DateTime,
s_sex Int8
);

分区表

目前只有MergeTree家族系列的表引擎才支持数据分区。分区的目的或概念和hive一致。

create table student_partition (
s_id Int8,
s_name String,
s_birth DateTime
)
engine = MergeTree()
partition by toDate(s_birth)
order by s_id;
insert into student_partition values
(1,'张三1','2021-07-07 01:13:12'),
(2,'张三2','2021-07-26 11:00:21'),
(3,'张三3','2021-07-25 11:00:21'),
(4,'张三4','2021-07-27 11:00:21'),
(5,'张三5','2021-07-25 11:00:21'),
(6,'张三6','2021-07-27 11:00:21');
# 查询分区状态
select table ,name , partition , path from system.parts where table = 'student_partition' ;
# 删除分区, 并且分区中分数据也会被删除
alter table student_partition drop partition '2021-07-27';
# 分区的卸载与装载，常用于分区数据的迁移和备份场景。
# 卸载 ：会将数据移动到表目录下的detached目录，同时clickhouse不会在管理这些数据。
alter table log2 detach partition '2021-07-27';
# 装载：会将分区移cdetached目录
alter table log2 attach partition '2021-07-27' ; # 装载以后数据就会被加载到表下

视图

视图分为普通视图和物化视图，其中物化视图拥有独立的存储，而普通视图只是一层简单的查询代理。

# 普通视图
# 普通视图不会存储任何数据，它只是一层单纯的 SELECT 查询映射，起着简化查询、明晰语义的作用，对查询性能不会有任何增强
create view student_view as select s_id*2,s_name,s_sex from student;
select * from student_view;
select * from student_view where s_sex = '男';
# 物化视图
# 物化视图支持表引擎，数据保存形式由它的表引擎决定，创建物化视图的完整语法如下所示
create materialized view mv_log engine=Log populate as select * from plog;
# 物化视图创建好之后，如果源表被写入新数据，那么物化视图也会同步更新
# 如果在创建视图时添加了populates关键字的话会把源表数据同步到物化视图中，不加则反之，并只会同步之后写入源表的数据
# 视图目前并不支持同步删除，如果在源表中删除了数据，物化视图的数据仍会保留
# 物化视图就是一种特殊的表

分布式表

不存储数据，是本地表的代理

# Distributed的参数
# ck_cluster:集群名称；
# my_db:库名；
# my_table:表名，要求各个实例中库名、表名相同；
# rand():选择路由分片的方式。或者指定分片
CREATE TABLE log_test_all (
     ts  DateTime,
     uid String,
     biz String
) ENGINE= Distributed(ck_cluster, my_db, my_table, rand());

表操作

# 查看建表语句
show create table student;
# 修改表结构
# 1.添加字段
alter table student add column age UInt32 [after s_name(在s_name字段后添加)];
# 2.修改字段
alter table student modify column age UInt8;
# 3.删除字段    
alter table student dorp column age;
# 4.字段添加/修改注释
alter table student comment column age '年龄';
# 5.修改表名或者移动表到另一个数据库
rename table student to student1/[数据库].student
# 删除表
drop table if exists student