CREATE TABLE `orders` (
`o_orderkey` int(11) NOT NULL COMMENT "",
`o_orderdate` date NOT NULL COMMENT "",
`o_custkey` int(11) NOT NULL COMMENT "",
`o_orderstatus` varchar(1) NOT NULL COMMENT "",
`o_totalprice` decimal64(15, 2) NOT NULL COMMENT "",
`o_orderpriority` varchar(15) NOT NULL COMMENT "",
`o_clerk` varchar(15) NOT NULL COMMENT "",
`o_shippriority` int(11) NOT NULL COMMENT "",
`o_comment` varchar(79) NOT NULL COMMENT ""
) ENGINE=OLAP
DUPLICATE KEY(`o_orderkey`, `o_orderdate`)
COMMENT "OLAP"
DISTRIBUTED BY HASH(`o_orderkey`) BUCKETS 96
PROPERTIES (
"replication_num" = "1",
"colocate_with" = "tpch2",
"in_memory" = "false",
"enable_persistent_index" = "false",
"replicated_storage" = "true",
"fast_schema_evolution" = "true",
"compression" = "LZ4"
);
mysql> select sum(o_totalprice) from (select o_totalprice from orders order by o_orderkey limit 5000, 100) as a;
+-------------------+
| sum(o_totalprice) |
+-------------------+
| 14504084.88 |
+-------------------+
1 row in set (0.08 sec)
mysql> select sum(o_totalprice) from (select o_totalprice from orders order by o_orderkey limit 5000, 100) as a;
+-------------------+
| sum(o_totalprice) |
+-------------------+
| 14504084.88 |
+-------------------+
1 row in set (0.09 sec)
mysql> select sum(o_totalprice) from (select o_totalprice from orders order by o_totalprice limit 5000, 100) as a;
+-------------------+
| sum(o_totalprice) |
+-------------------+
| 94215.72 |
+-------------------+
1 row in set (0.18 sec)
mysql> select sum(o_totalprice) from (select o_totalprice from orders order by o_totalprice limit 5000, 100) as a;
+-------------------+
| sum(o_totalprice) |
+-------------------+
| 94215.72 |
+-------------------+
1 row in set (0.14 sec)
mysql> select sum(o_totalprice) from (select o_totalprice from orders order by o_orderdate limit 5000, 100) as a;
+-------------------+
| sum(o_totalprice) |
+-------------------+
| 16296704.62 |
+-------------------+
1 row in set (0.17 sec)
mysql> select sum(o_totalprice) from (select o_totalprice from orders order by o_orderdate limit 5000, 100) as a;
+-------------------+
| sum(o_totalprice) |
+-------------------+
| 16303416.82 |
+-------------------+
1 row in set (0.15 sec)
从结果中可以看到,order by UPC 排序后累加的结果是一致的,4次结果都是19908,order by create_date 每次的结果都不相同21663,19344,18457, 15856,那么是什么原因导致的使用 order by create_date 排序,每次查询结果都有差异呢?
原因为 StarRocks 采用分布式存储数据,一条分页语句在查询执行过程中,一个 job 会把多个 task 任务分发到多个 BE 中并发的查询 tablet 中数据,最后进行数据的汇总,由于 order by 指定的列区分度低,导致查询时每个节点返回的数据顺序不一样,这样某条数据在第 N 页和 N+1 页查询都被命中,导致最终的排序结果不一样,所以最后累加的结果不一致。
解决方案:提高 order by 后指定列的区分度,在建表时我们新增了一个类似 MySQL 中 id 特性的字段,在分页查询时,除指定业务需要排序的列以外,另加上此 id 列,保证查询的数据整体是有序的。