Flink SQL 知其所以然之去重不仅仅有 Count Distinct 还有强大的 Deduplication
复制select id,
timestamp,
page,
param1,
param2,
paramN
from (
SELECT
id,
timestamp,
page,
param1,
param2,
paramN
-- proctime 代表处理时间即 source 表中的 PROCTIME()
row_number() over(partition by id orderby proctime) as rn
FROM source_table
)
where rn = 1
1.2.3.4.5.6.7.8.9.10.11.12.13.14.15.16.17.18.19.
THE END