sql分组后二次汇总(处理表重复记录查询和删除)的实现方法

程序员文章站 2022-03-02 23:30:02

--处理表重复记录(查询和删除) /*******************************************************************...

--处理表重复记录(查询和删除)
/******************************************************************************************************************************************************
1、num、name相同的重复值记录,没有大小关系只保留一条
2、name相同,id有大小关系时,保留大或小其中一个记录
整理人：中国风(roy)

日期:2008.06.06
******************************************************************************************************************************************************/

--1、用于查询重复处理记录(如果列没有大小关系时2000用生成自增列和临时表处理,sql2005用row_number函数处理)

--> --> (roy)生成測試數據

if not object_id('tempdb..#t') is null
 drop table #t
go
create table #t([id] int,[name] nvarchar(1),[memo] nvarchar(2))
insert #t
select 1,n'a',n'a1' union all
select 2,n'a',n'a2' union all
select 3,n'a',n'a3' union all
select 4,n'b',n'b1' union all
select 5,n'b',n'b2'
go

--i、name相同id最小的记录(推荐用1,2,3),方法3在sql05时，效率高于1、2
方法1:
select * from #t a where not exists(select 1 from #t where name=a.name and id<a.id)

方法2:
select a.* from #t a join (select min(id)id,name from #t group by name) b on a.name=b.name and a.id=b.id

方法3:
select * from #t a where id=(select min(id) from #t where name=a.name)

方法4:
select a.* from #t a join #t b on a.name=b.name and a.id>=b.id group by a.id,a.name,a.memo having count(1)=1

方法5:
select * from #t a group by id,name,memo having id=(select min(id)from #t where name=a.name)

方法6:
select * from #t a where (select count(1) from #t where name=a.name and id<a.id)=0

方法7:
select * from #t a where id=(select top 1 id from #t where name=a.name order by id)

方法8:
select * from #t a where id!>all(select id from #t where name=a.name)

方法9(注:id为唯一时可用):
select * from #t a where id in(select min(id) from #t group by name)

--sql2005:

方法10:
select id,name,memo from (select *,min(id)over(partition by name) as minid from #t a)t where id=minid

方法11:

select id,name,memo from (select *,row_number()over(partition by name order by id) as minid from #t a)t where minid=1

生成结果:
/*
id          name memo
----------- ---- ----
1           a    a1
4           b    b1

(2 行受影响)
*/

--ii、name相同id最大的记录,与min相反:
方法1:
select * from #t a where not exists(select 1 from #t where name=a.name and id>a.id)

方法2:
select a.* from #t a join (select max(id)id,name from #t group by name) b on a.name=b.name and a.id=b.id order by id

方法3:
select * from #t a where id=(select max(id) from #t where name=a.name) order by id

方法4:
select a.* from #t a join #t b on a.name=b.name and a.id<=b.id group by a.id,a.name,a.memo having count(1)=1

方法5:
select * from #t a group by id,name,memo having id=(select max(id)from #t where name=a.name)

方法6:
select * from #t a where (select count(1) from #t where name=a.name and id>a.id)=0

方法7:
select * from #t a where id=(select top 1 id from #t where name=a.name order by id desc)

方法8:
select * from #t a where id!<all(select id from #t where name=a.name)

方法9(注:id为唯一时可用):
select * from #t a where id in(select max(id) from #t group by name)

--sql2005:

方法10:
select id,name,memo from (select *,max(id)over(partition by name) as minid from #t a)t where id=minid

方法11:
select id,name,memo from (select *,row_number()over(partition by name order by id desc) as minid from #t a)t where minid=1

生成结果2:
/*
id          name memo
----------- ---- ----
3           a    a3
5           b    b2

(2 行受影响)
*/

--2、删除重复记录有大小关系时,保留大或小其中一个记录

--> --> (roy)生成測試數據

if not object_id('tempdb..#t') is null
drop table #t
go
create table #t([id] int,[name] nvarchar(1),[memo] nvarchar(2))
insert #t
select 1,n'a',n'a1' union all
select 2,n'a',n'a2' union all
select 3,n'a',n'a3' union all
select 4,n'b',n'b1' union all
select 5,n'b',n'b2'
go

--i、name相同id最小的记录(推荐用1,2,3),保留最小一条
方法1:
delete a from #t a where exists(select 1 from #t where name=a.name and id<a.id)

方法2:
delete a from #t a left join (select min(id)id,name from #t group by name) b on a.name=b.name and a.id=b.id where b.id is null

方法3:
delete a from #t a where id not in (select min(id) from #t where name=a.name)

方法4(注:id为唯一时可用):
delete a from #t a where id not in(select min(id)from #t group by name)

方法5:
delete a from #t a where (select count(1) from #t where name=a.name and id<a.id)>0

方法6:
delete a from #t a where id<>(select top 1 id from #t where name=a.name order by id)

方法7:
delete a from #t a where id>any(select id from #t where name=a.name)

select * from #t

生成结果:
/*
id          name memo
----------- ---- ----
1           a    a1
4           b    b1

(2 行受影响)
*/

--ii、name相同id保留最大的一条记录:

方法1:
delete a from #t a where exists(select 1 from #t where name=a.name and id>a.id)

方法2:
delete a from #t a left join (select max(id)id,name from #t group by name) b on a.name=b.name and a.id=b.id where b.id is null

方法3:
delete a from #t a where id not in (select max(id) from #t where name=a.name)

方法4(注:id为唯一时可用):
delete a from #t a where id not in(select max(id)from #t group by name)

方法5:
delete a from #t a where (select count(1) from #t where name=a.name and id>a.id)>0

方法6:
delete a from #t a where id<>(select top 1 id from #t where name=a.name order by id desc)

方法7:
delete a from #t a where id<any(select id from #t where name=a.name)

select * from #t
/*
id          name memo
----------- ---- ----
3           a    a3
5           b    b2

(2 行受影响)
*/

--3、删除重复记录没有大小关系时，处理重复值

--> --> (roy)生成測試數據

if not object_id('tempdb..#t') is null
drop table #t
go
create table #t([num] int,[name] nvarchar(1))
insert #t
select 1,n'a' union all
select 1,n'a' union all
select 1,n'a' union all
select 2,n'b' union all
select 2,n'b'
go

方法1:
if object_id('tempdb..#') is not null
drop table #
select distinct * into # from #t--排除重复记录结果集生成临时表#

truncate table #t--清空表

insert #t select * from # --把临时表#插入到表#t中

--查看结果
select * from #t

/*
num         name
----------- ----
1           a
2           b

(2 行受影响)
*/

--重新执行测试数据后用方法2
方法2:

alter table #t add id int identity--新增标识列
go
delete a from #t a where exists(select 1 from #t where num=a.num and name=a.name and id>a.id)--只保留一条记录
go
alter table #t drop column id--删除标识列

--查看结果
select * from #t

/*
num         name
----------- ----
1           a
2           b

(2 行受影响)

--重新执行测试数据后用方法3
方法3:
declare roy_cursor cursor local for
select count(1)-1,num,name from #t group by num,name having count(1)>1
declare @con int,@num int,@name nvarchar(1)
open roy_cursor
fetch next from roy_cursor into @con,@num,@name
while @@fetch_status=0
begin
    set rowcount @con;
    delete #t where num=@num and name=@name
    set rowcount 0;
    fetch next from roy_cursor into @con,@num,@name
end
close roy_cursor
deallocate roy_cursor

--查看结果
select * from #t
/*
num         name
----------- ----
1           a
2           b

(2 行受影响)

上一篇： PHP全栈开发工程师学习路线图（各编程语言的关系和学习顺序图解）

下一篇：聊聊Navicat统计的行数竟然和表实际行数不一致的问题