Home > mailing lists

Selecting and deleting duplicate rows - Mailing list pgsql-sql

From	Clark Evans
Subject	Selecting and deleting duplicate rows
Date	March 30, 1999 15:36:57
Msg-id	37013500.DFF0A64A@manhattanproject.com Whole thread Raw
In response to	regexp strangeness (Andrew Merrill <andrew@compclass.com>)
List	pgsql-sql

Tree view

This is a question I've seen a few times, and
had to research, so I figured I'd share the
answer.


-------------------------------------------------


drop table test;
--
create table test ( a text, b text );
--  unique values
insert into test values ( 'x', 'y');
insert into test values ( 'x', 'x');
insert into test values ( 'y', 'y' );
insert into test values ( 'y', 'x' );
-- duplicate values
insert into test values ( 'x', 'y');
insert into test values ( 'x', 'x');
insert into test values ( 'y', 'y' );
insert into test values ( 'y', 'x' );
-- one more double duplicate
insert into test values ( 'x', 'y');
--
select oid, a, b from test;
--
-- select duplicate rows
--
select o.oid, o.a, o.b from test owhere exists ( select 'x'                  from test i                where i.a = o.a
                and i.b = o.b                  and i.oid < o.oid            );
 
--
-- delete duplicate rows
--
-- Note: PostgreSQL dosn't support aliases on
--       the table mentioned in the from clause
--       of a delete.
--
delete from test where exists ( select 'x'                  from test i                where i.a = test.a
  and i.b = test.b                  and i.oid < test.oid            );
 
--
-- Let's see if it worked.
--

select oid, a, b from test;

--
-- Delete duplicates with respect to a only, ignoring
-- the value in b.  Note, the first deletion leaves the 
-- first oid with the unique values and removes subsequent
-- ones, in this delete we reverse the direction of the <
-- to save the last oid, and remove the previous ones.
--

delete from test where exists ( select 'x'                  from test i                where i.a = test.a
  and i.oid > test.oid            );
 

--
-- Let's see if it worked.
--

select oid, a, b from test;

pgsql-sql by date:

From: Andrew Merrill
Date: 30 March 1999, 13:13:16
Subject: Re: [SQL] indexing a datetime by date

From: Chairudin Sentosa
Date: 30 March 1999, 23:34:20
Subject: TO_CHAR or TO_DATE

Selecting and deleting duplicate rows - Mailing list pgsql-sql

Previous

Next