zoukankan      html  css  js  c++  java
  • SQL查询和删除重复字段的内容

    --例如: 
    id           NAME         VALUE 
    1               a                 pp 
    2               a                 pp 
    3               b                 iii 
    4               b                 pp 
    5               b                 pp 
    6               c                 pp 
    7               c                 pp 
    8               c                 iii 
    --id是主键 
    --要求得到这样的结果 
    id           NAME         VALUE 
    1               a                 pp 
    3               b                 iii 
    4               b                 pp 
    6               c                 pp 
    8               c                 iii
    
    --方法1
    DELETE YourTable
    WHERE  [id] NOT   IN (SELECT MAX([id])
                          FROM   YourTable
                          GROUP BY
                                 (NAME + VALUE)) 
           
    --方法2
    
    DELETE a
    FROM   表 a
           LEFT   JOIN (
                    SELECT id = MIN(id)
                    FROM   表
                    GROUP BY
                           NAME,
                           VALUE
                )b
                ON  a.id = b.id
    WHERE  b.id IS NULL 
           
           
           
    --查询及删除重复记录的SQL语句
    --查询及删除重复记录的SQL语句
    --1、查找表中多余的重复记录,重复记录是根据单个字段(peopleId)来判断
    
    SELECT *
    FROM   people
    WHERE  peopleId IN (SELECT peopleId
                        FROM   people
                        GROUP BY
                               peopleId
                        HAVING COUNT(peopleId) > 1)
    --2、删除表中多余的重复记录,重复记录是根据单个字段(peopleId)来判断,只留有rowid最小的记录
    
    DELETE 
    FROM   people
    WHERE  peopleId IN (SELECT peopleId
                        FROM   people
                        GROUP BY
                               peopleId
                        HAVING COUNT(peopleId) > 1)
           AND rowid NOT IN (SELECT MIN(rowid)
                             FROM   people
                             GROUP BY
                                    peopleId
                             HAVING COUNT(peopleId) > 1)
    --3、查找表中多余的重复记录(多个字段)
    
    SELECT *
    FROM   vitae a
    WHERE  (a.peopleId, a.seq) IN (SELECT peopleId,
                                          seq
                                   FROM   vitae
                                   GROUP BY
                                          peopleId,
                                          seq
                                   HAVING COUNT(*) > 1)
    --4、删除表中多余的重复记录(多个字段),只留有rowid最小的记录
    
    DELETE 
    FROM   vitae a
    WHERE  (a.peopleId, a.seq) IN (SELECT peopleId,
                                          seq
                                   FROM   vitae
                                   GROUP BY
                                          peopleId,
                                          seq
                                   HAVING COUNT(*) > 1)
           AND rowid NOT IN (SELECT MIN(rowid)
                             FROM   vitae
                             GROUP BY
                                    peopleId,
                                    seq
                             HAVING COUNT(*) > 1)
               
    --5、查找表中多余的重复记录(多个字段),不包含rowid最小的记录
    
    SELECT *
    FROM   vitae a
    WHERE  (a.peopleId, a.seq) IN (SELECT peopleId,
                                          seq
                                   FROM   vitae
                                   GROUP BY
                                          peopleId,
                                          seq
                                   HAVING COUNT(*) > 1)
           AND rowid NOT IN (SELECT MIN(rowid)
                             FROM   vitae
                             GROUP BY
                                    peopleId,
                                    seq
                             HAVING COUNT(*) > 1)
    --(二)
    --比方说
    --在A表中存在一个字段“name”,
    --而且不同记录之间的“name”值有可能会相同,
    --现在就是需要查询出在该表中的各记录之间,“name”值存在重复的项;
    
    SELECT NAME,
           COUNT(*)
    FROM   A
    GROUP BY
           NAME
    HAVING COUNT(*) > 1
    
    --如果还查性别也相同大则如下:
    
    SELECT NAME,
           sex,
           COUNT(*)
    FROM   A
    GROUP BY
           NAME,
           sex
    HAVING COUNT(*) > 1(三)
    --方法一
    
    DECLARE @max     integer,
            @id      integer
    
    DECLARE cur_rows CURSOR LOCAL 
    FOR
        SELECT 主字段,
               COUNT(*)
        FROM   表名
        GROUP BY
               主字段
        HAVING COUNT(*) > ; 1
    
    OPEN cur_rows
    FETCH cur_rows INTO @id,@max
    WHILE @@fetch_status = 0
    BEGIN
        SELECT @max = @max -1
        SET ROWCOUNT @max
        DELETE 
        FROM   表名
        WHERE  主字段 = @id
        
        FETCH cur_rows INTO @id,@max
    END
    CLOSE cur_rows
    SET ROWCOUNT 0
        
    --方法二
    --"重复记录"有两个意义上的重复记录,一是完全重复的记录,也即所有字段均重复的记录,二是部分关键字段重复的记录,比如Name字段重复,而其他字段不一定重复或都重复可以忽略。
    --1、对于第一种重复,比较容易解决,使用
    
    SELECT DISTINCT * 
    FROM   tableName
    --就可以得到无重复记录的结果集。
    --如果该表需要删除重复的记录(重复记录保留1条),可以按以下方法删除
    
    SELECT DISTINCT * INTO #Tmp
    FROM   tableName
    
    DROP TABLE tableName
    SELECT * INTO tableName
    FROM   #Tmp
    
    DROP TABLE #Tmp
    --发生这种重复的原因是表设计不周产生的,增加唯一索引列即可解决。
    --2、这类重复问题通常要求保留重复记录中的第一条记录,操作方法如下
    --假设有重复的字段为Name,Address,要求得到这两个字段唯一的结果集
    SELECT IDENTITY(INT, 1, 1)  AS autoID,
           * INTO #Tmp
    FROM                           tableName
    
    SELECT MIN(autoID) AS autoID INTO #Tmp2
    FROM   #Tmp
    GROUP BY
           NAME,
           autoID
    
    SELECT *
    FROM   #Tmp
    WHERE  autoID IN (SELECT autoID
                      FROM   #tmp2)
    --最后一个select即得到了Name,Address不重复的结果集(但多了一个autoID字段,实际写时可以写在select子句中省去此列)(四)
    --查询重复
    
    SELECT *
    FROM   tablename
    WHERE  id IN (SELECT id
                  FROM   tablename
                  GROUP BY
                         id
                  HAVING COUNT(id) > 1)

  • 相关阅读:
    Java 虚拟机部分面试题
    Java 多线程部分面试题
    Java IO部分面试题
    Java 集合框架部分面试题
    Java 面向对象面试题
    Java 多线程同步的五种方法
    Python操作redis
    Python操作mysql
    Python操作mongodb
    数据处理的全过程---(获取数据-清洗数据-数据建模-数据可视化)
  • 原文地址:https://www.cnblogs.com/smartsmile/p/6234264.html
Copyright © 2011-2022 走看看