--合并结果集 --1.union all SELECT * FROM emp WHERE empno=7369 UNION ALL--单纯合并 SELECT * FROM emp WHERE empno=7369; --2.union SELECT * FROM emp WHERE empno=7369 UNION --将重复结果集合并 SELECT * FROM emp WHERE empno=7369; --------------使用命令窗口执行,查看union与or的执行计划 SQL> alter session set "_b_tree_bitmap_plans" = FALSE; SQL> explain plan for select empno,ename from emp where empno =7788 or ename='SCOTT'; SQL> select * from table(dbms_xplan.display); SQL> explain plan for select empno,ename from emp where empno=7788 UNION select empno,ename from emp where ename = 'SCOTT'; SQL> select * from table(dbms_xplan.display); --可见union会使用索引 --union会强制将结果集进行合并,从而使数据出现错误 SQL> select empno,deptno from emp where mgr=7698 order by 1; EMPNO DEPTNO ----- ------ 7499 30 7521 30 7654 30 7844 30 7900 30 SQL> select empno,deptno from emp where job='SALESMAN' order by 1; EMPNO DEPTNO ----- ------ 7499 30 7521 30 7654 30 7844 30 --从上面两条语句看出有4条结果重复,看看union和or的区别 SQL> select deptno from emp where mgr=7698 or job='SALESMAN'; DEPTNO ------ 30 30 30 30 30 SQL> select deptno from emp where mgr=7698 2 union 3 select deptno from emp where job='SALESMAN'; DEPTNO ------ 30 /************************************************************************************************************************************** * 结论: * 1.不仅两个数据集间重复的数据会被去重,而且单个数据集里重复的数据也会被去重; * 2.有重复数据的数据集用union后得到的数据与预期会不一致; * 3.可以这样,select deptno from (select empno,deptno from emp where mgr=7698 union select empno,deptno from emp where job='SALESMAN') * 或者将empno改为rowid也行。 **************************************************************************************************************************************/ --4.[inner] join与= SELECT e.empno,e.ename,d.dname,d.loc FROM emp e INNER JOIN dept d ON (e.deptno=d.deptno) WHERE e.deptno=10; SELECT e.empno,e.ename,d.dname,d.loc FROM emp e,dept d WHERE e.deptno=d.deptno AND e.deptno=10;--以上两句结果相同,但join是SQL-92标准,可以清晰反应表与表之间的关联关系,推荐使用join --5.in、exists和inner join CREATE TABLE emp2 AS--创建相关table SELECT ename,job,sal,comm FROM emp WHERE job = 'CLERK'; --6.要求查询与emp2相匹配的emp中的数据,可以使用in、exists或inner join SELECT * FROM emp WHERE (ename,job,sal) IN (SELECT ename,job,sal FROM emp2); SELECT * FROM emp a WHERE EXISTS (SELECT NULL FROM emp2 b WHERE b.ename=a.ename AND b.job=a.job AND b.sal=a.sal); SELECT * FROM emp a INNER JOIN emp2 b ON (b.ename=a.ename AND b.job=a.job AND b.sal=a.sal); /******************************************************************************************************** * 结论: * 1.以上三条语句可以返回相同条数的结果集; * 2.通过查看plan可以看出,exists和in都使用了HASH JOIN SEMI(哈希半连接)而inner join使用了哈希连接; * 3.exists和in的执行效率是一样的,如果不确定,可以通过查看plan来判断,不要死记硬背。 ********************************************************************************************************/ --7.内、左、右、外连接 --建立测试表 --左表 DROP TABLE L; CREATE TABLE L AS SELECT 'L_1' AS str,'1' AS v FROM dual UNION ALL SELECT 'L_2','2' AS v FROM dual UNION ALL SELECT 'L_3','3' AS v FROM dual UNION ALL SELECT 'L_4','4' AS v FROM dual; --右表 DROP TABLE R; CREATE TABLE R AS SELECT 'R_3' AS str,'3' AS v,1 AS STATUS FROM dual UNION ALL SELECT 'R_4','4' AS v,0 AS STATUS FROM dual UNION ALL SELECT 'R_5','5' AS v,0 AS STATUS FROM dual UNION ALL SELECT 'R_6','6' AS v,0 AS STATUS FROM dual; --INNER JOIN SELECT l.str AS l_str,r.str AS r_str FROM l INNER JOIN r ON l.v=r.v ORDER BY 1,2; SELECT l.str AS l_str,r.str AS r_str FROM l,r WHERE l.v=r.v ORDER BY 1,2; --LEFT JOIN SELECT l.str AS l_str,r.str AS r_str FROM l LEFT JOIN r ON l.v=r.v ORDER BY 1,2; SELECT l.str AS l_str,r.str AS r_str FROM l,r WHERE l.v=r.v(+) ORDER BY 1,2; --RIGHT JOIN SELECT l.str AS l_str,r.str AS r_str FROM l RIGHT JOIN r ON l.v=r.v ORDER BY 1,2; SELECT l.str AS l_str,r.str AS r_str FROM l,r WHERE l.v(+)=r.v ORDER BY 1,2; --FULL JOIN SELECT l.str AS l_str,r.str AS r_str FROM l FULL JOIN r ON l.v=r.v ORDER BY 1,2; --8.自连接 SELECT a.empno,a.ename,b.ename mgr,a.deptno FROM emp a,emp b WHERE a.mgr=b.empno(+) ORDER BY a.empno; --9.NOT IN,NOT EXISTS和LEFT JOIN SELECT * FROM DEPT WHERE DEPTNO NOT IN(SELECT DEPTNO FROM EMP WHERE EMP.DEPTNO IS NOT NULL); SELECT * FROM DEPT WHERE NOT EXISTS (SELECT NULL FROM EMP WHERE EMP.DEPTNO = DEPT.DEPTNO); SELECT DEPT.* FROM DEPT LEFT JOIN EMP ON EMP.DEPTNO=DEPT.DEPTNO WHERE EMP.DEPTNO IS NULL; --10.外连接中的条件 --沿用7的测试表,查询左表所有内容,使用V关联右表,但只显示右表中STATUS为1的值,期望结果如下: STR STR --- --- L_1 L_2 L_3 R_3 L_4 --错误写法: SELECT L.STR,R.STR FROM L LEFT JOIN R ON(L.V=R.V) WHERE R.STATUS=1 ORDER BY 1; PLAN_TABLE_OUTPUT -------------------------------------------------------------------------------- Plan hash value: 688663707 ---------------------------------------------------------------------------- | Id | Operation | Name | Rows | Bytes | Cost (%CPU)| Time | ---------------------------------------------------------------------------- | 0 | SELECT STATEMENT | | 1 | 27 | 8 (25)| 00:00:01 | | 1 | SORT ORDER BY | | 1 | 27 | 8 (25)| 00:00:01 | |* 2 | HASH JOIN | | 1 | 27 | 7 (15)| 00:00:01 | |* 3 | TABLE ACCESS FULL| R | 1 | 21 | 3 (0)| 00:00:01 | | 4 | TABLE ACCESS FULL| L | 4 | 24 | 3 (0)| 00:00:01 | ---------------------------------------------------------------------------- Predicate Information (identified by operation id): --------------------------------------------------- 2 - access("L"."V"="R"."V") 3 - filter("R"."STATUS"=1) Note ----- PLAN_TABLE_OUTPUT -------------------------------------------------------------------------------- - dynamic sampling used for this statement 21 rows selected --正确写法: SELECT L.STR,R.STR FROM L LEFT JOIN R ON (L.V=R.V AND R.STATUS=1) ORDER BY 1; PLAN_TABLE_OUTPUT -------------------------------------------------------------------------------- Plan hash value: 2310059642 ---------------------------------------------------------------------------- | Id | Operation | Name | Rows | Bytes | Cost (%CPU)| Time | ---------------------------------------------------------------------------- | 0 | SELECT STATEMENT | | 4 | 108 | 8 (25)| 00:00:01 | | 1 | SORT ORDER BY | | 4 | 108 | 8 (25)| 00:00:01 | |* 2 | HASH JOIN OUTER | | 4 | 108 | 7 (15)| 00:00:01 | | 3 | TABLE ACCESS FULL| L | 4 | 24 | 3 (0)| 00:00:01 | |* 4 | TABLE ACCESS FULL| R | 1 | 21 | 3 (0)| 00:00:01 | ---------------------------------------------------------------------------- Predicate Information (identified by operation id): --------------------------------------------------- 2 - access("L"."V"="R"."V"(+)) 4 - filter("R"."STATUS"(+)=1) Note ----- PLAN_TABLE_OUTPUT -------------------------------------------------------------------------------- - dynamic sampling used for this statement 21 rows selected /*外层条件不要随便加,会影响结果集*/ --11.检测两个表中的数据及对应数据的条数是否相同 CREATE OR REPLACE VIEW V AS SELECT * FROM EMP WHERE DEPTNO != 10 UNION ALL SELECT * FROM EMP WHERE ENAME='SCOTT'; --要求查处视图V与表EMP中不同的数据(注意:视图中'SCOTT'有两行数据,而EMP表中只有一条数据) --分析:除了EMP表中DEPTNO为10的数据,还有ENAME为SCOTT的数据与V中不一致,因为EMP表中只有一条而V中有两条 SELECT * FROM (SELECT EMPNO,ENAME,COUNT(*) AS CNT FROM V GROUP BY EMPNO,ENAME) V --加一列统计条数用以区分不同 FULL JOIN (SELECT EMPNO,ENAME,COUNT(*) AS CNT FROM EMP GROUP BY EMPNO,ENAME) E ON V.EMPNO=E.EMPNO AND V.CNT=E.CNT WHERE V.EMPNO IS NULL OR E.EMPNO IS NULL; EMPNO ENAME CNT EMPNO ENAME CNT ---------- ---------- ---------- ----- ---------- ---------- 7788 SCOTT 2 7782 CLARK 1 7839 KING 1 7788 SCOTT 1 7934 MILLER 1 --12.聚集与内连接 CREATE TABLE EMP_BONUS (EMPNO INT,RECEIVED DATE,TYPE INT); INSERT INTO EMP_BONUS VALUES (7934,DATE '2005-5-17',1); INSERT INTO EMP_BONUS VALUES (7934,DATE '2005-2-15',2); INSERT INTO EMP_BONUS VALUES (7839,DATE '2005-5-17',3); INSERT INTO EMP_BONUS VALUES (7782,DATE '2005-5-17',1); --要求返回上述员工的工资及奖金,奖金根据TYPE来定,TYPE为1,奖金为10%... SELECT E.DEPTNO,E.EMPNO,E.ENAME,E.SAL,B.TYPE*0.1*E.SAL AS BONUS FROM EMP E,EMP_BONUS B WHERE E.EMPNO(+)=B.EMPNO; DEPTNO EMPNO ENAME SAL BONUS ------ ----- ---------- --------- ---------- 10 7934 MILLER 1300.00 130 10 7934 MILLER 1300.00 260 10 7839 KING 5000.00 1500 10 7782 CLARK 2450.00 245 --若此时想要计算6月份部门为10的总工资 --错误做法: SELECT E.DEPTNO,SUM(E.SAL) TOTAL_SAL,SUM(B.TYPE*0.1*E.SAL) AS TOTAL_BONUS FROM EMP E,EMP_BONUS B WHERE E.EMPNO(+)=B.EMPNO GROUP BY E.DEPTNO; DEPTNO TOTAL_SAL TOTAL_BONUS ------ ---------- ----------- 10 10050 2135 --原因,MILLER的工资和奖金都重复计算了,因为他5月份已经降职了,所以有两条不同的TYPE对应他的相关信息! --正确做法: SELECT E.DEPTNO,SUM(E.SAL) TOTAL_SAL,SUM(B.TYPE*0.1*E.SAL) AS TOTAL_BONUS FROM EMP E INNER JOIN (SELECT EB.EMPNO,EB.TYPE,EB.RECEIVED FROM EMP_BONUS EB INNER JOIN (SELECT MAX(C.EMPNO) EMPNO,MAX(C.RECEIVED) RECEIVED FROM EMP_BONUS C GROUP BY C.EMPNO) EBG --先统计出员工最新的职位变更时间 ON EB.EMPNO=EBG.EMPNO AND EB.RECEIVED=EBG.RECEIVED) B ON E.EMPNO=B.EMPNO GROUP BY E.DEPTNO; DEPTNO TOTAL_SAL TOTAL_BONUS ------ ---------- ----------- 10 8750 1875 --13.聚集与外连接 SELECT E.DEPTNO,SUM(E.SAL) TOTAL_SAL,SUM(B.TYPE*0.1*E.SAL) AS TOTAL_BONUS FROM EMP E LEFT JOIN --只改此处为LEFT JOIN即可 (SELECT EB.EMPNO,EB.TYPE,EB.RECEIVED FROM EMP_BONUS EB INNER JOIN (SELECT MAX(C.EMPNO) EMPNO,MAX(C.RECEIVED) RECEIVED FROM EMP_BONUS C GROUP BY C.EMPNO) EBG --先统计出员工最新的职位变更时间 ON EB.EMPNO=EBG.EMPNO AND EB.RECEIVED=EBG.RECEIVED) B ON E.EMPNO=B.EMPNO GROUP BY E.DEPTNO ORDER BY 1; DEPTNO TOTAL_SAL TOTAL_BONUS ------ ---------- ----------- 10 8750 1875 20 10875 30 9400 --14.多表查询时的空值处理 --要求返回比ALLEN提成低的员工 --错误做法: SELECT E.ENAME,E.COMM FROM EMP E WHERE E.COMM<(SELECT COMM FROM EMP WHERE ENAME='ALLEN'); ENAME COMM ---------- --------- TURNER 0.00 --错误原因:有些员工的COMM一项为NULL,但并未返回 --正确做法: SELECT E.ENAME,E.COMM FROM EMP E WHERE COALESCE(E.COMM,0)<(SELECT COMM FROM EMP WHERE ENAME='ALLEN'); ENAME COMM ---------- --------- SMITH JONES BLAKE CLARK SCOTT KING TURNER 0.00 ADAMS JAMES FORD MILLER