您的位置:首页 > 数据库 > Oracle

Oracle查询优化-多表查询

2016-11-13 14:55 429 查看
--合并结果集
--1.union all
SELECT * FROM emp WHERE empno=7369
UNION ALL--单纯合并
SELECT * FROM emp WHERE empno=7369;
--2.union
SELECT * FROM emp WHERE empno=7369
UNION --将重复结果集合并
SELECT * FROM emp WHERE empno=7369;
--------------使用命令窗口执行,查看union与or的执行计划
SQL> alter session set "_b_tree_bitmap_plans" = FALSE;
SQL> explain plan for select empno,ename from emp where empno =7788 or ename='SCOTT';
SQL> select * from table(dbms_xplan.display);
SQL> explain plan for select empno,ename from emp where empno=7788 UNION select empno,ename from emp where ename = 'SCOTT';
SQL> select * from table(dbms_xplan.display);
--可见union会使用索引
--union会强制将结果集进行合并,从而使数据出现错误
SQL> select empno,deptno from emp where mgr=7698 order by 1;

EMPNO DEPTNO
----- ------
7499     30
7521     30
7654     30
7844     30
7900     30

SQL> select empno,deptno from emp where job='SALESMAN' order by 1;

EMPNO DEPTNO
----- ------
7499     30
7521     30
7654     30
7844     30
--从上面两条语句看出有4条结果重复,看看union和or的区别
SQL> select deptno from emp where mgr=7698 or job='SALESMAN';

DEPTNO
------
30
30
30
30
30

SQL> select deptno from emp where mgr=7698
2  union
3  select deptno from emp where job='SALESMAN';

DEPTNO
------
30
/**************************************************************************************************************************************
* 结论:
* 1.不仅两个数据集间重复的数据会被去重,而且单个数据集里重复的数据也会被去重;
* 2.有重复数据的数据集用union后得到的数据与预期会不一致;
* 3.可以这样,select deptno from (select empno,deptno from emp where mgr=7698 union select empno,deptno from emp where job='SALESMAN')
*   或者将empno改为rowid也行。
**************************************************************************************************************************************/
--4.[inner] join与=
SELECT e.empno,e.ename,d.dname,d.loc
FROM emp e
INNER JOIN dept d ON (e.deptno=d.deptno)
WHERE e.deptno=10;
SELECT e.empno,e.ename,d.dname,d.loc
FROM emp e,dept d
WHERE e.deptno=d.deptno
AND e.deptno=10;--以上两句结果相同,但join是SQL-92标准,可以清晰反应表与表之间的关联关系,推荐使用join
--5.in、exists和inner join
CREATE TABLE emp2 AS--创建相关table
SELECT ename,job,sal,comm FROM emp WHERE job = 'CLERK';
--6.要求查询与emp2相匹配的emp中的数据,可以使用in、exists或inner join
SELECT * FROM emp WHERE (ename,job,sal) IN (SELECT ename,job,sal FROM emp2);
SELECT * FROM emp a WHERE EXISTS (SELECT NULL FROM emp2 b WHERE b.ename=a.ename
AND b.job=a.job
AND b.sal=a.sal);
SELECT * FROM emp a
INNER JOIN emp2 b
ON (b.ename=a.ename
AND b.job=a.job
AND b.sal=a.sal);
/********************************************************************************************************
* 结论:
* 1.以上三条语句可以返回相同条数的结果集;
* 2.通过查看plan可以看出,exists和in都使用了HASH JOIN SEMI(哈希半连接)而inner join使用了哈希连接;
* 3.exists和in的执行效率是一样的,如果不确定,可以通过查看plan来判断,不要死记硬背。
********************************************************************************************************/
--7.内、左、右、外连接
--建立测试表
--左表
DROP TABLE L;
CREATE TABLE L AS SELECT 'L_1' AS str,'1' AS v FROM dual UNION ALL
SELECT 'L_2','2' AS v FROM dual UNION ALL
SELECT 'L_3','3' AS v FROM dual UNION ALL
SELECT 'L_4','4' AS v FROM dual;
--右表
DROP TABLE R;
CREATE TABLE R AS
SELECT 'R_3' AS str,'3' AS v,1 AS STATUS FROM dual UNION ALL
SELECT 'R_4','4' AS v,0 AS STATUS FROM dual UNION ALL
SELECT 'R_5','5' AS v,0 AS STATUS FROM dual UNION ALL
SELECT 'R_6','6' AS v,0 AS STATUS FROM dual;
--INNER JOIN
SELECT l.str AS l_str,r.str AS r_str
FROM l
INNER JOIN r ON l.v=r.v
ORDER BY 1,2;
SELECT l.str AS l_str,r.str AS r_str
FROM l,r
WHERE l.v=r.v
ORDER BY 1,2;
--LEFT JOIN
SELECT l.str AS l_str,r.str AS r_str
FROM l
LEFT JOIN r ON l.v=r.v
ORDER BY 1,2;
SELECT l.str AS l_str,r.str AS r_str
FROM l,r
WHERE l.v=r.v(+)
ORDER BY 1,2;
--RIGHT JOIN
SELECT l.str AS l_str,r.str AS r_str
FROM l
RIGHT JOIN r ON l.v=r.v
ORDER BY 1,2;
SELECT l.str AS l_str,r.str AS r_str
FROM l,r
WHERE l.v(+)=r.v
ORDER BY 1,2;
--FULL JOIN
SELECT l.str AS l_str,r.str AS r_str
FROM l
FULL JOIN r ON l.v=r.v
ORDER BY 1,2;
--8.自连接
SELECT a.empno,a.ename,b.ename mgr,a.deptno FROM emp a,emp b WHERE a.mgr=b.empno(+) ORDER BY a.empno;
--9.NOT IN,NOT EXISTS和LEFT JOIN
SELECT * FROM DEPT WHERE DEPTNO NOT IN(SELECT DEPTNO FROM EMP WHERE EMP.DEPTNO IS NOT NULL);
SELECT * FROM DEPT WHERE NOT EXISTS (SELECT NULL FROM EMP WHERE EMP.DEPTNO = DEPT.DEPTNO);
SELECT DEPT.* FROM DEPT LEFT JOIN EMP ON EMP.DEPTNO=DEPT.DEPTNO WHERE EMP.DEPTNO IS NULL;
--10.外连接中的条件
--沿用7的测试表,查询左表所有内容,使用V关联右表,但只显示右表中STATUS为1的值,期望结果如下:
STR STR
--- ---
L_1
L_2
L_3 R_3
L_4
--错误写法:
SELECT L.STR,R.STR FROM L LEFT JOIN R ON(L.V=R.V) WHERE R.STATUS=1 ORDER BY 1;
PLAN_TABLE_OUTPUT
--------------------------------------------------------------------------------
Plan hash value: 688663707
----------------------------------------------------------------------------
| Id  | Operation           | Name | Rows  | Bytes | Cost (%CPU)| Time     |
----------------------------------------------------------------------------
|   0 | SELECT STATEMENT    |      |     1 |    27 |     8  (25)| 00:00:01 |
|   1 |  SORT ORDER BY      |      |     1 |    27 |     8  (25)| 00:00:01 |
|*  2 |   HASH JOIN         |      |     1 |    27 |     7  (15)| 00:00:01 |
|*  3 |    TABLE ACCESS FULL| R    |     1 |    21 |     3   (0)| 00:00:01 |
|   4 |    TABLE ACCESS FULL| L    |     4 |    24 |     3   (0)| 00:00:01 |
----------------------------------------------------------------------------
Predicate Information (identified by operation id):
---------------------------------------------------
2 - access("L"."V"="R"."V")
3 - filter("R"."STATUS"=1)
Note
-----

PLAN_TABLE_OUTPUT
--------------------------------------------------------------------------------
- dynamic sampling used for this statement

21 rows selected
--正确写法:
SELECT L.STR,R.STR FROM L LEFT JOIN R ON (L.V=R.V AND R.STATUS=1) ORDER BY 1;
PLAN_TABLE_OUTPUT
--------------------------------------------------------------------------------
Plan hash value: 2310059642
----------------------------------------------------------------------------
| Id  | Operation           | Name | Rows  | Bytes | Cost (%CPU)| Time     |
----------------------------------------------------------------------------
|   0 | SELECT STATEMENT    |      |     4 |   108 |     8  (25)| 00:00:01 |
|   1 |  SORT ORDER BY      |      |     4 |   108 |     8  (25)| 00:00:01 |
|*  2 |   HASH JOIN OUTER   |      |     4 |   108 |     7  (15)| 00:00:01 |
|   3 |    TABLE ACCESS FULL| L    |     4 |    24 |     3   (0)| 00:00:01 |
|*  4 |    TABLE ACCESS FULL| R    |     1 |    21 |     3   (0)| 00:00:01 |
----------------------------------------------------------------------------
Predicate Information (identified by operation id):
---------------------------------------------------
2 - access("L"."V"="R"."V"(+))
4 - filter("R"."STATUS"(+)=1)
Note
-----

PLAN_TABLE_OUTPUT
--------------------------------------------------------------------------------
- dynamic sampling used for this statement

21 rows selected
/*外层条件不要随便加,会影响结果集*/
--11.检测两个表中的数据及对应数据的条数是否相同
CREATE OR REPLACE VIEW V AS
SELECT * FROM EMP WHERE DEPTNO != 10
UNION ALL
SELECT * FROM EMP WHERE ENAME='SCOTT';
--要求查处视图V与表EMP中不同的数据(注意:视图中'SCOTT'有两行数据,而EMP表中只有一条数据)
--分析:除了EMP表中DEPTNO为10的数据,还有ENAME为SCOTT的数据与V中不一致,因为EMP表中只有一条而V中有两条
SELECT *
FROM (SELECT EMPNO,ENAME,COUNT(*) AS CNT FROM V GROUP BY EMPNO,ENAME) V --加一列统计条数用以区分不同
FULL JOIN (SELECT EMPNO,ENAME,COUNT(*) AS CNT FROM EMP GROUP BY EMPNO,ENAME) E
ON V.EMPNO=E.EMPNO AND V.CNT=E.CNT
WHERE V.EMPNO IS NULL OR E.EMPNO IS NULL;
EMPNO ENAME             CNT EMPNO ENAME             CNT
---------- ---------- ---------- ----- ---------- ----------
7788 SCOTT               2
7782 CLARK               1
7839 KING                1
7788 SCOTT               1
7934 MILLER              1
--12.聚集与内连接
CREATE TABLE EMP_BONUS (EMPNO INT,RECEIVED DATE,TYPE INT);
INSERT INTO EMP_BONUS VALUES (7934,DATE '2005-5-17',1);
INSERT INTO EMP_BONUS VALUES (7934,DATE '2005-2-15',2);
INSERT INTO EMP_BONUS VALUES (7839,DATE '2005-5-17',3);
INSERT INTO EMP_BONUS VALUES (7782,DATE '2005-5-17',1);
--要求返回上述员工的工资及奖金,奖金根据TYPE来定,TYPE为1,奖金为10%...
SELECT E.DEPTNO,E.EMPNO,E.ENAME,E.SAL,B.TYPE*0.1*E.SAL AS BONUS
FROM EMP E,EMP_BONUS B
WHERE E.EMPNO(+)=B.EMPNO;
DEPTNO EMPNO ENAME            SAL      BONUS
------ ----- ---------- --------- ----------
10  7934 MILLER       1300.00        130
10  7934 MILLER       1300.00        260
10  7839 KING         5000.00       1500
10  7782 CLARK        2450.00        245
--若此时想要计算6月份部门为10的总工资
--错误做法:
SELECT E.DEPTNO,SUM(E.SAL) TOTAL_SAL,SUM(B.TYPE*0.1*E.SAL) AS TOTAL_BONUS
FROM EMP E,EMP_BONUS B
WHERE E.EMPNO(+)=B.EMPNO
GROUP BY E.DEPTNO;
DEPTNO  TOTAL_SAL TOTAL_BONUS
------ ---------- -----------
10      10050        2135
--原因,MILLER的工资和奖金都重复计算了,因为他5月份已经降职了,所以有两条不同的TYPE对应他的相关信息!
--正确做法:
SELECT E.DEPTNO,SUM(E.SAL) TOTAL_SAL,SUM(B.TYPE*0.1*E.SAL) AS TOTAL_BONUS
FROM EMP E
INNER JOIN
(SELECT EB.EMPNO,EB.TYPE,EB.RECEIVED
FROM EMP_BONUS EB
INNER JOIN
(SELECT MAX(C.EMPNO) EMPNO,MAX(C.RECEIVED) RECEIVED FROM EMP_BONUS C GROUP BY C.EMPNO) EBG --先统计出员工最新的职位变更时间
ON EB.EMPNO=EBG.EMPNO AND EB.RECEIVED=EBG.RECEIVED) B
ON E.EMPNO=B.EMPNO
GROUP BY E.DEPTNO;
DEPTNO  TOTAL_SAL TOTAL_BONUS
------ ---------- -----------
10       8750        1875
--13.聚集与外连接
SELECT E.DEPTNO,SUM(E.SAL) TOTAL_SAL,SUM(B.TYPE*0.1*E.SAL) AS TOTAL_BONUS
FROM EMP E
LEFT JOIN --只改此处为LEFT JOIN即可
(SELECT EB.EMPNO,EB.TYPE,EB.RECEIVED
FROM EMP_BONUS EB
INNER JOIN
(SELECT MAX(C.EMPNO) EMPNO,MAX(C.RECEIVED) RECEIVED FROM EMP_BONUS C GROUP BY C.EMPNO) EBG --先统计出员工最新的职位变更时间
ON EB.EMPNO=EBG.EMPNO AND EB.RECEIVED=EBG.RECEIVED) B
ON E.EMPNO=B.EMPNO
GROUP BY E.DEPTNO
ORDER BY 1;
DEPTNO  TOTAL_SAL TOTAL_BONUS
------ ---------- -----------
10       8750        1875
20      10875
30       9400
--14.多表查询时的空值处理
--要求返回比ALLEN提成低的员工
--错误做法:
SELECT E.ENAME,E.COMM
FROM EMP E
WHERE E.COMM<(SELECT COMM FROM EMP WHERE ENAME='ALLEN');
ENAME           COMM
---------- ---------
TURNER          0.00
--错误原因:有些员工的COMM一项为NULL,但并未返回
--正确做法:
SELECT E.ENAME,E.COMM
FROM EMP E
WHERE COALESCE(E.COMM,0)<(SELECT COMM FROM EMP WHERE ENAME='ALLEN');
ENAME           COMM
---------- ---------
SMITH
JONES
BLAKE
CLARK
SCOTT
KING
TURNER          0.00
ADAMS
JAMES
FORD
MILLER
内容来自用户分享和网络整理,不保证内容的准确性,如有侵权内容,可联系管理员处理 点击这里给我发消息
标签: