Added parallel example.

jonheller1 · Jun 30, 2015 · b46e187 · b46e187
1 parent 13bd66d
commit b46e187
Showing 1 changed file with 192 additions and 16 deletions.
diff --git a/SQL_Monitoring_tutorial.sql b/SQL_Monitoring_tutorial.sql
@@ -2,14 +2,15 @@
 -- This SQL Monitoring tutorial demonstrates how to use Real-Time SQL Monitoring
 -- and when Historical SQL Monitoring can help.
 --
--- This tutorial assumes you are familiar with basic Oracle tuning concepts,
+-- This tutorial assumes you are familiar with basic Oracle tuning concepts
 -- like explain plans, join methods, etc.
 --
 -- This worksheet should be run in pieces in an IDE like PL/SQL Developer, Toad,
 -- or SQL Developer.  (Sorry, SQL*Plus - you're not good enough for SQL tuning.)
 --
 -- Scenario #1 shows a cardinality (rows) estimate problem.
 -- Scenario #2 shows a downgraded parallel query problem.
+--
 --------------------------------------------------------------------------------
 
 
@@ -23,6 +24,7 @@ drop table small_table;
 drop table medium_table;
 drop table large_table;
 
+
 --#1b: Create simple tables of different sizes, then gather statistics.
 create table small_table (a number);
 create table medium_table(a number);
@@ -37,13 +39,15 @@ begin
 end;
 /
 
+
 --#1c: Simulate a statistics mistake.  Although Oracle has default tasks to
 --gather statistics at night, it is important to manually gather statistics
 --after a large data load.  It's a common mistake in a data warehouse to
 --load a table but forget to manually gather statistics when the job is done.
 insert into small_table  select level+1 from dual connect by level <= 100000;
 commit;
 
+
 --#1d: Run this statement to count the rows.  This will run for hours or days
 --because of the bad optimizer statistics.  While it's running, go to step #1e
 --in a separate session.
@@ -61,6 +65,7 @@ begin
 end;
 /
 
+
 --#1e: In a separate session, find the SQL_ID of the slow statement.
 --The first step for tuning is to find what's slow.  This is much harder than
 --most people realize.  If you're lucky, what's slow is a single SQL statement,
@@ -73,17 +78,19 @@ from gv$sql
 where users_executing > 0
 order by elapsed_time desc;
 
+
 --#1f: Run Real-Time SQL Monitoring on the slow statement.
 --There are multiple "types".  I prefer "text" but you may want to try "active".
 select dbms_sqltune.report_sql_monitor(
     sql_id => '70zg7uquwa4vj',
     type   => 'text'
 ) from dual;
 
---#1g: Take a brief look at the sample output.
-SQL Monitoring Report
 
+--#1g: Look at the sample output.
 /*
+SQL Monitoring Report
+
 SQL Text
 ------------------------------
 select count(*) unique_string_to_search_for from small_table st join medium_table mt on st.a = mt.a join large_table lt on mt.a = lt.a
@@ -157,13 +164,13 @@ one row when it really has much more.  This implies the statistics are incorrect
 for that table and need to be re-gathered.
 */
 
+
 --#1i: Run Historical SQL Monitoring on the results.
 select hist_sql_mon.hist_sql_mon(
 	p_sql_id => '70zg7uquwa4vj',
 	p_start_time_filter => sysdate - interval '1' hour,
 	p_end_time_filter => sysdate
 ) from dual;
-
 /*
 Historical SQL Monitoring 1.2.1 (when Real-Time SQL Monitoring does not work)
 
@@ -224,16 +231,7 @@ conclusion - the statistics are wrong for SMALL_TABLE.
 --#2: Downgraded Parallel Query.
 --------------------------------------------------------------------------------
 
-
---#2: TODO
---#2a: Simulate a parallelism problem.
---Open a separate session in your IDE, run this, but don't retreive all results.
---This simulates a long-running parallel query that uses all parallel resources.
---You may need to run this multiple times depending on parallel limitations.
-select /*+ parallel(1000) */ * from dba_objects;
-
-
---Use all but 2 of the parallel threads.
+--#2a: Run this in a separate session to use all but two parallel servers.
 --(This assumes no other parallel operations are running, there is no parallel
 -- queueing, resource manager restrictions, profile restrictions, etc.)	
 declare
@@ -248,7 +246,7 @@ begin
 	where name = 'parallel_max_servers';
 
 	--Open a parallel cursor that uses all but 2 of the threads.
-	open parallel_cursor for 'select /*+ parallel('||v_dop||') */ 1 a from small_table';
+	open parallel_cursor for 'select /*+ parallel('||v_dop||') */ 1 a from large_table';
 
 	--Get the first row and pause, using all the parallel servers.
 	loop
@@ -258,8 +256,186 @@ begin
 end;
 /
 
---TODO
 
+--#2b: Run this in another session to simulate a large parallel query.
+declare
+	v_count number;
+begin
+	--Dynamic SQL is used to ensure the SQL_ID will be the same.
+	execute immediate '
+		select /*+ parallel(8) */ count(*)
+		from large_table
+		cross join (select level from dual connect by level <= 10000)
+	'
+	into v_count;
+end;
+/
+
+
+--#2c: Run Real-Time SQL Monitoring on the parallel statement.
+select dbms_sqltune.report_sql_monitor(
+    sql_id => 'aq8x1pk2kmmgs',
+    type   => 'text'
+) from dual;
 
+--#2d: Examine the output.
+/*
+SQL Monitoring Report
 
+SQL Text
+------------------------------
+select /* parallel(8) / count(*) from large_table cross join (select level from dual connect by level <= 10000)
+
+Global Information
+------------------------------
+ Status              :  DONE (ALL ROWS)                   
+ Instance ID         :  1                                 
+ Session             :  JHELLER (374:57213)               
+ SQL ID              :  aq8x1pk2kmmgs                     
+ SQL Execution ID    :  16777217                          
+ Execution Started   :  06/29/2015 20:56:47               
+ First Refresh Time  :  06/29/2015 20:56:47               
+ Last Refresh Time   :  06/29/2015 20:59:12               
+ Duration            :  145s                              
+ Module/Action       :  PL/SQL Developer/SQL Window - New 
+ Service             :  orcl12                            
+ Program             :  plsqldev.exe                      
+ DOP Downgrade       :  75%                               
+ Fetch Calls         :  1                                 
+
+Global Stats
+===========================================================================
+| Elapsed |   Cpu   |    IO    |  Other   | Fetch | Buffer | Read | Read  |
+| Time(s) | Time(s) | Waits(s) | Waits(s) | Calls |  Gets  | Reqs | Bytes |
+===========================================================================
+|     281 |     278 |     0.30 |     2.21 |     1 |   1783 |  127 |  12MB |
+===========================================================================
+
+Parallel Execution Details (DOP=2 , Servers Requested=8 , Servers Allocated=2)
+====================================================================================================================
+|      Name      | Type  | Server# | Elapsed |   Cpu   |    IO    |  Other   | Buffer | Read | Read  | Wait Events |
+|                |       |         | Time(s) | Time(s) | Waits(s) | Waits(s) |  Gets  | Reqs | Bytes | (sample #)  |
+====================================================================================================================
+| PX Coordinator | QC    |         |    0.03 |    0.03 |          |          |     13 |      |     . |             |
+| p004           | Set 1 |       1 |     145 |     144 |     0.14 |     1.02 |    886 |   64 |   6MB |             |
+| p005           | Set 1 |       2 |     135 |     134 |     0.15 |     1.19 |    884 |   63 |   6MB |             |
+====================================================================================================================
+
+SQL Plan Monitoring Details (Plan Hash Value=3411683413)
+===========================================================================================================================================================================
+| Id |                Operation                |    Name     |  Rows   | Cost |   Time    | Start  | Execs |   Rows   | Read | Read  |  Mem  | Activity | Activity Detail |
+|    |                                         |             | (Estim) |      | Active(s) | Active |       | (Actual) | Reqs | Bytes | (Max) |   (%)    |   (# samples)   |
+===========================================================================================================================================================================
+|  0 | SELECT STATEMENT                        |             |         |      |         1 |   +145 |     1 |        1 |      |       |       |          |                 |
+|  1 |   SORT AGGREGATE                        |             |       1 |      |         1 |   +145 |     1 |        1 |      |       |       |          |                 |
+|  2 |    PX COORDINATOR                       |             |         |      |         1 |   +145 |     3 |        2 |      |       |       |          |                 |
+|  3 |     PX SEND QC (RANDOM)                 | :TQ10001    |       1 |      |         1 |   +145 |     2 |        2 |      |       |       |          |                 |
+|  4 |      SORT AGGREGATE                     |             |       1 |      |       145 |     +1 |     2 |        2 |      |       |       |          |                 |
+|  5 |       MERGE JOIN CARTESIAN              |             |      1M |  401 |       144 |     +2 |     2 |       9G |      |       |       |          |                 |
+|  6 |        BUFFER SORT                      |             |         |      |       144 |     +2 |     2 |    20000 |      |       |  485K |          |                 |
+|  7 |         PX RECEIVE                      |             |       1 |    2 |         1 |     +2 |     2 |    20000 |      |       |       |          |                 |
+|  8 |          PX SEND BROADCAST              | :TQ10000    |       1 |    2 |         1 |   +135 |     1 |        2 |      |       |       |          |                 |
+|  9 |           VIEW                          |             |       1 |    2 |         1 |   +135 |     1 |    10000 |      |       |       |          |                 |
+| 10 |            CONNECT BY WITHOUT FILTERING |             |         |      |         1 |   +135 |     1 |    10000 |      |       |       |          |                 |
+| 11 |             FAST DUAL                   |             |       1 |    2 |         1 |   +135 |     1 |        1 |      |       |       |          |                 |
+| 12 |        BUFFER SORT                      |             |      1M |  401 |       146 |     +1 | 20000 |       9G |      |       |   24M |          |                 |
+| 13 |         PX BLOCK ITERATOR               |             |      1M |   62 |         1 |     +2 |     2 |       1M |      |       |       |          |                 |
+| 14 |          TABLE ACCESS FULL              | LARGE_TABLE |      1M |   62 |         1 |     +2 |    34 |       1M |  127 |  12MB |       |          |                 |
+===========================================================================================================================================================================*/
+
+--#2e: Interpret results.
+/*
+
+The Real-Time SQL Monitoring report makes it very easy to spot the problem.
+Note these two lines from the output:
+
+...
+ DOP Downgrade       :  75%                               
+...
+Parallel Execution Details (DOP=2 , Servers Requested=8 , Servers Allocated=2)
+...
+
+
+One session was hogging the parallel servers and the real query could only use
+2 out of the requested 8 parallel servers.  This kind of downgrading can be
+disastrous for data warehouses.
+
+Unfortunately, there is no way in Oracle to tell *why* it was downgraded.
+
+*/
+
+
+--#2f: Run Historical SQL Monitoring.
+select hist_sql_mon.hist_sql_mon(
+	p_sql_id => 'aq8x1pk2kmmgs',
+	p_start_time_filter => sysdate - interval '1' hour,
+	p_end_time_filter => sysdate
+) from dual;
+
+/*
+Historical SQL Monitoring 1.2.1 (when Real-Time SQL Monitoring does not work)
+
+Monitoring Metadata
+------------------------------ 
+ Report Created Date : 2015-06-29 21:03:03
+ Report Created by   : JHELLER
+ SQL_ID              : aq8x1pk2kmmgs
+ SQL_TEXT            :  select /* parallel(8) / count(*) from large_table cross join (select level from dual connec
+ P_START_TIME_FILTER : 2015-06-29 20:03:03
+ P_END_TIME_FILTER   : 2015-06-29 21:03:03
+
+
+Plan hash value: 3411683413
+Start Time     : 2015-06-29 20:56:21
+End Time       : 2015-06-29 20:59:12
+Source         : Data came from DBA_HIST_ACTIVE_SESS_HISTORY only.
+
+--------------------------------------------------------------------------------------------------------------------------===============================================================
+| Id  | Operation                             | Name        | Rows  | Cost (%CPU)| Time     |    TQ  |IN-OUT| PQ Distrib | Activity (%) | Activity Detail (# samples|# distinct samples)|
+--------------------------------------------------------------------------------------------------------------------------===============================================================
+|   0 | SELECT STATEMENT                      |             |       |   401 (100)|          |        |      |            |              |                                               |
+|   1 |  SORT AGGREGATE                       |             |     1 |            |          |        |      |            |              |                                               |
+|   2 |   PX COORDINATOR                      |             |       |            |          |        |      |            |              |                                               |
+|   3 |    PX SEND QC (RANDOM)                | :TQ10001    |     1 |            |          |  Q1,01 | P->S | QC (RAND)  |              |                                               |
+|   4 |     SORT AGGREGATE                    |             |     1 |            |          |  Q1,01 | PCWP |            |         5.71 | Cpu (2|2)                                     |
+|   5 |      MERGE JOIN CARTESIAN             |             |  1000K|   401   (1)| 00:00:01 |  Q1,01 | PCWP |            |              |                                               |
+|   6 |       BUFFER SORT                     |             |       |            |          |  Q1,01 | PCWC |            |              |                                               |
+|   7 |        PX RECEIVE                     |             |     1 |     2   (0)| 00:00:01 |  Q1,01 | PCWP |            |              |                                               |
+|   8 |         PX SEND BROADCAST             | :TQ10000    |     1 |     2   (0)| 00:00:01 |        | S->P | BROADCAST  |              |                                               |
+|   9 |          VIEW                         |             |     1 |     2   (0)| 00:00:01 |        |      |            |              |                                               |
+|  10 |           CONNECT BY WITHOUT FILTERING|             |       |            |          |        |      |            |              |                                               |
+|  11 |            FAST DUAL                  |             |     1 |     2   (0)| 00:00:01 |        |      |            |              |                                               |
+|  12 |       BUFFER SORT                     |             |  1000K|   401   (1)| 00:00:01 |  Q1,01 | PCWP |            |        94.29 | Cpu (33|18)                                   |
+|  13 |        PX BLOCK ITERATOR              |             |  1000K|    62   (0)| 00:00:01 |  Q1,01 | PCWC |            |              |                                               |
+|* 14 |         TABLE ACCESS FULL             | LARGE_TABLE |  1000K|    62   (0)| 00:00:01 |  Q1,01 | PCWP |            |              |                                               |
+--------------------------------------------------------------------------------------------------------------------------===============================================================
+
+Predicate Information (identified by operation id):
+---------------------------------------------------
+
+  14 - access(:Z>=:Z AND :Z<=:Z)
+
+Note
+-----
+   - Degree of Parallelism is 8 because of hint
+
+*/
+
+
+--#2g: Interpret results.
+/*
+
+The requested and actual degree of parallelism are not recorded and are not
+available in the Historical SQL Monitoring results.  But it is possible to infer
+the effective degree of parallelism by looking at the ratio of "# samples" over
+the "# distinct samples".  For example, Plan ID #12 had 18 time periods with at
+least one sample, and a total of 33 samples.  On average, there were 1.8333
+sessions active for that operation.
+
+This number closely matches the real DOP of 2.  However, the numbers will never
+perfectly match for several reasons.  Even if nothing else was running, it's
+likely that the effective DOP would not be 8.  It's hard to say what the ideal
+number would be, but in practice 2 out of 8 is too low, and implies a problem.
+
+*/