Home » RDBMS Server » Performance Tuning » Bulk update performance issue (Oracle 11g, Windows XP)
Bulk update performance issue [message #525335] Sat, 01 October 2011 03:03 Go to next message
ninan
Messages: 163
Registered: June 2011
Location: Noida
Senior Member
Hi,

I have a table with 8726387 records.

There is this procedure to update a column of the same table, from derived values of another column of the same table.

I have index on columns used in WHERE clause except the on which update is happening. I am checking for any duplicate values in the column which is getting updated, since the requirement is to rollup column values in the child hierarchy and update the column against the parent , with comma separated row values of child records.

I am using a LIMIT of 100000 to BULK FETCH in each iteration.

I am using PLSQL records, and bulk fetching it into a ref cursor and updating using FOR ALL statment.

This is taking 5 hours 40 minutes to update 8726387 records.

Attached is the Update statement, script for table creation and insertion, explain plan etc.,

Kindly suggest how can we improve this, since I think 8726387 is not too high for Oracle. I am doubting it could be a DB issue of Buffer of the REF CURSOR being full and not able to complete.


 /* Formatted on 10/1/2011 12:23:31 PM (QP5 v5.139.911.3011) */
CREATE TABLE itemexcption
(
   item_id         VARCHAR2 (40),
   part            VARCHAR2 (50),
   sub_part        VARCHAR2 (40),
   reason          VARCHAR2 (4000),
   rolled_reason   VARCHAR2 (4000)
)
CREATE index itemidx on itemexcption (item_id);

CREATE INDEX partidx
   ON itemexcption (part);

CREATE INDEX subpartidx
   ON itemexcption (sub_part);

INSERT INTO itemexcption (item_id,
                          part,
                          sub_part,
                          reason)
     VALUES ('ITEM1',
             NULL,
             NULL,
             4);

INSERT INTO itemexcption (item_id,
                          part,
                          sub_part,
                          reason)
     VALUES ('ITEM1',
             'PART1',
             NULL,
             2);

INSERT INTO itemexcption (item_id,
                          part,
                          sub_part,
                          reason)
     VALUES ('ITEM1',
             'PART2',
             NULL,
             3);


INSERT INTO itemexcption (item_id,
                          part,
                          sub_part,
                          reason)
     VALUES ('ITEM1',
             'PART1',
             'SUBPART1',
             1);

INSERT INTO itemexcption (item_id,
                          part,
                          sub_part,
                          reason)
     VALUES ('ITEM1',
             'PART1',
             'SUBPART2',
             2);

INSERT INTO itemexcption (item_id,
                          part,
                          sub_part,
                          reason)
     VALUES ('ITEM1',
             'PART2',
             NULL,
             1);

INSERT INTO itemexcption (item_id,
                          part,
                          sub_part,
                          reason)
     VALUES ('ITEM1',
             'PART2',
             'SUBPART1',
             1);


INSERT INTO itemexcption (item_id,
                          part,
                          sub_part,
                          reason)
     VALUES ('ITEM1',
             'PART2',
             'SUBPART2',
             3);


INSERT INTO itemexcption (item_id,
                          part,
                          sub_part,
                          reason)
     VALUES ('ITEM2',
             NULL,
             NULL,
             2);

INSERT INTO itemexcption (item_id,
                          part,
                          sub_part,
                          reason)
     VALUES ('ITEM2',
             NULL,
             NULL,
             2);

INSERT INTO itemexcption (item_id,
                          part,
                          sub_part,
                          reason)
     VALUES ('ITEM2',
             'PART1',
             NULL,
             1);

INSERT INTO itemexcption (item_id,
                          part,
                          sub_part,
                          reason)
     VALUES ('ITEM2',
             'PART2',
             NULL,
             3);


INSERT INTO itemexcption (item_id,
                          part,
                          sub_part,
                          reason)
     VALUES ('ITEM2',
             'PART1',
             'SUBPART1',
             4);

INSERT INTO itemexcption (item_id,
                          part,
                          sub_part,
                          reason)
     VALUES ('ITEM2',
             'PART1',
             'SUBPART2',
             1);

INSERT INTO itemexcption (item_id,
                          part,
                          sub_part,
                          reason)
     VALUES ('ITEM2',
             'PART2',
             NULL,
             3);

INSERT INTO itemexcption (item_id,
                          part,
                          sub_part,
                          reason)
     VALUES ('ITEM2',
             'PART2',
             'SUBPART1',
             2);


INSERT INTO itemexcption (item_id,
                          part,
                          sub_part,
                          reason)
     VALUES ('ITEM2',
             'PART2',
             'SUBPART2',
             4);


COMMIT;

SELECT * FROM ITMEXCPTION

----------------------------------------------------------

ITEM    PART   SUBPART       REASON           ROLLED_REASON
ITEM1	PART1		       2	
ITEM1	PART2		       3	
ITEM1	PART1	SUBPART1       1	
ITEM1	PART1	SUBPART2       2	
ITEM1	PART2		       1	
ITEM1	PART2	SUBPART1       1	
ITEM1	PART2	SUBPART2       3	
ITEM2			       2	
ITEM2	PART1		       1	
ITEM2	PART2		       3	
ITEM2			       2	
ITEM2	PART1	SUBPART1       4	
ITEM2	PART1	SUBPART2       1	
ITEM2	PART2		       3	
ITEM2	PART2	SUBPART1       2	
ITEM2	PART2	SUBPART2       4	

---------------------------------------------------------


Procedure for updating is working fine as I have tested with a lesser data set. Problem is with performance of this UPDATE and the time it takes to update the entire table.

The output for above is given below. (i.e, ROLLED_REASON column after updation )

ROLLED_REASON is rolled up and updated only for PARENT i.e., ITEM and PART ie., here ITEM1 will have 4,2,3,1 since PARTs and SUBPARTS under ITEM1 have these distinct values. There is no order for this updation. It can be 1,2,3,4 or any order as this is from a BULK update.

Similiarly PART1 under ITEM1 will have 2,1 since SUBPARTs under PART1 have these distinct values in Column REASON.

After updation the result will look like below.


select * from itemexcption order by item_id, part nulls first, sub_part nulls first;

----------------------------------------------------------

ITEM    PART   SUBPART       REASON           ROLLED_REASON
-----------------------------------------------------------
ITEM1			      4	              1,2,3,4,
ITEM1	PART1		      2	              1,2,4,
ITEM1	PART1	SUBPART1      1	
ITEM1	PART1	SUBPART2      2	
ITEM1	PART2		      3	              1,2,3,4,
ITEM1	PART2		      1	              1,2,3,4,
ITEM1	PART2	SUBPART1      1	
ITEM1	PART2	SUBPART2      3	
ITEM2			      2     	      1,2,3,4,
ITEM2			      2	              1,2,3,4,
ITEM2	PART1		      1	              1,2,4,
ITEM2	PART1	SUBPAR1	      4 	
ITEM2	PART1	SUBPART2      1	
ITEM2	PART2		      3	              1,2,3,4,
ITEM2	PART2		      3	              1,2,3,4,
ITEM2	PART2	SUBPART1      2	
ITEM2	PART2	SUBPART2      4	
---------------------------------------------------------



Script for this updation is given below.


DECLARE
   TYPE item_rec IS RECORD (
      item       itemexcption.item_id%TYPE,
      rsncodes   itemexcption.reason%TYPE
   );

   TYPE item_tab IS TABLE OF item_rec;

   v_limit   NUMBER := 500;
   l_start   NUMBER;

   mod_rec   item_tab;
   itm_rec   item_tab;

   TYPE itemrec IS REF CURSOR;

   rec      itemrec;
   rec1      itemrec;
   
BEGIN

   l_start := DBMS_UTILITY.get_time;


   UPDATE itemexcption
     SET rolled_reason = NULL
   WHERE rolled_reason IS NOT NULL;

   COMMIT;

   

   /***** Reason  Code updation Against the PARTs******************************************************/

   OPEN rec FOR
      SELECT part, reason
        FROM (SELECT b.part part,
                     b.reason reason,                       ROW_NUMBER ()
                     OVER (PARTITION BY b.part, b.reason      ORDER BY b.part)
                        rn
                FROM itemexcption b
               WHERE b.reason IS NOT NULL)
       WHERE rn = 1;  /** For getting distinct values against PART****/


   LOOP
      FETCH rec
      BULK COLLECT INTO mod_rec
      LIMIT 100000;

      FORALL i IN mod_rec.FIRST .. mod_rec.LAST
      SAVE EXCEPTIONS
         UPDATE                                                /* bulk bind */
               itemexcption a
            SET a.rolled_reason=
                   a.rolled_reason || mod_rec (i).rsncodes || ','
          WHERE mod_rec (i).item = a.PART AND a.SUB_PART IS NULL
        AND    (a.rolled_reason IS NULL OR  a.rolled_reason  not like '%'||mod_rec(i).rsncodes||'%'  );

         COMMIT;

      EXIT WHEN rec%NOTFOUND;
   END LOOP;

   CLOSE rec;

   COMMIT;


   /***** Reason  Code updation Against the ITEMs******************************************************/

   OPEN rec FOR
      SELECT item_id, reason
        FROM (SELECT b.item_id item_id,
                     b.reason reason,                       ROW_NUMBER ()
                     OVER (PARTITION BY b.item_id, b.reason      ORDER BY b.item_id)
                        rn
                FROM itemexcption b
               WHERE b.reason IS NOT NULL)
       WHERE rn = 1;  /** For getting distinct values against PART****/


   LOOP
      FETCH rec
      BULK COLLECT INTO itm_rec
      LIMIT 100000;

      FORALL i IN itm_rec.FIRST .. itm_rec.LAST
      SAVE EXCEPTIONS
         UPDATE                                                /* bulk bind */
               itemexcption a
            SET a.rolled_reason=
                   a.rolled_reason || itm_rec (i).rsncodes || ','
          WHERE itm_rec (i).item = a.ITEM_ID AND a.PART IS NULL
        AND  ( a.rolled_reason IS NULL OR  a.rolled_reason not like '%'||itm_rec(i).rsncodes||'%'  );

         COMMIT;

      EXIT WHEN rec%NOTFOUND;
   END LOOP;

   CLOSE rec;

   COMMIT;

EXCEPTION
   WHEN OTHERS
   THEN
      DBMS_OUTPUT.put_line ('Exception' || SQLERRM);
END; 


-----------

This took 2 hours to update 21,48,725 records.

Any suggestions, what can be wrong in the proc.

[Updated on: Sat, 01 October 2011 03:33]

Report message to a moderator

Re: Bulk update performance issue [message #525344 is a reply to message #525335] Sat, 01 October 2011 05:04 Go to previous messageGo to next message
ThomasG
Messages: 3211
Registered: April 2005
Location: Heilbronn, Germany
Senior Member
Well, the main problem is that ROLLED_REASON shouldn't be stored in the first place.

You can use STRAGG or other methods to calculate it in on the fly the select.

If you absolutely insist on storing it, you can also use that select to do a straight SQL update of the entire table without using a procedure.
Re: Bulk update performance issue [message #525346 is a reply to message #525344] Sat, 01 October 2011 05:37 Go to previous messageGo to next message
ninan
Messages: 163
Registered: June 2011
Location: Noida
Senior Member
It needs to be stored in table since this is a datawarehousing environment.

I did'nt understand your statment that it should'nt be stored. How is storage going to be a problem for Oracle, in that case are you suggesting updating 8 million records is something Oracle is not capable of doing ?

Even Single SQL statement for updating is taking a long time.
Re: Bulk update performance issue [message #525377 is a reply to message #525346] Sat, 01 October 2011 12:58 Go to previous messageGo to next message
jbrpub
Messages: 1
Registered: October 2011
Location: France
Junior Member
if it's possible, try with a "WHERE CURRENT OF"
Re: Bulk update performance issue [message #525378 is a reply to message #525346] Sat, 01 October 2011 12:58 Go to previous messageGo to next message
BlackSwan
Messages: 26766
Registered: January 2009
Location: SoCal
Senior Member
Since NOBODY can optimize SQL just by looking at it, we need a few more details.
http://www.orafaq.com/forum/m/433888/136107/#msg_433888
Please refer to URL above & be sure to provide the details requested:
Re: Bulk update performance issue [message #525390 is a reply to message #525378] Sun, 02 October 2011 04:13 Go to previous messageGo to next message
ninan
Messages: 163
Registered: June 2011
Location: Noida
Senior Member
Hard luck. Tried many options available in Oracle, it did'nt work.

Finally we decided to go for another DB, i.e. SQL Server.

Loaded same volume (8 million ) of data in SQL Server and it completed in 1 hour 25 minuts. Where Oracle had taken 5 hours and 40 minutes to complete the job.

Lessons learnt.: Oracle is good, if you are playing with a low volume of data. Otherwise it will never going to work. Telling this after spending more than a week trying many options avaiable in Oracle.
Re: Bulk update performance issue [message #525391 is a reply to message #525390] Sun, 02 October 2011 04:14 Go to previous messageGo to next message
ninan
Messages: 163
Registered: June 2011
Location: Noida
Senior Member
Thanks to everyone who had given suggestions.
Re: Bulk update performance issue [message #525394 is a reply to message #525378] Sun, 02 October 2011 05:24 Go to previous messageGo to next message
ninan
Messages: 163
Registered: June 2011
Location: Noida
Senior Member
Table creation script, insert script and other details are already pasted in the query.

Please find the explain plan below.
---------------------------------------


Explain Plan
----------------------
UPDATE STATEMENT  ALL_ROWSCost: 6  						
	8 UPDATE ADMIN_COSTPL_OWNER.ITEMEXCPTION
		7 TABLE ACCESS BY INDEX ROWID TABLE ADMIN_COSTPL_OWNER.ITEMEXCPTION Cost: 6  Bytes: 19  Cardinality: 1  				
			6 BITMAP CONVERSION TO ROWIDS  			
				5 BITMAP AND  		
					2 BITMAP CONVERSION FROM ROWIDS  	
						1 INDEX RANGE SCAN INDEX ADMIN_COSTPL_OWNER.ITEM_MOD_IDX Cost: 3  Cardinality: 14  
					4 BITMAP CONVERSION FROM ROWIDS  	
						3 INDEX RANGE SCAN INDEX ADMIN_COSTPL_OWNER.ITEM_SKU_IDX Cost: 3  Cardinality: 14  
Re: Bulk update performance issue [message #525416 is a reply to message #525394] Sun, 02 October 2011 14:21 Go to previous messageGo to next message
Barbara Boehmer
Messages: 9090
Registered: November 2002
Location: California, USA
Senior Member
I believe it would be more efficient to do your aggregation in the select, so that you would only have to do one update per row, instead of one update for each reason per row. Please see the demonstration below in which I changed your select and update statements.

SCOTT@orcl_11gR2> column item_id       format a8
SCOTT@orcl_11gR2> column part	       format a8
SCOTT@orcl_11gR2> column sub_part      format a8
SCOTT@orcl_11gR2> column reason        format a8
SCOTT@orcl_11gR2> column rolled_reason format a8
SCOTT@orcl_11gR2> select *
  2  from   itemexcption
  3  order  by item_id, part nulls first, sub_part nulls first
  4  /

ITEM_ID  PART     SUB_PART REASON   ROLLED_R
-------- -------- -------- -------- --------
ITEM1                      4
ITEM1    PART1             2
ITEM1    PART1    SUBPART1 1
ITEM1    PART1    SUBPART2 2
ITEM1    PART2             3
ITEM1    PART2             1
ITEM1    PART2    SUBPART1 1
ITEM1    PART2    SUBPART2 3
ITEM2                      2
ITEM2                      2
ITEM2    PART1             1
ITEM2    PART1    SUBPART1 4
ITEM2    PART1    SUBPART2 1
ITEM2    PART2             3
ITEM2    PART2             3
ITEM2    PART2    SUBPART1 2
ITEM2    PART2    SUBPART2 4

17 rows selected.

SCOTT@orcl_11gR2> DECLARE
  2  	TYPE item_rec IS RECORD (
  3  	   item       itemexcption.item_id%TYPE,
  4  	   rsncodes   itemexcption.reason%TYPE
  5  	);
  6  	TYPE item_tab IS TABLE OF item_rec;
  7  	mod_rec   item_tab;
  8  	itm_rec   item_tab;
  9  	TYPE itemrec IS REF CURSOR;
 10  	rec	  itemrec;
 11  	rec1	  itemrec;
 12  BEGIN
 13  	UPDATE itemexcption
 14  	  SET rolled_reason = NULL
 15  	WHERE rolled_reason IS NOT NULL;
 16  	COMMIT;
 17  	/***** Reason  Code updation Against the PARTs******************************************************/
 18  	OPEN rec FOR
 19  	   select part,
 20  		  listagg (reason, ',') within group (order by reason) reason
 21  	   from   (select distinct part, reason
 22  		   from   itemexcption
 23  		   where  part is not null)
 24  	   group  by part;
 25  	LOOP
 26  	   FETCH rec
 27  	   BULK COLLECT INTO mod_rec
 28  	   LIMIT 100000;
 29  	   FORALL i IN mod_rec.FIRST .. mod_rec.LAST
 30  	   SAVE EXCEPTIONS
 31  	      update itemexcption a
 32  	      set    a.rolled_reason = mod_rec(i).rsncodes
 33  	      where  a.part = mod_rec(i).item
 34  	      and    a.sub_part is null;
 35  	   EXIT WHEN rec%NOTFOUND;
 36  	END LOOP;
 37  	CLOSE rec;
 38  	COMMIT;
 39  	/***** Reason  Code updation Against the ITEMs******************************************************/
 40  	OPEN rec FOR
 41  	   select item_id,
 42  		  listagg (reason, ',') within group (order by reason) reason
 43  	   from   (select distinct item_id, reason
 44  		   from   itemexcption
 45  		   where  item_id is not null)
 46  	   group  by item_id;
 47  	LOOP
 48  	   FETCH rec
 49  	   BULK COLLECT INTO itm_rec
 50  	   LIMIT 100000;
 51  	   FORALL i IN itm_rec.FIRST .. itm_rec.LAST
 52  	   SAVE EXCEPTIONS
 53  	      update itemexcption a
 54  	      set    a.rolled_reason = itm_rec(i).rsncodes
 55  	      where  a.item_id = itm_rec(i).item
 56  	      and    a.part is null;
 57  	   EXIT WHEN rec%NOTFOUND;
 58  	END LOOP;
 59  	CLOSE rec;
 60  	COMMIT;
 61  END;
 62  /

PL/SQL procedure successfully completed.

SCOTT@orcl_11gR2> select *
  2  from   itemexcption
  3  order  by item_id, part nulls first, sub_part nulls first
  4  /

ITEM_ID  PART     SUB_PART REASON   ROLLED_R
-------- -------- -------- -------- --------
ITEM1                      4        1,2,3,4
ITEM1    PART1             2        1,2,4
ITEM1    PART1    SUBPART1 1
ITEM1    PART1    SUBPART2 2
ITEM1    PART2             3        1,2,3,4
ITEM1    PART2             1        1,2,3,4
ITEM1    PART2    SUBPART1 1
ITEM1    PART2    SUBPART2 3
ITEM2                      2        1,2,3,4
ITEM2                      2        1,2,3,4
ITEM2    PART1             1        1,2,4
ITEM2    PART1    SUBPART1 4
ITEM2    PART1    SUBPART2 1
ITEM2    PART2             3        1,2,3,4
ITEM2    PART2             3        1,2,3,4
ITEM2    PART2    SUBPART1 2
ITEM2    PART2    SUBPART2 4

17 rows selected.

SCOTT@orcl_11gR2>

Re: Bulk update performance issue [message #525421 is a reply to message #525416] Mon, 03 October 2011 00:11 Go to previous messageGo to next message
ninan
Messages: 163
Registered: June 2011
Location: Noida
Senior Member
Hi Barbara,

Thanks for your solution. But we have 11g Release 1, so listagg won't work ?

   SELECT item_id,  max(sys_connect_by_path(reason,',')) rsn_code
   FROM  (SELECT  item_id,                           reason,
              dense_rank() OVER (PARTITION BY item_id ORDER BY  reason ) rn
              FROM  itemexcption b
              WHERE b.part IS NOT NULL AND b.item_id IS NOT NULL AND b.reason IS NOT NULL                )
     GROUP BY item_id    CONNECT BY rn = PRIOR rn+1 AND item_id= PRIOR item_id    START WITH rn = 1;



Is dense_rank recommended in this scenario, for performance reasons?
Re: Bulk update performance issue [message #525433 is a reply to message #525421] Mon, 03 October 2011 01:46 Go to previous messageGo to next message
ninan
Messages: 163
Registered: June 2011
Location: Noida
Senior Member
Barbara,

Also your query have COMMIT outside the LOOP and after closing the cursor.

Will it result in a exclusive lock on the table and the query getting stuck, since the selection and update is on the same table (If we have large no. of rows ie., 8 million etc.,)

Should'nt we COMMIT as soon as UPDATE statement, inside the LOOP itself.

Thanks,

Nirmal
Re: Bulk update performance issue [message #525522 is a reply to message #525433] Mon, 03 October 2011 12:01 Go to previous messageGo to next message
Barbara Boehmer
Messages: 9090
Registered: November 2002
Location: California, USA
Senior Member
If you can't use listagg, then you can use the undocumented wm_concat, as demonstrated below, or any of various other string aggregation techniques. It should be better to do your aggregation in the select, so that it drastically reduces the number of updates. Your method with dense_rank does not do that.

With normal loops, it is unadvisable to commit within the loop, as you may get a snapshot too old error or some such thing. However, forall is a little different and if your system lacks the capacity to process as many rows as you have all at once, then you can decrease the limits (1000 is a typical number) and commit after each update within the forall if you like. Ideally, if your system could handle it, the most efficient method would be to do it all in one sql update statement without any pl/sql.

SCOTT@orcl_11gR2> column item_id       format a8
SCOTT@orcl_11gR2> column part	       format a8
SCOTT@orcl_11gR2> column sub_part      format a8
SCOTT@orcl_11gR2> column reason        format a8
SCOTT@orcl_11gR2> column rolled_reason format a8
SCOTT@orcl_11gR2> select *
  2  from   itemexcption
  3  order  by item_id, part nulls first, sub_part nulls first
  4  /

ITEM_ID  PART     SUB_PART REASON   ROLLED_R
-------- -------- -------- -------- --------
ITEM1                      4
ITEM1    PART1             2
ITEM1    PART1    SUBPART1 1
ITEM1    PART1    SUBPART2 2
ITEM1    PART2             3
ITEM1    PART2             1
ITEM1    PART2    SUBPART1 1
ITEM1    PART2    SUBPART2 3
ITEM2                      2
ITEM2                      2
ITEM2    PART1             1
ITEM2    PART1    SUBPART1 4
ITEM2    PART1    SUBPART2 1
ITEM2    PART2             3
ITEM2    PART2             3
ITEM2    PART2    SUBPART1 2
ITEM2    PART2    SUBPART2 4

17 rows selected.

SCOTT@orcl_11gR2> DECLARE
  2  	TYPE item_rec IS RECORD (
  3  	   item       itemexcption.item_id%TYPE,
  4  	   rsncodes   itemexcption.reason%TYPE
  5  	);
  6  	TYPE item_tab IS TABLE OF item_rec;
  7  	mod_rec   item_tab;
  8  	itm_rec   item_tab;
  9  	TYPE itemrec IS REF CURSOR;
 10  	rec	  itemrec;
 11  	rec1	  itemrec;
 12  BEGIN
 13  	UPDATE itemexcption
 14  	  SET rolled_reason = NULL
 15  	WHERE rolled_reason IS NOT NULL;
 16  	COMMIT;
 17  	/***** Reason  Code updation Against the PARTs******************************************************/
 18  	OPEN rec FOR
 19  	   select part, wm_concat (reason) reason
 20  	   from   (select distinct part, reason
 21  		   from   itemexcption
 22  		   where  part is not null)
 23  	   group  by part;
 24  	LOOP
 25  	   FETCH rec
 26  	   BULK COLLECT INTO mod_rec
 27  	   LIMIT 1000;
 28  	   FORALL i IN mod_rec.FIRST .. mod_rec.LAST
 29  	   SAVE EXCEPTIONS
 30  	      update itemexcption a
 31  	      set    a.rolled_reason = mod_rec(i).rsncodes
 32  	      where  a.part = mod_rec(i).item
 33  	      and    a.sub_part is null;
 34  	   COMMIT;
 35  	   EXIT WHEN rec%NOTFOUND;
 36  	END LOOP;
 37  	CLOSE rec;
 38  	COMMIT;
 39  	/***** Reason  Code updation Against the ITEMs******************************************************/
 40  	OPEN rec FOR
 41  	   select item_id, wm_concat (reason)
 42  	   from   (select distinct item_id, reason
 43  		   from   itemexcption
 44  		   where  item_id is not null)
 45  	   group  by item_id;
 46  	LOOP
 47  	   FETCH rec
 48  	   BULK COLLECT INTO itm_rec
 49  	   LIMIT 1000;
 50  	   FORALL i IN itm_rec.FIRST .. itm_rec.LAST
 51  	   SAVE EXCEPTIONS
 52  	      update itemexcption a
 53  	      set    a.rolled_reason = itm_rec(i).rsncodes
 54  	      where  a.item_id = itm_rec(i).item
 55  	      and    a.part is null;
 56  	   COMMIT;
 57  	   EXIT WHEN rec%NOTFOUND;
 58  	END LOOP;
 59  	CLOSE rec;
 60  	COMMIT;
 61  END;
 62  /

PL/SQL procedure successfully completed.

SCOTT@orcl_11gR2> select *
  2  from   itemexcption
  3  order  by item_id, part nulls first, sub_part nulls first
  4  /

ITEM_ID  PART     SUB_PART REASON   ROLLED_R
-------- -------- -------- -------- --------
ITEM1                      4        4,1,2,3
ITEM1    PART1             2        2,4,1
ITEM1    PART1    SUBPART1 1
ITEM1    PART1    SUBPART2 2
ITEM1    PART2             3        1,4,2,3
ITEM1    PART2             1        1,4,2,3
ITEM1    PART2    SUBPART1 1
ITEM1    PART2    SUBPART2 3
ITEM2                      2        1,2,3,4
ITEM2                      2        1,2,3,4
ITEM2    PART1             1        2,4,1
ITEM2    PART1    SUBPART1 4
ITEM2    PART1    SUBPART2 1
ITEM2    PART2             3        1,4,2,3
ITEM2    PART2             3        1,4,2,3
ITEM2    PART2    SUBPART1 2
ITEM2    PART2    SUBPART2 4

17 rows selected.

SCOTT@orcl_11gR2>

Re: Bulk update performance issue [message #525524 is a reply to message #525522] Mon, 03 October 2011 12:15 Go to previous messageGo to next message
Barbara Boehmer
Messages: 9090
Registered: November 2002
Location: California, USA
Senior Member
You might try using just sql update statements, as deonstrated below, and see if your system can handle it. You might be surprised. If not, there are parameters and such that can be increased.

SCOTT@orcl_11gR2> column item_id       format a8
SCOTT@orcl_11gR2> column part	       format a8
SCOTT@orcl_11gR2> column sub_part      format a8
SCOTT@orcl_11gR2> column reason        format a8
SCOTT@orcl_11gR2> column rolled_reason format a8
SCOTT@orcl_11gR2> select *
  2  from   itemexcption
  3  order  by item_id, part nulls first, sub_part nulls first
  4  /

ITEM_ID  PART     SUB_PART REASON   ROLLED_R
-------- -------- -------- -------- --------
ITEM1                      4
ITEM1    PART1             2
ITEM1    PART1    SUBPART1 1
ITEM1    PART1    SUBPART2 2
ITEM1    PART2             3
ITEM1    PART2             1
ITEM1    PART2    SUBPART1 1
ITEM1    PART2    SUBPART2 3
ITEM2                      2
ITEM2                      2
ITEM2    PART1             1
ITEM2    PART1    SUBPART1 4
ITEM2    PART1    SUBPART2 1
ITEM2    PART2             3
ITEM2    PART2             3
ITEM2    PART2    SUBPART1 2
ITEM2    PART2    SUBPART2 4

17 rows selected.

SCOTT@orcl_11gR2> UPDATE itemexcption
  2    SET rolled_reason = NULL
  3  WHERE rolled_reason IS NOT NULL;

0 rows updated.

SCOTT@orcl_11gR2> COMMIT;

Commit complete.

SCOTT@orcl_11gR2> update itemexcption a
  2  set    a.rolled_reason =
  3  	    (select rsncodes
  4  	     from   (select part, wm_concat (reason) rsncodes
  5  		     from   (select distinct part, reason
  6  			     from   itemexcption
  7  			     where  part is not null)
  8  		     group  by part) i
  9  	     where  a.part = i.part)
 10  where  a.sub_part is null;

9 rows updated.

SCOTT@orcl_11gR2> COMMIT;

Commit complete.

SCOTT@orcl_11gR2> update itemexcption a
  2  set    a.rolled_reason =
  3  	    (select rsncodes
  4  	     from   (select item_id, wm_concat (reason) rsncodes
  5  		     from   (select distinct item_id, reason
  6  			     from   itemexcption
  7  			     where  item_id is not null)
  8  		     group  by item_id) i
  9  	     where  a.item_id = i.item_id)
 10  where  a.part is null;

3 rows updated.

SCOTT@orcl_11gR2> COMMIT;

Commit complete.

SCOTT@orcl_11gR2> select *
  2  from   itemexcption
  3  order  by item_id, part nulls first, sub_part nulls first
  4  /

ITEM_ID  PART     SUB_PART REASON   ROLLED_R
-------- -------- -------- -------- --------
ITEM1                      4        1,4,3,2
ITEM1    PART1             2        1,4,2
ITEM1    PART1    SUBPART1 1
ITEM1    PART1    SUBPART2 2
ITEM1    PART2             3        1,4,3,2
ITEM1    PART2             1        1,4,3,2
ITEM1    PART2    SUBPART1 1
ITEM1    PART2    SUBPART2 3
ITEM2                      2        1,4,3,2
ITEM2                      2        1,4,3,2
ITEM2    PART1             1        1,4,2
ITEM2    PART1    SUBPART1 4
ITEM2    PART1    SUBPART2 1
ITEM2    PART2             3        1,4,3,2
ITEM2    PART2             3        1,4,3,2
ITEM2    PART2    SUBPART1 2
ITEM2    PART2    SUBPART2 4

17 rows selected.

SCOTT@orcl_11gR2>

Re: Bulk update performance issue [message #525525 is a reply to message #525524] Mon, 03 October 2011 12:23 Go to previous messageGo to next message
Barbara Boehmer
Messages: 9090
Registered: November 2002
Location: California, USA
Senior Member
You might also try adding the following before doing any updates.

create index item_reason
on itemexcption (item_id, reason)
/
create index part_reason
on itemexcption (part, reason)
/
exec dbms_stats.gather_table_stats (user, 'ITEMEXCPTION')

Re: Bulk update performance issue [message #525552 is a reply to message #525525] Mon, 03 October 2011 13:34 Go to previous messageGo to next message
ninan
Messages: 163
Registered: June 2011
Location: Noida
Senior Member

SELECT item_id,  max(sys_connect_by_path(reason,',')) rsn_code
   FROM  (SELECT  item_id,                           reason,
              dense_rank() OVER (PARTITION BY item_id ORDER BY  reason ) rn
              FROM  itemexcption b
              WHERE b.part IS NOT NULL AND b.item_id IS NOT NULL AND b.reason IS NOT NULL                )
     GROUP BY item_id    CONNECT BY rn = PRIOR rn+1 AND item_id= PRIOR item_id    START WITH rn = 1;





Barbara, Thanks a ton for your suggestions.
Since listagg is not available in R1 and wm_concat is undocumented we cannot use it.

But the dense_rank() above is used in conjunction with sys_connect_by_path , thus concatenating and reducint the rows to process.. What do you think about the same.

Your suggestion about sql statement is good.
I would like to try that as well , and let you know if this works for me.

Thanks a lot again.

Re: Bulk update performance issue [message #525561 is a reply to message #525552] Mon, 03 October 2011 13:50 Go to previous messageGo to next message
ninan
Messages: 163
Registered: June 2011
Location: Noida
Senior Member
Also I would like to know
Quote:

as deonstrated below, and see if your system can handle it


What is the ideal situation where we can decide whether system can handle it or not ?
Re: Bulk update performance issue [message #525563 is a reply to message #525552] Mon, 03 October 2011 14:07 Go to previous messageGo to next message
Barbara Boehmer
Messages: 9090
Registered: November 2002
Location: California, USA
Senior Member
I glanced at your dense_rank too quickly and thought that you had just replaced the row_number in your previous code with dense_rank and missed the sys_connect_by_path. That should work fine with either method as demonstrated below.

SCOTT@orcl_11gR2> column item_id       format a8
SCOTT@orcl_11gR2> column part	       format a8
SCOTT@orcl_11gR2> column sub_part      format a8
SCOTT@orcl_11gR2> column reason        format a8
SCOTT@orcl_11gR2> column rolled_reason format a8
SCOTT@orcl_11gR2> select *
  2  from   itemexcption
  3  order  by item_id, part nulls first, sub_part nulls first
  4  /

ITEM_ID  PART     SUB_PART REASON   ROLLED_R
-------- -------- -------- -------- --------
ITEM1                      4
ITEM1    PART1             2
ITEM1    PART1    SUBPART1 1
ITEM1    PART1    SUBPART2 2
ITEM1    PART2             3
ITEM1    PART2             1
ITEM1    PART2    SUBPART1 1
ITEM1    PART2    SUBPART2 3
ITEM2                      2
ITEM2                      2
ITEM2    PART1             1
ITEM2    PART1    SUBPART1 4
ITEM2    PART1    SUBPART2 1
ITEM2    PART2             3
ITEM2    PART2             3
ITEM2    PART2    SUBPART1 2
ITEM2    PART2    SUBPART2 4

17 rows selected.

SCOTT@orcl_11gR2> DECLARE
  2  	TYPE item_rec IS RECORD (
  3  	   item       itemexcption.item_id%TYPE,
  4  	   rsncodes   itemexcption.reason%TYPE
  5  	);
  6  	TYPE item_tab IS TABLE OF item_rec;
  7  	mod_rec   item_tab;
  8  	itm_rec   item_tab;
  9  	TYPE itemrec IS REF CURSOR;
 10  	rec	  itemrec;
 11  	rec1	  itemrec;
 12  BEGIN
 13  	UPDATE itemexcption
 14  	  SET rolled_reason = NULL
 15  	WHERE rolled_reason IS NOT NULL;
 16  	COMMIT;
 17  	/***** Reason  Code updation Against the PARTs******************************************************/
 18  	OPEN rec FOR
 19  	   select part,
 20  		  ltrim (max (sys_connect_by_path (reason, ',')), ',') rsn_codes
 21  	   from   (select part, reason,
 22  			  dense_rank () over
 23  			    (partition by part order by reason) rn
 24  		   from   itemexcption
 25  		   where  part is not null)
 26  	   start  with rn = 1
 27  	   connect by rn = prior rn + 1
 28  	   group  by part;
 29  	LOOP
 30  	   FETCH rec
 31  	   BULK COLLECT INTO mod_rec
 32  	   LIMIT 1000;
 33  	   FORALL i IN mod_rec.FIRST .. mod_rec.LAST
 34  	   SAVE EXCEPTIONS
 35  	      update itemexcption a
 36  	      set    a.rolled_reason = mod_rec(i).rsncodes
 37  	      where  a.part = mod_rec(i).item
 38  	      and    a.sub_part is null;
 39  	   COMMIT;
 40  	   EXIT WHEN rec%NOTFOUND;
 41  	END LOOP;
 42  	CLOSE rec;
 43  	COMMIT;
 44  	/***** Reason  Code updation Against the ITEMs******************************************************/
 45  	OPEN rec FOR
 46  	   select item_id,
 47  		  ltrim (max (sys_connect_by_path (reason, ',')), ',') rsn_codes
 48  	   from   (select item_id, reason,
 49  			  dense_rank () over
 50  			    (partition by item_id order by reason) rn
 51  		   from   itemexcption
 52  		   where  item_id is not null)
 53  	   start  with rn = 1
 54  	   connect by rn = prior rn + 1
 55  	   group  by item_id;
 56  	LOOP
 57  	   FETCH rec
 58  	   BULK COLLECT INTO itm_rec
 59  	   LIMIT 1000;
 60  	   FORALL i IN itm_rec.FIRST .. itm_rec.LAST
 61  	   SAVE EXCEPTIONS
 62  	      update itemexcption a
 63  	      set    a.rolled_reason = itm_rec(i).rsncodes
 64  	      where  a.item_id = itm_rec(i).item
 65  	      and    a.part is null;
 66  	   COMMIT;
 67  	   EXIT WHEN rec%NOTFOUND;
 68  	END LOOP;
 69  	CLOSE rec;
 70  	COMMIT;
 71  END;
 72  /

PL/SQL procedure successfully completed.

SCOTT@orcl_11gR2> select *
  2  from   itemexcption
  3  order  by item_id, part nulls first, sub_part nulls first
  4  /

ITEM_ID  PART     SUB_PART REASON   ROLLED_R
-------- -------- -------- -------- --------
ITEM1                      4        1,2,3,4
ITEM1    PART1             2        1,2,4
ITEM1    PART1    SUBPART1 1
ITEM1    PART1    SUBPART2 2
ITEM1    PART2             3        1,2,4,4
ITEM1    PART2             1        1,2,4,4
ITEM1    PART2    SUBPART1 1
ITEM1    PART2    SUBPART2 3
ITEM2                      2        1,2,3,4
ITEM2                      2        1,2,3,4
ITEM2    PART1             1        1,2,4
ITEM2    PART1    SUBPART1 4
ITEM2    PART1    SUBPART2 1
ITEM2    PART2             3        1,2,4,4
ITEM2    PART2             3        1,2,4,4
ITEM2    PART2    SUBPART1 2
ITEM2    PART2    SUBPART2 4

17 rows selected.

SCOTT@orcl_11gR2>


SCOTT@orcl_11gR2> column item_id       format a8
SCOTT@orcl_11gR2> column part	       format a8
SCOTT@orcl_11gR2> column sub_part      format a8
SCOTT@orcl_11gR2> column reason        format a8
SCOTT@orcl_11gR2> column rolled_reason format a8
SCOTT@orcl_11gR2> select *
  2  from   itemexcption
  3  order  by item_id, part nulls first, sub_part nulls first
  4  /

ITEM_ID  PART     SUB_PART REASON   ROLLED_R
-------- -------- -------- -------- --------
ITEM1                      4
ITEM1    PART1             2
ITEM1    PART1    SUBPART1 1
ITEM1    PART1    SUBPART2 2
ITEM1    PART2             3
ITEM1    PART2             1
ITEM1    PART2    SUBPART1 1
ITEM1    PART2    SUBPART2 3
ITEM2                      2
ITEM2                      2
ITEM2    PART1             1
ITEM2    PART1    SUBPART1 4
ITEM2    PART1    SUBPART2 1
ITEM2    PART2             3
ITEM2    PART2             3
ITEM2    PART2    SUBPART1 2
ITEM2    PART2    SUBPART2 4

17 rows selected.

SCOTT@orcl_11gR2> UPDATE itemexcption
  2  SET rolled_reason = NULL
  3  WHERE rolled_reason IS NOT NULL;

0 rows updated.

SCOTT@orcl_11gR2> COMMIT;

Commit complete.

SCOTT@orcl_11gR2> update itemexcption a
  2  set    a.rolled_reason =
  3  	    (select rsncodes
  4  	     from   (select part,
  5  			    ltrim (max (sys_connect_by_path (reason, ',')), ',') rsncodes
  6  		     from   (select part, reason,
  7  				    dense_rank() over
  8  				      (partition by part order by reason) rn
  9  			     from   itemexcption
 10  			     where  part is not null)
 11  		     start with rn = 1
 12  		     connect by rn = prior rn + 1
 13  		     group  by part) i
 14  	     where  a.part = i.part)
 15  where  a.sub_part is null;

9 rows updated.

SCOTT@orcl_11gR2> COMMIT;

Commit complete.

SCOTT@orcl_11gR2> update itemexcption a
  2  set    a.rolled_reason =
  3  	    (select rsncodes
  4  	     from   (select item_id,
  5  			    ltrim (max (sys_connect_by_path (reason, ',')), ',') rsncodes
  6  		     from   (select item_id, reason,
  7  				    dense_rank() over
  8  				      (partition by item_id order by reason) rn
  9  			     from   itemexcption
 10  			     where  item_id is not null)
 11  		     start with rn = 1
 12  		     connect by rn = prior rn + 1
 13  		     group  by item_id) i
 14  	     where  a.item_id = i.item_id)
 15  where  a.part is null;

3 rows updated.

SCOTT@orcl_11gR2> COMMIT;

Commit complete.

SCOTT@orcl_11gR2> select *
  2  from   itemexcption
  3  order  by item_id, part nulls first, sub_part nulls first
  4  /

ITEM_ID  PART     SUB_PART REASON   ROLLED_R
-------- -------- -------- -------- --------
ITEM1                      4        1,2,3,4
ITEM1    PART1             2        1,2,4
ITEM1    PART1    SUBPART1 1
ITEM1    PART1    SUBPART2 2
ITEM1    PART2             3        1,2,4,4
ITEM1    PART2             1        1,2,4,4
ITEM1    PART2    SUBPART1 1
ITEM1    PART2    SUBPART2 3
ITEM2                      2        1,2,3,4
ITEM2                      2        1,2,3,4
ITEM2    PART1             1        1,2,4
ITEM2    PART1    SUBPART1 4
ITEM2    PART1    SUBPART2 1
ITEM2    PART2             3        1,2,4,4
ITEM2    PART2             3        1,2,4,4
ITEM2    PART2    SUBPART1 2
ITEM2    PART2    SUBPART2 4

17 rows selected.

SCOTT@orcl_11gR2>

Re: Bulk update performance issue [message #525564 is a reply to message #525561] Mon, 03 October 2011 14:10 Go to previous messageGo to next message
Barbara Boehmer
Messages: 9090
Registered: November 2002
Location: California, USA
Senior Member
nirmalnarayanans wrote on Mon, 03 October 2011 11:50
Also I would like to know
Quote:

as deonstrated below, and see if your system can handle it


What is the ideal situation where we can decide whether system can handle it or not ?


A simple SQL update is generally faster than PL/SQL. However, when you are processing that many rows, you need to make sure that your system has enough memory to handle it with overflowing. I would just test it as is and see what happens. If it completes then you do not need to do anything. If you get an error message, then base your actions on the error message.
Re: Bulk update performance issue [message #525862 is a reply to message #525564] Thu, 06 October 2011 06:26 Go to previous messageGo to next message
ninan
Messages: 163
Registered: June 2011
Location: Noida
Senior Member

 46  	   select item_id,
 47  		  ltrim (max (sys_connect_by_path (reason, ',')), ',') rsn_codes
 48  	   from   (select item_id, reason,
 49  			  dense_rank () over
 50  			    (partition by item_id order by reason) rn
 51  		   from   itemexcption
 52  		   where  item_id is not null)
 53  	   start  with rn = 1
 54  	   connect by rn = prior rn + 1
 55  	   group  by item_id;



The above code is giving an issue with sys_connect_by_path in the following scenario.

For a certain item_id='0700-0787' has got duplicate values against of 500 records with reason=1 and with same part and sub_part as null. Total no. of records for this item is 700

The distinct values of reason is 1,2,4 against this item_id.

If I run the query on this 500 recordset alone the sys_connect_by_path rollups correctly to 1,2,4 for Rolled_reason.

But since this 700 records is subset of a large table with 8 million records, where lot of item_ids have duplicate records like this against them, sys_connect_by_path is failing.

Against this item_id mentioned above the Rolled_reason values was only 1. It did'nt roll up 1,2,4 as final value.

Is this because sys_connect_by_path has some short comings working against large data set ? Is this a bug with sys_connect_by_path.

Anyone came across such issue.

You need to test this with a large table with lot of duplicate records, to encounter this issue.
Re: Bulk update performance issue [message #525875 is a reply to message #525862] Thu, 06 October 2011 07:26 Go to previous messageGo to next message
Barbara Boehmer
Messages: 9090
Registered: November 2002
Location: California, USA
Senior Member
Any sql varchar2 column result is going to be limited to 4000 characters, no matter what aggregation technique you use. So, that may not work for you.
Re: Bulk update performance issue [message #525879 is a reply to message #525390] Thu, 06 October 2011 08:16 Go to previous messageGo to next message
Roachcoach
Messages: 1576
Registered: May 2010
Location: UK
Senior Member
nirmalnarayanans wrote on Sun, 02 October 2011 10:13
Hard luck. Tried many options available in Oracle, it did'nt work.

Finally we decided to go for another DB, i.e. SQL Server.

Loaded same volume (8 million ) of data in SQL Server and it completed in 1 hour 25 minuts. Where Oracle had taken 5 hours and 40 minutes to complete the job.

Lessons learnt.: Oracle is good, if you are playing with a low volume of data. Otherwise it will never going to work. Telling this after spending more than a week trying many options avaiable in Oracle.


8 million rows is tiny....

Your hardware needs better hamsters Smile
Re: Bulk update performance issue [message #525880 is a reply to message #525875] Thu, 06 October 2011 08:17 Go to previous messageGo to next message
ninan
Messages: 163
Registered: June 2011
Location: Noida
Senior Member
Barbara,

When I said there are duplicate records, the distinct value in this column can be only 4, i.e, 1,2, 3,4. so there is no chance the length can go beyond 8 characters.

But since the sys_connect_by_path has to loop through so many duplicate records, it is not able to connect to the second distinct, even though the inner query with dense_rank() gets these 4 distinct values.

for eg. this is how the data will be

  item_id   part  sub_part reason
  ---------------------------------
   0070787                   4
   0070787  part1            1
   0070787  part1            1
   0070787  part1            1
   0070787  part1   subpart  1
   0070787  part1   subpart  1
   0070787  part1   subpart  1
   0070787  part1   subpart  1
   0070787  part1   subpart  1
   0070787  part1            1
   0070787  part2            1
   0070787  part2            1
   0070787  part2            1
   0070787  part2            1
   0070787  part2            1
   0070787  part3            2
   0070787  part3            2
   0070787  part3            2
   0070787  part3            2
   0070787  part3            2

like this the records are repeated with values (1 or 2 or 3 or 4)  for 500 times ( n times for 1, n times for 2 like that..)

the query

 46  	   select item_id,
 47  		  ltrim (max (sys_connect_by_path (reason, ',')), ',') rsn_codes
 48  	   from   (select item_id, reason,
 49  			  dense_rank () over
 50  			    (partition by item_id order by reason) rn
 51  		   from   itemexcption
 52  		   where  item_id is not null)
 53  	   start  with rn = 1
 54  	   connect by rn = prior rn + 1
 55  	   group  by item_id;




The dense_rank is getting the distinct values, i.e, 4,1,2
but since the table has around 8 million records with reason ( 1 or 2 or 3 or 4 ) maximum length of rollup will be 8 ( i.e., length of rolled up value 1,2,3,4, ). To get this max string of 8 characters it sys_connect_by_path has to loop through the entire table. Here it fails and just gets the value as 4, which is incorrect rollup of the values returned by dense_rank ( i.e., 4,1,2 )..

I think this is where sys_connect_by_path failing. It may be a bug.

To verify this I extracted only 500 records into another table from the big table, and run the same query on the table with small data set.

It rolled up correctly to 4,1,2, this time.

Re: Bulk update performance issue [message #525881 is a reply to message #525879] Thu, 06 October 2011 08:21 Go to previous messageGo to next message
ninan
Messages: 163
Registered: June 2011
Location: Noida
Senior Member
Hardware in the sense the Oracle Server.

How can I know the configuration of the Oracle Server.

If I get the DB information will if help you suggest , if this is a problem with DB Configuration.

Can you please help me with the query to get the DB Configuration information ?
Re: Bulk update performance issue [message #525886 is a reply to message #525881] Thu, 06 October 2011 08:54 Go to previous messageGo to next message
Roachcoach
Messages: 1576
Registered: May 2010
Location: UK
Senior Member
Ask your sysadmin

The below operations, whilst not identical to yours, were run on a laptop with 4 cores - bog standard work issue - not a fancy one. Took approximately 30-40 minutes all in, the update took about 17 minutes.

create table t nologging as select * from dba_objects
/

create table t2 nologging as select * from dba_objects
/

select count(*) from t
/

alter session enable parallel dml
/

begin
for i in 1..150 loop
insert /*+ append parallel(2)*/ into t select * from t2;
commit;
end loop;
end;
/

select count(*) from t
/

alter table t add test_col number
/

update t set test_col = (object_id * dbms_random.value() )
/


10,965,921 rows updated.



As I say - not identical to yours - but 8 million rows isn't huge.
Re: Bulk update performance issue [message #528677 is a reply to message #525886] Wed, 26 October 2011 06:48 Go to previous messageGo to next message
Kevin Meade
Messages: 2103
Registered: December 1999
Location: Connecticut USA
Senior Member
Quote:
Lessons learnt.: Oracle is good, if you are playing with a low volume of data. Otherwise it will never going to work. Telling this after spending more than a week trying many options avaiable in Oracle.


If you really concluded this then maybe you are better off on SQLSERVER because you clearly don't appreciate what it is you have. SQLSERVER is a toy database compared to Oracle and Oracle will outperform SQLSERVER and any other database in terms of capacity, scalability, functionality, and speed in almost every situation. However, any database can only do so much to fix bad code.

Without spending lots of time trying to decipher your code, I would suggest the following, which is pretty much what everyone else is saying:

1) you should construct the solution set as a set of rows first using a query
2) then update your table based on the solution set

This approach is warranted by the nature of your hierarchical requirements and your need to update the table you are reading. It allows you to avoid performance costs of things likes going to the rollback segment to rebuild blocks because you are updating the same table you are reading.

Additionally you should consider that your app may be flawed in design because of its need to carry redundant data. This is one reason why the suggestion has been put forth to query the data you need when you need it rather than update ahead of time.

Good luck on SQLSERVER. Kevin
Re: Bulk update performance issue [message #529072 is a reply to message #528677] Fri, 28 October 2011 10:06 Go to previous messageGo to next message
Vackar
Messages: 81
Registered: October 2007
Member
Kevin Meade wrote on Wed, 26 October 2011 06:48
Quote:
Lessons learnt.: Oracle is good, if you are playing with a low volume of data. Otherwise it will never going to work. Telling this after spending more than a week trying many options avaiable in Oracle.


If you really concluded this then maybe you are better off on SQLSERVER because you clearly don't appreciate what it is you have. SQLSERVER is a toy database compared to Oracle and Oracle will outperform SQLSERVER and any other database in terms of capacity, scalability, functionality, and speed in almost every situation. However, any database can only do so much to fix bad code.

....
Good luck on SQLSERVER. Kevin


I'd have to agree with that. Generally when queries are taking hours, it's becuase you're doing something silly with your code. Fix that 'silly' thing and nothing will beat Oracle - I've yet to come accross a real world example of any RDBMS solution outperforming Oracle.
Re: Bulk update performance issue [message #529221 is a reply to message #529072] Sat, 29 October 2011 19:54 Go to previous message
Kevin Meade
Messages: 2103
Registered: December 1999
Location: Connecticut USA
Senior Member
The problem with your update may be those bitmap indexes. Your update is updating I am guessing half of the rows in the table or more. I have seen great abuse of bitmap indexes. Most people don't understand what they are really for and how to use them.

For this update I would do something like the following. I have not checked any of the sql for syntax, I leave that to you.

Quote:
1) do not allow the query to use any of the bitmap indexes on the itemexcption table. This is killing you. Just doing this may be enough to get the speed you want.

2) use SQL like the following. Substitute the appropriate string concatenation method for your version of Oracle. NOTICE THE APPROACH

A) first build your answer set
B) then update the table
C) you can even create a new table

Unless you are working on some slow machines, or have other issues, this update should get done in 10 minutes or less. If you don't like the idea of creating an answerset first, then rewrite the updates as you see fit once you demonstrate the timings you want using these methods.

You should see your query doing FULL TABLE SCANS and variations of HASH JOINS in order to query the data. If you are using indexes for a query that looks at everything, the stop that.

Good luck, Kevin

with
      itemexcption as (
                        select 'ITEM1' item_id,'' part,'' subpart,'4' reason from dual union all
                        select 'ITEM1' item_id,'PART1' part,'' subpart,'2' reason from dual union all
                        select 'ITEM1','PART2','','3' from dual union all
                        select 'ITEM1','PART1','SUBPART1','1' from dual union all
                        select 'ITEM1','PART1','SUBPART2','2' from dual union all
                        select 'ITEM1','PART2','','1' from dual union all
                        select 'ITEM1','PART2','SUBPART1','1' from dual union all
                        select 'ITEM1','PART2','SUBPART2','3' from dual
                      )
select *
from itemexcption
order by item_id,part nulls first,subpart nulls first,reason
/

with
      itemexcption as (
                        select 'ITEM1' item_id,'' part,'' subpart,'4' reason from dual union all
                        select 'ITEM1' item_id,'PART1' part,'' subpart,'2' reason from dual union all
                        select 'ITEM1','PART2','','3' from dual union all
                        select 'ITEM1','PART1','SUBPART1','1' from dual union all
                        select 'ITEM1','PART1','SUBPART2','2' from dual union all
                        select 'ITEM1','PART2','','1' from dual union all
                        select 'ITEM1','PART2','SUBPART1','1' from dual union all
                        select 'ITEM1','PART2','SUBPART2','3' from dual
                      )
   , distinct_list as (
                        select distinct item_id,reason
                        from itemexcption
                      )
select *
from distinct_list
/

with
      itemexcption as (
                        select 'ITEM1' item_id,'' part,'' subpart,'4' reason from dual union all
                        select 'ITEM1' item_id,'PART1' part,'' subpart,'2' reason from dual union all
                        select 'ITEM1','PART2','','3' from dual union all
                        select 'ITEM1','PART1','SUBPART1','1' from dual union all
                        select 'ITEM1','PART1','SUBPART2','2' from dual union all
                        select 'ITEM1','PART2','','1' from dual union all
                        select 'ITEM1','PART2','SUBPART1','1' from dual union all
                        select 'ITEM1','PART2','SUBPART2','3' from dual
                      )
   , distinct_list as (
                        select distinct item_id,reason
                        from itemexcption
                      )
--
-- substitute the best available string aggregation method for your version of Oracle
-- try to stay away from PLSQL functions if possible
--
   , solution_11g as (
                       select item_id,listagg(reason,',') within group (order by reason) rolled_reason
                       from distinct_list
                       group by item_id
                     )
select *
from solution_11g 
/


create table kev_item_temp
nologging
as
with
     distinct_list as (
                        select distinct item_id,reason
                        from itemexcption
                        where item_id is not null
                      )
   , solution_11g as (
                       select item_id,listagg(reason,',') within group (order by reason) rolled_reason
                       from distinct_list
                       group by item_id
                     )
select *
from solution_11g 
/

update itemexcption set
        rolled_reason = (
                          select rolled_reason
                          from kev_item_temp
                          where kev_item_temp.item_id = itemexcption.item_id
                        )
where part is null
/


create table kev_item_part_temp
nologging
as
with
     distinct_list as (
                        select distinct item_id,part,reason
                        from itemexcption
                        where part is not null
                      )
   , solution_11g as (
                       select item_id,part,listagg(reason,',') within group (order by reason) rolled_reason
                       from distinct_list
                       group by item_id,part
                     )
select *
from solution_11g 
/

update itemexcption set
        rolled_reason = (
                          select rolled_reason
                          from kev_item_part_temp
                          where kev_item_part_temp.item_id = itemexcption.item_id
                          and kev_item_part_temp.part_id = itemexcption.part_id
                        )
where subpart is null
/

create table new_itemexcption
nologging
as
select   itemexcption.item_id
       , itemexcption.part
       , itemexcption.reason
       , case when itemexcption.part is not null 
                then kev_item_part_temp.rolled_reason 
              else kev_item_temp.rolled_reason 
         end rolled_reason
from   itemexcption
     , kev_item_temp
     , kev_item_part_temp
where itemexcption.item_id = kev_item_temp.item_id
and itemexcption.item_id = kev_item_part_temp.item_id(+)
and itemexcption.part = kev_item_part_temp.part_id(+)
and subpart is null
/

[Updated on: Sun, 30 October 2011 01:33] by Moderator

Report message to a moderator

Previous Topic: buffer busy wait
Next Topic: Parallelism in queries
Goto Forum:
  


Current Time: Tue Apr 23 07:52:30 CDT 2024