On Wed, Feb 11, 2009 at 02:37:21PM -0600, David DeWitt wrote: > So that Erik Paulson can participate let's do this as a conf call. > > Phone number is > > >866-500-6738 > > >Participant code is: 3383288 > > Thanks > David This might be useful - here's the exact sequence of events I run to setup the database: db2 create database cacm on '/scratch.1/db2data/cacm' dbpath on '/scratch.1/db2data/cacm' db2 connect to cacm db2 create bufferpool cacmbuffer size 16384 pagesize 32K numblockpages 14741 blocksize 64 db2 create tablespace cacmts pagesize 32K managed by automatic storage extentsize 64 bufferpool cacmbuffer db2 'CREATE TABLE Rankings( pageRank INT, pageURL VARCHAR(100), avgDuration INT) in cacmts distribute by hash(pageURL)' db2 'create index rankindx on Rankings(pageRank) CLUSTER' db2 disconnect cacm /common/tmp/epaulson/load_rankings_data.pl pssh -p 5 -t 6000 -h /common/tmp/epaulson/machines-152-200 -o /tmp/rankings-loads /common/tmp/epaulson/load_rankings_data.pl db2 connect to cacm db2 'CREATE TABLE UserVisits( sourceIPAddr VARCHAR(16), destinationURL VARCHAR(100), visitDate DATE, adRevenue FLOAT, UserAgent VARCHAR(64), cCode CHAR(3), lCode CHAR(6), sKeyword VARCHAR(32), avgTimeOnSite INT) in cacmts distribute by hash(destinationURL)' db2 'create index uvindx on UserVisits(visitDate) cluster' db2 disconnect cacm pssh -p 5 -t 6000 -h /common/tmp/epaulson/machines-152-200 -o /tmp/uservists-loads /common/tmp/epaulson/load_uservisits_data.pl /common/tmp/epaulson/load_uservisits_data.pl db2 update db cfg for cacm using sortheap 131072 pssh -p 1 -h /common/tmp/epaulson/machines-152-200 -o /tmp/sortupdate -t 600 db2 update db cfg for cacm using sortheap 131072 db2 update db cfg for cacm using sheapthres_shr 131072 pssh -p 1 -h /common/tmp/epaulson/machines-152-200 -o /tmp/sortupdate -t 600 db2 update db cfg for cacm using sheapthres_shr 131072 db2 connect to cacm db2 alter table UserVisits compress yes db2 alter table Rankings compress yes db2 create system temporary tablespace tmptbsp pagesize 32K managed by automatic storage extentsize 64 bufferpool cacmbuffer date ; db2 reorg table rankings use tmptbsp ; date ; db2 reorg table uservisits use tmptbsp ; date date; db2 reorg indexes all for table UserVisits; date; db2 reorg indexes all for table Rankings; date db2 runstats on table db2inst1.UserVisits for indexes all; db2 runstats on table db2inst1.Rankings for indexes all; db2 'create table data (attr1 char(10), attr2 char(90)) in cacmts' db2 disconnect cacm #make sure grepdata is the right size /common/tmp/epaulson/load_grep_data.pl date; pssh -p 5 -t 6000 -h /common/tmp/epaulson/machines-152-200 -o /tmp/grepdata-loads /common/tmp/epaulson/load_grep_data.pl db2 connect to cacm db2 alter table data compress yes date; db2 reorg table data use tmptbsp; date load_uservisits: #!/bin/sh db2 connect to cacm db2 load from '/scratch.1/arasin/MRData/UserVisits.dat' of del modified by anyorder NOCHARDEL COLDEL\| insert into UserVisits\(sourceIPAddr, destinationURL, visitDate, adRevenue, UserAgent, cCode, lCode, sKeyword, avgTimeOnSite\); db2 disconnect cacm load_rankings: #!/bin/sh db2 connect to cacm db2 load from '/scratch.1/arasin/MRData/Rankings.dat' of del modified by anyorder NOCHARDEL COLDEL\| insert into Rankings\(pageRank, pageURL, avgDuration\); db2 disconnect cacm