CSC662
CSC662 Data mining, Data
warehouse and Visualization . . ก !
""#$$ "#%$ &'ก# ()
2 Data
*+(
,--ก.-
Call center
Weather
Contact lenses
Irises
CPU performance
Labor negotiations
Soybean classification
3 Data
* :&/%-:&/)ก0#%,%&/
)ก0#%,%&/
"-# %",ก$
$)1%-
,--ก.- CSC662
4 Data
CallCenterPivot.xls:25975 %-:24 )ก0#%,%&/
ก2-%ก,3ก0,4!(ก5$
/)ก-0)6"5$ &ก-0))-,3ก0(1(3 %(1 ) 3 $" 1999 73 25 .)" 1999 )ก1 ,--"*ก"7*(&68ก)-1"" ก)-ก"6 )--ก&ก1""
ก2-1, transactional --61"1(6,
",ก$1-)ก0#%,%&/
Call center
5 Data
)ก0#%,%&/,9$)/")! -)3ก6()ก"*
OnHoldMins ก2-&/ก"7*( &68ก)-1""
"1,9&/&-ก(*
ServiceTimeMins ก2-&/ก")--ก &ก1""
&2& "1,9&/&-ก(*
)ก0#%,%&/*&%7ก,9ก1"* ()ก" ,%ก"
5$ 7/ก" $(ก )ก0#%
,4!(-8*+:-$$)+- "5)-5,4!( )- %)-
"78)ก
$) Call center
6 Data
CallID ()-)3กกก-ก
CustomerType (),%ก"
AppType (),ก
ProbType (),4!(
ArrivalBinID()
AppName *,ก
SuiteName *,ก/)ก)+
CustomerName *ก"%-6
$ Call center ( ๑ )
7 Data
Region ()-)3กกก-ก
State ):ก"1
Industry )ก0#%$(กก"
ProbName *,4!(
Complexity ,"5)-5,4!(&),9%)- Easy Medium Difficult
WeeklyHourBin ())(3),(
Date )
DOW ())(3),(
$ Call center ( ๒ )
8 Data
Hour )
Week ),(
Month *
Year ,;
Quarter ก1*
StaffLevel %)-"78)ก
$)11 1, 5, 4, 2, 1, Access, MS Office, M Research, Midwest, MI, Consulting, Basic use, Easy, 1, 10/3/1999, 1, 1, 41, 10, 1999, 4, 4, 0, 15.42
$ Call center ( ๓ )
9 Data
weather.nominal.arff, weather.arff:14 %-:5 )ก0#%,%&/
,9$ 8*3ก0)+$.ก/(*
$ก("$)ก&)ก1)ก',%(3
outlook 8ก
temperature #( ,9&/ weather.arff
humidity "*+ ,9&/ weather.arff
windy 88)
play ,9)ก0#%,%&/, ("1"* yes (* no
-# 61ก(6,%61,ก$
$)1 1 rainy, mild, high, TRUE, no
Weather
10 Data
Contact-lenses.arff:24%-:5)ก0#%,%&/
6&กก&<)$&$ก)-&)ก08 $1+7ก ,&"6617/6,&6
age -กก1)-ก$&
spectacle-prescrip ก1ก
astigmatism -ก",ก$ก%&ก$
tear-prod-rate -ก)$ก$+/$
contact-lenses )ก0#%,%&/, ("1 none, soft, hard "-# %61,ก$
$)1 1 young, myope, no, normal, soft
Contact lenses
11 Data
iris.arff:150%-:5)ก0#%,%&/
-)3ก8). 68). "* iris setosa, iris versicolor, iris virginica 6&ก R. A. Fisher -)3ก)ก-+%ก)- ก 8*/$)8). 6+
sepallength "ก-+
sepalwidth "กก-+
petallength "ก-ก
petalwidth "กก-ก
class )ก0#%,%&/, ("1"* setosa, versicolor, virginica "-# %61,ก$
$)1 1 7.2, 3.2, 6.0, 1.8, Iris-virginica
Irises
12 Data
cpu.arff:209 %-:7 )ก0#%,%&/
-)3ก"2)8). ก,%$"2(1 ,% *+(1"&/()ก (1"&/" 1ก$$1
MYCT "2(1,%
MMIN ,#(1"&/()ก$/
MMAX ,#(1"&/()ก
CACH ,#(1"&/"
CHMIN ,#(1"&/"$/
CHMAX ,#(1"&/"
class )ก0#%,%&/, ("1,9&/$2
CPU performance
13 Data
"-#
$1%)ก0#%,%&/ก$ก$1ก)
)ก0#%,%&/, ("1",,
$)1 1
29.0, 8000.0, 32000.0, 32.0, 8.0, 32.0, 253.0 23.0, 16000.0, 64000.0, 64.0, 16.0, 32.0, 749.0 23.0, 32000.0, 64000.0, 128.0, 32.0, 64.0, 1238.0
CPU performance (cont.)
14 Data
labor.arff:57 %-:17 )ก0#%,%&/
&กก$ก)!!,%",; 1987 % 1988 )!!/ก).ก&%-ก1$)&ก 500 ก )!!/
&7*1/2&(*61/2&-)3ก)ก0#%,%&/ class
duration %%)!!
wage-increase-first-year "1&83+,;ก
wage-increase-second-year "1&83+,;
wage-increase-third-year "1&83+,;
cost-of-living-adjustment "1&1,%&/),)-ก
working-hours &/)/$1),(
Labor negotiations
15 Data
pension *ก0#
standby-pay &1
shift-differential $1
education-allowance "1ก3ก0
statutory-holidays )(
vacation ก8)ก
Longterm-disability-assistance ก1(*1"8ก
%%
contribution-to-dental-plan )$ก
bereavement-assistance ก1(*<ก<&กก!
contribution-to-health-plan 8
class )ก0#%,%&/, (" bad/good
Labor negotiations
16 Data
61"-# $1)ก0#%,%&/, ("-#
61,ก$
$)1 1
2.0, 2.5, 2.5, ?, ?, 38.0, empl_contr, ?, ?, ?, 10.0, average, ?, ?, ?, ?, bad
2.0, 4.5, 4.0, ?, ?, 40.0, ?, ?, 2.0, no, 10.0, below_average, no, half, ?, half, bad
Labor negotiations
17 Data
soybean.arff:683 %-:36 )ก0#%,%&/
ก-ก"$7)(*6&ก/&"$7) (*8ก2-)ก0#%,%&/ 35 )ก0#% "$7))+( 19
date *ก
plant-stand )ก0#%/$
precip )ก0#%ก*,-ก)-,ก$
temp #(
hail ก(2-
crop-hist ,%)$ก,ก
area-damaged 8*+(
severity "
Soybeans classification
18 Data
seed-tmt ก&)ก28).
germination )ก0#%ก$-$&ก2
plant-growth ก$/$7)
leaves )ก0#%-
leafspots-halo &---,9
leafspots-marg &--
leaf-shread )ก0#%--- shread
leaf-malf )ก0#%--- malf
leaf-mild )ก0#%--- mald
stem )ก0#%ก1/$
lodging )ก0#%ก,ก,
Soybeans classification
19 Data
stem-cankers )ก0#%/$1,9"
canker-lesion 1,9"
fruiting-bodies 1
external-decay )ก0#%กก
mycelium ก,ก= mycelium
int-discolor ,6,
sclerotia ก,ก= sclerotia
fruit-pods ,1
fruit-spots &
seed )ก0#%2
mold-growth )ก0#%ก$ mold
Soybeans classification
20 Data
seed-discolor ",ก$2
seed-size 2
shriveling )ก0#%ก+/
roots ก
class )ก0#%,%&/, ( 19"1
61-# %61,ก$
$)1 1 october, normal, gt-norm, norm, yes, same-lst- yr, low-areas, pot-severe, none, 90-100, abnorm, abnorm, absent, dna, dna, absent, absent, absent, abnorm, no, above-sec-nde, brown, present, firm-and-dry, absent, none, absent, norm, dna, norm, absent, absent, norm, absent, norm, diaporthe-stem-canker