Demo 0 | Demo 1 | Demo 2 | Demo 3 | Demo 4 | Demo 5 | Code | Matt Smith

Demo 2

Array
(
    [1] => data
    [2] => mining
    [4] => wikipedia
    [5] => data
    [6] => mining
    [8] => wikipedia
    [10] => free
    [11] => encyclopedia
    [12] => jump
    [14] => navigation
    [15] => search
    [19] => confused
    [21] => analytics
    [22] => information
    [23] => extraction
    [25] => data
    [26] => analysis
    [27] => machine
    [28] => learning
    [30] => data
    [31] => mining
    [32] => problems
    [33] => classification
    [34] => clustering
    [35] => regression
    [36] => anomaly
    [37] => detection
    [38] => association
    [39] => rules
    [40] => reinforcement
    [41] => learning
    [42] => structured
    [43] => prediction
    [44] => feature
    [45] => engineering
    [46] => feature
    [47] => learning
    [48] => online
    [49] => learning
    [50] => semi-supervised
    [51] => learning
    [52] => unsupervised
    [53] => learning
    [54] => learning
    [56] => rank
    [57] => grammar
    [58] => induction
    [59] => supervised
    [60] => learning
    [61] => classification
    [62] => regression
    [63] => decision
    [64] => trees
    [65] => ensembles
    [66] => bagging
    [67] => boosting
    [68] => random
    [69] => forest
    [70] => k
    [71] => -nn
    [72] => linear
    [73] => regression
    [74] => naive
    [75] => bayes
    [76] => neural
    [77] => networks
    [78] => logistic
    [79] => regression
    [80] => perceptron
    [81] => relevance
    [82] => vector
    [83] => machine
    [84] => rvm
    [85] => support
    [86] => vector
    [87] => machine
    [88] => svm
    [89] => clustering
    [90] => birch
    [91] => cure
    [92] => hierarchical
    [93] => k
    [94] => -means
    [95] => expectation
    [96] => maximization
    [97] => em
    [98] => dbscan
    [99] => optics
    [100] => mean-shift
    [101] => dimensionality
    [102] => reduction
    [103] => factor
    [104] => analysis
    [105] => cca
    [106] => ica
    [107] => lda
    [108] => nmf
    [109] => pca
    [110] => t-sne
    [111] => structured
    [112] => prediction
    [113] => graphical
    [114] => models
    [115] => bayes
    [116] => net
    [117] => crf
    [118] => hmm
    [119] => anomaly
    [120] => detection
    [121] => k
    [122] => -nn
    [123] => local
    [124] => outlier
    [125] => factor
    [126] => neural
    [127] => nets
    [128] => autoencoder
    [129] => deep
    [130] => learning
    [131] => multilayer
    [132] => perceptron
    [133] => rnn
    [134] => restricted
    [135] => boltzmann
    [136] => machine
    [137] => som
    [138] => convolutional
    [139] => neural
    [140] => network
    [141] => reinforcement
    [142] => learning
    [143] => q-learning
    [144] => sarsa
    [145] => temporal
    [146] => difference
    [147] => td
    [148] => theory
    [149] => bias-variance
    [150] => dilemma
    [151] => computational
    [152] => learning
    [153] => theory
    [154] => empirical
    [155] => risk
    [156] => minimization
    [157] => occam
    [158] => learning
    [159] => pac
    [160] => learning
    [161] => statistical
    [162] => learning
    [163] => vc
    [164] => theory
    [165] => machine-learning
    [166] => venues
    [167] => nips
    [168] => icml
    [169] => ml
    [170] => jmlr
    [171] => arxiv
    [172] => cs
    [173] => lg
    [174] => related
    [175] => articles
    [176] => list
    [178] => datasets
    [180] => machine-learning
    [181] => research
    [182] => outline
    [184] => machine
    [185] => learning
    [186] => machine
    [187] => learning
    [188] => portal
    [189] => v
    [190] => t
    [191] => e
    [192] => data
    [193] => mining
    [196] => computing
    [197] => process
    [199] => discovering
    [200] => patterns
    [202] => large
    [203] => data
    [204] => sets
    [205] => involving
    [206] => methods
    [209] => intersection
    [211] => machine
    [212] => learning
    [213] => statistics
    [215] => database
    [216] => systems
    [217] => 1
    [221] => essential
    [222] => process
    [224] => intelligent
    [225] => methods
    [227] => applied
    [229] => extract
    [230] => data
    [231] => patterns
    [232] => 1
    [233] => 2
    [237] => interdisciplinary
    [238] => subfield
    [240] => computer
    [241] => science
    [242] => 1
    [243] => 3
    [244] => 4
    [247] => goal
    [250] => data
    [251] => mining
    [252] => process
    [255] => extract
    [256] => information
    [259] => data
    [260] => set
    [262] => transform
    [266] => understandable
    [267] => structure
    [271] => 1
    [275] => raw
    [276] => analysis
    [277] => step
    [279] => involves
    [280] => database
    [282] => data
    [283] => management
    [284] => aspects
    [285] => data
    [286] => pre-processing
    [287] => model
    [289] => inference
    [290] => considerations
    [291] => interestingness
    [292] => metrics
    [293] => complexity
    [294] => considerations
    [295] => post-processing
    [297] => discovered
    [298] => structures
    [299] => visualization
    [301] => online
    [302] => updating
    [303] => 1
    [304] => data
    [305] => mining
    [308] => analysis
    [309] => step
    [312] => knowledge
    [313] => discovery
    [315] => databases
    [316] => process
    [318] => kdd
    [319] => 5
    [321] => term
    [324] => misnomer
    [327] => goal
    [330] => extraction
    [332] => patterns
    [334] => knowledge
    [336] => large
    [337] => amounts
    [339] => data
    [342] => extraction
    [343] => mining
    [345] => data
    [347] => 6
    [352] => buzzword
    [353] => 7
    [356] => frequently
    [357] => applied
    [360] => form
    [362] => large-scale
    [363] => data
    [365] => information
    [366] => processing
    [367] => collection
    [368] => extraction
    [369] => warehousing
    [370] => analysis
    [372] => statistics
    [377] => application
    [379] => computer
    [380] => decision
    [381] => support
    [382] => system
    [383] => including
    [384] => artificial
    [385] => intelligence
    [386] => machine
    [387] => learning
    [389] => business
    [390] => intelligence
    [392] => book
    [393] => data
    [394] => mining
    [395] => practical
    [396] => machine
    [397] => learning
    [398] => tools
    [400] => techniques
    [402] => java
    [403] => 8
    [405] => covers
    [407] => machine
    [408] => learning
    [409] => material
    [411] => originally
    [414] => named
    [416] => practical
    [417] => machine
    [418] => learning
    [421] => term
    [422] => data
    [423] => mining
    [426] => added
    [428] => marketing
    [429] => reasons
    [430] => 9
    [434] => general
    [435] => terms
    [436] => large
    [437] => scale
    [438] => data
    [439] => analysis
    [441] => analytics
    [444] => referring
    [446] => actual
    [447] => methods
    [448] => artificial
    [449] => intelligence
    [451] => machine
    [452] => learning
    [457] => actual
    [458] => data
    [459] => mining
    [460] => task
    [463] => semi-automatic
    [465] => automatic
    [466] => analysis
    [468] => large
    [469] => quantities
    [471] => data
    [473] => extract
    [474] => previously
    [475] => unknown
    [476] => interesting
    [477] => patterns
    [480] => groups
    [482] => data
    [483] => records
    [484] => cluster
    [485] => analysis
    [486] => unusual
    [487] => records
    [488] => anomaly
    [489] => detection
    [491] => dependencies
    [492] => association
    [493] => rule
    [494] => mining
    [495] => sequential
    [496] => pattern
    [497] => mining
    [500] => involves
    [502] => database
    [503] => techniques
    [506] => spatial
    [507] => indices
    [509] => patterns
    [516] => kind
    [518] => summary
    [521] => input
    [522] => data
    [529] => analysis
    [534] => machine
    [535] => learning
    [537] => predictive
    [538] => analytics
    [542] => data
    [543] => mining
    [544] => step
    [546] => identify
    [547] => multiple
    [548] => groups
    [551] => data
    [558] => obtain
    [560] => accurate
    [561] => prediction
    [562] => results
    [565] => decision
    [566] => support
    [567] => system
    [570] => data
    [571] => collection
    [572] => data
    [573] => preparation
    [575] => result
    [576] => interpretation
    [578] => reporting
    [580] => part
    [583] => data
    [584] => mining
    [585] => step
    [588] => belong
    [592] => kdd
    [593] => process
    [595] => additional
    [596] => steps
    [598] => related
    [599] => terms
    [600] => data
    [601] => dredging
    [602] => data
    [603] => fishing
    [605] => data
    [606] => snooping
    [607] => refer
    [612] => data
    [613] => mining
    [614] => methods
    [616] => sample
    [617] => parts
    [620] => larger
    [621] => population
    [622] => data
    [623] => set
    [630] => small
    [632] => reliable
    [633] => statistical
    [634] => inferences
    [637] => made
    [640] => validity
    [643] => patterns
    [644] => discovered
    [646] => methods
    [652] => creating
    [654] => hypotheses
    [656] => test
    [659] => larger
    [660] => data
    [661] => populations
    [662] => contents
    [663] => 1
    [664] => etymology
    [665] => 2
    [666] => background
    [667] => 3
    [668] => process
    [669] => 3
    [670] => 1
    [671] => pre-processing
    [672] => 3
    [673] => 2
    [674] => data
    [675] => mining
    [676] => 3
    [677] => 3
    [678] => results
    [679] => validation
    [680] => 4
    [681] => research
    [682] => 5
    [683] => standards
    [684] => 6
    [685] => notable
    [687] => 7
    [688] => privacy
    [689] => concerns
    [691] => ethics
    [692] => 7
    [693] => 1
    [694] => situation
    [696] => europe
    [697] => 7
    [698] => 2
    [699] => situation
    [702] => united
    [703] => states
    [704] => 8
    [705] => copyright
    [706] => law
    [707] => 8
    [708] => 1
    [709] => situation
    [711] => europe
    [712] => 8
    [713] => 2
    [714] => situation
    [717] => united
    [718] => states
    [719] => 9
    [720] => software
    [721] => 9
    [722] => 1
    [723] => free
    [724] => open-source
    [725] => data
    [726] => mining
    [727] => software
    [729] => applications
    [730] => 9
    [731] => 2
    [732] => proprietary
    [733] => data-mining
    [734] => software
    [736] => applications
    [737] => 9
    [738] => 3
    [739] => marketplace
    [740] => surveys
    [741] => 10
    [744] => 11
    [745] => references
    [746] => 12
    [748] => reading
    [749] => 13
    [750] => external
    [751] => links
    [752] => etymology
    [753] => edit
    [756] => 1960s
    [757] => statisticians
    [759] => terms
    [761] => data
    [762] => fishing
    [764] => data
    [765] => dredging
    [767] => refer
    [771] => considered
    [773] => bad
    [774] => practice
    [776] => analyzing
    [777] => data
    [780] => a-priori
    [781] => hypothesis
    [783] => term
    [784] => data
    [785] => mining
    [786] => appeared
    [788] => 1990
    [791] => database
    [792] => community
    [795] => short
    [796] => time
    [798] => 1980s
    [800] => phrase
    [801] => database
    [802] => mining
    [809] => trademarked
    [811] => hnc
    [813] => san
    [814] => diego-based
    [815] => company
    [817] => pitch
    [819] => database
    [820] => mining
    [821] => workstation
    [822] => 10
    [823] => researchers
    [825] => turned
    [827] => data
    [828] => mining
    [830] => terms
    [832] => include
    [833] => data
    [834] => archaeology
    [835] => information
    [836] => harvesting
    [837] => information
    [838] => discovery
    [839] => knowledge
    [840] => extraction
    [842] => gregory
    [843] => piatetsky-shapiro
    [844] => coined
    [846] => term
    [847] => knowledge
    [848] => discovery
    [850] => databases
    [854] => workshop
    [858] => topic
    [859] => kdd-1989
    [862] => term
    [865] => popular
    [867] => ai
    [869] => machine
    [870] => learning
    [871] => community
    [874] => term
    [875] => data
    [876] => mining
    [879] => popular
    [882] => business
    [884] => press
    [885] => communities
    [886] => 11
    [889] => terms
    [890] => data
    [891] => mining
    [893] => knowledge
    [894] => discovery
    [897] => interchangeably
    [900] => academic
    [901] => community
    [903] => major
    [904] => forums
    [906] => research
    [907] => started
    [909] => 1995
    [913] => international
    [914] => conference
    [916] => data
    [917] => mining
    [919] => knowledge
    [920] => discovery
    [921] => kdd-95
    [923] => started
    [925] => montreal
    [927] => aaai
    [928] => sponsorship
    [931] => co-chaired
    [933] => usama
    [934] => fayyad
    [936] => ramasamy
    [937] => uthurusamy
    [939] => year
    [942] => 1996
    [943] => usama
    [944] => fayyad
    [945] => launched
    [947] => journal
    [949] => kluwer
    [950] => called
    [951] => data
    [952] => mining
    [954] => knowledge
    [955] => discovery
    [958] => founding
    [959] => editor-in-chief
    [962] => started
    [964] => sigkddd
    [965] => newsletter
    [966] => sigkdd
    [967] => explorations
    [968] => 12
    [970] => kdd
    [971] => international
    [972] => conference
    [975] => primary
    [976] => highest
    [977] => quality
    [978] => conference
    [980] => data
    [981] => mining
    [984] => acceptance
    [985] => rate
    [987] => research
    [988] => paper
    [989] => submissions
    [991] => 18
    [993] => journal
    [994] => data
    [995] => mining
    [997] => knowledge
    [998] => discovery
    [1001] => primary
    [1002] => research
    [1003] => journal
    [1006] => field
    [1007] => background
    [1008] => edit
    [1010] => manual
    [1011] => extraction
    [1013] => patterns
    [1015] => data
    [1017] => occurred
    [1019] => centuries
    [1020] => early
    [1021] => methods
    [1023] => identifying
    [1024] => patterns
    [1026] => data
    [1027] => include
    [1028] => bayes'
    [1029] => theorem
    [1030] => 1700s
    [1032] => regression
    [1033] => analysis
    [1034] => 1800s
    [1036] => proliferation
    [1037] => ubiquity
    [1039] => increasing
    [1040] => power
    [1042] => computer
    [1043] => technology
    [1045] => dramatically
    [1046] => increased
    [1047] => data
    [1048] => collection
    [1049] => storage
    [1051] => manipulation
    [1052] => ability
    [1054] => data
    [1055] => sets
    [1057] => grown
    [1059] => size
    [1061] => complexity
    [1062] => direct
    [1063] => hands-on
    [1064] => data
    [1065] => analysis
    [1067] => increasingly
    [1069] => augmented
    [1071] => indirect
    [1072] => automated
    [1073] => data
    [1074] => processing
    [1075] => aided
    [1078] => discoveries
    [1080] => computer
    [1081] => science
    [1084] => neural
    [1085] => networks
    [1086] => cluster
    [1087] => analysis
    [1088] => genetic
    [1089] => algorithms
    [1090] => 1950s
    [1091] => decision
    [1092] => trees
    [1094] => decision
    [1095] => rules
    [1096] => 1960s
    [1098] => support
    [1099] => vector
    [1100] => machines
    [1101] => 1990s
    [1102] => data
    [1103] => mining
    [1106] => process
    [1108] => applying
    [1110] => methods
    [1113] => intention
    [1115] => uncovering
    [1116] => hidden
    [1117] => patterns
    [1118] => 13
    [1120] => large
    [1121] => data
    [1122] => sets
    [1124] => bridges
    [1126] => gap
    [1128] => applied
    [1129] => statistics
    [1131] => artificial
    [1132] => intelligence
    [1135] => provide
    [1137] => mathematical
    [1138] => background
    [1140] => database
    [1141] => management
    [1143] => exploiting
    [1146] => data
    [1148] => stored
    [1150] => indexed
    [1152] => databases
    [1154] => execute
    [1156] => actual
    [1157] => learning
    [1159] => discovery
    [1160] => algorithms
    [1162] => efficiently
    [1163] => allowing
    [1165] => methods
    [1168] => applied
    [1171] => larger
    [1172] => data
    [1173] => sets
    [1174] => process
    [1175] => edit
    [1177] => knowledge
    [1178] => discovery
    [1180] => databases
    [1181] => kdd
    [1182] => process
    [1184] => commonly
    [1185] => defined
    [1188] => stages
    [1189] => 1
    [1190] => selection
    [1191] => 2
    [1192] => pre-processing
    [1193] => 3
    [1194] => transformation
    [1195] => 4
    [1196] => data
    [1197] => mining
    [1198] => 5
    [1199] => interpretation
    [1200] => evaluation
    [1201] => 5
    [1203] => exists
    [1207] => variations
    [1210] => theme
    [1214] => cross
    [1215] => industry
    [1216] => standard
    [1217] => process
    [1219] => data
    [1220] => mining
    [1221] => crisp-dm
    [1223] => defines
    [1225] => phases
    [1226] => 1
    [1227] => business
    [1228] => understanding
    [1229] => 2
    [1230] => data
    [1231] => understanding
    [1232] => 3
    [1233] => data
    [1234] => preparation
    [1235] => 4
    [1236] => modeling
    [1237] => 5
    [1238] => evaluation
    [1239] => 6
    [1240] => deployment
    [1243] => simplified
    [1244] => process
    [1247] => 1
    [1248] => pre-processing
    [1249] => 2
    [1250] => data
    [1251] => mining
    [1253] => 3
    [1254] => results
    [1255] => validation
    [1256] => polls
    [1257] => conducted
    [1259] => 2002
    [1260] => 2004
    [1261] => 2007
    [1263] => 2014
    [1264] => show
    [1267] => crisp-dm
    [1268] => methodology
    [1271] => leading
    [1272] => methodology
    [1275] => data
    [1276] => miners
    [1277] => 14
    [1281] => data
    [1282] => mining
    [1283] => standard
    [1284] => named
    [1287] => polls
    [1289] => semma
    [1291] => 3
    [1292] => 4
    [1293] => times
    [1296] => people
    [1297] => reported
    [1299] => crisp-dm
    [1301] => teams
    [1303] => researchers
    [1305] => published
    [1306] => reviews
    [1308] => data
    [1309] => mining
    [1310] => process
    [1311] => models
    [1312] => 15
    [1313] => 16
    [1315] => azevedo
    [1317] => santos
    [1318] => conducted
    [1320] => comparison
    [1322] => crisp-dm
    [1324] => semma
    [1326] => 2008
    [1327] => 17
    [1328] => pre-processing
    [1329] => edit
    [1331] => data
    [1332] => mining
    [1333] => algorithms
    [1338] => target
    [1339] => data
    [1340] => set
    [1343] => assembled
    [1345] => data
    [1346] => mining
    [1349] => uncover
    [1350] => patterns
    [1352] => present
    [1355] => data
    [1357] => target
    [1358] => data
    [1359] => set
    [1362] => large
    [1367] => patterns
    [1369] => remaining
    [1370] => concise
    [1374] => mined
    [1377] => acceptable
    [1378] => time
    [1379] => limit
    [1381] => common
    [1382] => source
    [1384] => data
    [1387] => data
    [1388] => mart
    [1390] => data
    [1391] => warehouse
    [1392] => pre-processing
    [1394] => essential
    [1396] => analyze
    [1398] => multivariate
    [1399] => data
    [1400] => sets
    [1402] => data
    [1403] => mining
    [1405] => target
    [1406] => set
    [1409] => cleaned
    [1410] => data
    [1411] => cleaning
    [1412] => removes
    [1414] => observations
    [1416] => noise
    [1420] => missing
    [1421] => data
    [1422] => data
    [1423] => mining
    [1424] => edit
    [1425] => data
    [1426] => mining
    [1427] => involves
    [1429] => common
    [1430] => classes
    [1432] => tasks
    [1433] => 5
    [1434] => anomaly
    [1435] => detection
    [1436] => outlier
    [1437] => change
    [1438] => deviation
    [1439] => detection
    [1441] => identification
    [1443] => unusual
    [1444] => data
    [1445] => records
    [1449] => interesting
    [1451] => data
    [1452] => errors
    [1454] => require
    [1456] => investigation
    [1457] => association
    [1458] => rule
    [1459] => learning
    [1460] => dependency
    [1461] => modelling
    [1462] => searches
    [1464] => relationships
    [1466] => variables
    [1470] => supermarket
    [1472] => gather
    [1473] => data
    [1475] => customer
    [1476] => purchasing
    [1477] => habits
    [1479] => association
    [1480] => rule
    [1481] => learning
    [1483] => supermarket
    [1485] => determine
    [1487] => products
    [1489] => frequently
    [1490] => bought
    [1495] => information
    [1497] => marketing
    [1498] => purposes
    [1502] => referred
    [1505] => market
    [1506] => basket
    [1507] => analysis
    [1508] => clustering
    [1511] => task
    [1513] => discovering
    [1514] => groups
    [1516] => structures
    [1519] => data
    [1527] => similar
    [1531] => structures
    [1534] => data
    [1535] => classification
    [1538] => task
    [1540] => generalizing
    [1542] => structure
    [1544] => apply
    [1547] => data
    [1551] => e-mail
    [1552] => program
    [1554] => attempt
    [1556] => classify
    [1558] => e-mail
    [1560] => legitimate
    [1563] => spam
    [1564] => regression
    [1565] => attempts
    [1567] => find
    [1569] => function
    [1571] => models
    [1573] => data
    [1577] => error
    [1581] => estimating
    [1583] => relationships
    [1585] => data
    [1587] => datasets
    [1588] => summarization
    [1589] => providing
    [1592] => compact
    [1593] => representation
    [1596] => data
    [1597] => set
    [1598] => including
    [1599] => visualization
    [1601] => report
    [1602] => generation
    [1603] => results
    [1604] => validation
    [1605] => edit
    [1609] => data
    [1610] => produced
    [1612] => data
    [1613] => dredging
    [1616] => bot
    [1617] => operated
    [1619] => statistician
    [1620] => tyler
    [1621] => vigen
    [1622] => apparently
    [1623] => showing
    [1625] => close
    [1626] => link
    [1630] => word
    [1631] => winning
    [1633] => spelling
    [1634] => bee
    [1635] => competition
    [1638] => number
    [1640] => people
    [1643] => united
    [1644] => states
    [1645] => killed
    [1647] => venomous
    [1648] => spiders
    [1650] => similarity
    [1652] => trends
    [1656] => coincidence
    [1657] => data
    [1658] => mining
    [1660] => unintentionally
    [1662] => misused
    [1666] => produce
    [1667] => results
    [1672] => significant
    [1678] => predict
    [1679] => future
    [1680] => behaviour
    [1684] => reproduced
    [1688] => sample
    [1690] => data
    [1692] => bear
    [1697] => results
    [1699] => investigating
    [1702] => hypotheses
    [1705] => performing
    [1706] => proper
    [1707] => statistical
    [1708] => hypothesis
    [1709] => testing
    [1711] => simple
    [1712] => version
    [1715] => problem
    [1717] => machine
    [1718] => learning
    [1722] => overfitting
    [1726] => problem
    [1728] => arise
    [1731] => phases
    [1734] => process
    [1738] => train
    [1739] => test
    [1740] => split
    [1743] => applicable
    [1750] => sufficient
    [1752] => prevent
    [1755] => happening
    [1756] => 18
    [1758] => section
    [1760] => missing
    [1761] => information
    [1763] => non-classification
    [1764] => tasks
    [1766] => data
    [1767] => mining
    [1770] => covers
    [1771] => machine
    [1772] => learning
    [1774] => expand
    [1776] => section
    [1778] => include
    [1780] => information
    [1782] => details
    [1784] => exist
    [1787] => talk
    [1788] => page
    [1789] => september
    [1790] => 2011
    [1792] => final
    [1793] => step
    [1795] => knowledge
    [1796] => discovery
    [1798] => data
    [1801] => verify
    [1804] => patterns
    [1805] => produced
    [1808] => data
    [1809] => mining
    [1810] => algorithms
    [1811] => occur
    [1814] => wider
    [1815] => data
    [1816] => set
    [1819] => patterns
    [1820] => found
    [1823] => data
    [1824] => mining
    [1825] => algorithms
    [1827] => necessarily
    [1828] => valid
    [1831] => common
    [1834] => data
    [1835] => mining
    [1836] => algorithms
    [1838] => find
    [1839] => patterns
    [1842] => training
    [1843] => set
    [1847] => present
    [1850] => general
    [1851] => data
    [1852] => set
    [1855] => called
    [1856] => overfitting
    [1858] => overcome
    [1861] => evaluation
    [1864] => test
    [1865] => set
    [1867] => data
    [1871] => data
    [1872] => mining
    [1873] => algorithm
    [1876] => trained
    [1878] => learned
    [1879] => patterns
    [1881] => applied
    [1884] => test
    [1885] => set
    [1888] => resulting
    [1889] => output
    [1891] => compared
    [1894] => desired
    [1895] => output
    [1899] => data
    [1900] => mining
    [1901] => algorithm
    [1904] => distinguish
    [1905] => spam
    [1907] => legitimate
    [1908] => emails
    [1911] => trained
    [1914] => training
    [1915] => set
    [1917] => sample
    [1918] => e-mails
    [1920] => trained
    [1922] => learned
    [1923] => patterns
    [1926] => applied
    [1929] => test
    [1930] => set
    [1932] => e-mails
    [1939] => trained
    [1941] => accuracy
    [1944] => patterns
    [1948] => measured
    [1952] => e-mails
    [1954] => correctly
    [1955] => classify
    [1957] => number
    [1959] => statistical
    [1960] => methods
    [1965] => evaluate
    [1967] => algorithm
    [1970] => roc
    [1971] => curves
    [1974] => learned
    [1975] => patterns
    [1978] => meet
    [1980] => desired
    [1981] => standards
    [1982] => subsequently
    [1987] => re-evaluate
    [1989] => change
    [1991] => pre-processing
    [1993] => data
    [1994] => mining
    [1995] => steps
    [1998] => learned
    [1999] => patterns
    [2001] => meet
    [2003] => desired
    [2004] => standards
    [2007] => final
    [2008] => step
    [2011] => interpret
    [2013] => learned
    [2014] => patterns
    [2016] => turn
    [2019] => knowledge
    [2020] => research
    [2021] => edit
    [2023] => premier
    [2024] => professional
    [2025] => body
    [2028] => field
    [2031] => association
    [2033] => computing
    [2034] => machinery
    [2035] => 's
    [2036] => acm
    [2037] => special
    [2038] => interest
    [2039] => group
    [2040] => sig
    [2042] => knowledge
    [2043] => discovery
    [2045] => data
    [2046] => mining
    [2047] => sigkdd
    [2048] => 19
    [2049] => 20
    [2051] => 1989
    [2053] => acm
    [2054] => sig
    [2056] => hosted
    [2058] => annual
    [2059] => international
    [2060] => conference
    [2062] => published
    [2064] => proceedings
    [2065] => 21
    [2068] => 1999
    [2071] => published
    [2073] => biannual
    [2074] => academic
    [2075] => journal
    [2076] => titled
    [2077] => sigkdd
    [2078] => explorations
    [2079] => 22
    [2080] => computer
    [2081] => science
    [2082] => conferences
    [2084] => data
    [2085] => mining
    [2086] => include
    [2087] => cikm
    [2088] => conference
    [2089] => acm
    [2090] => conference
    [2092] => information
    [2094] => knowledge
    [2095] => management
    [2096] => european
    [2097] => conference
    [2099] => machine
    [2100] => learning
    [2102] => principles
    [2104] => practice
    [2106] => knowledge
    [2107] => discovery
    [2109] => databases
    [2110] => kdd
    [2111] => conference
    [2112] => acm
    [2113] => sigkdd
    [2114] => conference
    [2116] => knowledge
    [2117] => discovery
    [2119] => data
    [2120] => mining
    [2121] => data
    [2122] => mining
    [2123] => topics
    [2126] => present
    [2129] => data
    [2130] => management
    [2131] => database
    [2132] => conferences
    [2136] => icde
    [2137] => conference
    [2138] => sigmod
    [2139] => conference
    [2141] => international
    [2142] => conference
    [2145] => large
    [2146] => data
    [2147] => bases
    [2148] => standards
    [2149] => edit
    [2154] => efforts
    [2156] => define
    [2157] => standards
    [2160] => data
    [2161] => mining
    [2162] => process
    [2166] => 1999
    [2167] => european
    [2168] => cross
    [2169] => industry
    [2170] => standard
    [2171] => process
    [2173] => data
    [2174] => mining
    [2175] => crisp-dm
    [2176] => 1
    [2177] => 0
    [2180] => 2004
    [2181] => java
    [2182] => data
    [2183] => mining
    [2184] => standard
    [2185] => jdm
    [2186] => 1
    [2187] => 0
    [2188] => development
    [2190] => successors
    [2193] => processes
    [2194] => crisp-dm
    [2195] => 2
    [2196] => 0
    [2198] => jdm
    [2199] => 2
    [2200] => 0
    [2202] => active
    [2204] => 2006
    [2207] => stalled
    [2209] => jdm
    [2210] => 2
    [2211] => 0
    [2213] => withdrawn
    [2215] => reaching
    [2217] => final
    [2218] => draft
    [2220] => exchanging
    [2222] => extracted
    [2223] => models
    [2229] => predictive
    [2230] => analytics
    [2232] => key
    [2233] => standard
    [2236] => predictive
    [2237] => model
    [2238] => markup
    [2239] => language
    [2240] => pmml
    [2244] => xml
    [2245] => -based
    [2246] => language
    [2247] => developed
    [2250] => data
    [2251] => mining
    [2252] => group
    [2253] => dmg
    [2255] => supported
    [2257] => exchange
    [2258] => format
    [2261] => data
    [2262] => mining
    [2263] => applications
    [2267] => suggests
    [2270] => covers
    [2271] => prediction
    [2272] => models
    [2275] => data
    [2276] => mining
    [2277] => task
    [2279] => high
    [2280] => importance
    [2282] => business
    [2283] => applications
    [2285] => extensions
    [2287] => cover
    [2290] => subspace
    [2291] => clustering
    [2294] => proposed
    [2295] => independently
    [2298] => dmg
    [2299] => 23
    [2300] => notable
    [2302] => edit
    [2303] => main
    [2304] => article
    [2305] => examples
    [2307] => data
    [2308] => mining
    [2311] => category
    [2312] => applied
    [2313] => data
    [2314] => mining
    [2315] => data
    [2316] => mining
    [2322] => digital
    [2323] => data
    [2325] => today
    [2326] => notable
    [2327] => examples
    [2329] => data
    [2330] => mining
    [2333] => found
    [2335] => business
    [2336] => medicine
    [2337] => science
    [2339] => surveillance
    [2340] => privacy
    [2341] => concerns
    [2343] => ethics
    [2344] => edit
    [2347] => term
    [2348] => data
    [2349] => mining
    [2354] => ethical
    [2355] => implications
    [2362] => mining
    [2364] => information
    [2366] => relation
    [2368] => peoples'
    [2369] => behavior
    [2370] => ethical
    [2373] => 24
    [2375] => ways
    [2378] => data
    [2379] => mining
    [2386] => cases
    [2388] => contexts
    [2389] => raise
    [2390] => questions
    [2392] => privacy
    [2393] => legality
    [2395] => ethics
    [2396] => 25
    [2399] => data
    [2400] => mining
    [2401] => government
    [2403] => commercial
    [2404] => data
    [2405] => sets
    [2407] => national
    [2408] => security
    [2410] => law
    [2411] => enforcement
    [2412] => purposes
    [2417] => total
    [2418] => information
    [2419] => awareness
    [2420] => program
    [2423] => advise
    [2425] => raised
    [2426] => privacy
    [2427] => concerns
    [2428] => 26
    [2429] => 27
    [2430] => data
    [2431] => mining
    [2432] => requires
    [2433] => data
    [2434] => preparation
    [2437] => uncover
    [2438] => information
    [2440] => patterns
    [2443] => compromise
    [2444] => confidentiality
    [2446] => privacy
    [2447] => obligations
    [2449] => common
    [2454] => occur
    [2457] => data
    [2458] => aggregation
    [2459] => data
    [2460] => aggregation
    [2461] => involves
    [2462] => combining
    [2463] => data
    [2465] => possibly
    [2468] => sources
    [2473] => facilitates
    [2474] => analysis
    [2479] => make
    [2480] => identification
    [2482] => private
    [2483] => individual-level
    [2484] => data
    [2485] => deducible
    [2488] => apparent
    [2489] => 28
    [2493] => data
    [2494] => mining
    [2496] => se
    [2499] => result
    [2502] => preparation
    [2504] => data
    [2509] => purposes
    [2512] => analysis
    [2514] => threat
    [2517] => individual's
    [2518] => privacy
    [2521] => play
    [2524] => data
    [2526] => compiled
    [2529] => data
    [2530] => miner
    [2535] => access
    [2538] => newly
    [2539] => compiled
    [2540] => data
    [2541] => set
    [2546] => identify
    [2547] => specific
    [2548] => individuals
    [2552] => data
    [2554] => originally
    [2555] => anonymous
    [2556] => 29
    [2557] => 30
    [2558] => 31
    [2561] => recommended
    [2564] => individual
    [2566] => made
    [2567] => aware
    [2572] => data
    [2574] => collected
    [2575] => 28
    [2577] => purpose
    [2580] => data
    [2581] => collection
    [2585] => data
    [2586] => mining
    [2587] => projects
    [2590] => data
    [2599] => mine
    [2601] => data
    [2605] => data
    [2608] => derivatives
    [2610] => status
    [2612] => security
    [2613] => surrounding
    [2614] => access
    [2617] => data
    [2619] => collected
    [2620] => data
    [2623] => updated
    [2624] => data
    [2628] => modified
    [2633] => anonymous
    [2636] => individuals
    [2639] => readily
    [2641] => identified
    [2642] => 28
    [2645] => de-identified
    [2646] => anonymized
    [2647] => data
    [2648] => sets
    [2650] => potentially
    [2653] => information
    [2656] => identification
    [2658] => individuals
    [2660] => occurred
    [2662] => journalists
    [2666] => find
    [2668] => individuals
    [2669] => based
    [2672] => set
    [2674] => search
    [2675] => histories
    [2678] => inadvertently
    [2679] => released
    [2681] => aol
    [2682] => 32
    [2684] => inadvertent
    [2685] => revelation
    [2687] => personally
    [2688] => identifiable
    [2689] => information
    [2690] => leading
    [2693] => provider
    [2694] => violates
    [2695] => fair
    [2696] => information
    [2697] => practices
    [2699] => indiscretion
    [2702] => financial
    [2703] => emotional
    [2705] => bodily
    [2706] => harm
    [2710] => individual
    [2713] => instance
    [2715] => privacy
    [2716] => violation
    [2718] => patrons
    [2720] => walgreens
    [2721] => filed
    [2723] => lawsuit
    [2726] => company
    [2728] => 2011
    [2730] => selling
    [2731] => prescription
    [2732] => information
    [2734] => data
    [2735] => mining
    [2736] => companies
    [2739] => turn
    [2740] => provided
    [2742] => data
    [2744] => pharmaceutical
    [2745] => companies
    [2746] => 33
    [2747] => situation
    [2749] => europe
    [2750] => edit
    [2751] => europe
    [2754] => strong
    [2755] => privacy
    [2756] => laws
    [2758] => efforts
    [2760] => underway
    [2763] => strengthen
    [2765] => rights
    [2768] => consumers
    [2771] => u
    [2772] => s
    [2773] => -e
    [2774] => u
    [2775] => safe
    [2776] => harbor
    [2777] => principles
    [2779] => effectively
    [2780] => expose
    [2781] => european
    [2782] => users
    [2784] => privacy
    [2785] => exploitation
    [2787] => u
    [2788] => s
    [2789] => companies
    [2792] => consequence
    [2794] => edward
    [2795] => snowden
    [2796] => 's
    [2797] => global
    [2798] => surveillance
    [2799] => disclosure
    [2803] => increased
    [2804] => discussion
    [2806] => revoke
    [2808] => agreement
    [2813] => data
    [2816] => fully
    [2817] => exposed
    [2820] => national
    [2821] => security
    [2822] => agency
    [2824] => attempts
    [2826] => reach
    [2828] => agreement
    [2830] => failed
    [2831] => citation
    [2832] => needed
    [2833] => situation
    [2836] => united
    [2837] => states
    [2838] => edit
    [2841] => united
    [2842] => states
    [2843] => privacy
    [2844] => concerns
    [2847] => addressed
    [2851] => congress
    [2854] => passage
    [2856] => regulatory
    [2857] => controls
    [2861] => health
    [2862] => insurance
    [2863] => portability
    [2865] => accountability
    [2866] => act
    [2867] => hipaa
    [2869] => hipaa
    [2870] => requires
    [2871] => individuals
    [2873] => give
    [2875] => informed
    [2876] => consent
    [2878] => information
    [2880] => provide
    [2883] => intended
    [2884] => present
    [2886] => future
    [2891] => article
    [2893] => biotech
    [2894] => business
    [2895] => week
    [2896] => '
    [2898] => n
    [2899] => practice
    [2900] => hipaa
    [2903] => offer
    [2905] => greater
    [2906] => protection
    [2909] => longstanding
    [2910] => regulations
    [2913] => research
    [2914] => arena
    [2915] => '
    [2918] => aahc
    [2920] => importantly
    [2922] => rule's
    [2923] => goal
    [2925] => protection
    [2927] => informed
    [2928] => consent
    [2930] => approach
    [2932] => level
    [2934] => incomprehensibility
    [2936] => average
    [2937] => individuals
    [2938] => 34
    [2940] => underscores
    [2942] => necessity
    [2944] => data
    [2945] => anonymity
    [2947] => data
    [2948] => aggregation
    [2950] => mining
    [2951] => practices
    [2952] => u
    [2953] => s
    [2954] => information
    [2955] => privacy
    [2956] => legislation
    [2959] => hipaa
    [2962] => family
    [2963] => educational
    [2964] => rights
    [2966] => privacy
    [2967] => act
    [2968] => ferpa
    [2969] => applies
    [2973] => specific
    [2974] => areas
    [2978] => law
    [2979] => addresses
    [2982] => data
    [2983] => mining
    [2986] => majority
    [2988] => businesses
    [2991] => u
    [2992] => s
    [2995] => controlled
    [2998] => legislation
    [2999] => copyright
    [3000] => law
    [3001] => edit
    [3002] => situation
    [3004] => europe
    [3005] => edit
    [3006] => due
    [3009] => lack
    [3011] => flexibilities
    [3013] => european
    [3014] => copyright
    [3016] => database
    [3017] => law
    [3019] => mining
    [3021] => in-copyright
    [3022] => works
    [3025] => web
    [3026] => mining
    [3029] => permission
    [3032] => copyright
    [3033] => owner
    [3036] => legal
    [3039] => database
    [3041] => pure
    [3042] => data
    [3044] => europe
    [3051] => copyright
    [3053] => database
    [3054] => rights
    [3056] => exist
    [3058] => data
    [3059] => mining
    [3061] => subject
    [3063] => regulations
    [3066] => database
    [3067] => directive
    [3070] => recommendation
    [3073] => hargreaves
    [3074] => review
    [3076] => led
    [3079] => uk
    [3080] => government
    [3082] => amend
    [3084] => copyright
    [3085] => law
    [3087] => 2014
    [3088] => 35
    [3091] => content
    [3092] => mining
    [3095] => limitation
    [3097] => exception
    [3101] => country
    [3104] => world
    [3109] => japan
    [3111] => introduced
    [3113] => exception
    [3115] => 2009
    [3117] => data
    [3118] => mining
    [3120] => due
    [3123] => restriction
    [3126] => copyright
    [3127] => directive
    [3129] => uk
    [3130] => exception
    [3133] => content
    [3134] => mining
    [3136] => non-commercial
    [3137] => purposes
    [3138] => uk
    [3139] => copyright
    [3140] => law
    [3146] => provision
    [3149] => overridden
    [3151] => contractual
    [3152] => terms
    [3154] => conditions
    [3156] => european
    [3157] => commission
    [3158] => facilitated
    [3159] => stakeholder
    [3160] => discussion
    [3162] => text
    [3164] => data
    [3165] => mining
    [3167] => 2013
    [3170] => title
    [3172] => licences
    [3174] => europe
    [3175] => 36
    [3177] => focus
    [3180] => solution
    [3183] => legal
    [3184] => issue
    [3186] => licences
    [3189] => limitations
    [3191] => exceptions
    [3192] => led
    [3194] => representatives
    [3196] => universities
    [3197] => researchers
    [3198] => libraries
    [3199] => civil
    [3200] => society
    [3201] => groups
    [3203] => open
    [3204] => access
    [3205] => publishers
    [3207] => leave
    [3209] => stakeholder
    [3210] => dialogue
    [3213] => 2013
    [3214] => 37
    [3215] => situation
    [3218] => united
    [3219] => states
    [3220] => edit
    [3222] => contrast
    [3224] => europe
    [3226] => flexible
    [3227] => nature
    [3230] => copyright
    [3231] => law
    [3235] => fair
    [3237] => means
    [3239] => content
    [3240] => mining
    [3242] => america
    [3247] => fair
    [3249] => countries
    [3252] => israel
    [3253] => taiwan
    [3255] => south
    [3256] => korea
    [3258] => viewed
    [3261] => legal
    [3263] => content
    [3264] => mining
    [3266] => transformative
    [3272] => supplant
    [3274] => original
    [3275] => work
    [3278] => viewed
    [3281] => lawful
    [3283] => fair
    [3288] => part
    [3291] => google
    [3292] => book
    [3293] => settlement
    [3295] => presiding
    [3296] => judge
    [3299] => case
    [3300] => ruled
    [3302] => google's
    [3303] => digitisation
    [3304] => project
    [3306] => in-copyright
    [3307] => books
    [3309] => lawful
    [3311] => part
    [3315] => transformative
    [3319] => digitisation
    [3320] => project
    [3321] => displayed
    [3325] => text
    [3327] => data
    [3328] => mining
    [3329] => 38
    [3330] => software
    [3331] => edit
    [3334] => category
    [3335] => data
    [3336] => mining
    [3338] => machine
    [3339] => learning
    [3340] => software
    [3341] => free
    [3342] => open-source
    [3343] => data
    [3344] => mining
    [3345] => software
    [3347] => applications
    [3348] => edit
    [3351] => applications
    [3355] => free
    [3356] => open
    [3357] => source
    [3358] => licenses
    [3359] => public
    [3360] => access
    [3362] => application
    [3363] => source
    [3364] => code
    [3368] => carrot2
    [3369] => text
    [3371] => search
    [3372] => results
    [3373] => clustering
    [3374] => framework
    [3375] => chemicalize
    [3376] => org
    [3378] => chemical
    [3379] => structure
    [3380] => miner
    [3382] => web
    [3383] => search
    [3384] => engine
    [3385] => elki
    [3387] => university
    [3388] => research
    [3389] => project
    [3391] => advanced
    [3392] => cluster
    [3393] => analysis
    [3395] => outlier
    [3396] => detection
    [3397] => methods
    [3398] => written
    [3401] => java
    [3402] => language
    [3403] => gate
    [3405] => natural
    [3406] => language
    [3407] => processing
    [3409] => language
    [3410] => engineering
    [3411] => tool
    [3412] => knime
    [3414] => konstanz
    [3415] => information
    [3416] => miner
    [3418] => user
    [3419] => friendly
    [3421] => comprehensive
    [3422] => data
    [3423] => analytics
    [3424] => framework
    [3425] => massive
    [3426] => online
    [3427] => analysis
    [3428] => moa
    [3430] => real-time
    [3431] => big
    [3432] => data
    [3433] => stream
    [3434] => mining
    [3436] => concept
    [3437] => drift
    [3438] => tool
    [3441] => java
    [3442] => programming
    [3443] => language
    [3444] => mepx
    [3446] => cross
    [3447] => platform
    [3448] => tool
    [3450] => regression
    [3452] => classification
    [3453] => problems
    [3454] => based
    [3457] => genetic
    [3458] => programming
    [3459] => variant
    [3460] => ml-flex
    [3462] => software
    [3463] => package
    [3465] => enables
    [3466] => users
    [3468] => integrate
    [3470] => third-party
    [3471] => machine-learning
    [3472] => packages
    [3473] => written
    [3476] => programming
    [3477] => language
    [3478] => execute
    [3479] => classification
    [3480] => analyses
    [3482] => parallel
    [3484] => multiple
    [3485] => computing
    [3486] => nodes
    [3488] => produce
    [3489] => html
    [3490] => reports
    [3492] => classification
    [3493] => results
    [3494] => mlpack
    [3495] => library
    [3497] => collection
    [3499] => ready-to-use
    [3500] => machine
    [3501] => learning
    [3502] => algorithms
    [3503] => written
    [3506] => c
    [3507] => language
    [3508] => nltk
    [3509] => natural
    [3510] => language
    [3511] => toolkit
    [3513] => suite
    [3515] => libraries
    [3517] => programs
    [3519] => symbolic
    [3521] => statistical
    [3522] => natural
    [3523] => language
    [3524] => processing
    [3525] => nlp
    [3528] => python
    [3529] => language
    [3530] => opennn
    [3531] => open
    [3532] => neural
    [3533] => networks
    [3534] => library
    [3535] => orange
    [3537] => component-based
    [3538] => data
    [3539] => mining
    [3541] => machine
    [3542] => learning
    [3543] => software
    [3544] => suite
    [3545] => written
    [3548] => python
    [3549] => language
    [3550] => r
    [3552] => programming
    [3553] => language
    [3555] => software
    [3556] => environment
    [3558] => statistical
    [3559] => computing
    [3560] => data
    [3561] => mining
    [3563] => graphics
    [3566] => part
    [3569] => gnu
    [3570] => project
    [3571] => scikit-learn
    [3574] => open
    [3575] => source
    [3576] => machine
    [3577] => learning
    [3578] => library
    [3581] => python
    [3582] => programming
    [3583] => language
    [3584] => torch
    [3586] => open
    [3587] => source
    [3588] => deep
    [3589] => learning
    [3590] => library
    [3593] => lua
    [3594] => programming
    [3595] => language
    [3597] => scientific
    [3598] => computing
    [3599] => framework
    [3601] => wide
    [3602] => support
    [3604] => machine
    [3605] => learning
    [3606] => algorithms
    [3607] => uima
    [3609] => uima
    [3610] => unstructured
    [3611] => information
    [3612] => management
    [3613] => architecture
    [3616] => component
    [3617] => framework
    [3619] => analyzing
    [3620] => unstructured
    [3621] => content
    [3624] => text
    [3625] => audio
    [3627] => video
    [3628] => originally
    [3629] => developed
    [3631] => ibm
    [3632] => weka
    [3634] => suite
    [3636] => machine
    [3637] => learning
    [3638] => software
    [3639] => applications
    [3640] => written
    [3643] => java
    [3644] => programming
    [3645] => language
    [3646] => proprietary
    [3647] => data-mining
    [3648] => software
    [3650] => applications
    [3651] => edit
    [3654] => applications
    [3658] => proprietary
    [3659] => licenses
    [3660] => angoss
    [3661] => knowledgestudio
    [3662] => data
    [3663] => mining
    [3664] => tool
    [3665] => clarabridge
    [3666] => text
    [3667] => analytics
    [3668] => product
    [3669] => kxen
    [3670] => modeler
    [3671] => data
    [3672] => mining
    [3673] => tool
    [3674] => provided
    [3676] => kxen
    [3678] => lionsolver
    [3680] => integrated
    [3681] => software
    [3682] => application
    [3684] => data
    [3685] => mining
    [3686] => business
    [3687] => intelligence
    [3689] => modeling
    [3691] => implements
    [3693] => learning
    [3695] => intelligent
    [3696] => optimization
    [3697] => lion
    [3698] => approach
    [3699] => megaputer
    [3700] => intelligence
    [3701] => data
    [3703] => text
    [3704] => mining
    [3705] => software
    [3707] => called
    [3708] => polyanalyst
    [3709] => microsoft
    [3710] => analysis
    [3711] => services
    [3712] => data
    [3713] => mining
    [3714] => software
    [3715] => provided
    [3717] => microsoft
    [3718] => netowl
    [3719] => suite
    [3721] => multilingual
    [3722] => text
    [3724] => entity
    [3725] => analytics
    [3726] => products
    [3728] => enable
    [3729] => data
    [3730] => mining
    [3731] => opentext
    [3732] => big
    [3733] => data
    [3734] => analytics
    [3735] => visual
    [3736] => data
    [3737] => mining
    [3738] => predictive
    [3739] => analysis
    [3741] => open
    [3742] => text
    [3743] => corporation
    [3744] => oracle
    [3745] => data
    [3746] => mining
    [3747] => data
    [3748] => mining
    [3749] => software
    [3751] => oracle
    [3752] => corporation
    [3753] => pseven
    [3754] => platform
    [3756] => automation
    [3758] => engineering
    [3759] => simulation
    [3761] => analysis
    [3762] => multidisciplinary
    [3763] => optimization
    [3765] => data
    [3766] => mining
    [3767] => provided
    [3769] => datadvance
    [3770] => qlucore
    [3771] => omics
    [3772] => explorer
    [3773] => data
    [3774] => mining
    [3775] => software
    [3776] => rapidminer
    [3778] => environment
    [3780] => machine
    [3781] => learning
    [3783] => data
    [3784] => mining
    [3785] => experiments
    [3786] => sas
    [3787] => enterprise
    [3788] => miner
    [3789] => data
    [3790] => mining
    [3791] => software
    [3792] => provided
    [3795] => sas
    [3796] => institute
    [3797] => spss
    [3798] => modeler
    [3799] => data
    [3800] => mining
    [3801] => software
    [3802] => provided
    [3804] => ibm
    [3805] => statistica
    [3806] => data
    [3807] => miner
    [3808] => data
    [3809] => mining
    [3810] => software
    [3811] => provided
    [3813] => statsoft
    [3814] => tanagra
    [3815] => visualisation-oriented
    [3816] => data
    [3817] => mining
    [3818] => software
    [3821] => teaching
    [3822] => vertica
    [3823] => data
    [3824] => mining
    [3825] => software
    [3826] => provided
    [3828] => hewlett-packard
    [3829] => marketplace
    [3830] => surveys
    [3831] => edit
    [3833] => researchers
    [3835] => organizations
    [3837] => conducted
    [3838] => reviews
    [3840] => data
    [3841] => mining
    [3842] => tools
    [3844] => surveys
    [3846] => data
    [3847] => miners
    [3849] => identify
    [3853] => strengths
    [3855] => weaknesses
    [3858] => software
    [3859] => packages
    [3862] => provide
    [3864] => overview
    [3867] => behaviors
    [3868] => preferences
    [3870] => views
    [3872] => data
    [3873] => miners
    [3877] => reports
    [3878] => include
    [3879] => hurwitz
    [3880] => victory
    [3881] => index
    [3882] => report
    [3884] => advanced
    [3885] => analytics
    [3888] => market
    [3889] => research
    [3890] => assessment
    [3891] => tool
    [3893] => highlights
    [3896] => diverse
    [3899] => advanced
    [3900] => analytics
    [3901] => technology
    [3904] => vendors
    [3906] => make
    [3908] => applications
    [3910] => recent-research
    [3911] => rexer
    [3912] => analytics
    [3913] => data
    [3914] => miner
    [3915] => surveys
    [3916] => 2007
    [3917] => 2015
    [3918] => 39
    [3919] => 2011
    [3920] => wiley
    [3921] => interdisciplinary
    [3922] => reviews
    [3923] => data
    [3924] => mining
    [3926] => knowledge
    [3927] => discovery
    [3928] => 40
    [3929] => forrester
    [3930] => research
    [3931] => 2010
    [3932] => predictive
    [3933] => analytics
    [3935] => data
    [3936] => mining
    [3937] => solutions
    [3938] => report
    [3939] => 41
    [3940] => gartner
    [3941] => 2008
    [3942] => magic
    [3943] => quadrant
    [3944] => report
    [3945] => 42
    [3946] => robert
    [3948] => nisbet's
    [3949] => 2006
    [3951] => part
    [3952] => series
    [3954] => articles
    [3955] => data
    [3956] => mining
    [3957] => tools
    [3963] => crm
    [3964] => 43
    [3965] => haughton
    [3967] => al
    [3968] => 's
    [3969] => 2003
    [3970] => review
    [3972] => data
    [3973] => mining
    [3974] => software
    [3975] => packages
    [3978] => american
    [3979] => statistician
    [3980] => 44
    [3981] => goebel
    [3982] => gruenwald
    [3983] => 1999
    [3985] => survey
    [3987] => data
    [3988] => mining
    [3990] => knowledge
    [3991] => discovery
    [3992] => software
    [3993] => tools
    [3995] => sigkdd
    [3996] => explorations
    [3997] => 45
    [4000] => edit
    [4001] => methods
    [4002] => agent
    [4003] => mining
    [4004] => anomaly
    [4005] => outlier
    [4006] => change
    [4007] => detection
    [4008] => association
    [4009] => rule
    [4010] => learning
    [4011] => bayesian
    [4012] => networks
    [4013] => classification
    [4014] => cluster
    [4015] => analysis
    [4016] => decision
    [4017] => trees
    [4018] => ensemble
    [4019] => learning
    [4020] => factor
    [4021] => analysis
    [4022] => genetic
    [4023] => algorithms
    [4024] => intention
    [4025] => mining
    [4026] => learning
    [4027] => classifier
    [4028] => system
    [4029] => multilinear
    [4030] => subspace
    [4031] => learning
    [4032] => neural
    [4033] => networks
    [4034] => regression
    [4035] => analysis
    [4036] => sequence
    [4037] => mining
    [4038] => structured
    [4039] => data
    [4040] => analysis
    [4041] => support
    [4042] => vector
    [4043] => machines
    [4044] => text
    [4045] => mining
    [4046] => time
    [4047] => series
    [4048] => analysis
    [4049] => application
    [4050] => domains
    [4051] => analytics
    [4052] => behavior
    [4053] => informatics
    [4054] => big
    [4055] => data
    [4056] => bioinformatics
    [4057] => business
    [4058] => intelligence
    [4059] => data
    [4060] => analysis
    [4061] => data
    [4062] => warehouse
    [4063] => decision
    [4064] => support
    [4065] => system
    [4066] => domain
    [4067] => driven
    [4068] => data
    [4069] => mining
    [4070] => drug
    [4071] => discovery
    [4072] => exploratory
    [4073] => data
    [4074] => analysis
    [4075] => predictive
    [4076] => analytics
    [4077] => web
    [4078] => mining
    [4079] => application
    [4080] => examples
    [4081] => main
    [4082] => article
    [4083] => examples
    [4085] => data
    [4086] => mining
    [4089] => category
    [4090] => applied
    [4091] => data
    [4092] => mining
    [4093] => automatic
    [4094] => number
    [4095] => plate
    [4096] => recognition
    [4099] => united
    [4100] => kingdom
    [4101] => customer
    [4102] => analytics
    [4103] => educational
    [4104] => data
    [4105] => mining
    [4106] => national
    [4107] => security
    [4108] => agency
    [4109] => quantitative
    [4110] => structure
    [4111] => activity
    [4112] => relationship
    [4113] => surveillance
    [4114] => mass
    [4115] => surveillance
    [4116] => e
    [4117] => g
    [4118] => stellar
    [4119] => wind
    [4120] => related
    [4121] => topics
    [4122] => data
    [4123] => mining
    [4126] => analyzing
    [4127] => data
    [4129] => information
    [4131] => extracting
    [4132] => information
    [4135] => data
    [4137] => data
    [4138] => integration
    [4139] => data
    [4140] => transformation
    [4141] => electronic
    [4142] => discovery
    [4143] => information
    [4144] => extraction
    [4145] => information
    [4146] => integration
    [4147] => named-entity
    [4148] => recognition
    [4149] => profiling
    [4150] => information
    [4151] => science
    [4152] => psychometrics
    [4153] => social
    [4154] => media
    [4155] => mining
    [4156] => surveillance
    [4157] => capitalism
    [4158] => web
    [4159] => scraping
    [4161] => resources
    [4162] => international
    [4163] => journal
    [4165] => data
    [4166] => warehousing
    [4168] => mining
    [4169] => references
    [4170] => edit
    [4172] => b
    [4173] => c
    [4174] => d
    [4175] => e
    [4176] => data
    [4177] => mining
    [4178] => curriculum
    [4179] => acm
    [4180] => sigkdd
    [4181] => 2006-04-30
    [4182] => retrieved
    [4183] => 2014-01-27
    [4184] => han
    [4185] => kamber
    [4186] => pei
    [4187] => jaiwei
    [4188] => micheline
    [4189] => jian
    [4190] => june
    [4191] => 9
    [4192] => 2011
    [4193] => data
    [4194] => mining
    [4195] => concepts
    [4197] => techniques
    [4198] => 3rd
    [4199] => ed
    [4200] => morgan
    [4201] => kaufmann
    [4202] => isbn
    [4203] => 978-0-12-381479-1
    [4204] => cs1
    [4205] => maint
    [4206] => multiple
    [4207] => names
    [4208] => authors
    [4209] => list
    [4210] => link
    [4211] => clifton
    [4212] => christopher
    [4213] => 2010
    [4214] => encyclop
    [4215] => dia
    [4216] => britannica
    [4217] => definition
    [4219] => data
    [4220] => mining
    [4221] => retrieved
    [4222] => 2010-12-09
    [4223] => hastie
    [4224] => trevor
    [4225] => tibshirani
    [4226] => robert
    [4227] => friedman
    [4228] => jerome
    [4229] => 2009
    [4231] => elements
    [4233] => statistical
    [4234] => learning
    [4235] => data
    [4236] => mining
    [4237] => inference
    [4239] => prediction
    [4240] => retrieved
    [4241] => 2012-08-07
    [4243] => b
    [4244] => c
    [4245] => fayyad
    [4246] => usama
    [4247] => piatetsky-shapiro
    [4248] => gregory
    [4249] => smyth
    [4250] => padhraic
    [4251] => 1996
    [4253] => data
    [4254] => mining
    [4256] => knowledge
    [4257] => discovery
    [4259] => databases
    [4260] => pdf
    [4261] => retrieved
    [4262] => 17
    [4263] => december
    [4264] => 2008
    [4265] => han
    [4266] => jiawei
    [4267] => kamber
    [4268] => micheline
    [4269] => 2001
    [4270] => data
    [4271] => mining
    [4272] => concepts
    [4274] => techniques
    [4275] => morgan
    [4276] => kaufmann
    [4277] => p
    [4278] => 5
    [4279] => isbn
    [4280] => 978-1-55860-489-6
    [4282] => data
    [4283] => mining
    [4288] => appropriately
    [4289] => named
    [4290] => knowledge
    [4291] => mining
    [4293] => data
    [4298] => long
    [4300] => e
    [4301] => g
    [4302] => okairp
    [4303] => 2005
    [4304] => fall
    [4305] => conference
    [4306] => arizona
    [4307] => state
    [4308] => university
    [4311] => datamining
    [4312] => witten
    [4313] => ian
    [4314] => h
    [4315] => frank
    [4316] => eibe
    [4317] => hall
    [4318] => mark
    [4320] => 30
    [4321] => january
    [4322] => 2011
    [4323] => data
    [4324] => mining
    [4325] => practical
    [4326] => machine
    [4327] => learning
    [4328] => tools
    [4330] => techniques
    [4331] => 3
    [4332] => ed
    [4333] => elsevier
    [4334] => isbn
    [4335] => 978-0-12-374856-0
    [4336] => bouckaert
    [4337] => remco
    [4338] => r
    [4339] => frank
    [4340] => eibe
    [4341] => hall
    [4342] => mark
    [4344] => holmes
    [4345] => geoffrey
    [4346] => pfahringer
    [4347] => bernhard
    [4348] => reutemann
    [4349] => peter
    [4350] => witten
    [4351] => ian
    [4352] => h
    [4353] => 2010
    [4354] => weka
    [4355] => experiences
    [4358] => java
    [4359] => open-source
    [4360] => project
    [4361] => journal
    [4363] => machine
    [4364] => learning
    [4365] => research
    [4366] => 11
    [4367] => 2533
    [4368] => 2541
    [4370] => original
    [4371] => title
    [4372] => practical
    [4373] => machine
    [4374] => learning
    [4376] => changed
    [4378] => term
    [4379] => data
    [4380] => mining
    [4382] => added
    [4383] => primarily
    [4385] => marketing
    [4386] => reasons
    [4387] => mena
    [4388] => jes
    [4389] => s
    [4390] => 2011
    [4391] => machine
    [4392] => learning
    [4393] => forensics
    [4395] => law
    [4396] => enforcement
    [4397] => security
    [4399] => intelligence
    [4400] => boca
    [4401] => raton
    [4402] => fl
    [4403] => crc
    [4404] => press
    [4405] => taylor
    [4406] => francis
    [4407] => group
    [4408] => isbn
    [4409] => 978-1-4398-6069-4
    [4410] => piatetsky-shapiro
    [4411] => gregory
    [4412] => parker
    [4413] => gary
    [4414] => 2011
    [4415] => lesson
    [4416] => data
    [4417] => mining
    [4419] => knowledge
    [4420] => discovery
    [4422] => introduction
    [4423] => introduction
    [4425] => data
    [4426] => mining
    [4427] => kd
    [4428] => nuggets
    [4429] => retrieved
    [4430] => 30
    [4431] => august
    [4432] => 2012
    [4433] => fayyad
    [4434] => usama
    [4435] => 15
    [4436] => june
    [4437] => 1999
    [4439] => editorial
    [4441] => editor-in-chief
    [4442] => sigkdd
    [4443] => explorations
    [4444] => 13
    [4445] => 1
    [4446] => 102
    [4447] => doi
    [4448] => 10
    [4449] => 1145
    [4450] => 2207243
    [4451] => 2207269
    [4452] => retrieved
    [4453] => 27
    [4454] => december
    [4455] => 2010
    [4456] => kantardzic
    [4457] => mehmed
    [4458] => 2003
    [4459] => data
    [4460] => mining
    [4461] => concepts
    [4462] => models
    [4463] => methods
    [4465] => algorithms
    [4466] => john
    [4467] => wiley
    [4468] => sons
    [4469] => isbn
    [4470] => 0-471-22852-4
    [4471] => oclc
    [4472] => 50055336
    [4473] => gregory
    [4474] => piatetsky-shapiro
    [4475] => 2002
    [4476] => kdnuggets
    [4477] => methodology
    [4478] => poll
    [4479] => gregory
    [4480] => piatetsky-shapiro
    [4481] => 2004
    [4482] => kdnuggets
    [4483] => methodology
    [4484] => poll
    [4485] => gregory
    [4486] => piatetsky-shapiro
    [4487] => 2007
    [4488] => kdnuggets
    [4489] => methodology
    [4490] => poll
    [4491] => gregory
    [4492] => piatetsky-shapiro
    [4493] => 2014
    [4494] => kdnuggets
    [4495] => methodology
    [4496] => poll
    [4497] => scar
    [4498] => marb
    [4499] => n
    [4500] => gonzalo
    [4501] => mariscal
    [4503] => javier
    [4504] => segovia
    [4505] => 2009
    [4507] => data
    [4508] => mining
    [4509] => knowledge
    [4510] => discovery
    [4511] => process
    [4512] => model
    [4514] => data
    [4515] => mining
    [4517] => knowledge
    [4518] => discovery
    [4520] => real
    [4521] => life
    [4522] => applications
    [4523] => book
    [4524] => edited
    [4526] => julio
    [4527] => ponce
    [4529] => adem
    [4530] => karahoca
    [4531] => isbn
    [4532] => 978-3-902613-53-0
    [4533] => pp
    [4534] => 438
    [4535] => 453
    [4536] => february
    [4537] => 2009
    [4538] => i-tech
    [4539] => vienna
    [4540] => austria
    [4541] => lukasz
    [4542] => kurgan
    [4544] => petr
    [4545] => musilek
    [4546] => 2006
    [4548] => survey
    [4550] => knowledge
    [4551] => discovery
    [4553] => data
    [4554] => mining
    [4555] => process
    [4556] => models
    [4558] => knowledge
    [4559] => engineering
    [4560] => review
    [4561] => volume
    [4562] => 21
    [4563] => issue
    [4564] => 1
    [4565] => march
    [4566] => 2006
    [4567] => pp
    [4568] => 1
    [4569] => 24
    [4570] => cambridge
    [4571] => university
    [4572] => press
    [4574] => york
    [4575] => ny
    [4576] => usa
    [4577] => doi
    [4578] => 10
    [4579] => 1017
    [4580] => s0269888906000737
    [4581] => azevedo
    [4584] => santos
    [4585] => m
    [4586] => f
    [4587] => kdd
    [4588] => semma
    [4590] => crisp-dm
    [4592] => parallel
    [4593] => overview
    [4594] => archived
    [4595] => 2013-01-09
    [4598] => wayback
    [4599] => machine
    [4601] => proceedings
    [4604] => iadis
    [4605] => european
    [4606] => conference
    [4608] => data
    [4609] => mining
    [4610] => 2008
    [4611] => pp
    [4612] => 182
    [4613] => 185
    [4614] => hawkins
    [4615] => douglas
    [4616] => m
    [4617] => 2004
    [4619] => problem
    [4621] => overfitting
    [4622] => journal
    [4624] => chemical
    [4625] => information
    [4627] => computer
    [4628] => sciences
    [4629] => 44
    [4630] => 1
    [4631] => 1
    [4632] => 12
    [4633] => doi
    [4634] => 10
    [4635] => 1021
    [4636] => ci0342472
    [4637] => microsoft
    [4638] => academic
    [4639] => search
    [4640] => top
    [4641] => conferences
    [4643] => data
    [4644] => mining
    [4645] => microsoft
    [4646] => academic
    [4647] => search
    [4648] => google
    [4649] => scholar
    [4650] => top
    [4651] => publications
    [4653] => data
    [4654] => mining
    [4655] => analysis
    [4656] => google
    [4657] => scholar
    [4658] => proceedings
    [4659] => international
    [4660] => conferences
    [4662] => knowledge
    [4663] => discovery
    [4665] => data
    [4666] => mining
    [4667] => acm
    [4669] => york
    [4670] => sigkdd
    [4671] => explorations
    [4672] => acm
    [4674] => york
    [4675] => g
    [4676] => nnemann
    [4677] => stephan
    [4678] => kremer
    [4679] => hardy
    [4680] => seidl
    [4681] => thomas
    [4682] => 2011
    [4684] => extension
    [4687] => pmml
    [4688] => standard
    [4690] => subspace
    [4691] => clustering
    [4692] => models
    [4693] => proceedings
    [4696] => 2011
    [4697] => workshop
    [4699] => predictive
    [4700] => markup
    [4701] => language
    [4702] => modeling
    [4704] => pmml
    [4705] => '11
    [4706] => p
    [4707] => 48
    [4708] => doi
    [4709] => 10
    [4710] => 1145
    [4711] => 2023598
    [4712] => 2023605
    [4713] => isbn
    [4714] => 978-1-4503-0837-3
    [4715] => seltzer
    [4716] => william
    [4718] => promise
    [4720] => pitfalls
    [4722] => data
    [4723] => mining
    [4724] => ethical
    [4725] => issues
    [4726] => pdf
    [4727] => pitts
    [4728] => chip
    [4729] => 15
    [4730] => march
    [4731] => 2007
    [4733] => end
    [4735] => illegal
    [4736] => domestic
    [4737] => spying
    [4739] => count
    [4742] => washington
    [4743] => spectator
    [4744] => archived
    [4747] => original
    [4749] => 2007-10-29
    [4750] => taipale
    [4751] => kim
    [4753] => 15
    [4754] => december
    [4755] => 2003
    [4756] => data
    [4757] => mining
    [4759] => domestic
    [4760] => security
    [4761] => connecting
    [4763] => dots
    [4765] => make
    [4766] => sense
    [4768] => data
    [4769] => columbia
    [4770] => science
    [4772] => technology
    [4773] => law
    [4774] => review
    [4775] => 5
    [4776] => 2
    [4777] => oclc
    [4778] => 45263753
    [4779] => ssrn
    [4780] => 546782
    [4781] => resig
    [4782] => john
    [4783] => teredesai
    [4784] => ankur
    [4785] => 2004
    [4787] => framework
    [4789] => mining
    [4790] => instant
    [4791] => messaging
    [4792] => services
    [4793] => proceedings
    [4796] => 2004
    [4797] => siam
    [4798] => dm
    [4799] => conference
    [4801] => b
    [4802] => c
    [4806] => dig
    [4807] => privacy
    [4808] => implications
    [4810] => data
    [4811] => mining
    [4812] => aggregation
    [4813] => archived
    [4814] => 2008-12-17
    [4817] => wayback
    [4818] => machine
    [4819] => nascio
    [4820] => research
    [4822] => september
    [4823] => 2004
    [4824] => ohm
    [4825] => paul
    [4827] => build
    [4829] => database
    [4831] => ruin
    [4832] => harvard
    [4833] => business
    [4834] => review
    [4835] => darwin
    [4836] => bond-graham
    [4837] => iron
    [4838] => cagebook
    [4841] => logical
    [4842] => end
    [4844] => facebook's
    [4845] => patents
    [4846] => counterpunch
    [4847] => org
    [4848] => 2013
    [4849] => 12
    [4850] => 03
    [4851] => darwin
    [4852] => bond-graham
    [4853] => inside
    [4855] => tech
    [4856] => industry's
    [4857] => startup
    [4858] => conference
    [4859] => counterpunch
    [4860] => org
    [4861] => 2013
    [4862] => 09
    [4863] => 11
    [4864] => aol
    [4865] => search
    [4866] => data
    [4867] => identified
    [4868] => individuals
    [4869] => securityfocus
    [4870] => august
    [4871] => 2006
    [4872] => kshetri
    [4873] => nir
    [4874] => 2014
    [4875] => big
    [4876] => data
    [4877] => s
    [4878] => impact
    [4880] => privacy
    [4881] => security
    [4883] => consumer
    [4884] => welfare
    [4885] => telecommunications
    [4886] => policy
    [4887] => 38
    [4888] => 11
    [4889] => 1134
    [4890] => 1145
    [4891] => doi
    [4892] => 10
    [4893] => 1016
    [4894] => j
    [4895] => telpol
    [4896] => 2014
    [4897] => 10
    [4898] => 002
    [4899] => biotech
    [4900] => business
    [4901] => week
    [4902] => editors
    [4903] => june
    [4904] => 30
    [4905] => 2008
    [4906] => biomedicine
    [4907] => hipaa
    [4908] => privacy
    [4909] => rule
    [4910] => impedes
    [4911] => biomedical
    [4912] => research
    [4913] => biotech
    [4914] => business
    [4915] => week
    [4916] => retrieved
    [4917] => 17
    [4918] => november
    [4919] => 2009
    [4921] => lexisnexis
    [4922] => academic
    [4923] => uk
    [4924] => researchers
    [4926] => data
    [4927] => mining
    [4931] => uk
    [4932] => copyright
    [4933] => laws
    [4934] => archived
    [4935] => june
    [4936] => 9
    [4937] => 2014
    [4940] => wayback
    [4941] => machine
    [4942] => out-law
    [4944] => retrieved
    [4945] => 14
    [4946] => november
    [4947] => 2014
    [4948] => licences
    [4950] => europe
    [4952] => structured
    [4953] => stakeholder
    [4954] => dialogue
    [4955] => 2013
    [4956] => european
    [4957] => commission
    [4958] => retrieved
    [4959] => 14
    [4960] => november
    [4961] => 2014
    [4962] => text
    [4964] => data
    [4965] => mining
    [4967] => importance
    [4972] => change
    [4974] => europe
    [4975] => association
    [4977] => european
    [4978] => research
    [4979] => libraries
    [4980] => retrieved
    [4981] => 14
    [4982] => november
    [4983] => 2014
    [4984] => judge
    [4985] => grants
    [4986] => summary
    [4987] => judgment
    [4989] => favor
    [4991] => google
    [4992] => books
    [4994] => fair
    [4996] => victory
    [4997] => lexology
    [4999] => antonelli
    [5000] => law
    [5002] => retrieved
    [5003] => 14
    [5004] => november
    [5005] => 2014
    [5006] => karl
    [5007] => rexer
    [5008] => heather
    [5009] => allen
    [5010] => paul
    [5011] => gearan
    [5012] => 2011
    [5013] => understanding
    [5014] => data
    [5015] => miners
    [5016] => analytics
    [5017] => magazine
    [5019] => june
    [5020] => 2011
    [5021] => informs
    [5022] => institute
    [5024] => operations
    [5025] => research
    [5028] => management
    [5029] => sciences
    [5030] => mikut
    [5031] => ralf
    [5032] => reischl
    [5033] => markus
    [5034] => september
    [5035] => october
    [5036] => 2011
    [5037] => data
    [5038] => mining
    [5039] => tools
    [5040] => wiley
    [5041] => interdisciplinary
    [5042] => reviews
    [5043] => data
    [5044] => mining
    [5046] => knowledge
    [5047] => discovery
    [5048] => 1
    [5049] => 5
    [5050] => 431
    [5051] => 445
    [5052] => doi
    [5053] => 10
    [5054] => 1002
    [5055] => widm
    [5056] => 24
    [5057] => retrieved
    [5058] => october
    [5059] => 21
    [5060] => 2011
    [5061] => kobielus
    [5062] => james
    [5064] => forrester
    [5065] => wave
    [5066] => predictive
    [5067] => analytics
    [5069] => data
    [5070] => mining
    [5071] => solutions
    [5072] => q1
    [5073] => 2010
    [5074] => forrester
    [5075] => research
    [5076] => 1
    [5077] => july
    [5078] => 2008
    [5079] => herschel
    [5080] => gareth
    [5081] => magic
    [5082] => quadrant
    [5084] => customer
    [5085] => data-mining
    [5086] => applications
    [5087] => gartner
    [5089] => 1
    [5090] => july
    [5091] => 2008
    [5092] => nisbet
    [5093] => robert
    [5095] => 2006
    [5096] => data
    [5097] => mining
    [5098] => tools
    [5104] => crm
    [5105] => part
    [5106] => 1
    [5107] => information
    [5108] => management
    [5109] => special
    [5110] => reports
    [5111] => january
    [5112] => 2006
    [5113] => haughton
    [5114] => dominique
    [5115] => deichmann
    [5116] => joel
    [5117] => eshghi
    [5118] => abdolreza
    [5119] => sayek
    [5120] => selin
    [5121] => teebagy
    [5122] => nicholas
    [5124] => topi
    [5125] => heikki
    [5126] => 2003
    [5128] => review
    [5130] => software
    [5131] => packages
    [5133] => data
    [5134] => mining
    [5136] => american
    [5137] => statistician
    [5138] => vol
    [5139] => 57
    [5141] => 4
    [5142] => pp
    [5143] => 290
    [5144] => 309
    [5145] => goebel
    [5146] => michael
    [5147] => gruenwald
    [5148] => le
    [5149] => 1999
    [5151] => survey
    [5153] => data
    [5154] => mining
    [5156] => knowledge
    [5157] => discovery
    [5158] => software
    [5159] => tools
    [5160] => sigkdd
    [5161] => explorations
    [5162] => vol
    [5163] => 1
    [5164] => issue
    [5165] => 1
    [5166] => pp
    [5167] => 20
    [5168] => 33
    [5170] => reading
    [5171] => edit
    [5172] => cabena
    [5173] => peter
    [5174] => hadjnian
    [5175] => pablo
    [5176] => stadler
    [5177] => rolf
    [5178] => verhees
    [5179] => jaap
    [5180] => zanasi
    [5181] => alessandro
    [5182] => 1997
    [5183] => discovering
    [5184] => data
    [5185] => mining
    [5187] => concept
    [5189] => implementation
    [5190] => prentice
    [5191] => hall
    [5192] => isbn
    [5193] => 0-13-743980-6
    [5194] => m
    [5195] => s
    [5196] => chen
    [5197] => j
    [5198] => han
    [5199] => p
    [5200] => s
    [5201] => yu
    [5202] => 1996
    [5203] => data
    [5204] => mining
    [5206] => overview
    [5209] => database
    [5210] => perspective
    [5211] => knowledge
    [5213] => data
    [5214] => engineering
    [5215] => ieee
    [5216] => transactions
    [5218] => 8
    [5219] => 6
    [5220] => 866
    [5221] => 883
    [5222] => feldman
    [5223] => ronen
    [5224] => sanger
    [5225] => james
    [5226] => 2007
    [5228] => text
    [5229] => mining
    [5230] => handbook
    [5231] => cambridge
    [5232] => university
    [5233] => press
    [5234] => isbn
    [5235] => 978-0-521-83657-9
    [5236] => guo
    [5237] => yike
    [5239] => grossman
    [5240] => robert
    [5241] => editors
    [5242] => 1999
    [5243] => high
    [5244] => performance
    [5245] => data
    [5246] => mining
    [5247] => scaling
    [5248] => algorithms
    [5249] => applications
    [5251] => systems
    [5252] => kluwer
    [5253] => academic
    [5254] => publishers
    [5255] => han
    [5256] => jiawei
    [5257] => micheline
    [5258] => kamber
    [5260] => jian
    [5261] => pei
    [5262] => data
    [5263] => mining
    [5264] => concepts
    [5266] => techniques
    [5267] => morgan
    [5268] => kaufmann
    [5269] => 2006
    [5270] => hastie
    [5271] => trevor
    [5272] => tibshirani
    [5273] => robert
    [5275] => friedman
    [5276] => jerome
    [5277] => 2001
    [5279] => elements
    [5281] => statistical
    [5282] => learning
    [5283] => data
    [5284] => mining
    [5285] => inference
    [5287] => prediction
    [5288] => springer
    [5289] => isbn
    [5290] => 0-387-95284-5
    [5291] => liu
    [5292] => bing
    [5293] => 2007
    [5294] => web
    [5295] => data
    [5296] => mining
    [5297] => exploring
    [5298] => hyperlinks
    [5299] => contents
    [5301] => usage
    [5302] => data
    [5303] => springer
    [5304] => isbn
    [5305] => 3-540-37881-2
    [5306] => murphy
    [5307] => chris
    [5308] => 16
    [5310] => 2011
    [5312] => data
    [5313] => mining
    [5314] => free
    [5315] => speech
    [5316] => informationweek
    [5317] => umb
    [5318] => 12
    [5319] => nisbet
    [5320] => robert
    [5321] => elder
    [5322] => john
    [5323] => miner
    [5324] => gary
    [5325] => 2009
    [5326] => handbook
    [5328] => statistical
    [5329] => analysis
    [5330] => data
    [5331] => mining
    [5332] => applications
    [5333] => academic
    [5334] => press
    [5335] => elsevier
    [5336] => isbn
    [5337] => 978-0-12-374765-5
    [5338] => poncelet
    [5339] => pascal
    [5340] => masseglia
    [5341] => florent
    [5343] => teisseire
    [5344] => maguelonne
    [5345] => editors
    [5346] => october
    [5347] => 2007
    [5348] => data
    [5349] => mining
    [5350] => patterns
    [5352] => methods
    [5354] => applications
    [5355] => information
    [5356] => science
    [5357] => reference
    [5358] => isbn
    [5359] => 978-1-59904-162-9
    [5360] => tan
    [5361] => pang-ning
    [5362] => steinbach
    [5363] => michael
    [5365] => kumar
    [5366] => vipin
    [5367] => 2005
    [5368] => introduction
    [5370] => data
    [5371] => mining
    [5372] => isbn
    [5373] => 0-321-32136-7
    [5374] => theodoridis
    [5375] => sergios
    [5377] => koutroumbas
    [5378] => konstantinos
    [5379] => 2009
    [5380] => pattern
    [5381] => recognition
    [5382] => 4th
    [5383] => edition
    [5384] => academic
    [5385] => press
    [5386] => isbn
    [5387] => 978-1-59749-272-0
    [5388] => weiss
    [5389] => sholom
    [5390] => m
    [5392] => indurkhya
    [5393] => nitin
    [5394] => 1998
    [5395] => predictive
    [5396] => data
    [5397] => mining
    [5398] => morgan
    [5399] => kaufmann
    [5400] => witten
    [5401] => ian
    [5402] => h
    [5403] => frank
    [5404] => eibe
    [5405] => hall
    [5406] => mark
    [5408] => 30
    [5409] => january
    [5410] => 2011
    [5411] => data
    [5412] => mining
    [5413] => practical
    [5414] => machine
    [5415] => learning
    [5416] => tools
    [5418] => techniques
    [5419] => 3
    [5420] => ed
    [5421] => elsevier
    [5422] => isbn
    [5423] => 978-0-12-374856-0
    [5426] => free
    [5427] => weka
    [5428] => software
    [5429] => ye
    [5430] => nong
    [5431] => 2003
    [5433] => handbook
    [5435] => data
    [5436] => mining
    [5437] => mahwah
    [5438] => nj
    [5439] => lawrence
    [5440] => erlbaum
    [5441] => external
    [5442] => links
    [5443] => edit
    [5444] => wikimedia
    [5445] => commons
    [5447] => media
    [5448] => related
    [5450] => data
    [5451] => mining
    [5452] => knowledge
    [5453] => discovery
    [5454] => software
    [5456] => curlie
    [5457] => based
    [5459] => dmoz
    [5460] => data
    [5461] => mining
    [5462] => tool
    [5463] => vendors
    [5465] => curlie
    [5466] => based
    [5468] => dmoz
    [5469] => v
    [5470] => t
    [5471] => e
    [5472] => data
    [5473] => storage
    [5474] => analysis
    [5475] => cleansing
    [5476] => compression
    [5477] => corruption
    [5478] => curation
    [5479] => editing
    [5480] => farming
    [5481] => fusion
    [5482] => integration
    [5483] => integrity
    [5484] => loss
    [5485] => mining
    [5486] => pre-processing
    [5487] => quality
    [5488] => reduction
    [5489] => scraping
    [5490] => scrubbing
    [5491] => security
    [5492] => validation
    [5493] => warehouse
    [5494] => wrangling
    [5495] => munging
    [5496] => protection
    [5497] => privacy
    [5498] => v
    [5499] => t
    [5500] => e
    [5501] => data
    [5502] => warehouse
    [5503] => creating
    [5505] => data
    [5506] => warehouse
    [5507] => concepts
    [5508] => database
    [5509] => dimension
    [5510] => dimensional
    [5511] => modeling
    [5512] => fact
    [5513] => olap
    [5514] => star
    [5515] => schema
    [5516] => aggregate
    [5517] => variants
    [5518] => anchor
    [5519] => modeling
    [5520] => column-oriented
    [5521] => dbms
    [5522] => data
    [5523] => vault
    [5524] => modeling
    [5525] => holap
    [5526] => molap
    [5527] => rolap
    [5528] => operational
    [5529] => data
    [5530] => store
    [5531] => elements
    [5532] => data
    [5533] => dictionary
    [5534] => metadata
    [5535] => data
    [5536] => mart
    [5537] => sixth
    [5538] => normal
    [5539] => form
    [5540] => surrogate
    [5541] => key
    [5542] => fact
    [5543] => fact
    [5544] => table
    [5545] => early-arriving
    [5546] => fact
    [5547] => measure
    [5548] => dimension
    [5549] => dimension
    [5550] => table
    [5551] => degenerate
    [5552] => slowly
    [5553] => changing
    [5554] => filling
    [5555] => extract-transform-load
    [5556] => etl
    [5557] => extract
    [5558] => transform
    [5559] => load
    [5562] => data
    [5563] => warehouse
    [5564] => concepts
    [5565] => business
    [5566] => intelligence
    [5567] => dashboard
    [5568] => data
    [5569] => mining
    [5570] => decision
    [5571] => support
    [5572] => system
    [5573] => dss
    [5574] => olap
    [5575] => cube
    [5576] => data
    [5577] => warehouse
    [5578] => automation
    [5579] => languages
    [5580] => data
    [5581] => mining
    [5582] => extensions
    [5583] => dmx
    [5584] => multidimensional
    [5585] => expressions
    [5586] => mdx
    [5587] => xml
    [5589] => analysis
    [5590] => xmla
    [5591] => tools
    [5592] => business
    [5593] => intelligence
    [5594] => software
    [5595] => reporting
    [5596] => software
    [5597] => spreadsheet
    [5598] => related
    [5599] => people
    [5600] => bill
    [5601] => inmon
    [5602] => ralph
    [5603] => kimball
    [5604] => products
    [5605] => comparison
    [5607] => olap
    [5608] => servers
    [5609] => data
    [5610] => warehousing
    [5611] => products
    [5614] => producers
    [5615] => v
    [5616] => t
    [5617] => e
    [5618] => major
    [5619] => fields
    [5621] => computer
    [5622] => science
    [5623] => note
    [5625] => template
    [5626] => roughly
    [5629] => 2012
    [5630] => acm
    [5631] => computing
    [5632] => classification
    [5633] => system
    [5634] => hardware
    [5635] => printed
    [5636] => circuit
    [5637] => board
    [5638] => peripheral
    [5639] => integrated
    [5640] => circuit
    [5641] => very-large-scale
    [5642] => integration
    [5643] => energy
    [5644] => consumption
    [5645] => electronic
    [5646] => design
    [5647] => automation
    [5648] => computer
    [5649] => systems
    [5650] => organization
    [5651] => computer
    [5652] => architecture
    [5653] => embedded
    [5654] => system
    [5655] => real-time
    [5656] => computing
    [5657] => dependability
    [5658] => networks
    [5659] => network
    [5660] => architecture
    [5661] => network
    [5662] => protocol
    [5663] => network
    [5664] => components
    [5665] => network
    [5666] => scheduler
    [5667] => network
    [5668] => performance
    [5669] => evaluation
    [5670] => network
    [5671] => service
    [5672] => software
    [5673] => organization
    [5674] => interpreter
    [5675] => middleware
    [5676] => virtual
    [5677] => machine
    [5678] => operating
    [5679] => system
    [5680] => software
    [5681] => quality
    [5682] => software
    [5683] => notations
    [5685] => tools
    [5686] => programming
    [5687] => paradigm
    [5688] => programming
    [5689] => language
    [5690] => compiler
    [5691] => domain-specific
    [5692] => language
    [5693] => modeling
    [5694] => language
    [5695] => software
    [5696] => framework
    [5697] => integrated
    [5698] => development
    [5699] => environment
    [5700] => software
    [5701] => configuration
    [5702] => management
    [5703] => software
    [5704] => library
    [5705] => software
    [5706] => repository
    [5707] => software
    [5708] => development
    [5709] => software
    [5710] => development
    [5711] => process
    [5712] => requirements
    [5713] => analysis
    [5714] => software
    [5715] => design
    [5716] => software
    [5717] => construction
    [5718] => software
    [5719] => deployment
    [5720] => software
    [5721] => maintenance
    [5722] => programming
    [5723] => team
    [5724] => open-source
    [5725] => model
    [5726] => theory
    [5728] => computation
    [5729] => model
    [5731] => computation
    [5732] => formal
    [5733] => language
    [5734] => automata
    [5735] => theory
    [5736] => computational
    [5737] => complexity
    [5738] => theory
    [5739] => logic
    [5740] => semantics
    [5741] => algorithms
    [5742] => algorithm
    [5743] => design
    [5744] => analysis
    [5746] => algorithms
    [5747] => randomized
    [5748] => algorithm
    [5749] => computational
    [5750] => geometry
    [5751] => mathematics
    [5753] => computing
    [5754] => discrete
    [5755] => mathematics
    [5756] => probability
    [5757] => statistics
    [5758] => mathematical
    [5759] => software
    [5760] => information
    [5761] => theory
    [5762] => mathematical
    [5763] => analysis
    [5764] => numerical
    [5765] => analysis
    [5766] => information
    [5767] => systems
    [5768] => database
    [5769] => management
    [5770] => system
    [5771] => information
    [5772] => storage
    [5773] => systems
    [5774] => enterprise
    [5775] => information
    [5776] => system
    [5777] => social
    [5778] => information
    [5779] => systems
    [5780] => geographic
    [5781] => information
    [5782] => system
    [5783] => decision
    [5784] => support
    [5785] => system
    [5786] => process
    [5787] => control
    [5788] => system
    [5789] => multimedia
    [5790] => information
    [5791] => system
    [5792] => data
    [5793] => mining
    [5794] => digital
    [5795] => library
    [5796] => computing
    [5797] => platform
    [5798] => digital
    [5799] => marketing
    [5800] => world
    [5801] => wide
    [5802] => web
    [5803] => information
    [5804] => retrieval
    [5805] => security
    [5806] => cryptography
    [5807] => formal
    [5808] => methods
    [5809] => security
    [5810] => services
    [5811] => intrusion
    [5812] => detection
    [5813] => system
    [5814] => hardware
    [5815] => security
    [5816] => network
    [5817] => security
    [5818] => information
    [5819] => security
    [5820] => application
    [5821] => security
    [5822] => human
    [5823] => computer
    [5824] => interaction
    [5825] => interaction
    [5826] => design
    [5827] => social
    [5828] => computing
    [5829] => ubiquitous
    [5830] => computing
    [5831] => visualization
    [5832] => accessibility
    [5833] => concurrency
    [5834] => concurrent
    [5835] => computing
    [5836] => parallel
    [5837] => computing
    [5838] => distributed
    [5839] => computing
    [5840] => multithreading
    [5841] => multiprocessing
    [5842] => artificial
    [5843] => intelligence
    [5844] => natural
    [5845] => language
    [5846] => processing
    [5847] => knowledge
    [5848] => representation
    [5850] => reasoning
    [5851] => computer
    [5852] => vision
    [5853] => automated
    [5854] => planning
    [5856] => scheduling
    [5857] => search
    [5858] => methodology
    [5859] => control
    [5860] => method
    [5861] => philosophy
    [5863] => artificial
    [5864] => intelligence
    [5865] => distributed
    [5866] => artificial
    [5867] => intelligence
    [5868] => machine
    [5869] => learning
    [5870] => supervised
    [5871] => learning
    [5872] => unsupervised
    [5873] => learning
    [5874] => reinforcement
    [5875] => learning
    [5876] => multi-task
    [5877] => learning
    [5878] => cross-validation
    [5879] => graphics
    [5880] => animation
    [5881] => rendering
    [5882] => image
    [5883] => manipulation
    [5884] => graphics
    [5885] => processing
    [5886] => unit
    [5887] => mixed
    [5888] => reality
    [5889] => virtual
    [5890] => reality
    [5891] => image
    [5892] => compression
    [5893] => solid
    [5894] => modeling
    [5895] => applied
    [5896] => computing
    [5897] => e-commerce
    [5898] => enterprise
    [5899] => software
    [5900] => computational
    [5901] => mathematics
    [5902] => computational
    [5903] => physics
    [5904] => computational
    [5905] => chemistry
    [5906] => computational
    [5907] => biology
    [5908] => computational
    [5909] => social
    [5910] => science
    [5911] => computational
    [5912] => engineering
    [5913] => computational
    [5914] => healthcare
    [5915] => digital
    [5916] => art
    [5917] => electronic
    [5918] => publishing
    [5919] => cyberwarfare
    [5920] => electronic
    [5921] => voting
    [5922] => video
    [5923] => game
    [5924] => word
    [5925] => processing
    [5926] => operations
    [5927] => research
    [5928] => educational
    [5929] => technology
    [5930] => document
    [5931] => management
    [5932] => book
    [5933] => category
    [5934] => portal
    [5935] => wikiproject
    [5936] => commons
    [5937] => authority
    [5938] => control
    [5939] => gnd
    [5940] => 4428654-5
    [5941] => ndl
    [5942] => 00948240
    [5943] => retrieved
    [5945] => https
    [5947] => wikipedia
    [5948] => org
    [5949] => w
    [5950] => index
    [5951] => php
    [5952] => title
    [5953] => data
    [5954] => mining
    [5955] => oldid
    [5956] => 814776161
    [5957] => categories
    [5958] => data
    [5959] => mining
    [5960] => formal
    [5961] => sciences
    [5962] => hidden
    [5963] => categories
    [5964] => cs1
    [5965] => maint
    [5966] => multiple
    [5967] => names
    [5968] => authors
    [5969] => list
    [5970] => webarchive
    [5971] => template
    [5972] => wayback
    [5973] => links
    [5974] => articles
    [5977] => expanded
    [5979] => september
    [5980] => 2011
    [5982] => articles
    [5984] => unsourced
    [5985] => statements
    [5986] => articles
    [5988] => unsourced
    [5989] => statements
    [5991] => april
    [5992] => 2014
    [5993] => articles
    [5995] => dmoz
    [5996] => links
    [5997] => wikipedia
    [5998] => articles
    [6000] => gnd
    [6001] => identifiers
    [6002] => navigation
    [6003] => menu
    [6004] => personal
    [6005] => tools
    [6007] => logged
    [6009] => talk
    [6010] => contributions
    [6011] => create
    [6012] => account
    [6013] => log
    [6015] => namespaces
    [6016] => article
    [6017] => talk
    [6018] => variants
    [6019] => views
    [6020] => read
    [6021] => edit
    [6022] => view
    [6023] => history
    [6025] => search
    [6026] => navigation
    [6027] => main
    [6028] => page
    [6029] => contents
    [6030] => featured
    [6031] => content
    [6032] => current
    [6033] => events
    [6034] => random
    [6035] => article
    [6036] => donate
    [6038] => wikipedia
    [6039] => wikipedia
    [6040] => store
    [6041] => interaction
    [6044] => wikipedia
    [6045] => community
    [6046] => portal
    [6047] => recent
    [6049] => contact
    [6050] => page
    [6051] => tools
    [6053] => links
    [6055] => related
    [6057] => upload
    [6058] => file
    [6059] => special
    [6060] => pages
    [6061] => permanent
    [6062] => link
    [6063] => page
    [6064] => information
    [6065] => wikidata
    [6066] => item
    [6067] => cite
    [6069] => page
    [6070] => print
    [6071] => export
    [6072] => create
    [6074] => book
    [6075] => download
    [6077] => pdf
    [6078] => printable
    [6079] => version
    [6082] => projects
    [6083] => wikimedia
    [6084] => commons
    [6085] => languages
    [6086] => az
    [6087] => rbaycanca
    [6088] => catal
    [6089] => e
    [6090] => tina
    [6091] => dansk
    [6092] => deutsch
    [6093] => eesti
    [6094] => espa
    [6095] => ol
    [6096] => euskara
    [6097] => fran
    [6098] => ais
    [6099] => hrvatski
    [6100] => bahasa
    [6101] => indonesia
    [6102] => italiano
    [6103] => latvie
    [6104] => u
    [6105] => magyar
    [6106] => nederlands
    [6107] => norsk
    [6108] => polski
    [6109] => portugu
    [6110] => s
    [6111] => rom
    [6112] => n
    [6113] => shqip
    [6114] => simple
    [6115] => english
    [6116] => sloven
    [6117] => ina
    [6118] => sloven
    [6119] => ina
    [6120] => srpski
    [6121] => srpskohrvatski
    [6122] => basa
    [6123] => sunda
    [6124] => suomi
    [6125] => svenska
    [6126] => t
    [6127] => rk
    [6128] => e
    [6129] => ti
    [6130] => ng
    [6131] => vi
    [6132] => t
    [6133] => edit
    [6134] => links
    [6136] => page
    [6139] => edited
    [6141] => 10
    [6142] => december
    [6143] => 2017
    [6145] => 21
    [6146] => 46
    [6147] => text
    [6152] => creative
    [6153] => commons
    [6154] => attribution-sharealike
    [6155] => license
    [6156] => additional
    [6157] => terms
    [6159] => apply
    [6163] => site
    [6165] => agree
    [6168] => terms
    [6172] => privacy
    [6173] => policy
    [6174] => wikipedia
    [6177] => registered
    [6178] => trademark
    [6181] => wikimedia
    [6182] => foundation
    [6185] => non-profit
    [6186] => organization
    [6187] => privacy
    [6188] => policy
    [6190] => wikipedia
    [6191] => disclaimers
    [6192] => contact
    [6193] => wikipedia
    [6194] => developers
    [6195] => cookie
    [6196] => statement
    [6197] => mobile
    [6198] => view
)
======================
Text: data mining - wikipedia data mining from wikipedia the free encyclopedia...
Total Keywords: 4345
======================

Demo2.php

<?php

//All Keywords as an array
$tm = new TextMiner();

$tm->addFile("http://en.wikipedia.org/wiki/Data_mining");
$tm->process();

printa($tm->getKeywords());
echo 
$tm->printSummary();
        
?>