Demo 0 | Demo 1 | Demo 2 | Demo 3 | Demo 4 | Demo 5 | Code | Matt Smith

Demo 2

Array
(
    [1] => data
    [2] => mining
    [4] => wikipedia
    [5] => data
    [6] => mining
    [8] => wikipedia
    [10] => free
    [11] => encyclopedia
    [12] => jump
    [14] => navigation
    [15] => search
    [19] => confused
    [21] => analytics
    [22] => information
    [23] => extraction
    [25] => data
    [26] => analysis
    [27] => machine
    [28] => learning
    [30] => data
    [31] => mining
    [32] => problems
    [33] => classification
    [34] => clustering
    [35] => regression
    [36] => anomaly
    [37] => detection
    [38] => association
    [39] => rules
    [40] => reinforcement
    [41] => learning
    [42] => structured
    [43] => prediction
    [44] => feature
    [45] => engineering
    [46] => feature
    [47] => learning
    [48] => online
    [49] => learning
    [50] => semi-supervised
    [51] => learning
    [52] => unsupervised
    [53] => learning
    [54] => learning
    [56] => rank
    [57] => grammar
    [58] => induction
    [59] => supervised
    [60] => learning
    [61] => classification
    [62] => regression
    [63] => decision
    [64] => trees
    [65] => ensembles
    [66] => bagging
    [67] => boosting
    [68] => random
    [69] => forest
    [70] => k
    [71] => -nn
    [72] => linear
    [73] => regression
    [74] => naive
    [75] => bayes
    [76] => neural
    [77] => networks
    [78] => logistic
    [79] => regression
    [80] => perceptron
    [81] => relevance
    [82] => vector
    [83] => machine
    [84] => rvm
    [85] => support
    [86] => vector
    [87] => machine
    [88] => svm
    [89] => clustering
    [90] => birch
    [91] => hierarchical
    [92] => k
    [93] => -means
    [94] => expectation
    [95] => maximization
    [96] => em
    [97] => dbscan
    [98] => optics
    [99] => mean-shift
    [100] => dimensionality
    [101] => reduction
    [102] => factor
    [103] => analysis
    [104] => cca
    [105] => ica
    [106] => lda
    [107] => nmf
    [108] => pca
    [109] => t-sne
    [110] => structured
    [111] => prediction
    [112] => graphical
    [113] => models
    [114] => bayes
    [115] => net
    [116] => crf
    [117] => hmm
    [118] => anomaly
    [119] => detection
    [120] => k
    [121] => -nn
    [122] => local
    [123] => outlier
    [124] => factor
    [125] => neural
    [126] => nets
    [127] => autoencoder
    [128] => deep
    [129] => learning
    [130] => multilayer
    [131] => perceptron
    [132] => rnn
    [133] => restricted
    [134] => boltzmann
    [135] => machine
    [136] => som
    [137] => convolutional
    [138] => neural
    [139] => network
    [140] => reinforcement
    [141] => learning
    [142] => q-learning
    [143] => sarsa
    [144] => temporal
    [145] => difference
    [146] => td
    [147] => theory
    [148] => bias-variance
    [149] => dilemma
    [150] => computational
    [151] => learning
    [152] => theory
    [153] => empirical
    [154] => risk
    [155] => minimization
    [156] => occam
    [157] => learning
    [158] => pac
    [159] => learning
    [160] => statistical
    [161] => learning
    [162] => vc
    [163] => theory
    [164] => machine-learning
    [165] => venues
    [166] => nips
    [167] => icml
    [168] => ml
    [169] => jmlr
    [170] => arxiv
    [171] => cs
    [172] => lg
    [173] => related
    [174] => articles
    [175] => list
    [177] => datasets
    [179] => machine-learning
    [180] => research
    [181] => outline
    [183] => machine
    [184] => learning
    [185] => machine
    [186] => learning
    [187] => portal
    [188] => v
    [189] => t
    [190] => e
    [191] => data
    [192] => mining
    [195] => computing
    [196] => process
    [198] => discovering
    [199] => patterns
    [201] => large
    [202] => data
    [203] => sets
    [204] => involving
    [205] => methods
    [208] => intersection
    [210] => machine
    [211] => learning
    [212] => statistics
    [214] => database
    [215] => systems
    [216] => 1
    [218] => essential
    [219] => process
    [221] => intelligent
    [222] => methods
    [224] => applied
    [226] => extract
    [227] => data
    [228] => patterns
    [229] => 1
    [230] => 2
    [234] => interdisciplinary
    [235] => subfield
    [237] => computer
    [238] => science
    [239] => 1
    [240] => 3
    [241] => 4
    [244] => goal
    [247] => data
    [248] => mining
    [249] => process
    [252] => extract
    [253] => information
    [256] => data
    [257] => set
    [259] => transform
    [263] => understandable
    [264] => structure
    [268] => 1
    [272] => raw
    [273] => analysis
    [274] => step
    [276] => involves
    [277] => database
    [279] => data
    [280] => management
    [281] => aspects
    [282] => data
    [283] => pre-processing
    [284] => model
    [286] => inference
    [287] => considerations
    [288] => interestingness
    [289] => metrics
    [290] => complexity
    [291] => considerations
    [292] => post-processing
    [294] => discovered
    [295] => structures
    [296] => visualization
    [298] => online
    [299] => updating
    [300] => 1
    [301] => data
    [302] => mining
    [305] => analysis
    [306] => step
    [309] => knowledge
    [310] => discovery
    [312] => databases
    [313] => process
    [315] => kdd
    [316] => 5
    [318] => term
    [321] => misnomer
    [324] => goal
    [327] => extraction
    [329] => patterns
    [331] => knowledge
    [333] => large
    [334] => amounts
    [336] => data
    [339] => extraction
    [340] => mining
    [342] => data
    [344] => 6
    [349] => buzzword
    [350] => 7
    [353] => frequently
    [354] => applied
    [357] => form
    [359] => large-scale
    [360] => data
    [362] => information
    [363] => processing
    [364] => collection
    [365] => extraction
    [366] => warehousing
    [367] => analysis
    [369] => statistics
    [374] => application
    [376] => computer
    [377] => decision
    [378] => support
    [379] => system
    [380] => including
    [381] => artificial
    [382] => intelligence
    [383] => machine
    [384] => learning
    [386] => business
    [387] => intelligence
    [389] => book
    [390] => data
    [391] => mining
    [392] => practical
    [393] => machine
    [394] => learning
    [395] => tools
    [397] => techniques
    [399] => java
    [400] => 8
    [402] => covers
    [404] => machine
    [405] => learning
    [406] => material
    [408] => originally
    [411] => named
    [413] => practical
    [414] => machine
    [415] => learning
    [418] => term
    [419] => data
    [420] => mining
    [423] => added
    [425] => marketing
    [426] => reasons
    [427] => 9
    [431] => general
    [432] => terms
    [433] => large
    [434] => scale
    [435] => data
    [436] => analysis
    [438] => analytics
    [441] => referring
    [443] => actual
    [444] => methods
    [445] => artificial
    [446] => intelligence
    [448] => machine
    [449] => learning
    [454] => actual
    [455] => data
    [456] => mining
    [457] => task
    [460] => semi-automatic
    [462] => automatic
    [463] => analysis
    [465] => large
    [466] => quantities
    [468] => data
    [470] => extract
    [471] => previously
    [472] => unknown
    [473] => interesting
    [474] => patterns
    [477] => groups
    [479] => data
    [480] => records
    [481] => cluster
    [482] => analysis
    [483] => unusual
    [484] => records
    [485] => anomaly
    [486] => detection
    [488] => dependencies
    [489] => association
    [490] => rule
    [491] => mining
    [492] => sequential
    [493] => pattern
    [494] => mining
    [497] => involves
    [499] => database
    [500] => techniques
    [503] => spatial
    [504] => indices
    [506] => patterns
    [513] => kind
    [515] => summary
    [518] => input
    [519] => data
    [526] => analysis
    [531] => machine
    [532] => learning
    [534] => predictive
    [535] => analytics
    [539] => data
    [540] => mining
    [541] => step
    [543] => identify
    [544] => multiple
    [545] => groups
    [548] => data
    [555] => obtain
    [557] => accurate
    [558] => prediction
    [559] => results
    [562] => decision
    [563] => support
    [564] => system
    [567] => data
    [568] => collection
    [569] => data
    [570] => preparation
    [572] => result
    [573] => interpretation
    [575] => reporting
    [577] => part
    [580] => data
    [581] => mining
    [582] => step
    [585] => belong
    [589] => kdd
    [590] => process
    [592] => additional
    [593] => steps
    [595] => related
    [596] => terms
    [597] => data
    [598] => dredging
    [599] => data
    [600] => fishing
    [602] => data
    [603] => snooping
    [604] => refer
    [609] => data
    [610] => mining
    [611] => methods
    [613] => sample
    [614] => parts
    [617] => larger
    [618] => population
    [619] => data
    [620] => set
    [627] => small
    [629] => reliable
    [630] => statistical
    [631] => inferences
    [634] => made
    [637] => validity
    [640] => patterns
    [641] => discovered
    [643] => methods
    [649] => creating
    [651] => hypotheses
    [653] => test
    [656] => larger
    [657] => data
    [658] => populations
    [659] => contents
    [660] => 1
    [661] => etymology
    [662] => 2
    [663] => background
    [664] => 3
    [665] => process
    [666] => 3
    [667] => 1
    [668] => pre-processing
    [669] => 3
    [670] => 2
    [671] => data
    [672] => mining
    [673] => 3
    [674] => 3
    [675] => results
    [676] => validation
    [677] => 4
    [678] => research
    [679] => 5
    [680] => standards
    [681] => 6
    [682] => notable
    [684] => 7
    [685] => privacy
    [686] => concerns
    [688] => ethics
    [689] => 7
    [690] => 1
    [691] => situation
    [693] => europe
    [694] => 7
    [695] => 2
    [696] => situation
    [699] => united
    [700] => states
    [701] => 8
    [702] => copyright
    [703] => law
    [704] => 8
    [705] => 1
    [706] => situation
    [708] => europe
    [709] => 8
    [710] => 2
    [711] => situation
    [714] => united
    [715] => states
    [716] => 9
    [717] => software
    [718] => 9
    [719] => 1
    [720] => free
    [721] => open-source
    [722] => data
    [723] => mining
    [724] => software
    [726] => applications
    [727] => 9
    [728] => 2
    [729] => proprietary
    [730] => data-mining
    [731] => software
    [733] => applications
    [734] => 9
    [735] => 3
    [736] => marketplace
    [737] => surveys
    [738] => 10
    [741] => 11
    [742] => references
    [743] => 12
    [745] => reading
    [746] => 13
    [747] => external
    [748] => links
    [749] => etymology
    [750] => edit
    [753] => 1960s
    [754] => statisticians
    [756] => terms
    [758] => data
    [759] => fishing
    [761] => data
    [762] => dredging
    [764] => refer
    [768] => considered
    [770] => bad
    [771] => practice
    [773] => analyzing
    [774] => data
    [777] => a-priori
    [778] => hypothesis
    [780] => term
    [781] => data
    [782] => mining
    [783] => appeared
    [785] => 1990
    [788] => database
    [789] => community
    [792] => short
    [793] => time
    [795] => 1980s
    [797] => phrase
    [798] => database
    [799] => mining
    [806] => trademarked
    [808] => hnc
    [810] => san
    [811] => diego-based
    [812] => company
    [814] => pitch
    [816] => database
    [817] => mining
    [818] => workstation
    [819] => 10
    [820] => researchers
    [822] => turned
    [824] => data
    [825] => mining
    [827] => terms
    [829] => include
    [830] => data
    [831] => archaeology
    [832] => information
    [833] => harvesting
    [834] => information
    [835] => discovery
    [836] => knowledge
    [837] => extraction
    [839] => gregory
    [840] => piatetsky-shapiro
    [841] => coined
    [843] => term
    [844] => knowledge
    [845] => discovery
    [847] => databases
    [851] => workshop
    [855] => topic
    [856] => kdd-1989
    [859] => term
    [862] => popular
    [864] => ai
    [866] => machine
    [867] => learning
    [868] => community
    [871] => term
    [872] => data
    [873] => mining
    [876] => popular
    [879] => business
    [881] => press
    [882] => communities
    [883] => 11
    [886] => terms
    [887] => data
    [888] => mining
    [890] => knowledge
    [891] => discovery
    [894] => interchangeably
    [897] => academic
    [898] => community
    [900] => major
    [901] => forums
    [903] => research
    [904] => started
    [906] => 1995
    [910] => international
    [911] => conference
    [913] => data
    [914] => mining
    [916] => knowledge
    [917] => discovery
    [918] => kdd-95
    [920] => started
    [922] => montreal
    [924] => aaai
    [925] => sponsorship
    [928] => co-chaired
    [930] => usama
    [931] => fayyad
    [933] => ramasamy
    [934] => uthurusamy
    [936] => year
    [939] => 1996
    [940] => usama
    [941] => fayyad
    [942] => launched
    [944] => journal
    [946] => kluwer
    [947] => called
    [948] => data
    [949] => mining
    [951] => knowledge
    [952] => discovery
    [955] => founding
    [956] => editor-in-chief
    [959] => started
    [961] => sigkddd
    [962] => newsletter
    [963] => sigkdd
    [964] => explorations
    [965] => 12
    [967] => kdd
    [968] => international
    [969] => conference
    [972] => primary
    [973] => highest
    [974] => quality
    [975] => conference
    [977] => data
    [978] => mining
    [981] => acceptance
    [982] => rate
    [984] => research
    [985] => paper
    [986] => submissions
    [988] => 18
    [990] => journal
    [991] => data
    [992] => mining
    [994] => knowledge
    [995] => discovery
    [998] => primary
    [999] => research
    [1000] => journal
    [1003] => field
    [1004] => background
    [1005] => edit
    [1007] => manual
    [1008] => extraction
    [1010] => patterns
    [1012] => data
    [1014] => occurred
    [1016] => centuries
    [1017] => early
    [1018] => methods
    [1020] => identifying
    [1021] => patterns
    [1023] => data
    [1024] => include
    [1025] => bayes'
    [1026] => theorem
    [1027] => 1700s
    [1029] => regression
    [1030] => analysis
    [1031] => 1800s
    [1033] => proliferation
    [1034] => ubiquity
    [1036] => increasing
    [1037] => power
    [1039] => computer
    [1040] => technology
    [1042] => dramatically
    [1043] => increased
    [1044] => data
    [1045] => collection
    [1046] => storage
    [1048] => manipulation
    [1049] => ability
    [1051] => data
    [1052] => sets
    [1054] => grown
    [1056] => size
    [1058] => complexity
    [1059] => direct
    [1060] => hands-on
    [1061] => data
    [1062] => analysis
    [1064] => increasingly
    [1066] => augmented
    [1068] => indirect
    [1069] => automated
    [1070] => data
    [1071] => processing
    [1072] => aided
    [1075] => discoveries
    [1077] => computer
    [1078] => science
    [1081] => neural
    [1082] => networks
    [1083] => cluster
    [1084] => analysis
    [1085] => genetic
    [1086] => algorithms
    [1087] => 1950s
    [1088] => decision
    [1089] => trees
    [1091] => decision
    [1092] => rules
    [1093] => 1960s
    [1095] => support
    [1096] => vector
    [1097] => machines
    [1098] => 1990s
    [1099] => data
    [1100] => mining
    [1103] => process
    [1105] => applying
    [1107] => methods
    [1110] => intention
    [1112] => uncovering
    [1113] => hidden
    [1114] => patterns
    [1115] => 13
    [1117] => large
    [1118] => data
    [1119] => sets
    [1121] => bridges
    [1123] => gap
    [1125] => applied
    [1126] => statistics
    [1128] => artificial
    [1129] => intelligence
    [1132] => provide
    [1134] => mathematical
    [1135] => background
    [1137] => database
    [1138] => management
    [1140] => exploiting
    [1143] => data
    [1145] => stored
    [1147] => indexed
    [1149] => databases
    [1151] => execute
    [1153] => actual
    [1154] => learning
    [1156] => discovery
    [1157] => algorithms
    [1159] => efficiently
    [1160] => allowing
    [1162] => methods
    [1165] => applied
    [1168] => larger
    [1169] => data
    [1170] => sets
    [1171] => process
    [1172] => edit
    [1174] => knowledge
    [1175] => discovery
    [1177] => databases
    [1178] => kdd
    [1179] => process
    [1181] => commonly
    [1182] => defined
    [1185] => stages
    [1186] => 1
    [1187] => selection
    [1188] => 2
    [1189] => pre-processing
    [1190] => 3
    [1191] => transformation
    [1192] => 4
    [1193] => data
    [1194] => mining
    [1195] => 5
    [1196] => interpretation
    [1197] => evaluation
    [1198] => 5
    [1200] => exists
    [1204] => variations
    [1207] => theme
    [1211] => cross
    [1212] => industry
    [1213] => standard
    [1214] => process
    [1216] => data
    [1217] => mining
    [1218] => crisp-dm
    [1220] => defines
    [1222] => phases
    [1223] => 1
    [1224] => business
    [1225] => understanding
    [1226] => 2
    [1227] => data
    [1228] => understanding
    [1229] => 3
    [1230] => data
    [1231] => preparation
    [1232] => 4
    [1233] => modeling
    [1234] => 5
    [1235] => evaluation
    [1236] => 6
    [1237] => deployment
    [1240] => simplified
    [1241] => process
    [1244] => 1
    [1245] => pre-processing
    [1246] => 2
    [1247] => data
    [1248] => mining
    [1250] => 3
    [1251] => results
    [1252] => validation
    [1253] => polls
    [1254] => conducted
    [1256] => 2002
    [1257] => 2004
    [1258] => 2007
    [1260] => 2014
    [1261] => show
    [1264] => crisp-dm
    [1265] => methodology
    [1268] => leading
    [1269] => methodology
    [1272] => data
    [1273] => miners
    [1274] => 14
    [1278] => data
    [1279] => mining
    [1280] => standard
    [1281] => named
    [1284] => polls
    [1286] => semma
    [1288] => 3
    [1289] => 4
    [1290] => times
    [1293] => people
    [1294] => reported
    [1296] => crisp-dm
    [1298] => teams
    [1300] => researchers
    [1302] => published
    [1303] => reviews
    [1305] => data
    [1306] => mining
    [1307] => process
    [1308] => models
    [1309] => 15
    [1310] => 16
    [1312] => azevedo
    [1314] => santos
    [1315] => conducted
    [1317] => comparison
    [1319] => crisp-dm
    [1321] => semma
    [1323] => 2008
    [1324] => 17
    [1325] => pre-processing
    [1326] => edit
    [1328] => data
    [1329] => mining
    [1330] => algorithms
    [1335] => target
    [1336] => data
    [1337] => set
    [1340] => assembled
    [1342] => data
    [1343] => mining
    [1346] => uncover
    [1347] => patterns
    [1349] => present
    [1352] => data
    [1354] => target
    [1355] => data
    [1356] => set
    [1359] => large
    [1364] => patterns
    [1366] => remaining
    [1367] => concise
    [1371] => mined
    [1374] => acceptable
    [1375] => time
    [1376] => limit
    [1378] => common
    [1379] => source
    [1381] => data
    [1384] => data
    [1385] => mart
    [1387] => data
    [1388] => warehouse
    [1389] => pre-processing
    [1391] => essential
    [1393] => analyze
    [1395] => multivariate
    [1396] => data
    [1397] => sets
    [1399] => data
    [1400] => mining
    [1402] => target
    [1403] => set
    [1406] => cleaned
    [1407] => data
    [1408] => cleaning
    [1409] => removes
    [1411] => observations
    [1413] => noise
    [1417] => missing
    [1418] => data
    [1419] => data
    [1420] => mining
    [1421] => edit
    [1422] => data
    [1423] => mining
    [1424] => involves
    [1426] => common
    [1427] => classes
    [1429] => tasks
    [1430] => 5
    [1431] => anomaly
    [1432] => detection
    [1433] => outlier
    [1434] => change
    [1435] => deviation
    [1436] => detection
    [1438] => identification
    [1440] => unusual
    [1441] => data
    [1442] => records
    [1446] => interesting
    [1448] => data
    [1449] => errors
    [1451] => require
    [1453] => investigation
    [1454] => association
    [1455] => rule
    [1456] => learning
    [1457] => dependency
    [1458] => modelling
    [1459] => searches
    [1461] => relationships
    [1463] => variables
    [1467] => supermarket
    [1469] => gather
    [1470] => data
    [1472] => customer
    [1473] => purchasing
    [1474] => habits
    [1476] => association
    [1477] => rule
    [1478] => learning
    [1480] => supermarket
    [1482] => determine
    [1484] => products
    [1486] => frequently
    [1487] => bought
    [1492] => information
    [1494] => marketing
    [1495] => purposes
    [1499] => referred
    [1502] => market
    [1503] => basket
    [1504] => analysis
    [1505] => clustering
    [1508] => task
    [1510] => discovering
    [1511] => groups
    [1513] => structures
    [1516] => data
    [1524] => similar
    [1528] => structures
    [1531] => data
    [1532] => classification
    [1535] => task
    [1537] => generalizing
    [1539] => structure
    [1541] => apply
    [1544] => data
    [1548] => e-mail
    [1549] => program
    [1551] => attempt
    [1553] => classify
    [1555] => e-mail
    [1557] => legitimate
    [1560] => spam
    [1561] => regression
    [1562] => attempts
    [1564] => find
    [1566] => function
    [1568] => models
    [1570] => data
    [1574] => error
    [1578] => estimating
    [1580] => relationships
    [1582] => data
    [1584] => datasets
    [1585] => summarization
    [1586] => providing
    [1589] => compact
    [1590] => representation
    [1593] => data
    [1594] => set
    [1595] => including
    [1596] => visualization
    [1598] => report
    [1599] => generation
    [1600] => results
    [1601] => validation
    [1602] => edit
    [1606] => data
    [1607] => produced
    [1609] => data
    [1610] => dredging
    [1613] => bot
    [1614] => operated
    [1616] => statistician
    [1617] => tyler
    [1618] => vigen
    [1619] => apparently
    [1620] => showing
    [1622] => close
    [1623] => link
    [1627] => word
    [1628] => winning
    [1630] => spelling
    [1631] => bee
    [1632] => competition
    [1635] => number
    [1637] => people
    [1640] => united
    [1641] => states
    [1642] => killed
    [1644] => venomous
    [1645] => spiders
    [1647] => similarity
    [1649] => trends
    [1653] => coincidence
    [1654] => data
    [1655] => mining
    [1657] => unintentionally
    [1659] => misused
    [1663] => produce
    [1664] => results
    [1669] => significant
    [1675] => predict
    [1676] => future
    [1677] => behaviour
    [1681] => reproduced
    [1685] => sample
    [1687] => data
    [1689] => bear
    [1694] => results
    [1696] => investigating
    [1699] => hypotheses
    [1702] => performing
    [1703] => proper
    [1704] => statistical
    [1705] => hypothesis
    [1706] => testing
    [1708] => simple
    [1709] => version
    [1712] => problem
    [1714] => machine
    [1715] => learning
    [1719] => overfitting
    [1723] => problem
    [1725] => arise
    [1728] => phases
    [1731] => process
    [1735] => train
    [1736] => test
    [1737] => split
    [1740] => applicable
    [1747] => sufficient
    [1749] => prevent
    [1752] => happening
    [1753] => 18
    [1755] => section
    [1757] => missing
    [1758] => information
    [1760] => non-classification
    [1761] => tasks
    [1763] => data
    [1764] => mining
    [1767] => covers
    [1768] => machine
    [1769] => learning
    [1771] => expand
    [1773] => section
    [1775] => include
    [1777] => information
    [1779] => details
    [1781] => exist
    [1784] => talk
    [1785] => page
    [1786] => september
    [1787] => 2011
    [1789] => final
    [1790] => step
    [1792] => knowledge
    [1793] => discovery
    [1795] => data
    [1798] => verify
    [1801] => patterns
    [1802] => produced
    [1805] => data
    [1806] => mining
    [1807] => algorithms
    [1808] => occur
    [1811] => wider
    [1812] => data
    [1813] => set
    [1816] => patterns
    [1817] => found
    [1820] => data
    [1821] => mining
    [1822] => algorithms
    [1824] => necessarily
    [1825] => valid
    [1828] => common
    [1831] => data
    [1832] => mining
    [1833] => algorithms
    [1835] => find
    [1836] => patterns
    [1839] => training
    [1840] => set
    [1844] => present
    [1847] => general
    [1848] => data
    [1849] => set
    [1852] => called
    [1853] => overfitting
    [1855] => overcome
    [1858] => evaluation
    [1861] => test
    [1862] => set
    [1864] => data
    [1868] => data
    [1869] => mining
    [1870] => algorithm
    [1873] => trained
    [1875] => learned
    [1876] => patterns
    [1878] => applied
    [1881] => test
    [1882] => set
    [1885] => resulting
    [1886] => output
    [1888] => compared
    [1891] => desired
    [1892] => output
    [1896] => data
    [1897] => mining
    [1898] => algorithm
    [1901] => distinguish
    [1902] => spam
    [1904] => legitimate
    [1905] => emails
    [1908] => trained
    [1911] => training
    [1912] => set
    [1914] => sample
    [1915] => e-mails
    [1917] => trained
    [1919] => learned
    [1920] => patterns
    [1923] => applied
    [1926] => test
    [1927] => set
    [1929] => e-mails
    [1936] => trained
    [1938] => accuracy
    [1941] => patterns
    [1945] => measured
    [1949] => e-mails
    [1951] => correctly
    [1952] => classify
    [1954] => number
    [1956] => statistical
    [1957] => methods
    [1962] => evaluate
    [1964] => algorithm
    [1967] => roc
    [1968] => curves
    [1971] => learned
    [1972] => patterns
    [1975] => meet
    [1977] => desired
    [1978] => standards
    [1979] => subsequently
    [1984] => re-evaluate
    [1986] => change
    [1988] => pre-processing
    [1990] => data
    [1991] => mining
    [1992] => steps
    [1995] => learned
    [1996] => patterns
    [1998] => meet
    [2000] => desired
    [2001] => standards
    [2004] => final
    [2005] => step
    [2008] => interpret
    [2010] => learned
    [2011] => patterns
    [2013] => turn
    [2016] => knowledge
    [2017] => research
    [2018] => edit
    [2020] => premier
    [2021] => professional
    [2022] => body
    [2025] => field
    [2028] => association
    [2030] => computing
    [2031] => machinery
    [2032] => 's
    [2033] => acm
    [2034] => special
    [2035] => interest
    [2036] => group
    [2037] => sig
    [2039] => knowledge
    [2040] => discovery
    [2042] => data
    [2043] => mining
    [2044] => sigkdd
    [2045] => 19
    [2046] => 20
    [2048] => 1989
    [2050] => acm
    [2051] => sig
    [2053] => hosted
    [2055] => annual
    [2056] => international
    [2057] => conference
    [2059] => published
    [2061] => proceedings
    [2062] => 21
    [2065] => 1999
    [2068] => published
    [2070] => biannual
    [2071] => academic
    [2072] => journal
    [2073] => titled
    [2074] => sigkdd
    [2075] => explorations
    [2076] => 22
    [2077] => computer
    [2078] => science
    [2079] => conferences
    [2081] => data
    [2082] => mining
    [2083] => include
    [2084] => cikm
    [2085] => conference
    [2086] => acm
    [2087] => conference
    [2089] => information
    [2091] => knowledge
    [2092] => management
    [2093] => dmin
    [2094] => conference
    [2095] => international
    [2096] => conference
    [2098] => data
    [2099] => mining
    [2100] => dmkd
    [2101] => conference
    [2102] => research
    [2103] => issues
    [2105] => data
    [2106] => mining
    [2108] => knowledge
    [2109] => discovery
    [2110] => dsaa
    [2111] => conference
    [2112] => ieee
    [2113] => international
    [2114] => conference
    [2116] => data
    [2117] => science
    [2119] => advanced
    [2120] => analytics
    [2121] => ecdm
    [2122] => conference
    [2123] => european
    [2124] => conference
    [2126] => data
    [2127] => mining
    [2128] => ecml-pkdd
    [2129] => conference
    [2130] => european
    [2131] => conference
    [2133] => machine
    [2134] => learning
    [2136] => principles
    [2138] => practice
    [2140] => knowledge
    [2141] => discovery
    [2143] => databases
    [2144] => edm
    [2145] => conference
    [2146] => international
    [2147] => conference
    [2149] => educational
    [2150] => data
    [2151] => mining
    [2152] => infocom
    [2153] => conference
    [2154] => ieee
    [2155] => infocom
    [2156] => icdm
    [2157] => conference
    [2158] => ieee
    [2159] => international
    [2160] => conference
    [2162] => data
    [2163] => mining
    [2164] => kdd
    [2165] => conference
    [2166] => acm
    [2167] => sigkdd
    [2168] => conference
    [2170] => knowledge
    [2171] => discovery
    [2173] => data
    [2174] => mining
    [2175] => mldm
    [2176] => conference
    [2177] => machine
    [2178] => learning
    [2180] => data
    [2181] => mining
    [2183] => pattern
    [2184] => recognition
    [2185] => pakdd
    [2186] => conference
    [2188] => annual
    [2189] => pacific-asia
    [2190] => conference
    [2192] => knowledge
    [2193] => discovery
    [2195] => data
    [2196] => mining
    [2197] => paw
    [2198] => conference
    [2199] => predictive
    [2200] => analytics
    [2201] => world
    [2202] => sdm
    [2203] => conference
    [2204] => siam
    [2205] => international
    [2206] => conference
    [2208] => data
    [2209] => mining
    [2210] => siam
    [2211] => sstd
    [2212] => symposium
    [2213] => symposium
    [2215] => spatial
    [2217] => temporal
    [2218] => databases
    [2219] => wsdm
    [2220] => conference
    [2221] => acm
    [2222] => conference
    [2224] => web
    [2225] => search
    [2227] => data
    [2228] => mining
    [2229] => data
    [2230] => mining
    [2231] => topics
    [2234] => present
    [2237] => data
    [2238] => management
    [2239] => database
    [2240] => conferences
    [2244] => icde
    [2245] => conference
    [2246] => sigmod
    [2247] => conference
    [2249] => international
    [2250] => conference
    [2253] => large
    [2254] => data
    [2255] => bases
    [2256] => standards
    [2257] => edit
    [2262] => efforts
    [2264] => define
    [2265] => standards
    [2268] => data
    [2269] => mining
    [2270] => process
    [2274] => 1999
    [2275] => european
    [2276] => cross
    [2277] => industry
    [2278] => standard
    [2279] => process
    [2281] => data
    [2282] => mining
    [2283] => crisp-dm
    [2284] => 1
    [2285] => 0
    [2288] => 2004
    [2289] => java
    [2290] => data
    [2291] => mining
    [2292] => standard
    [2293] => jdm
    [2294] => 1
    [2295] => 0
    [2296] => development
    [2298] => successors
    [2301] => processes
    [2302] => crisp-dm
    [2303] => 2
    [2304] => 0
    [2306] => jdm
    [2307] => 2
    [2308] => 0
    [2310] => active
    [2312] => 2006
    [2315] => stalled
    [2317] => jdm
    [2318] => 2
    [2319] => 0
    [2321] => withdrawn
    [2323] => reaching
    [2325] => final
    [2326] => draft
    [2328] => exchanging
    [2330] => extracted
    [2331] => models
    [2337] => predictive
    [2338] => analytics
    [2340] => key
    [2341] => standard
    [2344] => predictive
    [2345] => model
    [2346] => markup
    [2347] => language
    [2348] => pmml
    [2352] => xml
    [2353] => -based
    [2354] => language
    [2355] => developed
    [2358] => data
    [2359] => mining
    [2360] => group
    [2361] => dmg
    [2363] => supported
    [2365] => exchange
    [2366] => format
    [2369] => data
    [2370] => mining
    [2371] => applications
    [2375] => suggests
    [2378] => covers
    [2379] => prediction
    [2380] => models
    [2383] => data
    [2384] => mining
    [2385] => task
    [2387] => high
    [2388] => importance
    [2390] => business
    [2391] => applications
    [2393] => extensions
    [2395] => cover
    [2398] => subspace
    [2399] => clustering
    [2402] => proposed
    [2403] => independently
    [2406] => dmg
    [2407] => 23
    [2408] => notable
    [2410] => edit
    [2411] => main
    [2412] => article
    [2413] => examples
    [2415] => data
    [2416] => mining
    [2419] => category
    [2420] => applied
    [2421] => data
    [2422] => mining
    [2423] => data
    [2424] => mining
    [2430] => digital
    [2431] => data
    [2433] => today
    [2434] => notable
    [2435] => examples
    [2437] => data
    [2438] => mining
    [2441] => found
    [2443] => business
    [2444] => medicine
    [2445] => science
    [2447] => surveillance
    [2448] => privacy
    [2449] => concerns
    [2451] => ethics
    [2452] => edit
    [2455] => term
    [2456] => data
    [2457] => mining
    [2462] => ethical
    [2463] => implications
    [2470] => mining
    [2472] => information
    [2474] => relation
    [2476] => peoples'
    [2477] => behavior
    [2478] => ethical
    [2481] => 24
    [2483] => ways
    [2486] => data
    [2487] => mining
    [2494] => cases
    [2496] => contexts
    [2497] => raise
    [2498] => questions
    [2500] => privacy
    [2501] => legality
    [2503] => ethics
    [2504] => 25
    [2507] => data
    [2508] => mining
    [2509] => government
    [2511] => commercial
    [2512] => data
    [2513] => sets
    [2515] => national
    [2516] => security
    [2518] => law
    [2519] => enforcement
    [2520] => purposes
    [2525] => total
    [2526] => information
    [2527] => awareness
    [2528] => program
    [2531] => advise
    [2533] => raised
    [2534] => privacy
    [2535] => concerns
    [2536] => 26
    [2537] => 27
    [2538] => data
    [2539] => mining
    [2540] => requires
    [2541] => data
    [2542] => preparation
    [2545] => uncover
    [2546] => information
    [2548] => patterns
    [2551] => compromise
    [2552] => confidentiality
    [2554] => privacy
    [2555] => obligations
    [2557] => common
    [2562] => occur
    [2565] => data
    [2566] => aggregation
    [2567] => data
    [2568] => aggregation
    [2569] => involves
    [2570] => combining
    [2571] => data
    [2573] => possibly
    [2576] => sources
    [2581] => facilitates
    [2582] => analysis
    [2587] => make
    [2588] => identification
    [2590] => private
    [2591] => individual-level
    [2592] => data
    [2593] => deducible
    [2596] => apparent
    [2597] => 28
    [2601] => data
    [2602] => mining
    [2604] => se
    [2607] => result
    [2610] => preparation
    [2612] => data
    [2617] => purposes
    [2620] => analysis
    [2622] => threat
    [2625] => individual's
    [2626] => privacy
    [2629] => play
    [2632] => data
    [2634] => compiled
    [2637] => data
    [2638] => miner
    [2643] => access
    [2646] => newly
    [2647] => compiled
    [2648] => data
    [2649] => set
    [2654] => identify
    [2655] => specific
    [2656] => individuals
    [2660] => data
    [2662] => originally
    [2663] => anonymous
    [2664] => 29
    [2665] => 30
    [2666] => 31
    [2669] => recommended
    [2672] => individual
    [2674] => made
    [2675] => aware
    [2680] => data
    [2682] => collected
    [2683] => 28
    [2685] => purpose
    [2688] => data
    [2689] => collection
    [2693] => data
    [2694] => mining
    [2695] => projects
    [2698] => data
    [2707] => mine
    [2709] => data
    [2713] => data
    [2716] => derivatives
    [2718] => status
    [2720] => security
    [2721] => surrounding
    [2722] => access
    [2725] => data
    [2727] => collected
    [2728] => data
    [2731] => updated
    [2732] => data
    [2736] => modified
    [2741] => anonymous
    [2744] => individuals
    [2747] => readily
    [2749] => identified
    [2750] => 28
    [2753] => de-identified
    [2754] => anonymized
    [2755] => data
    [2756] => sets
    [2758] => potentially
    [2761] => information
    [2764] => identification
    [2766] => individuals
    [2768] => occurred
    [2770] => journalists
    [2774] => find
    [2776] => individuals
    [2777] => based
    [2780] => set
    [2782] => search
    [2783] => histories
    [2786] => inadvertently
    [2787] => released
    [2789] => aol
    [2790] => 32
    [2792] => inadvertent
    [2793] => revelation
    [2795] => personally
    [2796] => identifiable
    [2797] => information
    [2798] => leading
    [2801] => provider
    [2802] => violates
    [2803] => fair
    [2804] => information
    [2805] => practices
    [2807] => indiscretion
    [2810] => financial
    [2811] => emotional
    [2813] => bodily
    [2814] => harm
    [2818] => individual
    [2821] => instance
    [2823] => privacy
    [2824] => violation
    [2826] => patrons
    [2828] => walgreens
    [2829] => filed
    [2831] => lawsuit
    [2834] => company
    [2836] => 2011
    [2838] => selling
    [2839] => prescription
    [2840] => information
    [2842] => data
    [2843] => mining
    [2844] => companies
    [2847] => turn
    [2848] => provided
    [2850] => data
    [2852] => pharmaceutical
    [2853] => companies
    [2854] => 33
    [2855] => situation
    [2857] => europe
    [2858] => edit
    [2859] => europe
    [2862] => strong
    [2863] => privacy
    [2864] => laws
    [2866] => efforts
    [2868] => underway
    [2871] => strengthen
    [2873] => rights
    [2876] => consumers
    [2879] => u
    [2880] => s
    [2881] => -e
    [2882] => u
    [2883] => safe
    [2884] => harbor
    [2885] => principles
    [2887] => effectively
    [2888] => expose
    [2889] => european
    [2890] => users
    [2892] => privacy
    [2893] => exploitation
    [2895] => u
    [2896] => s
    [2897] => companies
    [2900] => consequence
    [2902] => edward
    [2903] => snowden
    [2904] => 's
    [2905] => global
    [2906] => surveillance
    [2907] => disclosure
    [2911] => increased
    [2912] => discussion
    [2914] => revoke
    [2916] => agreement
    [2921] => data
    [2924] => fully
    [2925] => exposed
    [2928] => national
    [2929] => security
    [2930] => agency
    [2932] => attempts
    [2934] => reach
    [2936] => agreement
    [2938] => failed
    [2939] => citation
    [2940] => needed
    [2941] => situation
    [2944] => united
    [2945] => states
    [2946] => edit
    [2949] => united
    [2950] => states
    [2951] => privacy
    [2952] => concerns
    [2955] => addressed
    [2959] => congress
    [2962] => passage
    [2964] => regulatory
    [2965] => controls
    [2969] => health
    [2970] => insurance
    [2971] => portability
    [2973] => accountability
    [2974] => act
    [2975] => hipaa
    [2977] => hipaa
    [2978] => requires
    [2979] => individuals
    [2981] => give
    [2983] => informed
    [2984] => consent
    [2986] => information
    [2988] => provide
    [2991] => intended
    [2992] => present
    [2994] => future
    [2999] => article
    [3001] => biotech
    [3002] => business
    [3003] => week
    [3004] => '
    [3006] => n
    [3007] => practice
    [3008] => hipaa
    [3011] => offer
    [3013] => greater
    [3014] => protection
    [3017] => longstanding
    [3018] => regulations
    [3021] => research
    [3022] => arena
    [3023] => '
    [3026] => aahc
    [3028] => importantly
    [3030] => rule's
    [3031] => goal
    [3033] => protection
    [3035] => informed
    [3036] => consent
    [3038] => undermined
    [3041] => complexity
    [3043] => consent
    [3044] => forms
    [3047] => required
    [3049] => patients
    [3051] => participants
    [3053] => approach
    [3055] => level
    [3057] => incomprehensibility
    [3059] => average
    [3060] => individuals
    [3061] => 34
    [3063] => underscores
    [3065] => necessity
    [3067] => data
    [3068] => anonymity
    [3070] => data
    [3071] => aggregation
    [3073] => mining
    [3074] => practices
    [3075] => u
    [3076] => s
    [3077] => information
    [3078] => privacy
    [3079] => legislation
    [3082] => hipaa
    [3085] => family
    [3086] => educational
    [3087] => rights
    [3089] => privacy
    [3090] => act
    [3091] => ferpa
    [3092] => applies
    [3096] => specific
    [3097] => areas
    [3101] => law
    [3102] => addresses
    [3105] => data
    [3106] => mining
    [3109] => majority
    [3111] => businesses
    [3114] => u
    [3115] => s
    [3118] => controlled
    [3121] => legislation
    [3122] => copyright
    [3123] => law
    [3124] => edit
    [3125] => situation
    [3127] => europe
    [3128] => edit
    [3129] => due
    [3132] => lack
    [3134] => flexibilities
    [3136] => european
    [3137] => copyright
    [3139] => database
    [3140] => law
    [3142] => mining
    [3144] => in-copyright
    [3145] => works
    [3148] => web
    [3149] => mining
    [3152] => permission
    [3155] => copyright
    [3156] => owner
    [3159] => legal
    [3162] => database
    [3164] => pure
    [3165] => data
    [3167] => europe
    [3174] => copyright
    [3176] => database
    [3177] => rights
    [3179] => exist
    [3181] => data
    [3182] => mining
    [3184] => subject
    [3186] => regulations
    [3189] => database
    [3190] => directive
    [3193] => recommendation
    [3196] => hargreaves
    [3197] => review
    [3199] => led
    [3202] => uk
    [3203] => government
    [3205] => amend
    [3207] => copyright
    [3208] => law
    [3210] => 2014
    [3211] => 35
    [3214] => content
    [3215] => mining
    [3218] => limitation
    [3220] => exception
    [3224] => country
    [3227] => world
    [3232] => japan
    [3234] => introduced
    [3236] => exception
    [3238] => 2009
    [3240] => data
    [3241] => mining
    [3243] => due
    [3246] => restriction
    [3249] => copyright
    [3250] => directive
    [3252] => uk
    [3253] => exception
    [3256] => content
    [3257] => mining
    [3259] => non-commercial
    [3260] => purposes
    [3261] => uk
    [3262] => copyright
    [3263] => law
    [3269] => provision
    [3272] => overridden
    [3274] => contractual
    [3275] => terms
    [3277] => conditions
    [3279] => european
    [3280] => commission
    [3281] => facilitated
    [3282] => stakeholder
    [3283] => discussion
    [3285] => text
    [3287] => data
    [3288] => mining
    [3290] => 2013
    [3293] => title
    [3295] => licences
    [3297] => europe
    [3298] => 36
    [3300] => focus
    [3303] => solution
    [3306] => legal
    [3307] => issue
    [3309] => licences
    [3312] => limitations
    [3314] => exceptions
    [3315] => led
    [3317] => representatives
    [3319] => universities
    [3320] => researchers
    [3321] => libraries
    [3322] => civil
    [3323] => society
    [3324] => groups
    [3326] => open
    [3327] => access
    [3328] => publishers
    [3330] => leave
    [3332] => stakeholder
    [3333] => dialogue
    [3336] => 2013
    [3337] => 37
    [3338] => situation
    [3341] => united
    [3342] => states
    [3343] => edit
    [3345] => contrast
    [3347] => europe
    [3349] => flexible
    [3350] => nature
    [3353] => copyright
    [3354] => law
    [3358] => fair
    [3360] => means
    [3362] => content
    [3363] => mining
    [3365] => america
    [3370] => fair
    [3372] => countries
    [3375] => israel
    [3376] => taiwan
    [3378] => south
    [3379] => korea
    [3381] => viewed
    [3384] => legal
    [3386] => content
    [3387] => mining
    [3389] => transformative
    [3395] => supplant
    [3397] => original
    [3398] => work
    [3401] => viewed
    [3404] => lawful
    [3406] => fair
    [3411] => part
    [3414] => google
    [3415] => book
    [3416] => settlement
    [3418] => presiding
    [3419] => judge
    [3422] => case
    [3423] => ruled
    [3425] => google's
    [3426] => digitisation
    [3427] => project
    [3429] => in-copyright
    [3430] => books
    [3432] => lawful
    [3434] => part
    [3438] => transformative
    [3442] => digitisation
    [3443] => project
    [3444] => displayed
    [3448] => text
    [3450] => data
    [3451] => mining
    [3452] => 38
    [3453] => software
    [3454] => edit
    [3457] => category
    [3458] => data
    [3459] => mining
    [3461] => machine
    [3462] => learning
    [3463] => software
    [3464] => free
    [3465] => open-source
    [3466] => data
    [3467] => mining
    [3468] => software
    [3470] => applications
    [3471] => edit
    [3474] => applications
    [3478] => free
    [3479] => open
    [3480] => source
    [3481] => licenses
    [3482] => public
    [3483] => access
    [3485] => application
    [3486] => source
    [3487] => code
    [3491] => carrot2
    [3492] => text
    [3494] => search
    [3495] => results
    [3496] => clustering
    [3497] => framework
    [3498] => chemicalize
    [3499] => org
    [3501] => chemical
    [3502] => structure
    [3503] => miner
    [3505] => web
    [3506] => search
    [3507] => engine
    [3508] => elki
    [3510] => university
    [3511] => research
    [3512] => project
    [3514] => advanced
    [3515] => cluster
    [3516] => analysis
    [3518] => outlier
    [3519] => detection
    [3520] => methods
    [3521] => written
    [3524] => java
    [3525] => language
    [3526] => gate
    [3528] => natural
    [3529] => language
    [3530] => processing
    [3532] => language
    [3533] => engineering
    [3534] => tool
    [3535] => knime
    [3537] => konstanz
    [3538] => information
    [3539] => miner
    [3541] => user
    [3542] => friendly
    [3544] => comprehensive
    [3545] => data
    [3546] => analytics
    [3547] => framework
    [3548] => massive
    [3549] => online
    [3550] => analysis
    [3551] => moa
    [3553] => real-time
    [3554] => big
    [3555] => data
    [3556] => stream
    [3557] => mining
    [3559] => concept
    [3560] => drift
    [3561] => tool
    [3564] => java
    [3565] => programming
    [3566] => language
    [3567] => mepx
    [3569] => cross
    [3570] => platform
    [3571] => tool
    [3573] => regression
    [3575] => classification
    [3576] => problems
    [3577] => based
    [3580] => genetic
    [3581] => programming
    [3582] => variant
    [3583] => ml-flex
    [3585] => software
    [3586] => package
    [3588] => enables
    [3589] => users
    [3591] => integrate
    [3593] => third-party
    [3594] => machine-learning
    [3595] => packages
    [3596] => written
    [3599] => programming
    [3600] => language
    [3601] => execute
    [3602] => classification
    [3603] => analyses
    [3605] => parallel
    [3607] => multiple
    [3608] => computing
    [3609] => nodes
    [3611] => produce
    [3612] => html
    [3613] => reports
    [3615] => classification
    [3616] => results
    [3617] => mlpack
    [3618] => library
    [3620] => collection
    [3622] => ready-to-use
    [3623] => machine
    [3624] => learning
    [3625] => algorithms
    [3626] => written
    [3629] => c
    [3630] => language
    [3631] => nltk
    [3632] => natural
    [3633] => language
    [3634] => toolkit
    [3636] => suite
    [3638] => libraries
    [3640] => programs
    [3642] => symbolic
    [3644] => statistical
    [3645] => natural
    [3646] => language
    [3647] => processing
    [3648] => nlp
    [3651] => python
    [3652] => language
    [3653] => opennn
    [3654] => open
    [3655] => neural
    [3656] => networks
    [3657] => library
    [3658] => orange
    [3660] => component-based
    [3661] => data
    [3662] => mining
    [3664] => machine
    [3665] => learning
    [3666] => software
    [3667] => suite
    [3668] => written
    [3671] => python
    [3672] => language
    [3673] => r
    [3675] => programming
    [3676] => language
    [3678] => software
    [3679] => environment
    [3681] => statistical
    [3682] => computing
    [3683] => data
    [3684] => mining
    [3686] => graphics
    [3689] => part
    [3692] => gnu
    [3693] => project
    [3694] => scikit-learn
    [3697] => open
    [3698] => source
    [3699] => machine
    [3700] => learning
    [3701] => library
    [3704] => python
    [3705] => programming
    [3706] => language
    [3707] => torch
    [3709] => open
    [3710] => source
    [3711] => deep
    [3712] => learning
    [3713] => library
    [3716] => lua
    [3717] => programming
    [3718] => language
    [3720] => scientific
    [3721] => computing
    [3722] => framework
    [3724] => wide
    [3725] => support
    [3727] => machine
    [3728] => learning
    [3729] => algorithms
    [3730] => uima
    [3732] => uima
    [3733] => unstructured
    [3734] => information
    [3735] => management
    [3736] => architecture
    [3739] => component
    [3740] => framework
    [3742] => analyzing
    [3743] => unstructured
    [3744] => content
    [3747] => text
    [3748] => audio
    [3750] => video
    [3751] => originally
    [3752] => developed
    [3754] => ibm
    [3755] => weka
    [3757] => suite
    [3759] => machine
    [3760] => learning
    [3761] => software
    [3762] => applications
    [3763] => written
    [3766] => java
    [3767] => programming
    [3768] => language
    [3769] => proprietary
    [3770] => data-mining
    [3771] => software
    [3773] => applications
    [3774] => edit
    [3777] => applications
    [3781] => proprietary
    [3782] => licenses
    [3783] => angoss
    [3784] => knowledgestudio
    [3785] => data
    [3786] => mining
    [3787] => tool
    [3788] => clarabridge
    [3789] => text
    [3790] => analytics
    [3791] => product
    [3792] => kxen
    [3793] => modeler
    [3794] => data
    [3795] => mining
    [3796] => tool
    [3797] => provided
    [3799] => kxen
    [3801] => lionsolver
    [3803] => integrated
    [3804] => software
    [3805] => application
    [3807] => data
    [3808] => mining
    [3809] => business
    [3810] => intelligence
    [3812] => modeling
    [3814] => implements
    [3816] => learning
    [3818] => intelligent
    [3819] => optimization
    [3820] => lion
    [3821] => approach
    [3822] => megaputer
    [3823] => intelligence
    [3824] => data
    [3826] => text
    [3827] => mining
    [3828] => software
    [3830] => called
    [3831] => polyanalyst
    [3832] => microsoft
    [3833] => analysis
    [3834] => services
    [3835] => data
    [3836] => mining
    [3837] => software
    [3838] => provided
    [3840] => microsoft
    [3841] => netowl
    [3842] => suite
    [3844] => multilingual
    [3845] => text
    [3847] => entity
    [3848] => analytics
    [3849] => products
    [3851] => enable
    [3852] => data
    [3853] => mining
    [3854] => opentext
    [3855] => big
    [3856] => data
    [3857] => analytics
    [3858] => visual
    [3859] => data
    [3860] => mining
    [3861] => predictive
    [3862] => analysis
    [3864] => open
    [3865] => text
    [3866] => corporation
    [3867] => oracle
    [3868] => data
    [3869] => mining
    [3870] => data
    [3871] => mining
    [3872] => software
    [3874] => oracle
    [3875] => corporation
    [3876] => pseven
    [3877] => platform
    [3879] => automation
    [3881] => engineering
    [3882] => simulation
    [3884] => analysis
    [3885] => multidisciplinary
    [3886] => optimization
    [3888] => data
    [3889] => mining
    [3890] => provided
    [3892] => datadvance
    [3893] => qlucore
    [3894] => omics
    [3895] => explorer
    [3896] => data
    [3897] => mining
    [3898] => software
    [3899] => rapidminer
    [3901] => environment
    [3903] => machine
    [3904] => learning
    [3906] => data
    [3907] => mining
    [3908] => experiments
    [3909] => sas
    [3910] => enterprise
    [3911] => miner
    [3912] => data
    [3913] => mining
    [3914] => software
    [3915] => provided
    [3918] => sas
    [3919] => institute
    [3920] => spss
    [3921] => modeler
    [3922] => data
    [3923] => mining
    [3924] => software
    [3925] => provided
    [3927] => ibm
    [3928] => statistica
    [3929] => data
    [3930] => miner
    [3931] => data
    [3932] => mining
    [3933] => software
    [3934] => provided
    [3936] => statsoft
    [3937] => tanagra
    [3938] => visualisation-oriented
    [3939] => data
    [3940] => mining
    [3941] => software
    [3944] => teaching
    [3945] => vertica
    [3946] => data
    [3947] => mining
    [3948] => software
    [3949] => provided
    [3951] => hewlett-packard
    [3952] => marketplace
    [3953] => surveys
    [3954] => edit
    [3956] => researchers
    [3958] => organizations
    [3960] => conducted
    [3961] => reviews
    [3963] => data
    [3964] => mining
    [3965] => tools
    [3967] => surveys
    [3969] => data
    [3970] => miners
    [3972] => identify
    [3976] => strengths
    [3978] => weaknesses
    [3981] => software
    [3982] => packages
    [3985] => provide
    [3987] => overview
    [3990] => behaviors
    [3991] => preferences
    [3993] => views
    [3995] => data
    [3996] => miners
    [4000] => reports
    [4001] => include
    [4002] => hurwitz
    [4003] => victory
    [4004] => index
    [4005] => report
    [4007] => advanced
    [4008] => analytics
    [4011] => market
    [4012] => research
    [4013] => assessment
    [4014] => tool
    [4016] => highlights
    [4019] => diverse
    [4022] => advanced
    [4023] => analytics
    [4024] => technology
    [4027] => vendors
    [4029] => make
    [4031] => applications
    [4033] => recent-research
    [4034] => rexer
    [4035] => analytics
    [4036] => data
    [4037] => miner
    [4038] => surveys
    [4039] => 2007
    [4040] => 2015
    [4041] => 39
    [4042] => 2011
    [4043] => wiley
    [4044] => interdisciplinary
    [4045] => reviews
    [4046] => data
    [4047] => mining
    [4049] => knowledge
    [4050] => discovery
    [4051] => 40
    [4052] => forrester
    [4053] => research
    [4054] => 2010
    [4055] => predictive
    [4056] => analytics
    [4058] => data
    [4059] => mining
    [4060] => solutions
    [4061] => report
    [4062] => 41
    [4063] => gartner
    [4064] => 2008
    [4065] => magic
    [4066] => quadrant
    [4067] => report
    [4068] => 42
    [4069] => robert
    [4071] => nisbet's
    [4072] => 2006
    [4074] => part
    [4075] => series
    [4077] => articles
    [4078] => data
    [4079] => mining
    [4080] => tools
    [4086] => crm
    [4087] => 43
    [4088] => haughton
    [4090] => al
    [4091] => 's
    [4092] => 2003
    [4093] => review
    [4095] => data
    [4096] => mining
    [4097] => software
    [4098] => packages
    [4101] => american
    [4102] => statistician
    [4103] => 44
    [4104] => goebel
    [4105] => gruenwald
    [4106] => 1999
    [4108] => survey
    [4110] => data
    [4111] => mining
    [4113] => knowledge
    [4114] => discovery
    [4115] => software
    [4116] => tools
    [4118] => sigkdd
    [4119] => explorations
    [4120] => 45
    [4123] => edit
    [4124] => methods
    [4125] => agent
    [4126] => mining
    [4127] => anomaly
    [4128] => outlier
    [4129] => change
    [4130] => detection
    [4131] => association
    [4132] => rule
    [4133] => learning
    [4134] => bayesian
    [4135] => networks
    [4136] => classification
    [4137] => cluster
    [4138] => analysis
    [4139] => decision
    [4140] => trees
    [4141] => ensemble
    [4142] => learning
    [4143] => factor
    [4144] => analysis
    [4145] => genetic
    [4146] => algorithms
    [4147] => intention
    [4148] => mining
    [4149] => learning
    [4150] => classifier
    [4151] => system
    [4152] => multilinear
    [4153] => subspace
    [4154] => learning
    [4155] => neural
    [4156] => networks
    [4157] => regression
    [4158] => analysis
    [4159] => sequence
    [4160] => mining
    [4161] => structured
    [4162] => data
    [4163] => analysis
    [4164] => support
    [4165] => vector
    [4166] => machines
    [4167] => text
    [4168] => mining
    [4169] => time
    [4170] => series
    [4171] => analysis
    [4172] => application
    [4173] => domains
    [4174] => analytics
    [4175] => behavior
    [4176] => informatics
    [4177] => big
    [4178] => data
    [4179] => bioinformatics
    [4180] => business
    [4181] => intelligence
    [4182] => data
    [4183] => analysis
    [4184] => data
    [4185] => warehouse
    [4186] => decision
    [4187] => support
    [4188] => system
    [4189] => domain
    [4190] => driven
    [4191] => data
    [4192] => mining
    [4193] => drug
    [4194] => discovery
    [4195] => exploratory
    [4196] => data
    [4197] => analysis
    [4198] => predictive
    [4199] => analytics
    [4200] => web
    [4201] => mining
    [4202] => application
    [4203] => examples
    [4204] => main
    [4205] => article
    [4206] => examples
    [4208] => data
    [4209] => mining
    [4212] => category
    [4213] => applied
    [4214] => data
    [4215] => mining
    [4216] => automatic
    [4217] => number
    [4218] => plate
    [4219] => recognition
    [4222] => united
    [4223] => kingdom
    [4224] => customer
    [4225] => analytics
    [4226] => educational
    [4227] => data
    [4228] => mining
    [4229] => national
    [4230] => security
    [4231] => agency
    [4232] => quantitative
    [4233] => structure
    [4234] => activity
    [4235] => relationship
    [4236] => surveillance
    [4237] => mass
    [4238] => surveillance
    [4239] => e
    [4240] => g
    [4241] => stellar
    [4242] => wind
    [4243] => related
    [4244] => topics
    [4245] => data
    [4246] => mining
    [4249] => analyzing
    [4250] => data
    [4252] => information
    [4254] => extracting
    [4255] => information
    [4258] => data
    [4260] => data
    [4261] => integration
    [4262] => data
    [4263] => transformation
    [4264] => electronic
    [4265] => discovery
    [4266] => information
    [4267] => extraction
    [4268] => information
    [4269] => integration
    [4270] => named-entity
    [4271] => recognition
    [4272] => profiling
    [4273] => information
    [4274] => science
    [4275] => psychometrics
    [4276] => social
    [4277] => media
    [4278] => mining
    [4279] => surveillance
    [4280] => capitalism
    [4281] => web
    [4282] => scraping
    [4284] => resources
    [4285] => international
    [4286] => journal
    [4288] => data
    [4289] => warehousing
    [4291] => mining
    [4292] => references
    [4293] => edit
    [4295] => b
    [4296] => c
    [4297] => d
    [4298] => e
    [4299] => data
    [4300] => mining
    [4301] => curriculum
    [4302] => acm
    [4303] => sigkdd
    [4304] => 2006-04-30
    [4305] => retrieved
    [4306] => 2014-01-27
    [4307] => han
    [4308] => kamber
    [4309] => pei
    [4310] => jaiwei
    [4311] => micheline
    [4312] => jian
    [4313] => june
    [4314] => 9
    [4315] => 2011
    [4316] => data
    [4317] => mining
    [4318] => concepts
    [4320] => techniques
    [4321] => 3rd
    [4322] => ed
    [4323] => morgan
    [4324] => kaufmann
    [4325] => isbn
    [4326] => 978-0-12-381479-1
    [4327] => cs1
    [4328] => maint
    [4329] => multiple
    [4330] => names
    [4331] => authors
    [4332] => list
    [4333] => link
    [4334] => clifton
    [4335] => christopher
    [4336] => 2010
    [4337] => encyclop
    [4338] => dia
    [4339] => britannica
    [4340] => definition
    [4342] => data
    [4343] => mining
    [4344] => retrieved
    [4345] => 2010-12-09
    [4346] => hastie
    [4347] => trevor
    [4348] => tibshirani
    [4349] => robert
    [4350] => friedman
    [4351] => jerome
    [4352] => 2009
    [4354] => elements
    [4356] => statistical
    [4357] => learning
    [4358] => data
    [4359] => mining
    [4360] => inference
    [4362] => prediction
    [4363] => retrieved
    [4364] => 2012-08-07
    [4366] => b
    [4367] => c
    [4368] => fayyad
    [4369] => usama
    [4370] => piatetsky-shapiro
    [4371] => gregory
    [4372] => smyth
    [4373] => padhraic
    [4374] => 1996
    [4376] => data
    [4377] => mining
    [4379] => knowledge
    [4380] => discovery
    [4382] => databases
    [4383] => pdf
    [4384] => retrieved
    [4385] => 17
    [4386] => december
    [4387] => 2008
    [4388] => han
    [4389] => jiawei
    [4390] => kamber
    [4391] => micheline
    [4392] => 2001
    [4393] => data
    [4394] => mining
    [4395] => concepts
    [4397] => techniques
    [4398] => morgan
    [4399] => kaufmann
    [4400] => p
    [4401] => 5
    [4402] => isbn
    [4403] => 978-1-55860-489-6
    [4405] => data
    [4406] => mining
    [4411] => appropriately
    [4412] => named
    [4413] => knowledge
    [4414] => mining
    [4416] => data
    [4421] => long
    [4423] => e
    [4424] => g
    [4425] => okairp
    [4426] => 2005
    [4427] => fall
    [4428] => conference
    [4429] => arizona
    [4430] => state
    [4431] => university
    [4434] => datamining
    [4435] => witten
    [4436] => ian
    [4437] => h
    [4438] => frank
    [4439] => eibe
    [4440] => hall
    [4441] => mark
    [4443] => 30
    [4444] => january
    [4445] => 2011
    [4446] => data
    [4447] => mining
    [4448] => practical
    [4449] => machine
    [4450] => learning
    [4451] => tools
    [4453] => techniques
    [4454] => 3
    [4455] => ed
    [4456] => elsevier
    [4457] => isbn
    [4458] => 978-0-12-374856-0
    [4459] => bouckaert
    [4460] => remco
    [4461] => r
    [4462] => frank
    [4463] => eibe
    [4464] => hall
    [4465] => mark
    [4467] => holmes
    [4468] => geoffrey
    [4469] => pfahringer
    [4470] => bernhard
    [4471] => reutemann
    [4472] => peter
    [4473] => witten
    [4474] => ian
    [4475] => h
    [4476] => 2010
    [4477] => weka
    [4478] => experiences
    [4481] => java
    [4482] => open-source
    [4483] => project
    [4484] => journal
    [4486] => machine
    [4487] => learning
    [4488] => research
    [4489] => 11
    [4490] => 2533
    [4491] => 2541
    [4493] => original
    [4494] => title
    [4495] => practical
    [4496] => machine
    [4497] => learning
    [4499] => changed
    [4501] => term
    [4502] => data
    [4503] => mining
    [4505] => added
    [4506] => primarily
    [4508] => marketing
    [4509] => reasons
    [4510] => mena
    [4511] => jes
    [4512] => s
    [4513] => 2011
    [4514] => machine
    [4515] => learning
    [4516] => forensics
    [4518] => law
    [4519] => enforcement
    [4520] => security
    [4522] => intelligence
    [4523] => boca
    [4524] => raton
    [4525] => fl
    [4526] => crc
    [4527] => press
    [4528] => taylor
    [4529] => francis
    [4530] => group
    [4531] => isbn
    [4532] => 978-1-4398-6069-4
    [4533] => piatetsky-shapiro
    [4534] => gregory
    [4535] => parker
    [4536] => gary
    [4537] => 2011
    [4538] => lesson
    [4539] => data
    [4540] => mining
    [4542] => knowledge
    [4543] => discovery
    [4545] => introduction
    [4546] => introduction
    [4548] => data
    [4549] => mining
    [4550] => kd
    [4551] => nuggets
    [4552] => retrieved
    [4553] => 30
    [4554] => august
    [4555] => 2012
    [4556] => fayyad
    [4557] => usama
    [4558] => 15
    [4559] => june
    [4560] => 1999
    [4562] => editorial
    [4564] => editor-in-chief
    [4565] => sigkdd
    [4566] => explorations
    [4567] => 13
    [4568] => 1
    [4569] => 102
    [4570] => doi
    [4571] => 10
    [4572] => 1145
    [4573] => 2207243
    [4574] => 2207269
    [4575] => retrieved
    [4576] => 27
    [4577] => december
    [4578] => 2010
    [4579] => kantardzic
    [4580] => mehmed
    [4581] => 2003
    [4582] => data
    [4583] => mining
    [4584] => concepts
    [4585] => models
    [4586] => methods
    [4588] => algorithms
    [4589] => john
    [4590] => wiley
    [4591] => sons
    [4592] => isbn
    [4593] => 0-471-22852-4
    [4594] => oclc
    [4595] => 50055336
    [4596] => gregory
    [4597] => piatetsky-shapiro
    [4598] => 2002
    [4599] => kdnuggets
    [4600] => methodology
    [4601] => poll
    [4602] => gregory
    [4603] => piatetsky-shapiro
    [4604] => 2004
    [4605] => kdnuggets
    [4606] => methodology
    [4607] => poll
    [4608] => gregory
    [4609] => piatetsky-shapiro
    [4610] => 2007
    [4611] => kdnuggets
    [4612] => methodology
    [4613] => poll
    [4614] => gregory
    [4615] => piatetsky-shapiro
    [4616] => 2014
    [4617] => kdnuggets
    [4618] => methodology
    [4619] => poll
    [4620] => scar
    [4621] => marb
    [4622] => n
    [4623] => gonzalo
    [4624] => mariscal
    [4626] => javier
    [4627] => segovia
    [4628] => 2009
    [4630] => data
    [4631] => mining
    [4632] => knowledge
    [4633] => discovery
    [4634] => process
    [4635] => model
    [4637] => data
    [4638] => mining
    [4640] => knowledge
    [4641] => discovery
    [4643] => real
    [4644] => life
    [4645] => applications
    [4646] => book
    [4647] => edited
    [4649] => julio
    [4650] => ponce
    [4652] => adem
    [4653] => karahoca
    [4654] => isbn
    [4655] => 978-3-902613-53-0
    [4656] => pp
    [4657] => 438
    [4658] => 453
    [4659] => february
    [4660] => 2009
    [4661] => i-tech
    [4662] => vienna
    [4663] => austria
    [4664] => lukasz
    [4665] => kurgan
    [4667] => petr
    [4668] => musilek
    [4669] => 2006
    [4671] => survey
    [4673] => knowledge
    [4674] => discovery
    [4676] => data
    [4677] => mining
    [4678] => process
    [4679] => models
    [4681] => knowledge
    [4682] => engineering
    [4683] => review
    [4684] => volume
    [4685] => 21
    [4686] => issue
    [4687] => 1
    [4688] => march
    [4689] => 2006
    [4690] => pp
    [4691] => 1
    [4692] => 24
    [4693] => cambridge
    [4694] => university
    [4695] => press
    [4697] => york
    [4698] => ny
    [4699] => usa
    [4700] => doi
    [4701] => 10
    [4702] => 1017
    [4703] => s0269888906000737
    [4704] => azevedo
    [4707] => santos
    [4708] => m
    [4709] => f
    [4710] => kdd
    [4711] => semma
    [4713] => crisp-dm
    [4715] => parallel
    [4716] => overview
    [4717] => archived
    [4718] => 2013-01-09
    [4721] => wayback
    [4722] => machine
    [4724] => proceedings
    [4727] => iadis
    [4728] => european
    [4729] => conference
    [4731] => data
    [4732] => mining
    [4733] => 2008
    [4734] => pp
    [4735] => 182
    [4736] => 185
    [4737] => hawkins
    [4738] => douglas
    [4739] => m
    [4740] => 2004
    [4742] => problem
    [4744] => overfitting
    [4745] => journal
    [4747] => chemical
    [4748] => information
    [4750] => computer
    [4751] => sciences
    [4752] => 44
    [4753] => 1
    [4754] => 1
    [4755] => 12
    [4756] => doi
    [4757] => 10
    [4758] => 1021
    [4759] => ci0342472
    [4760] => microsoft
    [4761] => academic
    [4762] => search
    [4763] => top
    [4764] => conferences
    [4766] => data
    [4767] => mining
    [4768] => microsoft
    [4769] => academic
    [4770] => search
    [4771] => google
    [4772] => scholar
    [4773] => top
    [4774] => publications
    [4776] => data
    [4777] => mining
    [4778] => analysis
    [4779] => google
    [4780] => scholar
    [4781] => proceedings
    [4782] => international
    [4783] => conferences
    [4785] => knowledge
    [4786] => discovery
    [4788] => data
    [4789] => mining
    [4790] => acm
    [4792] => york
    [4793] => sigkdd
    [4794] => explorations
    [4795] => acm
    [4797] => york
    [4798] => g
    [4799] => nnemann
    [4800] => stephan
    [4801] => kremer
    [4802] => hardy
    [4803] => seidl
    [4804] => thomas
    [4805] => 2011
    [4807] => extension
    [4810] => pmml
    [4811] => standard
    [4813] => subspace
    [4814] => clustering
    [4815] => models
    [4816] => proceedings
    [4819] => 2011
    [4820] => workshop
    [4822] => predictive
    [4823] => markup
    [4824] => language
    [4825] => modeling
    [4827] => pmml
    [4828] => '11
    [4829] => p
    [4830] => 48
    [4831] => isbn
    [4832] => 978-1-4503-0837-3
    [4833] => doi
    [4834] => 10
    [4835] => 1145
    [4836] => 2023598
    [4837] => 2023605
    [4838] => seltzer
    [4839] => william
    [4841] => promise
    [4843] => pitfalls
    [4845] => data
    [4846] => mining
    [4847] => ethical
    [4848] => issues
    [4849] => pdf
    [4850] => pitts
    [4851] => chip
    [4852] => 15
    [4853] => march
    [4854] => 2007
    [4856] => end
    [4858] => illegal
    [4859] => domestic
    [4860] => spying
    [4862] => count
    [4865] => washington
    [4866] => spectator
    [4867] => archived
    [4870] => original
    [4872] => 2007-10-29
    [4873] => taipale
    [4874] => kim
    [4876] => 15
    [4877] => december
    [4878] => 2003
    [4879] => data
    [4880] => mining
    [4882] => domestic
    [4883] => security
    [4884] => connecting
    [4886] => dots
    [4888] => make
    [4889] => sense
    [4891] => data
    [4892] => columbia
    [4893] => science
    [4895] => technology
    [4896] => law
    [4897] => review
    [4898] => 5
    [4899] => 2
    [4900] => oclc
    [4901] => 45263753
    [4902] => ssrn
    [4903] => 546782
    [4904] => resig
    [4905] => john
    [4906] => teredesai
    [4907] => ankur
    [4908] => 2004
    [4910] => framework
    [4912] => mining
    [4913] => instant
    [4914] => messaging
    [4915] => services
    [4916] => proceedings
    [4919] => 2004
    [4920] => siam
    [4921] => dm
    [4922] => conference
    [4924] => b
    [4925] => c
    [4929] => dig
    [4930] => privacy
    [4931] => implications
    [4933] => data
    [4934] => mining
    [4935] => aggregation
    [4936] => archived
    [4937] => 2008-12-17
    [4940] => wayback
    [4941] => machine
    [4942] => nascio
    [4943] => research
    [4945] => september
    [4946] => 2004
    [4947] => ohm
    [4948] => paul
    [4950] => build
    [4952] => database
    [4954] => ruin
    [4955] => harvard
    [4956] => business
    [4957] => review
    [4958] => darwin
    [4959] => bond-graham
    [4960] => iron
    [4961] => cagebook
    [4964] => logical
    [4965] => end
    [4967] => facebook's
    [4968] => patents
    [4969] => counterpunch
    [4970] => org
    [4971] => 2013
    [4972] => 12
    [4973] => 03
    [4974] => darwin
    [4975] => bond-graham
    [4976] => inside
    [4978] => tech
    [4979] => industry's
    [4980] => startup
    [4981] => conference
    [4982] => counterpunch
    [4983] => org
    [4984] => 2013
    [4985] => 09
    [4986] => 11
    [4987] => aol
    [4988] => search
    [4989] => data
    [4990] => identified
    [4991] => individuals
    [4992] => securityfocus
    [4993] => august
    [4994] => 2006
    [4995] => kshetri
    [4996] => nir
    [4997] => 2014
    [4998] => big
    [4999] => data
    [5000] => s
    [5001] => impact
    [5003] => privacy
    [5004] => security
    [5006] => consumer
    [5007] => welfare
    [5008] => telecommunications
    [5009] => policy
    [5010] => 38
    [5011] => 11
    [5012] => 1134
    [5013] => 1145
    [5014] => doi
    [5015] => 10
    [5016] => 1016
    [5017] => j
    [5018] => telpol
    [5019] => 2014
    [5020] => 10
    [5021] => 002
    [5022] => biotech
    [5023] => business
    [5024] => week
    [5025] => editors
    [5026] => june
    [5027] => 30
    [5028] => 2008
    [5029] => biomedicine
    [5030] => hipaa
    [5031] => privacy
    [5032] => rule
    [5033] => impedes
    [5034] => biomedical
    [5035] => research
    [5036] => biotech
    [5037] => business
    [5038] => week
    [5039] => retrieved
    [5040] => 17
    [5041] => november
    [5042] => 2009
    [5044] => lexisnexis
    [5045] => academic
    [5046] => uk
    [5047] => researchers
    [5049] => data
    [5050] => mining
    [5054] => uk
    [5055] => copyright
    [5056] => laws
    [5057] => archived
    [5058] => june
    [5059] => 9
    [5060] => 2014
    [5063] => wayback
    [5064] => machine
    [5065] => out-law
    [5067] => retrieved
    [5068] => 14
    [5069] => november
    [5070] => 2014
    [5071] => licences
    [5073] => europe
    [5075] => structured
    [5076] => stakeholder
    [5077] => dialogue
    [5078] => 2013
    [5079] => european
    [5080] => commission
    [5081] => retrieved
    [5082] => 14
    [5083] => november
    [5084] => 2014
    [5085] => text
    [5087] => data
    [5088] => mining
    [5090] => importance
    [5095] => change
    [5097] => europe
    [5098] => association
    [5100] => european
    [5101] => research
    [5102] => libraries
    [5103] => retrieved
    [5104] => 14
    [5105] => november
    [5106] => 2014
    [5107] => judge
    [5108] => grants
    [5109] => summary
    [5110] => judgment
    [5112] => favor
    [5114] => google
    [5115] => books
    [5117] => fair
    [5119] => victory
    [5120] => lexology
    [5122] => antonelli
    [5123] => law
    [5125] => retrieved
    [5126] => 14
    [5127] => november
    [5128] => 2014
    [5129] => karl
    [5130] => rexer
    [5131] => heather
    [5132] => allen
    [5133] => paul
    [5134] => gearan
    [5135] => 2011
    [5136] => understanding
    [5137] => data
    [5138] => miners
    [5139] => analytics
    [5140] => magazine
    [5142] => june
    [5143] => 2011
    [5144] => informs
    [5145] => institute
    [5147] => operations
    [5148] => research
    [5151] => management
    [5152] => sciences
    [5153] => mikut
    [5154] => ralf
    [5155] => reischl
    [5156] => markus
    [5157] => september
    [5158] => october
    [5159] => 2011
    [5160] => data
    [5161] => mining
    [5162] => tools
    [5163] => wiley
    [5164] => interdisciplinary
    [5165] => reviews
    [5166] => data
    [5167] => mining
    [5169] => knowledge
    [5170] => discovery
    [5171] => 1
    [5172] => 5
    [5173] => 431
    [5174] => 445
    [5175] => doi
    [5176] => 10
    [5177] => 1002
    [5178] => widm
    [5179] => 24
    [5180] => retrieved
    [5181] => october
    [5182] => 21
    [5183] => 2011
    [5184] => kobielus
    [5185] => james
    [5187] => forrester
    [5188] => wave
    [5189] => predictive
    [5190] => analytics
    [5192] => data
    [5193] => mining
    [5194] => solutions
    [5195] => q1
    [5196] => 2010
    [5197] => forrester
    [5198] => research
    [5199] => 1
    [5200] => july
    [5201] => 2008
    [5202] => herschel
    [5203] => gareth
    [5204] => magic
    [5205] => quadrant
    [5207] => customer
    [5208] => data-mining
    [5209] => applications
    [5210] => gartner
    [5212] => 1
    [5213] => july
    [5214] => 2008
    [5215] => nisbet
    [5216] => robert
    [5218] => 2006
    [5219] => data
    [5220] => mining
    [5221] => tools
    [5227] => crm
    [5228] => part
    [5229] => 1
    [5230] => information
    [5231] => management
    [5232] => special
    [5233] => reports
    [5234] => january
    [5235] => 2006
    [5236] => haughton
    [5237] => dominique
    [5238] => deichmann
    [5239] => joel
    [5240] => eshghi
    [5241] => abdolreza
    [5242] => sayek
    [5243] => selin
    [5244] => teebagy
    [5245] => nicholas
    [5247] => topi
    [5248] => heikki
    [5249] => 2003
    [5251] => review
    [5253] => software
    [5254] => packages
    [5256] => data
    [5257] => mining
    [5259] => american
    [5260] => statistician
    [5261] => vol
    [5262] => 57
    [5264] => 4
    [5265] => pp
    [5266] => 290
    [5267] => 309
    [5268] => goebel
    [5269] => michael
    [5270] => gruenwald
    [5271] => le
    [5272] => 1999
    [5274] => survey
    [5276] => data
    [5277] => mining
    [5279] => knowledge
    [5280] => discovery
    [5281] => software
    [5282] => tools
    [5283] => sigkdd
    [5284] => explorations
    [5285] => vol
    [5286] => 1
    [5287] => issue
    [5288] => 1
    [5289] => pp
    [5290] => 20
    [5291] => 33
    [5293] => reading
    [5294] => edit
    [5295] => cabena
    [5296] => peter
    [5297] => hadjnian
    [5298] => pablo
    [5299] => stadler
    [5300] => rolf
    [5301] => verhees
    [5302] => jaap
    [5303] => zanasi
    [5304] => alessandro
    [5305] => 1997
    [5306] => discovering
    [5307] => data
    [5308] => mining
    [5310] => concept
    [5312] => implementation
    [5313] => prentice
    [5314] => hall
    [5315] => isbn
    [5316] => 0-13-743980-6
    [5317] => m
    [5318] => s
    [5319] => chen
    [5320] => j
    [5321] => han
    [5322] => p
    [5323] => s
    [5324] => yu
    [5325] => 1996
    [5326] => data
    [5327] => mining
    [5329] => overview
    [5332] => database
    [5333] => perspective
    [5334] => knowledge
    [5336] => data
    [5337] => engineering
    [5338] => ieee
    [5339] => transactions
    [5341] => 8
    [5342] => 6
    [5343] => 866
    [5344] => 883
    [5345] => feldman
    [5346] => ronen
    [5347] => sanger
    [5348] => james
    [5349] => 2007
    [5351] => text
    [5352] => mining
    [5353] => handbook
    [5354] => cambridge
    [5355] => university
    [5356] => press
    [5357] => isbn
    [5358] => 978-0-521-83657-9
    [5359] => guo
    [5360] => yike
    [5362] => grossman
    [5363] => robert
    [5364] => editors
    [5365] => 1999
    [5366] => high
    [5367] => performance
    [5368] => data
    [5369] => mining
    [5370] => scaling
    [5371] => algorithms
    [5372] => applications
    [5374] => systems
    [5375] => kluwer
    [5376] => academic
    [5377] => publishers
    [5378] => han
    [5379] => jiawei
    [5380] => micheline
    [5381] => kamber
    [5383] => jian
    [5384] => pei
    [5385] => data
    [5386] => mining
    [5387] => concepts
    [5389] => techniques
    [5390] => morgan
    [5391] => kaufmann
    [5392] => 2006
    [5393] => hastie
    [5394] => trevor
    [5395] => tibshirani
    [5396] => robert
    [5398] => friedman
    [5399] => jerome
    [5400] => 2001
    [5402] => elements
    [5404] => statistical
    [5405] => learning
    [5406] => data
    [5407] => mining
    [5408] => inference
    [5410] => prediction
    [5411] => springer
    [5412] => isbn
    [5413] => 0-387-95284-5
    [5414] => liu
    [5415] => bing
    [5416] => 2007
    [5417] => web
    [5418] => data
    [5419] => mining
    [5420] => exploring
    [5421] => hyperlinks
    [5422] => contents
    [5424] => usage
    [5425] => data
    [5426] => springer
    [5427] => isbn
    [5428] => 3-540-37881-2
    [5429] => murphy
    [5430] => chris
    [5431] => 16
    [5433] => 2011
    [5435] => data
    [5436] => mining
    [5437] => free
    [5438] => speech
    [5439] => informationweek
    [5440] => umb
    [5441] => 12
    [5442] => nisbet
    [5443] => robert
    [5444] => elder
    [5445] => john
    [5446] => miner
    [5447] => gary
    [5448] => 2009
    [5449] => handbook
    [5451] => statistical
    [5452] => analysis
    [5453] => data
    [5454] => mining
    [5455] => applications
    [5456] => academic
    [5457] => press
    [5458] => elsevier
    [5459] => isbn
    [5460] => 978-0-12-374765-5
    [5461] => poncelet
    [5462] => pascal
    [5463] => masseglia
    [5464] => florent
    [5466] => teisseire
    [5467] => maguelonne
    [5468] => editors
    [5469] => october
    [5470] => 2007
    [5471] => data
    [5472] => mining
    [5473] => patterns
    [5475] => methods
    [5477] => applications
    [5478] => information
    [5479] => science
    [5480] => reference
    [5481] => isbn
    [5482] => 978-1-59904-162-9
    [5483] => tan
    [5484] => pang-ning
    [5485] => steinbach
    [5486] => michael
    [5488] => kumar
    [5489] => vipin
    [5490] => 2005
    [5491] => introduction
    [5493] => data
    [5494] => mining
    [5495] => isbn
    [5496] => 0-321-32136-7
    [5497] => theodoridis
    [5498] => sergios
    [5500] => koutroumbas
    [5501] => konstantinos
    [5502] => 2009
    [5503] => pattern
    [5504] => recognition
    [5505] => 4th
    [5506] => edition
    [5507] => academic
    [5508] => press
    [5509] => isbn
    [5510] => 978-1-59749-272-0
    [5511] => weiss
    [5512] => sholom
    [5513] => m
    [5515] => indurkhya
    [5516] => nitin
    [5517] => 1998
    [5518] => predictive
    [5519] => data
    [5520] => mining
    [5521] => morgan
    [5522] => kaufmann
    [5523] => witten
    [5524] => ian
    [5525] => h
    [5526] => frank
    [5527] => eibe
    [5528] => hall
    [5529] => mark
    [5531] => 30
    [5532] => january
    [5533] => 2011
    [5534] => data
    [5535] => mining
    [5536] => practical
    [5537] => machine
    [5538] => learning
    [5539] => tools
    [5541] => techniques
    [5542] => 3
    [5543] => ed
    [5544] => elsevier
    [5545] => isbn
    [5546] => 978-0-12-374856-0
    [5549] => free
    [5550] => weka
    [5551] => software
    [5552] => ye
    [5553] => nong
    [5554] => 2003
    [5556] => handbook
    [5558] => data
    [5559] => mining
    [5560] => mahwah
    [5561] => nj
    [5562] => lawrence
    [5563] => erlbaum
    [5564] => external
    [5565] => links
    [5566] => edit
    [5567] => wikimedia
    [5568] => commons
    [5570] => media
    [5571] => related
    [5573] => data
    [5574] => mining
    [5575] => knowledge
    [5576] => discovery
    [5577] => software
    [5579] => dmoz
    [5580] => data
    [5581] => mining
    [5582] => tool
    [5583] => vendors
    [5585] => dmoz
    [5586] => v
    [5587] => t
    [5588] => e
    [5589] => data
    [5590] => storage
    [5591] => analysis
    [5592] => cleansing
    [5593] => compression
    [5594] => corruption
    [5595] => curation
    [5596] => editing
    [5597] => farming
    [5598] => fusion
    [5599] => integration
    [5600] => integrity
    [5601] => loss
    [5602] => mining
    [5603] => pre-processing
    [5604] => quality
    [5605] => reduction
    [5606] => scraping
    [5607] => scrubbing
    [5608] => security
    [5609] => validation
    [5610] => warehouse
    [5611] => wrangling
    [5612] => munging
    [5613] => protection
    [5614] => privacy
    [5615] => v
    [5616] => t
    [5617] => e
    [5618] => data
    [5619] => warehouse
    [5620] => creating
    [5622] => data
    [5623] => warehouse
    [5624] => concepts
    [5625] => database
    [5626] => dimension
    [5627] => dimensional
    [5628] => modeling
    [5629] => fact
    [5630] => olap
    [5631] => star
    [5632] => schema
    [5633] => aggregate
    [5634] => variants
    [5635] => anchor
    [5636] => modeling
    [5637] => column-oriented
    [5638] => dbms
    [5639] => data
    [5640] => vault
    [5641] => modeling
    [5642] => holap
    [5643] => molap
    [5644] => rolap
    [5645] => operational
    [5646] => data
    [5647] => store
    [5648] => elements
    [5649] => data
    [5650] => dictionary
    [5651] => metadata
    [5652] => data
    [5653] => mart
    [5654] => sixth
    [5655] => normal
    [5656] => form
    [5657] => surrogate
    [5658] => key
    [5659] => fact
    [5660] => fact
    [5661] => table
    [5662] => early-arriving
    [5663] => fact
    [5664] => measure
    [5665] => dimension
    [5666] => dimension
    [5667] => table
    [5668] => degenerate
    [5669] => slowly
    [5670] => changing
    [5671] => filling
    [5672] => extract-transform-load
    [5673] => etl
    [5674] => extract
    [5675] => transform
    [5676] => load
    [5679] => data
    [5680] => warehouse
    [5681] => concepts
    [5682] => business
    [5683] => intelligence
    [5684] => dashboard
    [5685] => data
    [5686] => mining
    [5687] => decision
    [5688] => support
    [5689] => system
    [5690] => dss
    [5691] => olap
    [5692] => cube
    [5693] => data
    [5694] => warehouse
    [5695] => automation
    [5696] => languages
    [5697] => data
    [5698] => mining
    [5699] => extensions
    [5700] => dmx
    [5701] => multidimensional
    [5702] => expressions
    [5703] => mdx
    [5704] => xml
    [5706] => analysis
    [5707] => xmla
    [5708] => tools
    [5709] => business
    [5710] => intelligence
    [5711] => software
    [5712] => reporting
    [5713] => software
    [5714] => spreadsheet
    [5715] => related
    [5716] => people
    [5717] => bill
    [5718] => inmon
    [5719] => ralph
    [5720] => kimball
    [5721] => products
    [5722] => comparison
    [5724] => olap
    [5725] => servers
    [5726] => data
    [5727] => warehousing
    [5728] => products
    [5731] => producers
    [5732] => v
    [5733] => t
    [5734] => e
    [5735] => major
    [5736] => fields
    [5738] => computer
    [5739] => science
    [5740] => note
    [5742] => template
    [5743] => roughly
    [5746] => 2012
    [5747] => acm
    [5748] => computing
    [5749] => classification
    [5750] => system
    [5751] => hardware
    [5752] => printed
    [5753] => circuit
    [5754] => board
    [5755] => peripheral
    [5756] => integrated
    [5757] => circuit
    [5758] => very-large-scale
    [5759] => integration
    [5760] => energy
    [5761] => consumption
    [5762] => electronic
    [5763] => design
    [5764] => automation
    [5765] => computer
    [5766] => systems
    [5767] => organization
    [5768] => computer
    [5769] => architecture
    [5770] => embedded
    [5771] => system
    [5772] => real-time
    [5773] => computing
    [5774] => dependability
    [5775] => networks
    [5776] => network
    [5777] => architecture
    [5778] => network
    [5779] => protocol
    [5780] => network
    [5781] => components
    [5782] => network
    [5783] => scheduler
    [5784] => network
    [5785] => performance
    [5786] => evaluation
    [5787] => network
    [5788] => service
    [5789] => software
    [5790] => organization
    [5791] => interpreter
    [5792] => middleware
    [5793] => virtual
    [5794] => machine
    [5795] => operating
    [5796] => system
    [5797] => software
    [5798] => quality
    [5799] => software
    [5800] => notations
    [5802] => tools
    [5803] => programming
    [5804] => paradigm
    [5805] => programming
    [5806] => language
    [5807] => compiler
    [5808] => domain-specific
    [5809] => language
    [5810] => modeling
    [5811] => language
    [5812] => software
    [5813] => framework
    [5814] => integrated
    [5815] => development
    [5816] => environment
    [5817] => software
    [5818] => configuration
    [5819] => management
    [5820] => software
    [5821] => library
    [5822] => software
    [5823] => repository
    [5824] => software
    [5825] => development
    [5826] => software
    [5827] => development
    [5828] => process
    [5829] => requirements
    [5830] => analysis
    [5831] => software
    [5832] => design
    [5833] => software
    [5834] => construction
    [5835] => software
    [5836] => deployment
    [5837] => software
    [5838] => maintenance
    [5839] => programming
    [5840] => team
    [5841] => open-source
    [5842] => model
    [5843] => theory
    [5845] => computation
    [5846] => model
    [5848] => computation
    [5849] => formal
    [5850] => language
    [5851] => automata
    [5852] => theory
    [5853] => computational
    [5854] => complexity
    [5855] => theory
    [5856] => logic
    [5857] => semantics
    [5858] => algorithms
    [5859] => algorithm
    [5860] => design
    [5861] => analysis
    [5863] => algorithms
    [5864] => randomized
    [5865] => algorithm
    [5866] => computational
    [5867] => geometry
    [5868] => mathematics
    [5870] => computing
    [5871] => discrete
    [5872] => mathematics
    [5873] => probability
    [5874] => statistics
    [5875] => mathematical
    [5876] => software
    [5877] => information
    [5878] => theory
    [5879] => mathematical
    [5880] => analysis
    [5881] => numerical
    [5882] => analysis
    [5883] => information
    [5884] => systems
    [5885] => database
    [5886] => management
    [5887] => system
    [5888] => information
    [5889] => storage
    [5890] => systems
    [5891] => enterprise
    [5892] => information
    [5893] => system
    [5894] => social
    [5895] => information
    [5896] => systems
    [5897] => geographic
    [5898] => information
    [5899] => system
    [5900] => decision
    [5901] => support
    [5902] => system
    [5903] => process
    [5904] => control
    [5905] => system
    [5906] => multimedia
    [5907] => information
    [5908] => system
    [5909] => data
    [5910] => mining
    [5911] => digital
    [5912] => library
    [5913] => computing
    [5914] => platform
    [5915] => digital
    [5916] => marketing
    [5917] => world
    [5918] => wide
    [5919] => web
    [5920] => information
    [5921] => retrieval
    [5922] => security
    [5923] => cryptography
    [5924] => formal
    [5925] => methods
    [5926] => security
    [5927] => services
    [5928] => intrusion
    [5929] => detection
    [5930] => system
    [5931] => hardware
    [5932] => security
    [5933] => network
    [5934] => security
    [5935] => information
    [5936] => security
    [5937] => application
    [5938] => security
    [5939] => human
    [5940] => computer
    [5941] => interaction
    [5942] => interaction
    [5943] => design
    [5944] => social
    [5945] => computing
    [5946] => ubiquitous
    [5947] => computing
    [5948] => visualization
    [5949] => accessibility
    [5950] => concurrency
    [5951] => concurrent
    [5952] => computing
    [5953] => parallel
    [5954] => computing
    [5955] => distributed
    [5956] => computing
    [5957] => multithreading
    [5958] => multiprocessing
    [5959] => artificial
    [5960] => intelligence
    [5961] => natural
    [5962] => language
    [5963] => processing
    [5964] => knowledge
    [5965] => representation
    [5967] => reasoning
    [5968] => computer
    [5969] => vision
    [5970] => automated
    [5971] => planning
    [5973] => scheduling
    [5974] => search
    [5975] => methodology
    [5976] => control
    [5977] => method
    [5978] => philosophy
    [5980] => artificial
    [5981] => intelligence
    [5982] => distributed
    [5983] => artificial
    [5984] => intelligence
    [5985] => machine
    [5986] => learning
    [5987] => supervised
    [5988] => learning
    [5989] => unsupervised
    [5990] => learning
    [5991] => reinforcement
    [5992] => learning
    [5993] => multi-task
    [5994] => learning
    [5995] => cross-validation
    [5996] => graphics
    [5997] => animation
    [5998] => rendering
    [5999] => image
    [6000] => manipulation
    [6001] => graphics
    [6002] => processing
    [6003] => unit
    [6004] => mixed
    [6005] => reality
    [6006] => virtual
    [6007] => reality
    [6008] => image
    [6009] => compression
    [6010] => solid
    [6011] => modeling
    [6012] => applied
    [6013] => computing
    [6014] => e-commerce
    [6015] => enterprise
    [6016] => software
    [6017] => computational
    [6018] => mathematics
    [6019] => computational
    [6020] => physics
    [6021] => computational
    [6022] => chemistry
    [6023] => computational
    [6024] => biology
    [6025] => computational
    [6026] => social
    [6027] => science
    [6028] => computational
    [6029] => engineering
    [6030] => computational
    [6031] => healthcare
    [6032] => digital
    [6033] => art
    [6034] => electronic
    [6035] => publishing
    [6036] => cyberwarfare
    [6037] => electronic
    [6038] => voting
    [6039] => video
    [6040] => game
    [6041] => word
    [6042] => processing
    [6043] => operations
    [6044] => research
    [6045] => educational
    [6046] => technology
    [6047] => document
    [6048] => management
    [6049] => book
    [6050] => category
    [6051] => portal
    [6052] => wikiproject
    [6053] => commons
    [6054] => authority
    [6055] => control
    [6056] => gnd
    [6057] => 4428654-5
    [6058] => ndl
    [6059] => 00948240
    [6060] => retrieved
    [6062] => https
    [6064] => wikipedia
    [6065] => org
    [6066] => w
    [6067] => index
    [6068] => php
    [6069] => title
    [6070] => data
    [6071] => mining
    [6072] => oldid
    [6073] => 804484174
    [6074] => categories
    [6075] => data
    [6076] => mining
    [6077] => formal
    [6078] => sciences
    [6079] => hidden
    [6080] => categories
    [6081] => cs1
    [6082] => maint
    [6083] => multiple
    [6084] => names
    [6085] => authors
    [6086] => list
    [6087] => webarchive
    [6088] => template
    [6089] => wayback
    [6090] => links
    [6091] => articles
    [6094] => expanded
    [6096] => september
    [6097] => 2011
    [6099] => articles
    [6101] => unsourced
    [6102] => statements
    [6103] => articles
    [6105] => unsourced
    [6106] => statements
    [6108] => april
    [6109] => 2014
    [6110] => articles
    [6112] => dmoz
    [6113] => links
    [6114] => wikipedia
    [6115] => articles
    [6117] => gnd
    [6118] => identifiers
    [6119] => navigation
    [6120] => menu
    [6121] => personal
    [6122] => tools
    [6124] => logged
    [6126] => talk
    [6127] => contributions
    [6128] => create
    [6129] => account
    [6130] => log
    [6132] => namespaces
    [6133] => article
    [6134] => talk
    [6135] => variants
    [6136] => views
    [6137] => read
    [6138] => edit
    [6139] => view
    [6140] => history
    [6142] => search
    [6143] => navigation
    [6144] => main
    [6145] => page
    [6146] => contents
    [6147] => featured
    [6148] => content
    [6149] => current
    [6150] => events
    [6151] => random
    [6152] => article
    [6153] => donate
    [6155] => wikipedia
    [6156] => wikipedia
    [6157] => store
    [6158] => interaction
    [6161] => wikipedia
    [6162] => community
    [6163] => portal
    [6164] => recent
    [6166] => contact
    [6167] => page
    [6168] => tools
    [6170] => links
    [6172] => related
    [6174] => upload
    [6175] => file
    [6176] => special
    [6177] => pages
    [6178] => permanent
    [6179] => link
    [6180] => page
    [6181] => information
    [6182] => wikidata
    [6183] => item
    [6184] => cite
    [6186] => page
    [6187] => print
    [6188] => export
    [6189] => create
    [6191] => book
    [6192] => download
    [6194] => pdf
    [6195] => printable
    [6196] => version
    [6199] => projects
    [6200] => wikimedia
    [6201] => commons
    [6202] => languages
    [6203] => az
    [6204] => rbaycanca
    [6205] => catal
    [6206] => e
    [6207] => tina
    [6208] => dansk
    [6209] => deutsch
    [6210] => eesti
    [6211] => espa
    [6212] => ol
    [6213] => euskara
    [6214] => fran
    [6215] => ais
    [6216] => hrvatski
    [6217] => bahasa
    [6218] => indonesia
    [6219] => italiano
    [6220] => latvie
    [6221] => u
    [6222] => magyar
    [6223] => nederlands
    [6224] => norsk
    [6225] => polski
    [6226] => portugu
    [6227] => s
    [6228] => rom
    [6229] => n
    [6230] => shqip
    [6231] => simple
    [6232] => english
    [6233] => sloven
    [6234] => ina
    [6235] => sloven
    [6236] => ina
    [6237] => srpski
    [6238] => srpskohrvatski
    [6239] => basa
    [6240] => sunda
    [6241] => suomi
    [6242] => svenska
    [6243] => t
    [6244] => rk
    [6245] => e
    [6246] => ti
    [6247] => ng
    [6248] => vi
    [6249] => t
    [6250] => edit
    [6251] => links
    [6253] => page
    [6256] => edited
    [6258] => 9
    [6259] => october
    [6260] => 2017
    [6262] => 09
    [6263] => 10
    [6264] => text
    [6269] => creative
    [6270] => commons
    [6271] => attribution-sharealike
    [6272] => license
    [6273] => additional
    [6274] => terms
    [6276] => apply
    [6280] => site
    [6282] => agree
    [6285] => terms
    [6289] => privacy
    [6290] => policy
    [6291] => wikipedia
    [6294] => registered
    [6295] => trademark
    [6298] => wikimedia
    [6299] => foundation
    [6302] => non-profit
    [6303] => organization
    [6304] => privacy
    [6305] => policy
    [6307] => wikipedia
    [6308] => disclaimers
    [6309] => contact
    [6310] => wikipedia
    [6311] => developers
    [6312] => cookie
    [6313] => statement
    [6314] => mobile
    [6315] => view
)
======================
Text: data mining - wikipedia data mining from wikipedia the free encyclop...
Total Keywords: 4440
======================

Demo2.php

<?php

//All Keywords as an array
$tm = new TextMiner();

$tm->addFile("http://en.wikipedia.org/wiki/Data_mining");
$tm->process();

printa($tm->getKeywords());
echo 
$tm->printSummary();
        
?>