Demo 0 | Demo 1 | Demo 2 | Demo 3 | Demo 4 | Demo 5 | Code | Matt Smith

Demo 2

Array
(
    [1] => data
    [2] => mining
    [4] => wikipedia
    [5] => data
    [6] => mining
    [8] => wikipedia
    [10] => free
    [11] => encyclopedia
    [12] => jump
    [14] => navigation
    [15] => search
    [19] => confused
    [21] => analytics
    [22] => information
    [23] => extraction
    [25] => data
    [26] => analysis
    [27] => machine
    [28] => learning
    [30] => data
    [31] => mining
    [32] => problems
    [33] => classification
    [34] => clustering
    [35] => regression
    [36] => anomaly
    [37] => detection
    [38] => association
    [39] => rules
    [40] => reinforcement
    [41] => learning
    [42] => structured
    [43] => prediction
    [44] => feature
    [45] => engineering
    [46] => feature
    [47] => learning
    [48] => online
    [49] => learning
    [50] => semi-supervised
    [51] => learning
    [52] => unsupervised
    [53] => learning
    [54] => learning
    [56] => rank
    [57] => grammar
    [58] => induction
    [59] => supervised
    [60] => learning
    [61] => classification
    [62] => regression
    [63] => decision
    [64] => trees
    [65] => ensembles
    [66] => bagging
    [67] => boosting
    [68] => random
    [69] => forest
    [70] => k
    [71] => -nn
    [72] => linear
    [73] => regression
    [74] => naive
    [75] => bayes
    [76] => neural
    [77] => networks
    [78] => logistic
    [79] => regression
    [80] => perceptron
    [81] => relevance
    [82] => vector
    [83] => machine
    [84] => rvm
    [85] => support
    [86] => vector
    [87] => machine
    [88] => svm
    [89] => clustering
    [90] => birch
    [91] => hierarchical
    [92] => k
    [93] => -means
    [94] => expectation-maximization
    [95] => em
    [96] => dbscan
    [97] => optics
    [98] => mean-shift
    [99] => dimensionality
    [100] => reduction
    [101] => factor
    [102] => analysis
    [103] => cca
    [104] => ica
    [105] => lda
    [106] => nmf
    [107] => pca
    [108] => t-sne
    [109] => structured
    [110] => prediction
    [111] => graphical
    [112] => models
    [113] => bayes
    [114] => net
    [115] => crf
    [116] => hmm
    [117] => anomaly
    [118] => detection
    [119] => k
    [120] => -nn
    [121] => local
    [122] => outlier
    [123] => factor
    [124] => neural
    [125] => nets
    [126] => autoencoder
    [127] => deep
    [128] => learning
    [129] => multilayer
    [130] => perceptron
    [131] => rnn
    [132] => restricted
    [133] => boltzmann
    [134] => machine
    [135] => som
    [136] => convolutional
    [137] => neural
    [138] => network
    [139] => reinforcement
    [140] => learning
    [141] => q-learning
    [142] => sarsa
    [143] => temporal
    [144] => difference
    [145] => td
    [146] => theory
    [147] => bias-variance
    [148] => dilemma
    [149] => computational
    [150] => learning
    [151] => theory
    [152] => empirical
    [153] => risk
    [154] => minimization
    [155] => occam
    [156] => learning
    [157] => pac
    [158] => learning
    [159] => statistical
    [160] => learning
    [161] => vc
    [162] => theory
    [163] => machine
    [164] => learning
    [165] => venues
    [166] => nips
    [167] => icml
    [168] => ml
    [169] => jmlr
    [170] => arxiv
    [171] => cs
    [172] => lg
    [173] => related
    [174] => articles
    [175] => list
    [177] => datasets
    [179] => machine
    [180] => learning
    [181] => research
    [182] => outline
    [184] => machine
    [185] => learning
    [186] => machine
    [187] => learning
    [188] => portal
    [189] => v
    [190] => t
    [191] => e
    [192] => data
    [193] => mining
    [196] => computing
    [197] => process
    [199] => discovering
    [200] => patterns
    [202] => large
    [203] => data
    [204] => sets
    [205] => involving
    [206] => methods
    [209] => intersection
    [211] => machine
    [212] => learning
    [213] => statistics
    [215] => database
    [216] => systems
    [217] => 1
    [221] => interdisciplinary
    [222] => subfield
    [224] => computer
    [225] => science
    [226] => 1
    [227] => 2
    [228] => 3
    [231] => goal
    [234] => data
    [235] => mining
    [236] => process
    [239] => extract
    [240] => information
    [243] => data
    [244] => set
    [246] => transform
    [250] => understandable
    [251] => structure
    [255] => 1
    [259] => raw
    [260] => analysis
    [261] => step
    [263] => involves
    [264] => database
    [266] => data
    [267] => management
    [268] => aspects
    [269] => data
    [270] => pre-processing
    [271] => model
    [273] => inference
    [274] => considerations
    [275] => interestingness
    [276] => metrics
    [277] => complexity
    [278] => considerations
    [279] => post-processing
    [281] => discovered
    [282] => structures
    [283] => visualization
    [285] => online
    [286] => updating
    [287] => 1
    [288] => data
    [289] => mining
    [292] => analysis
    [293] => step
    [296] => knowledge
    [297] => discovery
    [299] => databases
    [300] => process
    [302] => kdd
    [303] => 4
    [305] => term
    [308] => misnomer
    [311] => goal
    [314] => extraction
    [316] => patterns
    [318] => knowledge
    [320] => large
    [321] => amounts
    [323] => data
    [326] => extraction
    [327] => mining
    [329] => data
    [331] => 5
    [336] => buzzword
    [337] => 6
    [340] => frequently
    [341] => applied
    [344] => form
    [346] => large-scale
    [347] => data
    [349] => information
    [350] => processing
    [351] => collection
    [352] => extraction
    [353] => warehousing
    [354] => analysis
    [356] => statistics
    [361] => application
    [363] => computer
    [364] => decision
    [365] => support
    [366] => system
    [367] => including
    [368] => artificial
    [369] => intelligence
    [370] => machine
    [371] => learning
    [373] => business
    [374] => intelligence
    [376] => book
    [377] => data
    [378] => mining
    [379] => practical
    [380] => machine
    [381] => learning
    [382] => tools
    [384] => techniques
    [386] => java
    [387] => 7
    [389] => covers
    [391] => machine
    [392] => learning
    [393] => material
    [395] => originally
    [398] => named
    [400] => practical
    [401] => machine
    [402] => learning
    [405] => term
    [406] => data
    [407] => mining
    [410] => added
    [412] => marketing
    [413] => reasons
    [414] => 8
    [418] => general
    [419] => terms
    [420] => large
    [421] => scale
    [422] => data
    [423] => analysis
    [425] => analytics
    [428] => referring
    [430] => actual
    [431] => methods
    [432] => artificial
    [433] => intelligence
    [435] => machine
    [436] => learning
    [441] => actual
    [442] => data
    [443] => mining
    [444] => task
    [447] => semi-automatic
    [449] => automatic
    [450] => analysis
    [452] => large
    [453] => quantities
    [455] => data
    [457] => extract
    [458] => previously
    [459] => unknown
    [460] => interesting
    [461] => patterns
    [464] => groups
    [466] => data
    [467] => records
    [468] => cluster
    [469] => analysis
    [470] => unusual
    [471] => records
    [472] => anomaly
    [473] => detection
    [475] => dependencies
    [476] => association
    [477] => rule
    [478] => mining
    [479] => sequential
    [480] => pattern
    [481] => mining
    [484] => involves
    [486] => database
    [487] => techniques
    [490] => spatial
    [491] => indices
    [493] => patterns
    [500] => kind
    [502] => summary
    [505] => input
    [506] => data
    [513] => analysis
    [518] => machine
    [519] => learning
    [521] => predictive
    [522] => analytics
    [526] => data
    [527] => mining
    [528] => step
    [530] => identify
    [531] => multiple
    [532] => groups
    [535] => data
    [542] => obtain
    [544] => accurate
    [545] => prediction
    [546] => results
    [549] => decision
    [550] => support
    [551] => system
    [554] => data
    [555] => collection
    [556] => data
    [557] => preparation
    [559] => result
    [560] => interpretation
    [562] => reporting
    [564] => part
    [567] => data
    [568] => mining
    [569] => step
    [572] => belong
    [576] => kdd
    [577] => process
    [579] => additional
    [580] => steps
    [582] => related
    [583] => terms
    [584] => data
    [585] => dredging
    [586] => data
    [587] => fishing
    [589] => data
    [590] => snooping
    [591] => refer
    [596] => data
    [597] => mining
    [598] => methods
    [600] => sample
    [601] => parts
    [604] => larger
    [605] => population
    [606] => data
    [607] => set
    [614] => small
    [616] => reliable
    [617] => statistical
    [618] => inferences
    [621] => made
    [624] => validity
    [627] => patterns
    [628] => discovered
    [630] => methods
    [636] => creating
    [638] => hypotheses
    [640] => test
    [643] => larger
    [644] => data
    [645] => populations
    [646] => contents
    [647] => 1
    [648] => etymology
    [649] => 2
    [650] => background
    [651] => 3
    [652] => process
    [653] => 3
    [654] => 1
    [655] => pre-processing
    [656] => 3
    [657] => 2
    [658] => data
    [659] => mining
    [660] => 3
    [661] => 3
    [662] => results
    [663] => validation
    [664] => 4
    [665] => research
    [666] => 5
    [667] => standards
    [668] => 6
    [669] => notable
    [671] => 7
    [672] => privacy
    [673] => concerns
    [675] => ethics
    [676] => 7
    [677] => 1
    [678] => situation
    [680] => europe
    [681] => 7
    [682] => 2
    [683] => situation
    [686] => united
    [687] => states
    [688] => 8
    [689] => copyright
    [690] => law
    [691] => 8
    [692] => 1
    [693] => situation
    [695] => europe
    [696] => 8
    [697] => 2
    [698] => situation
    [701] => united
    [702] => states
    [703] => 9
    [704] => software
    [705] => 9
    [706] => 1
    [707] => free
    [708] => open-source
    [709] => data
    [710] => mining
    [711] => software
    [713] => applications
    [714] => 9
    [715] => 2
    [716] => proprietary
    [717] => data-mining
    [718] => software
    [720] => applications
    [721] => 9
    [722] => 3
    [723] => marketplace
    [724] => surveys
    [725] => 10
    [728] => 11
    [729] => references
    [730] => 12
    [732] => reading
    [733] => 13
    [734] => external
    [735] => links
    [736] => etymology
    [737] => edit
    [740] => 1960s
    [741] => statisticians
    [743] => terms
    [745] => data
    [746] => fishing
    [748] => data
    [749] => dredging
    [751] => refer
    [755] => considered
    [757] => bad
    [758] => practice
    [760] => analyzing
    [761] => data
    [764] => a-priori
    [765] => hypothesis
    [767] => term
    [768] => data
    [769] => mining
    [770] => appeared
    [772] => 1990
    [775] => database
    [776] => community
    [779] => short
    [780] => time
    [782] => 1980s
    [784] => phrase
    [785] => database
    [786] => mining
    [793] => trademarked
    [795] => hnc
    [797] => san
    [798] => diego-based
    [799] => company
    [801] => pitch
    [803] => database
    [804] => mining
    [805] => workstation
    [806] => 9
    [807] => researchers
    [809] => turned
    [811] => data
    [812] => mining
    [814] => terms
    [816] => include
    [817] => data
    [818] => archaeology
    [819] => information
    [820] => harvesting
    [821] => information
    [822] => discovery
    [823] => knowledge
    [824] => extraction
    [826] => gregory
    [827] => piatetsky-shapiro
    [828] => coined
    [830] => term
    [831] => knowledge
    [832] => discovery
    [834] => databases
    [838] => workshop
    [842] => topic
    [843] => kdd-1989
    [846] => term
    [849] => popular
    [851] => ai
    [853] => machine
    [854] => learning
    [855] => community
    [858] => term
    [859] => data
    [860] => mining
    [863] => popular
    [866] => business
    [868] => press
    [869] => communities
    [870] => 10
    [873] => terms
    [874] => data
    [875] => mining
    [877] => knowledge
    [878] => discovery
    [881] => interchangeably
    [884] => academic
    [885] => community
    [887] => major
    [888] => forums
    [890] => research
    [891] => started
    [893] => 1995
    [897] => international
    [898] => conference
    [900] => data
    [901] => mining
    [903] => knowledge
    [904] => discovery
    [905] => kdd-95
    [907] => started
    [909] => montreal
    [911] => aaai
    [912] => sponsorship
    [915] => co-chaired
    [917] => usama
    [918] => fayyad
    [920] => ramasamy
    [921] => uthurusamy
    [923] => year
    [926] => 1996
    [927] => usama
    [928] => fayyad
    [929] => launched
    [931] => journal
    [933] => kluwer
    [934] => called
    [935] => data
    [936] => mining
    [938] => knowledge
    [939] => discovery
    [942] => founding
    [943] => editor-in-chief
    [946] => started
    [948] => sigkddd
    [949] => newsletter
    [950] => sigkdd
    [951] => explorations
    [952] => 11
    [954] => kdd
    [955] => international
    [956] => conference
    [959] => primary
    [960] => highest
    [961] => quality
    [962] => conference
    [964] => data
    [965] => mining
    [968] => acceptance
    [969] => rate
    [971] => research
    [972] => paper
    [973] => submissions
    [975] => 18
    [977] => journal
    [978] => data
    [979] => mining
    [981] => knowledge
    [982] => discovery
    [985] => primary
    [986] => research
    [987] => journal
    [990] => field
    [991] => background
    [992] => edit
    [994] => manual
    [995] => extraction
    [997] => patterns
    [999] => data
    [1001] => occurred
    [1003] => centuries
    [1004] => early
    [1005] => methods
    [1007] => identifying
    [1008] => patterns
    [1010] => data
    [1011] => include
    [1012] => bayes'
    [1013] => theorem
    [1014] => 1700s
    [1016] => regression
    [1017] => analysis
    [1018] => 1800s
    [1020] => proliferation
    [1021] => ubiquity
    [1023] => increasing
    [1024] => power
    [1026] => computer
    [1027] => technology
    [1029] => dramatically
    [1030] => increased
    [1031] => data
    [1032] => collection
    [1033] => storage
    [1035] => manipulation
    [1036] => ability
    [1038] => data
    [1039] => sets
    [1041] => grown
    [1043] => size
    [1045] => complexity
    [1046] => direct
    [1047] => hands-on
    [1048] => data
    [1049] => analysis
    [1051] => increasingly
    [1053] => augmented
    [1055] => indirect
    [1056] => automated
    [1057] => data
    [1058] => processing
    [1059] => aided
    [1062] => discoveries
    [1064] => computer
    [1065] => science
    [1068] => neural
    [1069] => networks
    [1070] => cluster
    [1071] => analysis
    [1072] => genetic
    [1073] => algorithms
    [1074] => 1950s
    [1075] => decision
    [1076] => trees
    [1078] => decision
    [1079] => rules
    [1080] => 1960s
    [1082] => support
    [1083] => vector
    [1084] => machines
    [1085] => 1990s
    [1086] => data
    [1087] => mining
    [1090] => process
    [1092] => applying
    [1094] => methods
    [1097] => intention
    [1099] => uncovering
    [1100] => hidden
    [1101] => patterns
    [1102] => 12
    [1104] => large
    [1105] => data
    [1106] => sets
    [1108] => bridges
    [1110] => gap
    [1112] => applied
    [1113] => statistics
    [1115] => artificial
    [1116] => intelligence
    [1119] => provide
    [1121] => mathematical
    [1122] => background
    [1124] => database
    [1125] => management
    [1127] => exploiting
    [1130] => data
    [1132] => stored
    [1134] => indexed
    [1136] => databases
    [1138] => execute
    [1140] => actual
    [1141] => learning
    [1143] => discovery
    [1144] => algorithms
    [1146] => efficiently
    [1147] => allowing
    [1149] => methods
    [1152] => applied
    [1155] => larger
    [1156] => data
    [1157] => sets
    [1158] => process
    [1159] => edit
    [1161] => knowledge
    [1162] => discovery
    [1164] => databases
    [1165] => kdd
    [1166] => process
    [1168] => commonly
    [1169] => defined
    [1172] => stages
    [1173] => 1
    [1174] => selection
    [1175] => 2
    [1176] => pre-processing
    [1177] => 3
    [1178] => transformation
    [1179] => 4
    [1180] => data
    [1181] => mining
    [1182] => 5
    [1183] => interpretation
    [1184] => evaluation
    [1185] => 4
    [1187] => exists
    [1191] => variations
    [1194] => theme
    [1198] => cross
    [1199] => industry
    [1200] => standard
    [1201] => process
    [1203] => data
    [1204] => mining
    [1205] => crisp-dm
    [1207] => defines
    [1209] => phases
    [1210] => 1
    [1211] => business
    [1212] => understanding
    [1213] => 2
    [1214] => data
    [1215] => understanding
    [1216] => 3
    [1217] => data
    [1218] => preparation
    [1219] => 4
    [1220] => modeling
    [1221] => 5
    [1222] => evaluation
    [1223] => 6
    [1224] => deployment
    [1227] => simplified
    [1228] => process
    [1231] => 1
    [1232] => pre-processing
    [1233] => 2
    [1234] => data
    [1235] => mining
    [1237] => 3
    [1238] => results
    [1239] => validation
    [1240] => polls
    [1241] => conducted
    [1243] => 2002
    [1244] => 2004
    [1245] => 2007
    [1247] => 2014
    [1248] => show
    [1251] => crisp-dm
    [1252] => methodology
    [1255] => leading
    [1256] => methodology
    [1259] => data
    [1260] => miners
    [1261] => 13
    [1265] => data
    [1266] => mining
    [1267] => standard
    [1268] => named
    [1271] => polls
    [1273] => semma
    [1275] => 3
    [1276] => 4
    [1277] => times
    [1280] => people
    [1281] => reported
    [1283] => crisp-dm
    [1285] => teams
    [1287] => researchers
    [1289] => published
    [1290] => reviews
    [1292] => data
    [1293] => mining
    [1294] => process
    [1295] => models
    [1296] => 14
    [1297] => 15
    [1299] => azevedo
    [1301] => santos
    [1302] => conducted
    [1304] => comparison
    [1306] => crisp-dm
    [1308] => semma
    [1310] => 2008
    [1311] => 16
    [1312] => pre-processing
    [1313] => edit
    [1315] => data
    [1316] => mining
    [1317] => algorithms
    [1322] => target
    [1323] => data
    [1324] => set
    [1327] => assembled
    [1329] => data
    [1330] => mining
    [1333] => uncover
    [1334] => patterns
    [1336] => present
    [1339] => data
    [1341] => target
    [1342] => data
    [1343] => set
    [1346] => large
    [1351] => patterns
    [1353] => remaining
    [1354] => concise
    [1358] => mined
    [1361] => acceptable
    [1362] => time
    [1363] => limit
    [1365] => common
    [1366] => source
    [1368] => data
    [1371] => data
    [1372] => mart
    [1374] => data
    [1375] => warehouse
    [1376] => pre-processing
    [1378] => essential
    [1380] => analyze
    [1382] => multivariate
    [1383] => data
    [1384] => sets
    [1386] => data
    [1387] => mining
    [1389] => target
    [1390] => set
    [1393] => cleaned
    [1394] => data
    [1395] => cleaning
    [1396] => removes
    [1398] => observations
    [1400] => noise
    [1404] => missing
    [1405] => data
    [1406] => data
    [1407] => mining
    [1408] => edit
    [1409] => data
    [1410] => mining
    [1411] => involves
    [1413] => common
    [1414] => classes
    [1416] => tasks
    [1417] => 4
    [1418] => anomaly
    [1419] => detection
    [1420] => outlier
    [1421] => change
    [1422] => deviation
    [1423] => detection
    [1425] => identification
    [1427] => unusual
    [1428] => data
    [1429] => records
    [1433] => interesting
    [1435] => data
    [1436] => errors
    [1438] => require
    [1440] => investigation
    [1441] => association
    [1442] => rule
    [1443] => learning
    [1444] => dependency
    [1445] => modelling
    [1446] => searches
    [1448] => relationships
    [1450] => variables
    [1454] => supermarket
    [1456] => gather
    [1457] => data
    [1459] => customer
    [1460] => purchasing
    [1461] => habits
    [1463] => association
    [1464] => rule
    [1465] => learning
    [1467] => supermarket
    [1469] => determine
    [1471] => products
    [1473] => frequently
    [1474] => bought
    [1479] => information
    [1481] => marketing
    [1482] => purposes
    [1486] => referred
    [1489] => market
    [1490] => basket
    [1491] => analysis
    [1492] => clustering
    [1495] => task
    [1497] => discovering
    [1498] => groups
    [1500] => structures
    [1503] => data
    [1511] => similar
    [1515] => structures
    [1518] => data
    [1519] => classification
    [1522] => task
    [1524] => generalizing
    [1526] => structure
    [1528] => apply
    [1531] => data
    [1535] => e-mail
    [1536] => program
    [1538] => attempt
    [1540] => classify
    [1542] => e-mail
    [1544] => legitimate
    [1547] => spam
    [1548] => regression
    [1549] => attempts
    [1551] => find
    [1553] => function
    [1555] => models
    [1557] => data
    [1561] => error
    [1565] => estimating
    [1567] => relationships
    [1569] => data
    [1571] => datasets
    [1572] => summarization
    [1573] => providing
    [1576] => compact
    [1577] => representation
    [1580] => data
    [1581] => set
    [1582] => including
    [1583] => visualization
    [1585] => report
    [1586] => generation
    [1587] => results
    [1588] => validation
    [1589] => edit
    [1593] => data
    [1594] => produced
    [1596] => data
    [1597] => dredging
    [1600] => bot
    [1601] => operated
    [1603] => statistician
    [1604] => tyler
    [1605] => vigen
    [1606] => apparently
    [1607] => showing
    [1609] => close
    [1610] => link
    [1614] => word
    [1615] => winning
    [1617] => spelling
    [1618] => bee
    [1619] => competition
    [1622] => number
    [1624] => people
    [1627] => united
    [1628] => states
    [1629] => killed
    [1631] => venomous
    [1632] => spiders
    [1634] => similarity
    [1636] => trends
    [1640] => coincidence
    [1641] => data
    [1642] => mining
    [1644] => unintentionally
    [1646] => misused
    [1650] => produce
    [1651] => results
    [1656] => significant
    [1662] => predict
    [1663] => future
    [1664] => behaviour
    [1668] => reproduced
    [1672] => sample
    [1674] => data
    [1676] => bear
    [1681] => results
    [1683] => investigating
    [1686] => hypotheses
    [1689] => performing
    [1690] => proper
    [1691] => statistical
    [1692] => hypothesis
    [1693] => testing
    [1695] => simple
    [1696] => version
    [1699] => problem
    [1701] => machine
    [1702] => learning
    [1706] => overfitting
    [1710] => problem
    [1712] => arise
    [1715] => phases
    [1718] => process
    [1722] => train
    [1723] => test
    [1724] => split
    [1727] => applicable
    [1734] => sufficient
    [1736] => prevent
    [1739] => happening
    [1740] => 17
    [1742] => section
    [1744] => missing
    [1745] => information
    [1747] => non-classification
    [1748] => tasks
    [1750] => data
    [1751] => mining
    [1754] => covers
    [1755] => machine
    [1756] => learning
    [1758] => expand
    [1760] => section
    [1762] => include
    [1764] => information
    [1766] => details
    [1768] => exist
    [1771] => talk
    [1772] => page
    [1773] => september
    [1774] => 2011
    [1776] => final
    [1777] => step
    [1779] => knowledge
    [1780] => discovery
    [1782] => data
    [1785] => verify
    [1788] => patterns
    [1789] => produced
    [1792] => data
    [1793] => mining
    [1794] => algorithms
    [1795] => occur
    [1798] => wider
    [1799] => data
    [1800] => set
    [1803] => patterns
    [1804] => found
    [1807] => data
    [1808] => mining
    [1809] => algorithms
    [1811] => necessarily
    [1812] => valid
    [1815] => common
    [1818] => data
    [1819] => mining
    [1820] => algorithms
    [1822] => find
    [1823] => patterns
    [1826] => training
    [1827] => set
    [1831] => present
    [1834] => general
    [1835] => data
    [1836] => set
    [1839] => called
    [1840] => overfitting
    [1842] => overcome
    [1845] => evaluation
    [1848] => test
    [1849] => set
    [1851] => data
    [1855] => data
    [1856] => mining
    [1857] => algorithm
    [1860] => trained
    [1862] => learned
    [1863] => patterns
    [1865] => applied
    [1868] => test
    [1869] => set
    [1872] => resulting
    [1873] => output
    [1875] => compared
    [1878] => desired
    [1879] => output
    [1883] => data
    [1884] => mining
    [1885] => algorithm
    [1888] => distinguish
    [1889] => spam
    [1891] => legitimate
    [1892] => emails
    [1895] => trained
    [1898] => training
    [1899] => set
    [1901] => sample
    [1902] => e-mails
    [1904] => trained
    [1906] => learned
    [1907] => patterns
    [1910] => applied
    [1913] => test
    [1914] => set
    [1916] => e-mails
    [1923] => trained
    [1925] => accuracy
    [1928] => patterns
    [1932] => measured
    [1936] => e-mails
    [1938] => correctly
    [1939] => classify
    [1941] => number
    [1943] => statistical
    [1944] => methods
    [1949] => evaluate
    [1951] => algorithm
    [1954] => roc
    [1955] => curves
    [1958] => learned
    [1959] => patterns
    [1962] => meet
    [1964] => desired
    [1965] => standards
    [1966] => subsequently
    [1971] => re-evaluate
    [1973] => change
    [1975] => pre-processing
    [1977] => data
    [1978] => mining
    [1979] => steps
    [1982] => learned
    [1983] => patterns
    [1985] => meet
    [1987] => desired
    [1988] => standards
    [1991] => final
    [1992] => step
    [1995] => interpret
    [1997] => learned
    [1998] => patterns
    [2000] => turn
    [2003] => knowledge
    [2004] => research
    [2005] => edit
    [2007] => premier
    [2008] => professional
    [2009] => body
    [2012] => field
    [2015] => association
    [2017] => computing
    [2018] => machinery
    [2019] => 's
    [2020] => acm
    [2021] => special
    [2022] => interest
    [2023] => group
    [2024] => sig
    [2026] => knowledge
    [2027] => discovery
    [2029] => data
    [2030] => mining
    [2031] => sigkdd
    [2032] => 18
    [2033] => 19
    [2035] => 1989
    [2037] => acm
    [2038] => sig
    [2040] => hosted
    [2042] => annual
    [2043] => international
    [2044] => conference
    [2046] => published
    [2048] => proceedings
    [2049] => 20
    [2052] => 1999
    [2055] => published
    [2057] => biannual
    [2058] => academic
    [2059] => journal
    [2060] => titled
    [2061] => sigkdd
    [2062] => explorations
    [2063] => 21
    [2064] => computer
    [2065] => science
    [2066] => conferences
    [2068] => data
    [2069] => mining
    [2070] => include
    [2071] => cikm
    [2072] => conference
    [2073] => acm
    [2074] => conference
    [2076] => information
    [2078] => knowledge
    [2079] => management
    [2080] => dmin
    [2081] => conference
    [2082] => international
    [2083] => conference
    [2085] => data
    [2086] => mining
    [2087] => dmkd
    [2088] => conference
    [2089] => research
    [2090] => issues
    [2092] => data
    [2093] => mining
    [2095] => knowledge
    [2096] => discovery
    [2097] => dsaa
    [2098] => conference
    [2099] => ieee
    [2100] => international
    [2101] => conference
    [2103] => data
    [2104] => science
    [2106] => advanced
    [2107] => analytics
    [2108] => ecdm
    [2109] => conference
    [2110] => european
    [2111] => conference
    [2113] => data
    [2114] => mining
    [2115] => ecml-pkdd
    [2116] => conference
    [2117] => european
    [2118] => conference
    [2120] => machine
    [2121] => learning
    [2123] => principles
    [2125] => practice
    [2127] => knowledge
    [2128] => discovery
    [2130] => databases
    [2131] => edm
    [2132] => conference
    [2133] => international
    [2134] => conference
    [2136] => educational
    [2137] => data
    [2138] => mining
    [2139] => infocom
    [2140] => conference
    [2141] => ieee
    [2142] => infocom
    [2143] => icdm
    [2144] => conference
    [2145] => ieee
    [2146] => international
    [2147] => conference
    [2149] => data
    [2150] => mining
    [2151] => kdd
    [2152] => conference
    [2153] => acm
    [2154] => sigkdd
    [2155] => conference
    [2157] => knowledge
    [2158] => discovery
    [2160] => data
    [2161] => mining
    [2162] => mldm
    [2163] => conference
    [2164] => machine
    [2165] => learning
    [2167] => data
    [2168] => mining
    [2170] => pattern
    [2171] => recognition
    [2172] => pakdd
    [2173] => conference
    [2175] => annual
    [2176] => pacific-asia
    [2177] => conference
    [2179] => knowledge
    [2180] => discovery
    [2182] => data
    [2183] => mining
    [2184] => paw
    [2185] => conference
    [2186] => predictive
    [2187] => analytics
    [2188] => world
    [2189] => sdm
    [2190] => conference
    [2191] => siam
    [2192] => international
    [2193] => conference
    [2195] => data
    [2196] => mining
    [2197] => siam
    [2198] => sstd
    [2199] => symposium
    [2200] => symposium
    [2202] => spatial
    [2204] => temporal
    [2205] => databases
    [2206] => wsdm
    [2207] => conference
    [2208] => acm
    [2209] => conference
    [2211] => web
    [2212] => search
    [2214] => data
    [2215] => mining
    [2216] => data
    [2217] => mining
    [2218] => topics
    [2221] => present
    [2224] => data
    [2225] => management
    [2226] => database
    [2227] => conferences
    [2231] => icde
    [2232] => conference
    [2233] => sigmod
    [2234] => conference
    [2236] => international
    [2237] => conference
    [2240] => large
    [2241] => data
    [2242] => bases
    [2243] => standards
    [2244] => edit
    [2249] => efforts
    [2251] => define
    [2252] => standards
    [2255] => data
    [2256] => mining
    [2257] => process
    [2261] => 1999
    [2262] => european
    [2263] => cross
    [2264] => industry
    [2265] => standard
    [2266] => process
    [2268] => data
    [2269] => mining
    [2270] => crisp-dm
    [2271] => 1
    [2272] => 0
    [2275] => 2004
    [2276] => java
    [2277] => data
    [2278] => mining
    [2279] => standard
    [2280] => jdm
    [2281] => 1
    [2282] => 0
    [2283] => development
    [2285] => successors
    [2288] => processes
    [2289] => crisp-dm
    [2290] => 2
    [2291] => 0
    [2293] => jdm
    [2294] => 2
    [2295] => 0
    [2297] => active
    [2299] => 2006
    [2302] => stalled
    [2304] => jdm
    [2305] => 2
    [2306] => 0
    [2308] => withdrawn
    [2310] => reaching
    [2312] => final
    [2313] => draft
    [2315] => exchanging
    [2317] => extracted
    [2318] => models
    [2324] => predictive
    [2325] => analytics
    [2327] => key
    [2328] => standard
    [2331] => predictive
    [2332] => model
    [2333] => markup
    [2334] => language
    [2335] => pmml
    [2339] => xml
    [2340] => -based
    [2341] => language
    [2342] => developed
    [2345] => data
    [2346] => mining
    [2347] => group
    [2348] => dmg
    [2350] => supported
    [2352] => exchange
    [2353] => format
    [2356] => data
    [2357] => mining
    [2358] => applications
    [2362] => suggests
    [2365] => covers
    [2366] => prediction
    [2367] => models
    [2370] => data
    [2371] => mining
    [2372] => task
    [2374] => high
    [2375] => importance
    [2377] => business
    [2378] => applications
    [2380] => extensions
    [2382] => cover
    [2385] => subspace
    [2386] => clustering
    [2389] => proposed
    [2390] => independently
    [2393] => dmg
    [2394] => 22
    [2395] => notable
    [2397] => edit
    [2398] => main
    [2399] => article
    [2400] => examples
    [2402] => data
    [2403] => mining
    [2406] => category
    [2407] => applied
    [2408] => data
    [2409] => mining
    [2410] => data
    [2411] => mining
    [2417] => digital
    [2418] => data
    [2420] => today
    [2421] => notable
    [2422] => examples
    [2424] => data
    [2425] => mining
    [2428] => found
    [2430] => business
    [2431] => medicine
    [2432] => science
    [2434] => surveillance
    [2435] => privacy
    [2436] => concerns
    [2438] => ethics
    [2439] => edit
    [2442] => term
    [2443] => data
    [2444] => mining
    [2449] => ethical
    [2450] => implications
    [2457] => mining
    [2459] => information
    [2461] => relation
    [2463] => peoples'
    [2464] => behavior
    [2465] => ethical
    [2468] => 23
    [2470] => ways
    [2473] => data
    [2474] => mining
    [2481] => cases
    [2483] => contexts
    [2484] => raise
    [2485] => questions
    [2487] => privacy
    [2488] => legality
    [2490] => ethics
    [2491] => 24
    [2494] => data
    [2495] => mining
    [2496] => government
    [2498] => commercial
    [2499] => data
    [2500] => sets
    [2502] => national
    [2503] => security
    [2505] => law
    [2506] => enforcement
    [2507] => purposes
    [2512] => total
    [2513] => information
    [2514] => awareness
    [2515] => program
    [2518] => advise
    [2520] => raised
    [2521] => privacy
    [2522] => concerns
    [2523] => 25
    [2524] => 26
    [2525] => data
    [2526] => mining
    [2527] => requires
    [2528] => data
    [2529] => preparation
    [2532] => uncover
    [2533] => information
    [2535] => patterns
    [2538] => compromise
    [2539] => confidentiality
    [2541] => privacy
    [2542] => obligations
    [2544] => common
    [2549] => occur
    [2552] => data
    [2553] => aggregation
    [2554] => data
    [2555] => aggregation
    [2556] => involves
    [2557] => combining
    [2558] => data
    [2560] => possibly
    [2563] => sources
    [2568] => facilitates
    [2569] => analysis
    [2574] => make
    [2575] => identification
    [2577] => private
    [2578] => individual-level
    [2579] => data
    [2580] => deducible
    [2583] => apparent
    [2584] => 27
    [2588] => data
    [2589] => mining
    [2591] => se
    [2594] => result
    [2597] => preparation
    [2599] => data
    [2604] => purposes
    [2607] => analysis
    [2609] => threat
    [2612] => individual's
    [2613] => privacy
    [2616] => play
    [2619] => data
    [2621] => compiled
    [2624] => data
    [2625] => miner
    [2630] => access
    [2633] => newly
    [2634] => compiled
    [2635] => data
    [2636] => set
    [2641] => identify
    [2642] => specific
    [2643] => individuals
    [2647] => data
    [2649] => originally
    [2650] => anonymous
    [2651] => 28
    [2652] => 29
    [2653] => 30
    [2656] => recommended
    [2659] => individual
    [2661] => made
    [2662] => aware
    [2667] => data
    [2669] => collected
    [2670] => 27
    [2672] => purpose
    [2675] => data
    [2676] => collection
    [2680] => data
    [2681] => mining
    [2682] => projects
    [2685] => data
    [2694] => mine
    [2696] => data
    [2700] => data
    [2703] => derivatives
    [2705] => status
    [2707] => security
    [2708] => surrounding
    [2709] => access
    [2712] => data
    [2714] => collected
    [2715] => data
    [2718] => updated
    [2719] => data
    [2723] => modified
    [2728] => anonymous
    [2731] => individuals
    [2734] => readily
    [2736] => identified
    [2737] => 27
    [2740] => de-identified
    [2741] => anonymized
    [2742] => data
    [2743] => sets
    [2745] => potentially
    [2748] => information
    [2751] => identification
    [2753] => individuals
    [2755] => occurred
    [2757] => journalists
    [2761] => find
    [2763] => individuals
    [2764] => based
    [2767] => set
    [2769] => search
    [2770] => histories
    [2773] => inadvertently
    [2774] => released
    [2776] => aol
    [2777] => 31
    [2779] => inadvertent
    [2780] => revelation
    [2782] => personally
    [2783] => identifiable
    [2784] => information
    [2785] => leading
    [2788] => provider
    [2789] => violates
    [2790] => fair
    [2791] => information
    [2792] => practices
    [2794] => indiscretion
    [2797] => financial
    [2798] => emotional
    [2800] => bodily
    [2801] => harm
    [2805] => individual
    [2808] => instance
    [2810] => privacy
    [2811] => violation
    [2813] => patrons
    [2815] => walgreens
    [2816] => filed
    [2818] => lawsuit
    [2821] => company
    [2823] => 2011
    [2825] => selling
    [2826] => prescription
    [2827] => information
    [2829] => data
    [2830] => mining
    [2831] => companies
    [2834] => turn
    [2835] => provided
    [2837] => data
    [2839] => pharmaceutical
    [2840] => companies
    [2841] => 32
    [2842] => situation
    [2844] => europe
    [2845] => edit
    [2846] => europe
    [2849] => strong
    [2850] => privacy
    [2851] => laws
    [2853] => efforts
    [2855] => underway
    [2858] => strengthen
    [2860] => rights
    [2863] => consumers
    [2866] => u
    [2867] => s
    [2868] => -e
    [2869] => u
    [2870] => safe
    [2871] => harbor
    [2872] => principles
    [2874] => effectively
    [2875] => expose
    [2876] => european
    [2877] => users
    [2879] => privacy
    [2880] => exploitation
    [2882] => u
    [2883] => s
    [2884] => companies
    [2887] => consequence
    [2889] => edward
    [2890] => snowden
    [2891] => 's
    [2892] => global
    [2893] => surveillance
    [2894] => disclosure
    [2898] => increased
    [2899] => discussion
    [2901] => revoke
    [2903] => agreement
    [2908] => data
    [2911] => fully
    [2912] => exposed
    [2915] => national
    [2916] => security
    [2917] => agency
    [2919] => attempts
    [2921] => reach
    [2923] => agreement
    [2925] => failed
    [2926] => citation
    [2927] => needed
    [2928] => situation
    [2931] => united
    [2932] => states
    [2933] => edit
    [2936] => united
    [2937] => states
    [2938] => privacy
    [2939] => concerns
    [2942] => addressed
    [2946] => congress
    [2949] => passage
    [2951] => regulatory
    [2952] => controls
    [2956] => health
    [2957] => insurance
    [2958] => portability
    [2960] => accountability
    [2961] => act
    [2962] => hipaa
    [2964] => hipaa
    [2965] => requires
    [2966] => individuals
    [2968] => give
    [2970] => informed
    [2971] => consent
    [2973] => information
    [2975] => provide
    [2978] => intended
    [2979] => present
    [2981] => future
    [2986] => article
    [2988] => biotech
    [2989] => business
    [2990] => week
    [2991] => '
    [2993] => n
    [2994] => practice
    [2995] => hipaa
    [2998] => offer
    [3000] => greater
    [3001] => protection
    [3004] => longstanding
    [3005] => regulations
    [3008] => research
    [3009] => arena
    [3010] => '
    [3013] => aahc
    [3015] => importantly
    [3017] => rule's
    [3018] => goal
    [3020] => protection
    [3022] => informed
    [3023] => consent
    [3025] => undermined
    [3028] => complexity
    [3030] => consent
    [3031] => forms
    [3034] => required
    [3036] => patients
    [3038] => participants
    [3040] => approach
    [3042] => level
    [3044] => incomprehensibility
    [3046] => average
    [3047] => individuals
    [3048] => 33
    [3050] => underscores
    [3052] => necessity
    [3054] => data
    [3055] => anonymity
    [3057] => data
    [3058] => aggregation
    [3060] => mining
    [3061] => practices
    [3062] => u
    [3063] => s
    [3064] => information
    [3065] => privacy
    [3066] => legislation
    [3069] => hipaa
    [3072] => family
    [3073] => educational
    [3074] => rights
    [3076] => privacy
    [3077] => act
    [3078] => ferpa
    [3079] => applies
    [3083] => specific
    [3084] => areas
    [3088] => law
    [3089] => addresses
    [3092] => data
    [3093] => mining
    [3096] => majority
    [3098] => businesses
    [3101] => u
    [3102] => s
    [3105] => controlled
    [3108] => legislation
    [3109] => copyright
    [3110] => law
    [3111] => edit
    [3112] => situation
    [3114] => europe
    [3115] => edit
    [3116] => due
    [3119] => lack
    [3121] => flexibilities
    [3123] => european
    [3124] => copyright
    [3126] => database
    [3127] => law
    [3129] => mining
    [3131] => in-copyright
    [3132] => works
    [3135] => web
    [3136] => mining
    [3139] => permission
    [3142] => copyright
    [3143] => owner
    [3146] => legal
    [3149] => database
    [3151] => pure
    [3152] => data
    [3154] => europe
    [3161] => copyright
    [3163] => database
    [3164] => rights
    [3166] => exist
    [3168] => data
    [3169] => mining
    [3171] => subject
    [3173] => regulations
    [3176] => database
    [3177] => directive
    [3180] => recommendation
    [3183] => hargreaves
    [3184] => review
    [3186] => led
    [3189] => uk
    [3190] => government
    [3192] => amend
    [3194] => copyright
    [3195] => law
    [3197] => 2014
    [3198] => 34
    [3201] => content
    [3202] => mining
    [3205] => limitation
    [3207] => exception
    [3211] => country
    [3214] => world
    [3219] => japan
    [3221] => introduced
    [3223] => exception
    [3225] => 2009
    [3227] => data
    [3228] => mining
    [3230] => due
    [3233] => restriction
    [3236] => copyright
    [3237] => directive
    [3239] => uk
    [3240] => exception
    [3243] => content
    [3244] => mining
    [3246] => non-commercial
    [3247] => purposes
    [3248] => uk
    [3249] => copyright
    [3250] => law
    [3256] => provision
    [3259] => overridden
    [3261] => contractual
    [3262] => terms
    [3264] => conditions
    [3266] => european
    [3267] => commission
    [3268] => facilitated
    [3269] => stakeholder
    [3270] => discussion
    [3272] => text
    [3274] => data
    [3275] => mining
    [3277] => 2013
    [3280] => title
    [3282] => licences
    [3284] => europe
    [3285] => 35
    [3287] => focus
    [3290] => solution
    [3293] => legal
    [3294] => issue
    [3296] => licences
    [3299] => limitations
    [3301] => exceptions
    [3302] => led
    [3304] => representatives
    [3306] => universities
    [3307] => researchers
    [3308] => libraries
    [3309] => civil
    [3310] => society
    [3311] => groups
    [3313] => open
    [3314] => access
    [3315] => publishers
    [3317] => leave
    [3319] => stakeholder
    [3320] => dialogue
    [3323] => 2013
    [3324] => 36
    [3325] => situation
    [3328] => united
    [3329] => states
    [3330] => edit
    [3332] => contrast
    [3334] => europe
    [3336] => flexible
    [3337] => nature
    [3340] => copyright
    [3341] => law
    [3345] => fair
    [3347] => means
    [3349] => content
    [3350] => mining
    [3352] => america
    [3357] => fair
    [3359] => countries
    [3362] => israel
    [3363] => taiwan
    [3365] => south
    [3366] => korea
    [3368] => viewed
    [3371] => legal
    [3373] => content
    [3374] => mining
    [3376] => transformative
    [3382] => supplant
    [3384] => original
    [3385] => work
    [3388] => viewed
    [3391] => lawful
    [3393] => fair
    [3398] => part
    [3401] => google
    [3402] => book
    [3403] => settlement
    [3405] => presiding
    [3406] => judge
    [3409] => case
    [3410] => ruled
    [3412] => google's
    [3413] => digitisation
    [3414] => project
    [3416] => in-copyright
    [3417] => books
    [3419] => lawful
    [3421] => part
    [3425] => transformative
    [3429] => digitisation
    [3430] => project
    [3431] => displayed
    [3435] => text
    [3437] => data
    [3438] => mining
    [3439] => 37
    [3440] => software
    [3441] => edit
    [3444] => category
    [3445] => data
    [3446] => mining
    [3448] => machine
    [3449] => learning
    [3450] => software
    [3451] => free
    [3452] => open-source
    [3453] => data
    [3454] => mining
    [3455] => software
    [3457] => applications
    [3458] => edit
    [3461] => applications
    [3465] => free
    [3466] => open
    [3467] => source
    [3468] => licenses
    [3469] => public
    [3470] => access
    [3472] => application
    [3473] => source
    [3474] => code
    [3478] => carrot2
    [3479] => text
    [3481] => search
    [3482] => results
    [3483] => clustering
    [3484] => framework
    [3485] => chemicalize
    [3486] => org
    [3488] => chemical
    [3489] => structure
    [3490] => miner
    [3492] => web
    [3493] => search
    [3494] => engine
    [3495] => elki
    [3497] => university
    [3498] => research
    [3499] => project
    [3501] => advanced
    [3502] => cluster
    [3503] => analysis
    [3505] => outlier
    [3506] => detection
    [3507] => methods
    [3508] => written
    [3511] => java
    [3512] => language
    [3513] => gate
    [3515] => natural
    [3516] => language
    [3517] => processing
    [3519] => language
    [3520] => engineering
    [3521] => tool
    [3522] => knime
    [3524] => konstanz
    [3525] => information
    [3526] => miner
    [3528] => user
    [3529] => friendly
    [3531] => comprehensive
    [3532] => data
    [3533] => analytics
    [3534] => framework
    [3535] => massive
    [3536] => online
    [3537] => analysis
    [3538] => moa
    [3540] => real-time
    [3541] => big
    [3542] => data
    [3543] => stream
    [3544] => mining
    [3546] => concept
    [3547] => drift
    [3548] => tool
    [3551] => java
    [3552] => programming
    [3553] => language
    [3554] => ml-flex
    [3556] => software
    [3557] => package
    [3559] => enables
    [3560] => users
    [3562] => integrate
    [3564] => third-party
    [3565] => machine-learning
    [3566] => packages
    [3567] => written
    [3570] => programming
    [3571] => language
    [3572] => execute
    [3573] => classification
    [3574] => analyses
    [3576] => parallel
    [3578] => multiple
    [3579] => computing
    [3580] => nodes
    [3582] => produce
    [3583] => html
    [3584] => reports
    [3586] => classification
    [3587] => results
    [3588] => mlpack
    [3589] => library
    [3591] => collection
    [3593] => ready-to-use
    [3594] => machine
    [3595] => learning
    [3596] => algorithms
    [3597] => written
    [3600] => c
    [3601] => language
    [3602] => mepx
    [3604] => cross
    [3605] => platform
    [3606] => tool
    [3608] => regression
    [3610] => classification
    [3611] => problems
    [3612] => based
    [3615] => genetic
    [3616] => programming
    [3617] => variant
    [3618] => nltk
    [3619] => natural
    [3620] => language
    [3621] => toolkit
    [3623] => suite
    [3625] => libraries
    [3627] => programs
    [3629] => symbolic
    [3631] => statistical
    [3632] => natural
    [3633] => language
    [3634] => processing
    [3635] => nlp
    [3638] => python
    [3639] => language
    [3640] => opennn
    [3641] => open
    [3642] => neural
    [3643] => networks
    [3644] => library
    [3645] => orange
    [3647] => component-based
    [3648] => data
    [3649] => mining
    [3651] => machine
    [3652] => learning
    [3653] => software
    [3654] => suite
    [3655] => written
    [3658] => python
    [3659] => language
    [3660] => r
    [3662] => programming
    [3663] => language
    [3665] => software
    [3666] => environment
    [3668] => statistical
    [3669] => computing
    [3670] => data
    [3671] => mining
    [3673] => graphics
    [3676] => part
    [3679] => gnu
    [3680] => project
    [3681] => scikit-learn
    [3684] => open
    [3685] => source
    [3686] => machine
    [3687] => learning
    [3688] => library
    [3691] => python
    [3692] => programming
    [3693] => language
    [3694] => torch
    [3696] => open
    [3697] => source
    [3698] => deep
    [3699] => learning
    [3700] => library
    [3703] => lua
    [3704] => programming
    [3705] => language
    [3707] => scientific
    [3708] => computing
    [3709] => framework
    [3711] => wide
    [3712] => support
    [3714] => machine
    [3715] => learning
    [3716] => algorithms
    [3717] => uima
    [3719] => uima
    [3720] => unstructured
    [3721] => information
    [3722] => management
    [3723] => architecture
    [3726] => component
    [3727] => framework
    [3729] => analyzing
    [3730] => unstructured
    [3731] => content
    [3734] => text
    [3735] => audio
    [3737] => video
    [3738] => originally
    [3739] => developed
    [3741] => ibm
    [3742] => weka
    [3744] => suite
    [3746] => machine
    [3747] => learning
    [3748] => software
    [3749] => applications
    [3750] => written
    [3753] => java
    [3754] => programming
    [3755] => language
    [3756] => proprietary
    [3757] => data-mining
    [3758] => software
    [3760] => applications
    [3761] => edit
    [3764] => applications
    [3768] => proprietary
    [3769] => licenses
    [3770] => angoss
    [3771] => knowledgestudio
    [3772] => data
    [3773] => mining
    [3774] => tool
    [3775] => clarabridge
    [3776] => text
    [3777] => analytics
    [3778] => product
    [3779] => vertica
    [3780] => data
    [3781] => mining
    [3782] => software
    [3783] => provided
    [3785] => hewlett-packard
    [3786] => spss
    [3787] => modeler
    [3788] => data
    [3789] => mining
    [3790] => software
    [3791] => provided
    [3793] => ibm
    [3794] => kxen
    [3795] => modeler
    [3796] => data
    [3797] => mining
    [3798] => tool
    [3799] => provided
    [3801] => kxen
    [3803] => lionsolver
    [3805] => integrated
    [3806] => software
    [3807] => application
    [3809] => data
    [3810] => mining
    [3811] => business
    [3812] => intelligence
    [3814] => modeling
    [3816] => implements
    [3818] => learning
    [3820] => intelligent
    [3821] => optimization
    [3822] => lion
    [3823] => approach
    [3824] => megaputer
    [3825] => intelligence
    [3826] => data
    [3828] => text
    [3829] => mining
    [3830] => software
    [3832] => called
    [3833] => polyanalyst
    [3834] => microsoft
    [3835] => analysis
    [3836] => services
    [3837] => data
    [3838] => mining
    [3839] => software
    [3840] => provided
    [3842] => microsoft
    [3843] => netowl
    [3844] => suite
    [3846] => multilingual
    [3847] => text
    [3849] => entity
    [3850] => analytics
    [3851] => products
    [3853] => enable
    [3854] => data
    [3855] => mining
    [3856] => opentext
    [3857] => big
    [3858] => data
    [3859] => analytics
    [3860] => visual
    [3861] => data
    [3862] => mining
    [3863] => predictive
    [3864] => analysis
    [3866] => open
    [3867] => text
    [3868] => corporation
    [3869] => oracle
    [3870] => data
    [3871] => mining
    [3872] => data
    [3873] => mining
    [3874] => software
    [3876] => oracle
    [3877] => corporation
    [3878] => pseven
    [3879] => platform
    [3881] => automation
    [3883] => engineering
    [3884] => simulation
    [3886] => analysis
    [3887] => multidisciplinary
    [3888] => optimization
    [3890] => data
    [3891] => mining
    [3892] => provided
    [3894] => datadvance
    [3895] => qlucore
    [3896] => omics
    [3897] => explorer
    [3898] => data
    [3899] => mining
    [3900] => software
    [3901] => rapidminer
    [3903] => environment
    [3905] => machine
    [3906] => learning
    [3908] => data
    [3909] => mining
    [3910] => experiments
    [3911] => sas
    [3912] => enterprise
    [3913] => miner
    [3914] => data
    [3915] => mining
    [3916] => software
    [3917] => provided
    [3920] => sas
    [3921] => institute
    [3922] => statistica
    [3923] => data
    [3924] => miner
    [3925] => data
    [3926] => mining
    [3927] => software
    [3928] => provided
    [3930] => statsoft
    [3931] => tanagra
    [3932] => visualisation-oriented
    [3933] => data
    [3934] => mining
    [3935] => software
    [3938] => teaching
    [3939] => marketplace
    [3940] => surveys
    [3941] => edit
    [3943] => researchers
    [3945] => organizations
    [3947] => conducted
    [3948] => reviews
    [3950] => data
    [3951] => mining
    [3952] => tools
    [3954] => surveys
    [3956] => data
    [3957] => miners
    [3959] => identify
    [3963] => strengths
    [3965] => weaknesses
    [3968] => software
    [3969] => packages
    [3972] => provide
    [3974] => overview
    [3977] => behaviors
    [3978] => preferences
    [3980] => views
    [3982] => data
    [3983] => miners
    [3987] => reports
    [3988] => include
    [3989] => hurwitz
    [3990] => victory
    [3991] => index
    [3992] => report
    [3994] => advanced
    [3995] => analytics
    [3998] => market
    [3999] => research
    [4000] => assessment
    [4001] => tool
    [4003] => highlights
    [4006] => diverse
    [4009] => advanced
    [4010] => analytics
    [4011] => technology
    [4014] => vendors
    [4016] => make
    [4018] => applications
    [4020] => recent-research
    [4021] => 2011
    [4022] => wiley
    [4023] => interdisciplinary
    [4024] => reviews
    [4025] => data
    [4026] => mining
    [4028] => knowledge
    [4029] => discovery
    [4030] => 38
    [4031] => rexer
    [4032] => analytics
    [4033] => data
    [4034] => miner
    [4035] => surveys
    [4036] => 2007
    [4037] => 2015
    [4038] => 39
    [4039] => forrester
    [4040] => research
    [4041] => 2010
    [4042] => predictive
    [4043] => analytics
    [4045] => data
    [4046] => mining
    [4047] => solutions
    [4048] => report
    [4049] => 40
    [4050] => gartner
    [4051] => 2008
    [4052] => magic
    [4053] => quadrant
    [4054] => report
    [4055] => 41
    [4056] => robert
    [4058] => nisbet's
    [4059] => 2006
    [4061] => part
    [4062] => series
    [4064] => articles
    [4065] => data
    [4066] => mining
    [4067] => tools
    [4073] => crm
    [4074] => 42
    [4075] => haughton
    [4077] => al
    [4078] => 's
    [4079] => 2003
    [4080] => review
    [4082] => data
    [4083] => mining
    [4084] => software
    [4085] => packages
    [4088] => american
    [4089] => statistician
    [4090] => 43
    [4091] => goebel
    [4092] => gruenwald
    [4093] => 1999
    [4095] => survey
    [4097] => data
    [4098] => mining
    [4100] => knowledge
    [4101] => discovery
    [4102] => software
    [4103] => tools
    [4105] => sigkdd
    [4106] => explorations
    [4107] => 44
    [4110] => edit
    [4111] => methods
    [4112] => agent
    [4113] => mining
    [4114] => anomaly
    [4115] => outlier
    [4116] => change
    [4117] => detection
    [4118] => association
    [4119] => rule
    [4120] => learning
    [4121] => bayesian
    [4122] => networks
    [4123] => classification
    [4124] => cluster
    [4125] => analysis
    [4126] => decision
    [4127] => trees
    [4128] => ensemble
    [4129] => learning
    [4130] => factor
    [4131] => analysis
    [4132] => genetic
    [4133] => algorithms
    [4134] => intention
    [4135] => mining
    [4136] => learning
    [4137] => classifier
    [4138] => system
    [4139] => multilinear
    [4140] => subspace
    [4141] => learning
    [4142] => neural
    [4143] => networks
    [4144] => regression
    [4145] => analysis
    [4146] => sequence
    [4147] => mining
    [4148] => structured
    [4149] => data
    [4150] => analysis
    [4151] => support
    [4152] => vector
    [4153] => machines
    [4154] => text
    [4155] => mining
    [4156] => time
    [4157] => series
    [4158] => analysis
    [4159] => application
    [4160] => domains
    [4161] => analytics
    [4162] => behavior
    [4163] => informatics
    [4164] => big
    [4165] => data
    [4166] => bioinformatics
    [4167] => business
    [4168] => intelligence
    [4169] => data
    [4170] => analysis
    [4171] => data
    [4172] => warehouse
    [4173] => decision
    [4174] => support
    [4175] => system
    [4176] => domain
    [4177] => driven
    [4178] => data
    [4179] => mining
    [4180] => drug
    [4181] => discovery
    [4182] => exploratory
    [4183] => data
    [4184] => analysis
    [4185] => predictive
    [4186] => analytics
    [4187] => web
    [4188] => mining
    [4189] => application
    [4190] => examples
    [4191] => main
    [4192] => article
    [4193] => examples
    [4195] => data
    [4196] => mining
    [4199] => category
    [4200] => applied
    [4201] => data
    [4202] => mining
    [4203] => customer
    [4204] => analytics
    [4205] => educational
    [4206] => data
    [4207] => mining
    [4208] => national
    [4209] => security
    [4210] => agency
    [4211] => automatic
    [4212] => number
    [4213] => plate
    [4214] => recognition
    [4217] => united
    [4218] => kingdom
    [4219] => quantitative
    [4220] => structure
    [4221] => activity
    [4222] => relationship
    [4223] => surveillance
    [4224] => mass
    [4225] => surveillance
    [4226] => e
    [4227] => g
    [4228] => stellar
    [4229] => wind
    [4230] => related
    [4231] => topics
    [4232] => data
    [4233] => mining
    [4236] => analyzing
    [4237] => data
    [4239] => information
    [4241] => extracting
    [4242] => information
    [4245] => data
    [4247] => data
    [4248] => integration
    [4249] => data
    [4250] => transformation
    [4251] => electronic
    [4252] => discovery
    [4253] => information
    [4254] => extraction
    [4255] => information
    [4256] => integration
    [4257] => named-entity
    [4258] => recognition
    [4259] => profiling
    [4260] => information
    [4261] => science
    [4262] => psychometrics
    [4263] => social
    [4264] => media
    [4265] => mining
    [4266] => surveillance
    [4267] => capitalism
    [4268] => web
    [4269] => scraping
    [4271] => resources
    [4272] => international
    [4273] => journal
    [4275] => data
    [4276] => warehousing
    [4278] => mining
    [4279] => references
    [4280] => edit
    [4282] => b
    [4283] => c
    [4284] => d
    [4285] => data
    [4286] => mining
    [4287] => curriculum
    [4288] => acm
    [4289] => sigkdd
    [4290] => 2006-04-30
    [4291] => retrieved
    [4292] => 2014-01-27
    [4293] => clifton
    [4294] => christopher
    [4295] => 2010
    [4296] => encyclop
    [4297] => dia
    [4298] => britannica
    [4299] => definition
    [4301] => data
    [4302] => mining
    [4303] => retrieved
    [4304] => 2010-12-09
    [4305] => hastie
    [4306] => trevor
    [4307] => tibshirani
    [4308] => robert
    [4309] => friedman
    [4310] => jerome
    [4311] => 2009
    [4313] => elements
    [4315] => statistical
    [4316] => learning
    [4317] => data
    [4318] => mining
    [4319] => inference
    [4321] => prediction
    [4322] => retrieved
    [4323] => 2012-08-07
    [4325] => b
    [4326] => c
    [4327] => fayyad
    [4328] => usama
    [4329] => piatetsky-shapiro
    [4330] => gregory
    [4331] => smyth
    [4332] => padhraic
    [4333] => 1996
    [4335] => data
    [4336] => mining
    [4338] => knowledge
    [4339] => discovery
    [4341] => databases
    [4342] => pdf
    [4343] => retrieved
    [4344] => 17
    [4345] => december
    [4346] => 2008
    [4347] => han
    [4348] => jiawei
    [4349] => kamber
    [4350] => micheline
    [4351] => 2001
    [4352] => data
    [4353] => mining
    [4354] => concepts
    [4356] => techniques
    [4357] => morgan
    [4358] => kaufmann
    [4359] => p
    [4360] => 5
    [4361] => isbn
    [4362] => 978-1-55860-489-6
    [4364] => data
    [4365] => mining
    [4370] => appropriately
    [4371] => named
    [4372] => knowledge
    [4373] => mining
    [4375] => data
    [4380] => long
    [4382] => e
    [4383] => g
    [4384] => okairp
    [4385] => 2005
    [4386] => fall
    [4387] => conference
    [4388] => arizona
    [4389] => state
    [4390] => university
    [4393] => datamining
    [4394] => witten
    [4395] => ian
    [4396] => h
    [4397] => frank
    [4398] => eibe
    [4399] => hall
    [4400] => mark
    [4402] => 30
    [4403] => january
    [4404] => 2011
    [4405] => data
    [4406] => mining
    [4407] => practical
    [4408] => machine
    [4409] => learning
    [4410] => tools
    [4412] => techniques
    [4413] => 3
    [4414] => ed
    [4415] => elsevier
    [4416] => isbn
    [4417] => 978-0-12-374856-0
    [4418] => bouckaert
    [4419] => remco
    [4420] => r
    [4421] => frank
    [4422] => eibe
    [4423] => hall
    [4424] => mark
    [4426] => holmes
    [4427] => geoffrey
    [4428] => pfahringer
    [4429] => bernhard
    [4430] => reutemann
    [4431] => peter
    [4432] => witten
    [4433] => ian
    [4434] => h
    [4435] => 2010
    [4436] => weka
    [4437] => experiences
    [4440] => java
    [4441] => open-source
    [4442] => project
    [4443] => journal
    [4445] => machine
    [4446] => learning
    [4447] => research
    [4448] => 11
    [4449] => 2533
    [4450] => 2541
    [4452] => original
    [4453] => title
    [4454] => practical
    [4455] => machine
    [4456] => learning
    [4458] => changed
    [4460] => term
    [4461] => data
    [4462] => mining
    [4464] => added
    [4465] => primarily
    [4467] => marketing
    [4468] => reasons
    [4469] => mena
    [4470] => jes
    [4471] => s
    [4472] => 2011
    [4473] => machine
    [4474] => learning
    [4475] => forensics
    [4477] => law
    [4478] => enforcement
    [4479] => security
    [4481] => intelligence
    [4482] => boca
    [4483] => raton
    [4484] => fl
    [4485] => crc
    [4486] => press
    [4487] => taylor
    [4488] => francis
    [4489] => group
    [4490] => isbn
    [4491] => 978-1-4398-6069-4
    [4492] => piatetsky-shapiro
    [4493] => gregory
    [4494] => parker
    [4495] => gary
    [4496] => 2011
    [4497] => lesson
    [4498] => data
    [4499] => mining
    [4501] => knowledge
    [4502] => discovery
    [4504] => introduction
    [4505] => introduction
    [4507] => data
    [4508] => mining
    [4509] => kd
    [4510] => nuggets
    [4511] => retrieved
    [4512] => 30
    [4513] => august
    [4514] => 2012
    [4515] => fayyad
    [4516] => usama
    [4517] => 15
    [4518] => june
    [4519] => 1999
    [4521] => editorial
    [4523] => editor-in-chief
    [4524] => sigkdd
    [4525] => explorations
    [4526] => 13
    [4527] => 1
    [4528] => 102
    [4529] => doi
    [4530] => 10
    [4531] => 1145
    [4532] => 2207243
    [4533] => 2207269
    [4534] => retrieved
    [4535] => 27
    [4536] => december
    [4537] => 2010
    [4538] => kantardzic
    [4539] => mehmed
    [4540] => 2003
    [4541] => data
    [4542] => mining
    [4543] => concepts
    [4544] => models
    [4545] => methods
    [4547] => algorithms
    [4548] => john
    [4549] => wiley
    [4550] => sons
    [4551] => isbn
    [4552] => 0-471-22852-4
    [4553] => oclc
    [4554] => 50055336
    [4555] => gregory
    [4556] => piatetsky-shapiro
    [4557] => 2002
    [4558] => kdnuggets
    [4559] => methodology
    [4560] => poll
    [4561] => gregory
    [4562] => piatetsky-shapiro
    [4563] => 2004
    [4564] => kdnuggets
    [4565] => methodology
    [4566] => poll
    [4567] => gregory
    [4568] => piatetsky-shapiro
    [4569] => 2007
    [4570] => kdnuggets
    [4571] => methodology
    [4572] => poll
    [4573] => gregory
    [4574] => piatetsky-shapiro
    [4575] => 2014
    [4576] => kdnuggets
    [4577] => methodology
    [4578] => poll
    [4579] => scar
    [4580] => marb
    [4581] => n
    [4582] => gonzalo
    [4583] => mariscal
    [4585] => javier
    [4586] => segovia
    [4587] => 2009
    [4589] => data
    [4590] => mining
    [4591] => knowledge
    [4592] => discovery
    [4593] => process
    [4594] => model
    [4596] => data
    [4597] => mining
    [4599] => knowledge
    [4600] => discovery
    [4602] => real
    [4603] => life
    [4604] => applications
    [4605] => book
    [4606] => edited
    [4608] => julio
    [4609] => ponce
    [4611] => adem
    [4612] => karahoca
    [4613] => isbn
    [4614] => 978-3-902613-53-0
    [4615] => pp
    [4616] => 438
    [4617] => 453
    [4618] => february
    [4619] => 2009
    [4620] => i-tech
    [4621] => vienna
    [4622] => austria
    [4623] => lukasz
    [4624] => kurgan
    [4626] => petr
    [4627] => musilek
    [4628] => 2006
    [4630] => survey
    [4632] => knowledge
    [4633] => discovery
    [4635] => data
    [4636] => mining
    [4637] => process
    [4638] => models
    [4640] => knowledge
    [4641] => engineering
    [4642] => review
    [4643] => volume
    [4644] => 21
    [4645] => issue
    [4646] => 1
    [4647] => march
    [4648] => 2006
    [4649] => pp
    [4650] => 1
    [4651] => 24
    [4652] => cambridge
    [4653] => university
    [4654] => press
    [4656] => york
    [4657] => ny
    [4658] => usa
    [4659] => doi
    [4660] => 10
    [4661] => 1017
    [4662] => s0269888906000737
    [4663] => azevedo
    [4666] => santos
    [4667] => m
    [4668] => f
    [4669] => kdd
    [4670] => semma
    [4672] => crisp-dm
    [4674] => parallel
    [4675] => overview
    [4677] => proceedings
    [4680] => iadis
    [4681] => european
    [4682] => conference
    [4684] => data
    [4685] => mining
    [4686] => 2008
    [4687] => pp
    [4688] => 182
    [4689] => 185
    [4690] => hawkins
    [4691] => douglas
    [4692] => m
    [4693] => 2004
    [4695] => problem
    [4697] => overfitting
    [4698] => journal
    [4700] => chemical
    [4701] => information
    [4703] => computer
    [4704] => sciences
    [4705] => 44
    [4706] => 1
    [4707] => 1
    [4708] => 12
    [4709] => doi
    [4710] => 10
    [4711] => 1021
    [4712] => ci0342472
    [4713] => microsoft
    [4714] => academic
    [4715] => search
    [4716] => top
    [4717] => conferences
    [4719] => data
    [4720] => mining
    [4721] => microsoft
    [4722] => academic
    [4723] => search
    [4724] => google
    [4725] => scholar
    [4726] => top
    [4727] => publications
    [4729] => data
    [4730] => mining
    [4731] => analysis
    [4732] => google
    [4733] => scholar
    [4734] => proceedings
    [4735] => international
    [4736] => conferences
    [4738] => knowledge
    [4739] => discovery
    [4741] => data
    [4742] => mining
    [4743] => acm
    [4745] => york
    [4746] => sigkdd
    [4747] => explorations
    [4748] => acm
    [4750] => york
    [4751] => g
    [4752] => nnemann
    [4753] => stephan
    [4754] => kremer
    [4755] => hardy
    [4756] => seidl
    [4757] => thomas
    [4758] => 2011
    [4760] => extension
    [4763] => pmml
    [4764] => standard
    [4766] => subspace
    [4767] => clustering
    [4768] => models
    [4769] => proceedings
    [4772] => 2011
    [4773] => workshop
    [4775] => predictive
    [4776] => markup
    [4777] => language
    [4778] => modeling
    [4780] => pmml
    [4781] => '11
    [4782] => p
    [4783] => 48
    [4784] => isbn
    [4785] => 978-1-4503-0837-3
    [4786] => doi
    [4787] => 10
    [4788] => 1145
    [4789] => 2023598
    [4790] => 2023605
    [4791] => seltzer
    [4792] => william
    [4794] => promise
    [4796] => pitfalls
    [4798] => data
    [4799] => mining
    [4800] => ethical
    [4801] => issues
    [4802] => pdf
    [4803] => pitts
    [4804] => chip
    [4805] => 15
    [4806] => march
    [4807] => 2007
    [4809] => end
    [4811] => illegal
    [4812] => domestic
    [4813] => spying
    [4815] => count
    [4818] => washington
    [4819] => spectator
    [4820] => archived
    [4823] => original
    [4825] => 2007-10-29
    [4826] => taipale
    [4827] => kim
    [4829] => 15
    [4830] => december
    [4831] => 2003
    [4832] => data
    [4833] => mining
    [4835] => domestic
    [4836] => security
    [4837] => connecting
    [4839] => dots
    [4841] => make
    [4842] => sense
    [4844] => data
    [4845] => columbia
    [4846] => science
    [4848] => technology
    [4849] => law
    [4850] => review
    [4851] => 5
    [4852] => 2
    [4853] => oclc
    [4854] => 45263753
    [4855] => ssrn
    [4856] => 546782
    [4857] => resig
    [4858] => john
    [4859] => teredesai
    [4860] => ankur
    [4861] => 2004
    [4863] => framework
    [4865] => mining
    [4866] => instant
    [4867] => messaging
    [4868] => services
    [4869] => proceedings
    [4872] => 2004
    [4873] => siam
    [4874] => dm
    [4875] => conference
    [4877] => b
    [4878] => c
    [4882] => dig
    [4883] => privacy
    [4884] => implications
    [4886] => data
    [4887] => mining
    [4888] => aggregation
    [4889] => nascio
    [4890] => research
    [4892] => september
    [4893] => 2004
    [4894] => ohm
    [4895] => paul
    [4897] => build
    [4899] => database
    [4901] => ruin
    [4902] => harvard
    [4903] => business
    [4904] => review
    [4905] => darwin
    [4906] => bond-graham
    [4907] => iron
    [4908] => cagebook
    [4911] => logical
    [4912] => end
    [4914] => facebook's
    [4915] => patents
    [4916] => counterpunch
    [4917] => org
    [4918] => 2013
    [4919] => 12
    [4920] => 03
    [4921] => darwin
    [4922] => bond-graham
    [4923] => inside
    [4925] => tech
    [4926] => industry's
    [4927] => startup
    [4928] => conference
    [4929] => counterpunch
    [4930] => org
    [4931] => 2013
    [4932] => 09
    [4933] => 11
    [4934] => aol
    [4935] => search
    [4936] => data
    [4937] => identified
    [4938] => individuals
    [4939] => securityfocus
    [4940] => august
    [4941] => 2006
    [4942] => kshetri
    [4943] => nir
    [4944] => 2014
    [4945] => big
    [4946] => data
    [4947] => s
    [4948] => impact
    [4950] => privacy
    [4951] => security
    [4953] => consumer
    [4954] => welfare
    [4955] => telecommunications
    [4956] => policy
    [4957] => 38
    [4958] => 11
    [4959] => 1134
    [4960] => 1145
    [4961] => doi
    [4962] => 10
    [4963] => 1016
    [4964] => j
    [4965] => telpol
    [4966] => 2014
    [4967] => 10
    [4968] => 002
    [4969] => biotech
    [4970] => business
    [4971] => week
    [4972] => editors
    [4973] => june
    [4974] => 30
    [4975] => 2008
    [4976] => biomedicine
    [4977] => hipaa
    [4978] => privacy
    [4979] => rule
    [4980] => impedes
    [4981] => biomedical
    [4982] => research
    [4983] => biotech
    [4984] => business
    [4985] => week
    [4986] => retrieved
    [4987] => 17
    [4988] => november
    [4989] => 2009
    [4991] => lexisnexis
    [4992] => academic
    [4993] => uk
    [4994] => researchers
    [4996] => data
    [4997] => mining
    [5001] => uk
    [5002] => copyright
    [5003] => laws
    [5004] => archived
    [5005] => june
    [5006] => 9
    [5007] => 2014
    [5010] => wayback
    [5011] => machine
    [5012] => out-law
    [5014] => retrieved
    [5015] => 14
    [5016] => november
    [5017] => 2014
    [5018] => licences
    [5020] => europe
    [5022] => structured
    [5023] => stakeholder
    [5024] => dialogue
    [5025] => 2013
    [5026] => european
    [5027] => commission
    [5028] => retrieved
    [5029] => 14
    [5030] => november
    [5031] => 2014
    [5032] => text
    [5034] => data
    [5035] => mining
    [5037] => importance
    [5042] => change
    [5044] => europe
    [5045] => association
    [5047] => european
    [5048] => research
    [5049] => libraries
    [5050] => retrieved
    [5051] => 14
    [5052] => november
    [5053] => 2014
    [5054] => judge
    [5055] => grants
    [5056] => summary
    [5057] => judgment
    [5059] => favor
    [5061] => google
    [5062] => books
    [5064] => fair
    [5066] => victory
    [5067] => lexology
    [5069] => antonelli
    [5070] => law
    [5072] => retrieved
    [5073] => 14
    [5074] => november
    [5075] => 2014
    [5076] => mikut
    [5077] => ralf
    [5078] => reischl
    [5079] => markus
    [5080] => september
    [5081] => october
    [5082] => 2011
    [5083] => data
    [5084] => mining
    [5085] => tools
    [5086] => wiley
    [5087] => interdisciplinary
    [5088] => reviews
    [5089] => data
    [5090] => mining
    [5092] => knowledge
    [5093] => discovery
    [5094] => 1
    [5095] => 5
    [5096] => 431
    [5097] => 445
    [5098] => doi
    [5099] => 10
    [5100] => 1002
    [5101] => widm
    [5102] => 24
    [5103] => retrieved
    [5104] => october
    [5105] => 21
    [5106] => 2011
    [5107] => karl
    [5108] => rexer
    [5109] => heather
    [5110] => allen
    [5111] => paul
    [5112] => gearan
    [5113] => 2011
    [5114] => understanding
    [5115] => data
    [5116] => miners
    [5117] => analytics
    [5118] => magazine
    [5120] => june
    [5121] => 2011
    [5122] => informs
    [5123] => institute
    [5125] => operations
    [5126] => research
    [5129] => management
    [5130] => sciences
    [5131] => kobielus
    [5132] => james
    [5134] => forrester
    [5135] => wave
    [5136] => predictive
    [5137] => analytics
    [5139] => data
    [5140] => mining
    [5141] => solutions
    [5142] => q1
    [5143] => 2010
    [5144] => forrester
    [5145] => research
    [5146] => 1
    [5147] => july
    [5148] => 2008
    [5149] => herschel
    [5150] => gareth
    [5151] => magic
    [5152] => quadrant
    [5154] => customer
    [5155] => data-mining
    [5156] => applications
    [5157] => gartner
    [5159] => 1
    [5160] => july
    [5161] => 2008
    [5162] => nisbet
    [5163] => robert
    [5165] => 2006
    [5166] => data
    [5167] => mining
    [5168] => tools
    [5174] => crm
    [5175] => part
    [5176] => 1
    [5177] => information
    [5178] => management
    [5179] => special
    [5180] => reports
    [5181] => january
    [5182] => 2006
    [5183] => haughton
    [5184] => dominique
    [5185] => deichmann
    [5186] => joel
    [5187] => eshghi
    [5188] => abdolreza
    [5189] => sayek
    [5190] => selin
    [5191] => teebagy
    [5192] => nicholas
    [5194] => topi
    [5195] => heikki
    [5196] => 2003
    [5198] => review
    [5200] => software
    [5201] => packages
    [5203] => data
    [5204] => mining
    [5206] => american
    [5207] => statistician
    [5208] => vol
    [5209] => 57
    [5211] => 4
    [5212] => pp
    [5213] => 290
    [5214] => 309
    [5215] => goebel
    [5216] => michael
    [5217] => gruenwald
    [5218] => le
    [5219] => 1999
    [5221] => survey
    [5223] => data
    [5224] => mining
    [5226] => knowledge
    [5227] => discovery
    [5228] => software
    [5229] => tools
    [5230] => sigkdd
    [5231] => explorations
    [5232] => vol
    [5233] => 1
    [5234] => issue
    [5235] => 1
    [5236] => pp
    [5237] => 20
    [5238] => 33
    [5240] => reading
    [5241] => edit
    [5242] => cabena
    [5243] => peter
    [5244] => hadjnian
    [5245] => pablo
    [5246] => stadler
    [5247] => rolf
    [5248] => verhees
    [5249] => jaap
    [5250] => zanasi
    [5251] => alessandro
    [5252] => 1997
    [5253] => discovering
    [5254] => data
    [5255] => mining
    [5257] => concept
    [5259] => implementation
    [5260] => prentice
    [5261] => hall
    [5262] => isbn
    [5263] => 0-13-743980-6
    [5264] => m
    [5265] => s
    [5266] => chen
    [5267] => j
    [5268] => han
    [5269] => p
    [5270] => s
    [5271] => yu
    [5272] => 1996
    [5273] => data
    [5274] => mining
    [5276] => overview
    [5279] => database
    [5280] => perspective
    [5281] => knowledge
    [5283] => data
    [5284] => engineering
    [5285] => ieee
    [5286] => transactions
    [5288] => 8
    [5289] => 6
    [5290] => 866
    [5291] => 883
    [5292] => feldman
    [5293] => ronen
    [5294] => sanger
    [5295] => james
    [5296] => 2007
    [5298] => text
    [5299] => mining
    [5300] => handbook
    [5301] => cambridge
    [5302] => university
    [5303] => press
    [5304] => isbn
    [5305] => 978-0-521-83657-9
    [5306] => guo
    [5307] => yike
    [5309] => grossman
    [5310] => robert
    [5311] => editors
    [5312] => 1999
    [5313] => high
    [5314] => performance
    [5315] => data
    [5316] => mining
    [5317] => scaling
    [5318] => algorithms
    [5319] => applications
    [5321] => systems
    [5322] => kluwer
    [5323] => academic
    [5324] => publishers
    [5325] => han
    [5326] => jiawei
    [5327] => micheline
    [5328] => kamber
    [5330] => jian
    [5331] => pei
    [5332] => data
    [5333] => mining
    [5334] => concepts
    [5336] => techniques
    [5337] => morgan
    [5338] => kaufmann
    [5339] => 2006
    [5340] => hastie
    [5341] => trevor
    [5342] => tibshirani
    [5343] => robert
    [5345] => friedman
    [5346] => jerome
    [5347] => 2001
    [5349] => elements
    [5351] => statistical
    [5352] => learning
    [5353] => data
    [5354] => mining
    [5355] => inference
    [5357] => prediction
    [5358] => springer
    [5359] => isbn
    [5360] => 0-387-95284-5
    [5361] => liu
    [5362] => bing
    [5363] => 2007
    [5364] => web
    [5365] => data
    [5366] => mining
    [5367] => exploring
    [5368] => hyperlinks
    [5369] => contents
    [5371] => usage
    [5372] => data
    [5373] => springer
    [5374] => isbn
    [5375] => 3-540-37881-2
    [5376] => murphy
    [5377] => chris
    [5378] => 16
    [5380] => 2011
    [5382] => data
    [5383] => mining
    [5384] => free
    [5385] => speech
    [5386] => informationweek
    [5387] => umb
    [5388] => 12
    [5389] => nisbet
    [5390] => robert
    [5391] => elder
    [5392] => john
    [5393] => miner
    [5394] => gary
    [5395] => 2009
    [5396] => handbook
    [5398] => statistical
    [5399] => analysis
    [5400] => data
    [5401] => mining
    [5402] => applications
    [5403] => academic
    [5404] => press
    [5405] => elsevier
    [5406] => isbn
    [5407] => 978-0-12-374765-5
    [5408] => poncelet
    [5409] => pascal
    [5410] => masseglia
    [5411] => florent
    [5413] => teisseire
    [5414] => maguelonne
    [5415] => editors
    [5416] => october
    [5417] => 2007
    [5418] => data
    [5419] => mining
    [5420] => patterns
    [5422] => methods
    [5424] => applications
    [5425] => information
    [5426] => science
    [5427] => reference
    [5428] => isbn
    [5429] => 978-1-59904-162-9
    [5430] => tan
    [5431] => pang-ning
    [5432] => steinbach
    [5433] => michael
    [5435] => kumar
    [5436] => vipin
    [5437] => 2005
    [5438] => introduction
    [5440] => data
    [5441] => mining
    [5442] => isbn
    [5443] => 0-321-32136-7
    [5444] => theodoridis
    [5445] => sergios
    [5447] => koutroumbas
    [5448] => konstantinos
    [5449] => 2009
    [5450] => pattern
    [5451] => recognition
    [5452] => 4th
    [5453] => edition
    [5454] => academic
    [5455] => press
    [5456] => isbn
    [5457] => 978-1-59749-272-0
    [5458] => weiss
    [5459] => sholom
    [5460] => m
    [5462] => indurkhya
    [5463] => nitin
    [5464] => 1998
    [5465] => predictive
    [5466] => data
    [5467] => mining
    [5468] => morgan
    [5469] => kaufmann
    [5470] => witten
    [5471] => ian
    [5472] => h
    [5473] => frank
    [5474] => eibe
    [5475] => hall
    [5476] => mark
    [5478] => 30
    [5479] => january
    [5480] => 2011
    [5481] => data
    [5482] => mining
    [5483] => practical
    [5484] => machine
    [5485] => learning
    [5486] => tools
    [5488] => techniques
    [5489] => 3
    [5490] => ed
    [5491] => elsevier
    [5492] => isbn
    [5493] => 978-0-12-374856-0
    [5496] => free
    [5497] => weka
    [5498] => software
    [5499] => ye
    [5500] => nong
    [5501] => 2003
    [5503] => handbook
    [5505] => data
    [5506] => mining
    [5507] => mahwah
    [5508] => nj
    [5509] => lawrence
    [5510] => erlbaum
    [5511] => external
    [5512] => links
    [5513] => edit
    [5514] => wikimedia
    [5515] => commons
    [5517] => media
    [5518] => related
    [5520] => data
    [5521] => mining
    [5522] => knowledge
    [5523] => discovery
    [5524] => software
    [5526] => dmoz
    [5527] => data
    [5528] => mining
    [5529] => tool
    [5530] => vendors
    [5532] => dmoz
    [5533] => v
    [5534] => t
    [5535] => e
    [5536] => data
    [5537] => storage
    [5538] => analysis
    [5539] => cleansing
    [5540] => compression
    [5541] => corruption
    [5542] => curation
    [5543] => editing
    [5544] => farming
    [5545] => fusion
    [5546] => integration
    [5547] => integrity
    [5548] => loss
    [5549] => mining
    [5550] => pre-processing
    [5551] => quality
    [5552] => reduction
    [5553] => scraping
    [5554] => scrubbing
    [5555] => security
    [5556] => validation
    [5557] => warehouse
    [5558] => wrangling
    [5559] => munging
    [5560] => protection
    [5561] => privacy
    [5562] => v
    [5563] => t
    [5564] => e
    [5565] => data
    [5566] => warehouse
    [5567] => creating
    [5569] => data
    [5570] => warehouse
    [5571] => concepts
    [5572] => database
    [5573] => dimension
    [5574] => dimensional
    [5575] => modeling
    [5576] => fact
    [5577] => olap
    [5578] => star
    [5579] => schema
    [5580] => aggregate
    [5581] => variants
    [5582] => anchor
    [5583] => modeling
    [5584] => column-oriented
    [5585] => dbms
    [5586] => data
    [5587] => vault
    [5588] => modeling
    [5589] => holap
    [5590] => molap
    [5591] => rolap
    [5592] => operational
    [5593] => data
    [5594] => store
    [5595] => elements
    [5596] => data
    [5597] => dictionary
    [5598] => metadata
    [5599] => data
    [5600] => mart
    [5601] => sixth
    [5602] => normal
    [5603] => form
    [5604] => surrogate
    [5605] => key
    [5606] => fact
    [5607] => fact
    [5608] => table
    [5609] => early-arriving
    [5610] => fact
    [5611] => measure
    [5612] => dimension
    [5613] => dimension
    [5614] => table
    [5615] => degenerate
    [5616] => slowly
    [5617] => changing
    [5618] => filling
    [5619] => extract-transform-load
    [5620] => etl
    [5621] => extract
    [5622] => transform
    [5623] => load
    [5626] => data
    [5627] => warehouse
    [5628] => concepts
    [5629] => business
    [5630] => intelligence
    [5631] => dashboard
    [5632] => data
    [5633] => mining
    [5634] => decision
    [5635] => support
    [5636] => system
    [5637] => dss
    [5638] => olap
    [5639] => cube
    [5640] => data
    [5641] => warehouse
    [5642] => automation
    [5643] => languages
    [5644] => data
    [5645] => mining
    [5646] => extensions
    [5647] => dmx
    [5648] => multidimensional
    [5649] => expressions
    [5650] => mdx
    [5651] => xml
    [5653] => analysis
    [5654] => xmla
    [5655] => tools
    [5656] => business
    [5657] => intelligence
    [5658] => software
    [5659] => reporting
    [5660] => software
    [5661] => spreadsheet
    [5662] => related
    [5663] => people
    [5664] => bill
    [5665] => inmon
    [5666] => ralph
    [5667] => kimball
    [5668] => products
    [5669] => comparison
    [5671] => olap
    [5672] => servers
    [5673] => data
    [5674] => warehousing
    [5675] => products
    [5678] => producers
    [5679] => v
    [5680] => t
    [5681] => e
    [5682] => major
    [5683] => fields
    [5685] => computer
    [5686] => science
    [5687] => note
    [5689] => template
    [5690] => roughly
    [5693] => 2012
    [5694] => acm
    [5695] => computing
    [5696] => classification
    [5697] => system
    [5698] => hardware
    [5699] => printed
    [5700] => circuit
    [5701] => board
    [5702] => peripheral
    [5703] => integrated
    [5704] => circuit
    [5705] => very-large-scale
    [5706] => integration
    [5707] => energy
    [5708] => consumption
    [5709] => electronic
    [5710] => design
    [5711] => automation
    [5712] => computer
    [5713] => systems
    [5714] => organization
    [5715] => computer
    [5716] => architecture
    [5717] => embedded
    [5718] => system
    [5719] => real-time
    [5720] => computing
    [5721] => dependability
    [5722] => networks
    [5723] => network
    [5724] => architecture
    [5725] => network
    [5726] => protocol
    [5727] => network
    [5728] => components
    [5729] => network
    [5730] => scheduler
    [5731] => network
    [5732] => performance
    [5733] => evaluation
    [5734] => network
    [5735] => service
    [5736] => software
    [5737] => organization
    [5738] => interpreter
    [5739] => middleware
    [5740] => virtual
    [5741] => machine
    [5742] => operating
    [5743] => system
    [5744] => software
    [5745] => quality
    [5746] => software
    [5747] => notations
    [5749] => tools
    [5750] => programming
    [5751] => paradigm
    [5752] => programming
    [5753] => language
    [5754] => compiler
    [5755] => domain-specific
    [5756] => language
    [5757] => modeling
    [5758] => language
    [5759] => software
    [5760] => framework
    [5761] => integrated
    [5762] => development
    [5763] => environment
    [5764] => software
    [5765] => configuration
    [5766] => management
    [5767] => software
    [5768] => library
    [5769] => software
    [5770] => repository
    [5771] => software
    [5772] => development
    [5773] => software
    [5774] => development
    [5775] => process
    [5776] => requirements
    [5777] => analysis
    [5778] => software
    [5779] => design
    [5780] => software
    [5781] => construction
    [5782] => software
    [5783] => deployment
    [5784] => software
    [5785] => maintenance
    [5786] => programming
    [5787] => team
    [5788] => open-source
    [5789] => model
    [5790] => theory
    [5792] => computation
    [5793] => model
    [5795] => computation
    [5796] => formal
    [5797] => language
    [5798] => automata
    [5799] => theory
    [5800] => computational
    [5801] => complexity
    [5802] => theory
    [5803] => logic
    [5804] => semantics
    [5805] => algorithms
    [5806] => algorithm
    [5807] => design
    [5808] => analysis
    [5810] => algorithms
    [5811] => randomized
    [5812] => algorithm
    [5813] => computational
    [5814] => geometry
    [5815] => mathematics
    [5817] => computing
    [5818] => discrete
    [5819] => mathematics
    [5820] => probability
    [5821] => statistics
    [5822] => mathematical
    [5823] => software
    [5824] => information
    [5825] => theory
    [5826] => mathematical
    [5827] => analysis
    [5828] => numerical
    [5829] => analysis
    [5830] => information
    [5831] => systems
    [5832] => database
    [5833] => management
    [5834] => system
    [5835] => information
    [5836] => storage
    [5837] => systems
    [5838] => enterprise
    [5839] => information
    [5840] => system
    [5841] => social
    [5842] => information
    [5843] => systems
    [5844] => geographic
    [5845] => information
    [5846] => system
    [5847] => decision
    [5848] => support
    [5849] => system
    [5850] => process
    [5851] => control
    [5852] => system
    [5853] => multimedia
    [5854] => information
    [5855] => system
    [5856] => data
    [5857] => mining
    [5858] => digital
    [5859] => library
    [5860] => computing
    [5861] => platform
    [5862] => digital
    [5863] => marketing
    [5864] => world
    [5865] => wide
    [5866] => web
    [5867] => information
    [5868] => retrieval
    [5869] => security
    [5870] => cryptography
    [5871] => formal
    [5872] => methods
    [5873] => security
    [5874] => services
    [5875] => intrusion
    [5876] => detection
    [5877] => system
    [5878] => hardware
    [5879] => security
    [5880] => network
    [5881] => security
    [5882] => information
    [5883] => security
    [5884] => application
    [5885] => security
    [5886] => human
    [5887] => computer
    [5888] => interaction
    [5889] => interaction
    [5890] => design
    [5891] => social
    [5892] => computing
    [5893] => ubiquitous
    [5894] => computing
    [5895] => visualization
    [5896] => accessibility
    [5897] => concurrency
    [5898] => concurrent
    [5899] => computing
    [5900] => parallel
    [5901] => computing
    [5902] => distributed
    [5903] => computing
    [5904] => multithreading
    [5905] => multiprocessing
    [5906] => artificial
    [5907] => intelligence
    [5908] => natural
    [5909] => language
    [5910] => processing
    [5911] => knowledge
    [5912] => representation
    [5914] => reasoning
    [5915] => computer
    [5916] => vision
    [5917] => automated
    [5918] => planning
    [5920] => scheduling
    [5921] => search
    [5922] => methodology
    [5923] => control
    [5924] => method
    [5925] => philosophy
    [5927] => artificial
    [5928] => intelligence
    [5929] => distributed
    [5930] => artificial
    [5931] => intelligence
    [5932] => machine
    [5933] => learning
    [5934] => supervised
    [5935] => learning
    [5936] => unsupervised
    [5937] => learning
    [5938] => reinforcement
    [5939] => learning
    [5940] => multi-task
    [5941] => learning
    [5942] => cross-validation
    [5943] => graphics
    [5944] => animation
    [5945] => rendering
    [5946] => image
    [5947] => manipulation
    [5948] => graphics
    [5949] => processing
    [5950] => unit
    [5951] => mixed
    [5952] => reality
    [5953] => virtual
    [5954] => reality
    [5955] => image
    [5956] => compression
    [5957] => solid
    [5958] => modeling
    [5959] => applied
    [5960] => computing
    [5961] => e-commerce
    [5962] => enterprise
    [5963] => software
    [5964] => computational
    [5965] => mathematics
    [5966] => computational
    [5967] => physics
    [5968] => computational
    [5969] => chemistry
    [5970] => computational
    [5971] => biology
    [5972] => computational
    [5973] => social
    [5974] => science
    [5975] => computational
    [5976] => engineering
    [5977] => computational
    [5978] => healthcare
    [5979] => digital
    [5980] => art
    [5981] => electronic
    [5982] => publishing
    [5983] => cyberwarfare
    [5984] => electronic
    [5985] => voting
    [5986] => video
    [5987] => game
    [5988] => word
    [5989] => processing
    [5990] => operations
    [5991] => research
    [5992] => educational
    [5993] => technology
    [5994] => document
    [5995] => management
    [5996] => computer
    [5997] => science
    [5998] => portal
    [5999] => authority
    [6000] => control
    [6001] => gnd
    [6002] => 4428654-5
    [6003] => ndl
    [6004] => 00948240
    [6005] => retrieved
    [6007] => https
    [6009] => wikipedia
    [6010] => org
    [6011] => w
    [6012] => index
    [6013] => php
    [6014] => title
    [6015] => data
    [6016] => mining
    [6017] => oldid
    [6018] => 794778829
    [6019] => categories
    [6020] => data
    [6021] => mining
    [6022] => formal
    [6023] => sciences
    [6024] => hidden
    [6025] => categories
    [6026] => webarchive
    [6027] => template
    [6028] => wayback
    [6029] => links
    [6030] => articles
    [6033] => expanded
    [6035] => september
    [6036] => 2011
    [6038] => articles
    [6040] => unsourced
    [6041] => statements
    [6042] => articles
    [6044] => unsourced
    [6045] => statements
    [6047] => april
    [6048] => 2014
    [6049] => articles
    [6051] => dmoz
    [6052] => links
    [6053] => wikipedia
    [6054] => articles
    [6056] => gnd
    [6057] => identifiers
    [6058] => navigation
    [6059] => menu
    [6060] => personal
    [6061] => tools
    [6063] => logged
    [6065] => talk
    [6066] => contributions
    [6067] => create
    [6068] => account
    [6069] => log
    [6071] => namespaces
    [6072] => article
    [6073] => talk
    [6074] => variants
    [6075] => views
    [6076] => read
    [6077] => edit
    [6078] => view
    [6079] => history
    [6081] => search
    [6082] => navigation
    [6083] => main
    [6084] => page
    [6085] => contents
    [6086] => featured
    [6087] => content
    [6088] => current
    [6089] => events
    [6090] => random
    [6091] => article
    [6092] => donate
    [6094] => wikipedia
    [6095] => wikipedia
    [6096] => store
    [6097] => interaction
    [6100] => wikipedia
    [6101] => community
    [6102] => portal
    [6103] => recent
    [6105] => contact
    [6106] => page
    [6107] => tools
    [6109] => links
    [6111] => related
    [6113] => upload
    [6114] => file
    [6115] => special
    [6116] => pages
    [6117] => permanent
    [6118] => link
    [6119] => page
    [6120] => information
    [6121] => wikidata
    [6122] => item
    [6123] => cite
    [6125] => page
    [6126] => print
    [6127] => export
    [6128] => create
    [6130] => book
    [6131] => download
    [6133] => pdf
    [6134] => printable
    [6135] => version
    [6136] => languages
    [6137] => az
    [6138] => rbaycanca
    [6139] => catal
    [6140] => e
    [6141] => tina
    [6142] => dansk
    [6143] => deutsch
    [6144] => eesti
    [6145] => espa
    [6146] => ol
    [6147] => euskara
    [6148] => fran
    [6149] => ais
    [6150] => hrvatski
    [6151] => bahasa
    [6152] => indonesia
    [6153] => italiano
    [6154] => latvie
    [6155] => u
    [6156] => lietuvi
    [6157] => magyar
    [6158] => nederlands
    [6159] => norsk
    [6160] => bokm
    [6161] => l
    [6162] => polski
    [6163] => portugu
    [6164] => s
    [6165] => rom
    [6166] => n
    [6167] => shqip
    [6168] => simple
    [6169] => english
    [6170] => sloven
    [6171] => ina
    [6172] => sloven
    [6173] => ina
    [6174] => srpski
    [6175] => srpskohrvatski
    [6176] => basa
    [6177] => sunda
    [6178] => suomi
    [6179] => svenska
    [6180] => t
    [6181] => rk
    [6182] => e
    [6183] => ti
    [6184] => ng
    [6185] => vi
    [6186] => t
    [6187] => edit
    [6188] => links
    [6190] => page
    [6193] => edited
    [6195] => 10
    [6196] => august
    [6197] => 2017
    [6199] => 00
    [6200] => 31
    [6201] => text
    [6206] => creative
    [6207] => commons
    [6208] => attribution-sharealike
    [6209] => license
    [6210] => additional
    [6211] => terms
    [6213] => apply
    [6217] => site
    [6219] => agree
    [6222] => terms
    [6226] => privacy
    [6227] => policy
    [6228] => wikipedia
    [6231] => registered
    [6232] => trademark
    [6235] => wikimedia
    [6236] => foundation
    [6239] => non-profit
    [6240] => organization
    [6241] => privacy
    [6242] => policy
    [6244] => wikipedia
    [6245] => disclaimers
    [6246] => contact
    [6247] => wikipedia
    [6248] => developers
    [6249] => cookie
    [6250] => statement
    [6251] => mobile
    [6252] => view
)
======================
Text: data mining - wikipedia data mining from wikipedia the free encyclopedia...
Total Keywords: 4388
======================

Demo2.php

<?php

//All Keywords as an array
$tm = new TextMiner();

$tm->addFile("http://en.wikipedia.org/wiki/Data_mining");
$tm->process();

printa($tm->getKeywords());
echo 
$tm->printSummary();
        
?>