Demo 0 | Demo 1 | Demo 2 | Demo 3 | Demo 4 | Demo 5 | Code | Matt Smith

Demo 2

Array
(
    [1] => data
    [2] => mining
    [4] => wikipedia
    [5] => data
    [6] => mining
    [8] => wikipedia
    [10] => free
    [11] => encyclopedia
    [12] => jump
    [14] => navigation
    [15] => search
    [16] => data
    [17] => mining
    [20] => process
    [22] => discovering
    [23] => patterns
    [25] => large
    [26] => data
    [27] => sets
    [28] => involving
    [29] => methods
    [32] => intersection
    [34] => machine
    [35] => learning
    [36] => statistics
    [38] => database
    [39] => systems
    [40] => 1
    [44] => essential
    [45] => process
    [47] => intelligent
    [48] => methods
    [50] => applied
    [52] => extract
    [53] => data
    [54] => patterns
    [55] => 1
    [56] => 2
    [60] => interdisciplinary
    [61] => subfield
    [63] => computer
    [64] => science
    [65] => 1
    [66] => 3
    [67] => 4
    [70] => goal
    [73] => data
    [74] => mining
    [75] => process
    [78] => extract
    [79] => information
    [82] => data
    [83] => set
    [85] => transform
    [89] => understandable
    [90] => structure
    [94] => 1
    [98] => raw
    [99] => analysis
    [100] => step
    [102] => involves
    [103] => database
    [105] => data
    [106] => management
    [107] => aspects
    [108] => data
    [109] => pre-processing
    [110] => model
    [112] => inference
    [113] => considerations
    [114] => interestingness
    [115] => metrics
    [116] => complexity
    [117] => considerations
    [118] => post-processing
    [120] => discovered
    [121] => structures
    [122] => visualization
    [124] => online
    [125] => updating
    [126] => 1
    [127] => data
    [128] => mining
    [131] => analysis
    [132] => step
    [135] => knowledge
    [136] => discovery
    [138] => databases
    [139] => process
    [141] => kdd
    [142] => 5
    [144] => term
    [147] => misnomer
    [150] => goal
    [153] => extraction
    [155] => patterns
    [157] => knowledge
    [159] => large
    [160] => amounts
    [162] => data
    [165] => extraction
    [166] => mining
    [168] => data
    [170] => 6
    [175] => buzzword
    [176] => 7
    [179] => frequently
    [180] => applied
    [183] => form
    [185] => large-scale
    [186] => data
    [188] => information
    [189] => processing
    [190] => collection
    [191] => extraction
    [192] => warehousing
    [193] => analysis
    [195] => statistics
    [200] => application
    [202] => computer
    [203] => decision
    [204] => support
    [205] => system
    [206] => including
    [207] => artificial
    [208] => intelligence
    [209] => machine
    [210] => learning
    [212] => business
    [213] => intelligence
    [215] => book
    [216] => data
    [217] => mining
    [218] => practical
    [219] => machine
    [220] => learning
    [221] => tools
    [223] => techniques
    [225] => java
    [226] => 8
    [228] => covers
    [230] => machine
    [231] => learning
    [232] => material
    [234] => originally
    [237] => named
    [239] => practical
    [240] => machine
    [241] => learning
    [244] => term
    [245] => data
    [246] => mining
    [249] => added
    [251] => marketing
    [252] => reasons
    [253] => 9
    [257] => general
    [258] => terms
    [259] => large
    [260] => scale
    [261] => data
    [262] => analysis
    [264] => analytics
    [267] => referring
    [269] => actual
    [270] => methods
    [271] => artificial
    [272] => intelligence
    [274] => machine
    [275] => learning
    [280] => actual
    [281] => data
    [282] => mining
    [283] => task
    [286] => semi-automatic
    [288] => automatic
    [289] => analysis
    [291] => large
    [292] => quantities
    [294] => data
    [296] => extract
    [297] => previously
    [298] => unknown
    [299] => interesting
    [300] => patterns
    [303] => groups
    [305] => data
    [306] => records
    [307] => cluster
    [308] => analysis
    [309] => unusual
    [310] => records
    [311] => anomaly
    [312] => detection
    [314] => dependencies
    [315] => association
    [316] => rule
    [317] => mining
    [318] => sequential
    [319] => pattern
    [320] => mining
    [323] => involves
    [325] => database
    [326] => techniques
    [329] => spatial
    [330] => indices
    [332] => patterns
    [339] => kind
    [341] => summary
    [344] => input
    [345] => data
    [352] => analysis
    [357] => machine
    [358] => learning
    [360] => predictive
    [361] => analytics
    [365] => data
    [366] => mining
    [367] => step
    [369] => identify
    [370] => multiple
    [371] => groups
    [374] => data
    [381] => obtain
    [383] => accurate
    [384] => prediction
    [385] => results
    [388] => decision
    [389] => support
    [390] => system
    [393] => data
    [394] => collection
    [395] => data
    [396] => preparation
    [398] => result
    [399] => interpretation
    [401] => reporting
    [403] => part
    [406] => data
    [407] => mining
    [408] => step
    [411] => belong
    [415] => kdd
    [416] => process
    [418] => additional
    [419] => steps
    [421] => related
    [422] => terms
    [423] => data
    [424] => dredging
    [425] => data
    [426] => fishing
    [428] => data
    [429] => snooping
    [430] => refer
    [435] => data
    [436] => mining
    [437] => methods
    [439] => sample
    [440] => parts
    [443] => larger
    [444] => population
    [445] => data
    [446] => set
    [453] => small
    [455] => reliable
    [456] => statistical
    [457] => inferences
    [460] => made
    [463] => validity
    [466] => patterns
    [467] => discovered
    [469] => methods
    [475] => creating
    [477] => hypotheses
    [479] => test
    [482] => larger
    [483] => data
    [484] => populations
    [485] => contents
    [486] => 1
    [487] => etymology
    [488] => 2
    [489] => background
    [490] => 3
    [491] => process
    [492] => 3
    [493] => 1
    [494] => pre-processing
    [495] => 3
    [496] => 2
    [497] => data
    [498] => mining
    [499] => 3
    [500] => 3
    [501] => results
    [502] => validation
    [503] => 4
    [504] => research
    [505] => 5
    [506] => standards
    [507] => 6
    [508] => notable
    [510] => 7
    [511] => privacy
    [512] => concerns
    [514] => ethics
    [515] => 7
    [516] => 1
    [517] => situation
    [519] => europe
    [520] => 7
    [521] => 2
    [522] => situation
    [525] => united
    [526] => states
    [527] => 8
    [528] => copyright
    [529] => law
    [530] => 8
    [531] => 1
    [532] => situation
    [534] => europe
    [535] => 8
    [536] => 2
    [537] => situation
    [540] => united
    [541] => states
    [542] => 9
    [543] => software
    [544] => 9
    [545] => 1
    [546] => free
    [547] => open-source
    [548] => data
    [549] => mining
    [550] => software
    [552] => applications
    [553] => 9
    [554] => 2
    [555] => proprietary
    [556] => data-mining
    [557] => software
    [559] => applications
    [560] => 9
    [561] => 3
    [562] => marketplace
    [563] => surveys
    [564] => 10
    [567] => 11
    [568] => references
    [569] => 12
    [571] => reading
    [572] => 13
    [573] => external
    [574] => links
    [575] => etymology
    [576] => edit
    [579] => 1960s
    [580] => statisticians
    [582] => economists
    [584] => terms
    [586] => data
    [587] => fishing
    [589] => data
    [590] => dredging
    [592] => refer
    [596] => considered
    [598] => bad
    [599] => practice
    [601] => analyzing
    [602] => data
    [605] => a-priori
    [606] => hypothesis
    [608] => term
    [609] => data
    [610] => mining
    [615] => similarly
    [616] => critical
    [619] => economist
    [620] => michael
    [621] => lovell
    [624] => article
    [625] => https
    [627] => jstor
    [628] => org
    [629] => stable
    [630] => 1924403
    [631] => seq
    [632] => 1
    [633] => page
    [634] => scan
    [635] => tab
    [636] => contents
    [637] => published
    [640] => review
    [642] => economic
    [643] => studies
    [644] => 1983
    [645] => lovell
    [649] => practice
    [650] => masquerades
    [653] => variety
    [655] => aliases
    [656] => ranging
    [658] => experimentation
    [659] => positive
    [661] => fishing
    [663] => snooping
    [664] => negative
    [666] => term
    [667] => data
    [668] => mining
    [669] => appeared
    [671] => 1990
    [674] => database
    [675] => community
    [676] => generally
    [678] => positive
    [679] => connotations
    [682] => short
    [683] => time
    [685] => 1980s
    [687] => phrase
    [688] => database
    [689] => mining
    [696] => trademarked
    [698] => hnc
    [700] => san
    [701] => diego-based
    [702] => company
    [704] => pitch
    [706] => database
    [707] => mining
    [708] => workstation
    [709] => 10
    [710] => researchers
    [712] => turned
    [714] => data
    [715] => mining
    [717] => terms
    [719] => include
    [720] => data
    [721] => archaeology
    [722] => information
    [723] => harvesting
    [724] => information
    [725] => discovery
    [726] => knowledge
    [727] => extraction
    [729] => gregory
    [730] => piatetsky-shapiro
    [731] => coined
    [733] => term
    [734] => knowledge
    [735] => discovery
    [737] => databases
    [741] => workshop
    [745] => topic
    [746] => kdd-1989
    [749] => term
    [752] => popular
    [754] => ai
    [756] => machine
    [757] => learning
    [758] => community
    [761] => term
    [762] => data
    [763] => mining
    [766] => popular
    [769] => business
    [771] => press
    [772] => communities
    [773] => 11
    [776] => terms
    [777] => data
    [778] => mining
    [780] => knowledge
    [781] => discovery
    [784] => interchangeably
    [787] => academic
    [788] => community
    [790] => major
    [791] => forums
    [793] => research
    [794] => started
    [796] => 1995
    [800] => international
    [801] => conference
    [803] => data
    [804] => mining
    [806] => knowledge
    [807] => discovery
    [808] => kdd-95
    [810] => started
    [812] => montreal
    [814] => aaai
    [815] => sponsorship
    [818] => co-chaired
    [820] => usama
    [821] => fayyad
    [823] => ramasamy
    [824] => uthurusamy
    [826] => year
    [829] => 1996
    [830] => usama
    [831] => fayyad
    [832] => launched
    [834] => journal
    [836] => kluwer
    [837] => called
    [838] => data
    [839] => mining
    [841] => knowledge
    [842] => discovery
    [845] => founding
    [846] => editor-in-chief
    [849] => started
    [851] => sigkddd
    [852] => newsletter
    [853] => sigkdd
    [854] => explorations
    [855] => 12
    [857] => kdd
    [858] => international
    [859] => conference
    [862] => primary
    [863] => highest
    [864] => quality
    [865] => conference
    [867] => data
    [868] => mining
    [871] => acceptance
    [872] => rate
    [874] => research
    [875] => paper
    [876] => submissions
    [878] => 18
    [880] => journal
    [881] => data
    [882] => mining
    [884] => knowledge
    [885] => discovery
    [888] => primary
    [889] => research
    [890] => journal
    [893] => field
    [894] => background
    [895] => edit
    [897] => manual
    [898] => extraction
    [900] => patterns
    [902] => data
    [904] => occurred
    [906] => centuries
    [907] => early
    [908] => methods
    [910] => identifying
    [911] => patterns
    [913] => data
    [914] => include
    [915] => bayes'
    [916] => theorem
    [917] => 1700s
    [919] => regression
    [920] => analysis
    [921] => 1800s
    [923] => proliferation
    [924] => ubiquity
    [926] => increasing
    [927] => power
    [929] => computer
    [930] => technology
    [932] => dramatically
    [933] => increased
    [934] => data
    [935] => collection
    [936] => storage
    [938] => manipulation
    [939] => ability
    [941] => data
    [942] => sets
    [944] => grown
    [946] => size
    [948] => complexity
    [949] => direct
    [950] => hands-on
    [951] => data
    [952] => analysis
    [954] => increasingly
    [956] => augmented
    [958] => indirect
    [959] => automated
    [960] => data
    [961] => processing
    [962] => aided
    [965] => discoveries
    [967] => computer
    [968] => science
    [971] => neural
    [972] => networks
    [973] => cluster
    [974] => analysis
    [975] => genetic
    [976] => algorithms
    [977] => 1950s
    [978] => decision
    [979] => trees
    [981] => decision
    [982] => rules
    [983] => 1960s
    [985] => support
    [986] => vector
    [987] => machines
    [988] => 1990s
    [989] => data
    [990] => mining
    [993] => process
    [995] => applying
    [997] => methods
    [1000] => intention
    [1002] => uncovering
    [1003] => hidden
    [1004] => patterns
    [1005] => 13
    [1007] => large
    [1008] => data
    [1009] => sets
    [1011] => bridges
    [1013] => gap
    [1015] => applied
    [1016] => statistics
    [1018] => artificial
    [1019] => intelligence
    [1022] => provide
    [1024] => mathematical
    [1025] => background
    [1027] => database
    [1028] => management
    [1030] => exploiting
    [1033] => data
    [1035] => stored
    [1037] => indexed
    [1039] => databases
    [1041] => execute
    [1043] => actual
    [1044] => learning
    [1046] => discovery
    [1047] => algorithms
    [1049] => efficiently
    [1050] => allowing
    [1052] => methods
    [1055] => applied
    [1058] => larger
    [1059] => data
    [1060] => sets
    [1061] => process
    [1062] => edit
    [1064] => knowledge
    [1065] => discovery
    [1067] => databases
    [1068] => kdd
    [1069] => process
    [1071] => commonly
    [1072] => defined
    [1075] => stages
    [1076] => selection
    [1077] => pre-processing
    [1078] => transformation
    [1079] => data
    [1080] => mining
    [1081] => interpretation
    [1082] => evaluation
    [1083] => 5
    [1085] => exists
    [1089] => variations
    [1092] => theme
    [1096] => cross
    [1097] => industry
    [1098] => standard
    [1099] => process
    [1101] => data
    [1102] => mining
    [1103] => crisp-dm
    [1105] => defines
    [1107] => phases
    [1108] => business
    [1109] => understanding
    [1110] => data
    [1111] => understanding
    [1112] => data
    [1113] => preparation
    [1114] => modeling
    [1115] => evaluation
    [1116] => deployment
    [1119] => simplified
    [1120] => process
    [1123] => 1
    [1124] => pre-processing
    [1125] => 2
    [1126] => data
    [1127] => mining
    [1129] => 3
    [1130] => results
    [1131] => validation
    [1132] => polls
    [1133] => conducted
    [1135] => 2002
    [1136] => 2004
    [1137] => 2007
    [1139] => 2014
    [1140] => show
    [1143] => crisp-dm
    [1144] => methodology
    [1147] => leading
    [1148] => methodology
    [1151] => data
    [1152] => miners
    [1153] => 14
    [1157] => data
    [1158] => mining
    [1159] => standard
    [1160] => named
    [1163] => polls
    [1165] => semma
    [1167] => 3
    [1168] => 4
    [1169] => times
    [1172] => people
    [1173] => reported
    [1175] => crisp-dm
    [1177] => teams
    [1179] => researchers
    [1181] => published
    [1182] => reviews
    [1184] => data
    [1185] => mining
    [1186] => process
    [1187] => models
    [1188] => 15
    [1189] => 16
    [1191] => azevedo
    [1193] => santos
    [1194] => conducted
    [1196] => comparison
    [1198] => crisp-dm
    [1200] => semma
    [1202] => 2008
    [1203] => 17
    [1204] => pre-processing
    [1205] => edit
    [1207] => data
    [1208] => mining
    [1209] => algorithms
    [1214] => target
    [1215] => data
    [1216] => set
    [1219] => assembled
    [1221] => data
    [1222] => mining
    [1225] => uncover
    [1226] => patterns
    [1228] => present
    [1231] => data
    [1233] => target
    [1234] => data
    [1235] => set
    [1238] => large
    [1243] => patterns
    [1245] => remaining
    [1246] => concise
    [1250] => mined
    [1253] => acceptable
    [1254] => time
    [1255] => limit
    [1257] => common
    [1258] => source
    [1260] => data
    [1263] => data
    [1264] => mart
    [1266] => data
    [1267] => warehouse
    [1268] => pre-processing
    [1270] => essential
    [1272] => analyze
    [1274] => multivariate
    [1275] => data
    [1276] => sets
    [1278] => data
    [1279] => mining
    [1281] => target
    [1282] => set
    [1285] => cleaned
    [1286] => data
    [1287] => cleaning
    [1288] => removes
    [1290] => observations
    [1292] => noise
    [1296] => missing
    [1297] => data
    [1298] => data
    [1299] => mining
    [1300] => edit
    [1301] => data
    [1302] => mining
    [1303] => involves
    [1305] => common
    [1306] => classes
    [1308] => tasks
    [1309] => 5
    [1310] => anomaly
    [1311] => detection
    [1312] => outlier
    [1313] => change
    [1314] => deviation
    [1315] => detection
    [1317] => identification
    [1319] => unusual
    [1320] => data
    [1321] => records
    [1325] => interesting
    [1327] => data
    [1328] => errors
    [1330] => require
    [1332] => investigation
    [1333] => association
    [1334] => rule
    [1335] => learning
    [1336] => dependency
    [1337] => modelling
    [1338] => searches
    [1340] => relationships
    [1342] => variables
    [1346] => supermarket
    [1348] => gather
    [1349] => data
    [1351] => customer
    [1352] => purchasing
    [1353] => habits
    [1355] => association
    [1356] => rule
    [1357] => learning
    [1359] => supermarket
    [1361] => determine
    [1363] => products
    [1365] => frequently
    [1366] => bought
    [1371] => information
    [1373] => marketing
    [1374] => purposes
    [1378] => referred
    [1381] => market
    [1382] => basket
    [1383] => analysis
    [1384] => clustering
    [1387] => task
    [1389] => discovering
    [1390] => groups
    [1392] => structures
    [1395] => data
    [1403] => similar
    [1407] => structures
    [1410] => data
    [1411] => classification
    [1414] => task
    [1416] => generalizing
    [1418] => structure
    [1420] => apply
    [1423] => data
    [1427] => e-mail
    [1428] => program
    [1430] => attempt
    [1432] => classify
    [1434] => e-mail
    [1436] => legitimate
    [1439] => spam
    [1440] => regression
    [1441] => attempts
    [1443] => find
    [1445] => function
    [1447] => models
    [1449] => data
    [1453] => error
    [1457] => estimating
    [1459] => relationships
    [1461] => data
    [1463] => datasets
    [1464] => summarization
    [1465] => providing
    [1468] => compact
    [1469] => representation
    [1472] => data
    [1473] => set
    [1474] => including
    [1475] => visualization
    [1477] => report
    [1478] => generation
    [1479] => results
    [1480] => validation
    [1481] => edit
    [1485] => data
    [1486] => produced
    [1488] => data
    [1489] => dredging
    [1492] => bot
    [1493] => operated
    [1495] => statistician
    [1496] => tyler
    [1497] => vigen
    [1498] => apparently
    [1499] => showing
    [1501] => close
    [1502] => link
    [1506] => word
    [1507] => winning
    [1509] => spelling
    [1510] => bee
    [1511] => competition
    [1514] => number
    [1516] => people
    [1519] => united
    [1520] => states
    [1521] => killed
    [1523] => venomous
    [1524] => spiders
    [1526] => similarity
    [1528] => trends
    [1532] => coincidence
    [1533] => data
    [1534] => mining
    [1536] => unintentionally
    [1538] => misused
    [1542] => produce
    [1543] => results
    [1548] => significant
    [1554] => predict
    [1555] => future
    [1556] => behaviour
    [1560] => reproduced
    [1564] => sample
    [1566] => data
    [1568] => bear
    [1573] => results
    [1575] => investigating
    [1578] => hypotheses
    [1581] => performing
    [1582] => proper
    [1583] => statistical
    [1584] => hypothesis
    [1585] => testing
    [1587] => simple
    [1588] => version
    [1591] => problem
    [1593] => machine
    [1594] => learning
    [1598] => overfitting
    [1602] => problem
    [1604] => arise
    [1607] => phases
    [1610] => process
    [1614] => train
    [1615] => test
    [1616] => split
    [1619] => applicable
    [1626] => sufficient
    [1628] => prevent
    [1631] => happening
    [1632] => 18
    [1634] => section
    [1636] => missing
    [1637] => information
    [1639] => non-classification
    [1640] => tasks
    [1642] => data
    [1643] => mining
    [1646] => covers
    [1647] => machine
    [1648] => learning
    [1650] => expand
    [1652] => section
    [1654] => include
    [1656] => information
    [1658] => details
    [1660] => exist
    [1663] => talk
    [1664] => page
    [1665] => september
    [1666] => 2011
    [1668] => final
    [1669] => step
    [1671] => knowledge
    [1672] => discovery
    [1674] => data
    [1677] => verify
    [1680] => patterns
    [1681] => produced
    [1684] => data
    [1685] => mining
    [1686] => algorithms
    [1687] => occur
    [1690] => wider
    [1691] => data
    [1692] => set
    [1695] => patterns
    [1696] => found
    [1699] => data
    [1700] => mining
    [1701] => algorithms
    [1703] => necessarily
    [1704] => valid
    [1707] => common
    [1710] => data
    [1711] => mining
    [1712] => algorithms
    [1714] => find
    [1715] => patterns
    [1718] => training
    [1719] => set
    [1723] => present
    [1726] => general
    [1727] => data
    [1728] => set
    [1731] => called
    [1732] => overfitting
    [1734] => overcome
    [1737] => evaluation
    [1740] => test
    [1741] => set
    [1743] => data
    [1747] => data
    [1748] => mining
    [1749] => algorithm
    [1752] => trained
    [1754] => learned
    [1755] => patterns
    [1757] => applied
    [1760] => test
    [1761] => set
    [1764] => resulting
    [1765] => output
    [1767] => compared
    [1770] => desired
    [1771] => output
    [1775] => data
    [1776] => mining
    [1777] => algorithm
    [1780] => distinguish
    [1781] => spam
    [1783] => legitimate
    [1784] => emails
    [1787] => trained
    [1790] => training
    [1791] => set
    [1793] => sample
    [1794] => e-mails
    [1796] => trained
    [1798] => learned
    [1799] => patterns
    [1802] => applied
    [1805] => test
    [1806] => set
    [1808] => e-mails
    [1815] => trained
    [1817] => accuracy
    [1820] => patterns
    [1824] => measured
    [1828] => e-mails
    [1830] => correctly
    [1831] => classify
    [1833] => number
    [1835] => statistical
    [1836] => methods
    [1841] => evaluate
    [1843] => algorithm
    [1846] => roc
    [1847] => curves
    [1850] => learned
    [1851] => patterns
    [1854] => meet
    [1856] => desired
    [1857] => standards
    [1858] => subsequently
    [1863] => re-evaluate
    [1865] => change
    [1867] => pre-processing
    [1869] => data
    [1870] => mining
    [1871] => steps
    [1874] => learned
    [1875] => patterns
    [1877] => meet
    [1879] => desired
    [1880] => standards
    [1883] => final
    [1884] => step
    [1887] => interpret
    [1889] => learned
    [1890] => patterns
    [1892] => turn
    [1895] => knowledge
    [1896] => research
    [1897] => edit
    [1899] => premier
    [1900] => professional
    [1901] => body
    [1904] => field
    [1907] => association
    [1909] => computing
    [1910] => machinery
    [1911] => 's
    [1912] => acm
    [1913] => special
    [1914] => interest
    [1915] => group
    [1916] => sig
    [1918] => knowledge
    [1919] => discovery
    [1921] => data
    [1922] => mining
    [1923] => sigkdd
    [1924] => 19
    [1925] => 20
    [1927] => 1989
    [1929] => acm
    [1930] => sig
    [1932] => hosted
    [1934] => annual
    [1935] => international
    [1936] => conference
    [1938] => published
    [1940] => proceedings
    [1941] => 21
    [1944] => 1999
    [1947] => published
    [1949] => biannual
    [1950] => academic
    [1951] => journal
    [1952] => titled
    [1953] => sigkdd
    [1954] => explorations
    [1955] => 22
    [1956] => computer
    [1957] => science
    [1958] => conferences
    [1960] => data
    [1961] => mining
    [1962] => include
    [1963] => cikm
    [1964] => conference
    [1965] => acm
    [1966] => conference
    [1968] => information
    [1970] => knowledge
    [1971] => management
    [1972] => european
    [1973] => conference
    [1975] => machine
    [1976] => learning
    [1978] => principles
    [1980] => practice
    [1982] => knowledge
    [1983] => discovery
    [1985] => databases
    [1986] => kdd
    [1987] => conference
    [1988] => acm
    [1989] => sigkdd
    [1990] => conference
    [1992] => knowledge
    [1993] => discovery
    [1995] => data
    [1996] => mining
    [1997] => data
    [1998] => mining
    [1999] => topics
    [2002] => present
    [2005] => data
    [2006] => management
    [2007] => database
    [2008] => conferences
    [2012] => icde
    [2013] => conference
    [2014] => sigmod
    [2015] => conference
    [2017] => international
    [2018] => conference
    [2021] => large
    [2022] => data
    [2023] => bases
    [2024] => standards
    [2025] => edit
    [2030] => efforts
    [2032] => define
    [2033] => standards
    [2036] => data
    [2037] => mining
    [2038] => process
    [2042] => 1999
    [2043] => european
    [2044] => cross
    [2045] => industry
    [2046] => standard
    [2047] => process
    [2049] => data
    [2050] => mining
    [2051] => crisp-dm
    [2052] => 1
    [2053] => 0
    [2056] => 2004
    [2057] => java
    [2058] => data
    [2059] => mining
    [2060] => standard
    [2061] => jdm
    [2062] => 1
    [2063] => 0
    [2064] => development
    [2066] => successors
    [2069] => processes
    [2070] => crisp-dm
    [2071] => 2
    [2072] => 0
    [2074] => jdm
    [2075] => 2
    [2076] => 0
    [2078] => active
    [2080] => 2006
    [2083] => stalled
    [2085] => jdm
    [2086] => 2
    [2087] => 0
    [2089] => withdrawn
    [2091] => reaching
    [2093] => final
    [2094] => draft
    [2096] => exchanging
    [2098] => extracted
    [2099] => models
    [2105] => predictive
    [2106] => analytics
    [2108] => key
    [2109] => standard
    [2112] => predictive
    [2113] => model
    [2114] => markup
    [2115] => language
    [2116] => pmml
    [2120] => xml
    [2121] => -based
    [2122] => language
    [2123] => developed
    [2126] => data
    [2127] => mining
    [2128] => group
    [2129] => dmg
    [2131] => supported
    [2133] => exchange
    [2134] => format
    [2137] => data
    [2138] => mining
    [2139] => applications
    [2143] => suggests
    [2146] => covers
    [2147] => prediction
    [2148] => models
    [2151] => data
    [2152] => mining
    [2153] => task
    [2155] => high
    [2156] => importance
    [2158] => business
    [2159] => applications
    [2161] => extensions
    [2163] => cover
    [2166] => subspace
    [2167] => clustering
    [2170] => proposed
    [2171] => independently
    [2174] => dmg
    [2175] => 23
    [2176] => notable
    [2178] => edit
    [2179] => main
    [2180] => article
    [2181] => examples
    [2183] => data
    [2184] => mining
    [2187] => category
    [2188] => applied
    [2189] => data
    [2190] => mining
    [2191] => data
    [2192] => mining
    [2198] => digital
    [2199] => data
    [2201] => today
    [2202] => notable
    [2203] => examples
    [2205] => data
    [2206] => mining
    [2209] => found
    [2211] => business
    [2212] => medicine
    [2213] => science
    [2215] => surveillance
    [2216] => privacy
    [2217] => concerns
    [2219] => ethics
    [2220] => edit
    [2223] => term
    [2224] => data
    [2225] => mining
    [2230] => ethical
    [2231] => implications
    [2238] => mining
    [2240] => information
    [2242] => relation
    [2244] => peoples'
    [2245] => behavior
    [2246] => ethical
    [2249] => 24
    [2251] => ways
    [2254] => data
    [2255] => mining
    [2262] => cases
    [2264] => contexts
    [2265] => raise
    [2266] => questions
    [2268] => privacy
    [2269] => legality
    [2271] => ethics
    [2272] => 25
    [2275] => data
    [2276] => mining
    [2277] => government
    [2279] => commercial
    [2280] => data
    [2281] => sets
    [2283] => national
    [2284] => security
    [2286] => law
    [2287] => enforcement
    [2288] => purposes
    [2293] => total
    [2294] => information
    [2295] => awareness
    [2296] => program
    [2299] => advise
    [2301] => raised
    [2302] => privacy
    [2303] => concerns
    [2304] => 26
    [2305] => 27
    [2306] => data
    [2307] => mining
    [2308] => requires
    [2309] => data
    [2310] => preparation
    [2313] => uncover
    [2314] => information
    [2316] => patterns
    [2319] => compromise
    [2320] => confidentiality
    [2322] => privacy
    [2323] => obligations
    [2325] => common
    [2330] => occur
    [2333] => data
    [2334] => aggregation
    [2335] => data
    [2336] => aggregation
    [2337] => involves
    [2338] => combining
    [2339] => data
    [2341] => possibly
    [2344] => sources
    [2349] => facilitates
    [2350] => analysis
    [2355] => make
    [2356] => identification
    [2358] => private
    [2359] => individual-level
    [2360] => data
    [2361] => deducible
    [2364] => apparent
    [2365] => 28
    [2369] => data
    [2370] => mining
    [2372] => se
    [2375] => result
    [2378] => preparation
    [2380] => data
    [2385] => purposes
    [2388] => analysis
    [2390] => threat
    [2393] => individual's
    [2394] => privacy
    [2397] => play
    [2400] => data
    [2402] => compiled
    [2405] => data
    [2406] => miner
    [2411] => access
    [2414] => newly
    [2415] => compiled
    [2416] => data
    [2417] => set
    [2422] => identify
    [2423] => specific
    [2424] => individuals
    [2428] => data
    [2430] => originally
    [2431] => anonymous
    [2432] => 29
    [2433] => 30
    [2434] => 31
    [2437] => recommended
    [2440] => individual
    [2442] => made
    [2443] => aware
    [2448] => data
    [2450] => collected
    [2451] => 28
    [2453] => purpose
    [2456] => data
    [2457] => collection
    [2461] => data
    [2462] => mining
    [2463] => projects
    [2466] => data
    [2475] => mine
    [2477] => data
    [2481] => data
    [2484] => derivatives
    [2486] => status
    [2488] => security
    [2489] => surrounding
    [2490] => access
    [2493] => data
    [2495] => collected
    [2496] => data
    [2499] => updated
    [2500] => data
    [2504] => modified
    [2509] => anonymous
    [2512] => individuals
    [2515] => readily
    [2517] => identified
    [2518] => 28
    [2521] => de-identified
    [2522] => anonymized
    [2523] => data
    [2524] => sets
    [2526] => potentially
    [2529] => information
    [2532] => identification
    [2534] => individuals
    [2536] => occurred
    [2538] => journalists
    [2542] => find
    [2544] => individuals
    [2545] => based
    [2548] => set
    [2550] => search
    [2551] => histories
    [2554] => inadvertently
    [2555] => released
    [2557] => aol
    [2558] => 32
    [2560] => inadvertent
    [2561] => revelation
    [2563] => personally
    [2564] => identifiable
    [2565] => information
    [2566] => leading
    [2569] => provider
    [2570] => violates
    [2571] => fair
    [2572] => information
    [2573] => practices
    [2575] => indiscretion
    [2578] => financial
    [2579] => emotional
    [2581] => bodily
    [2582] => harm
    [2586] => individual
    [2589] => instance
    [2591] => privacy
    [2592] => violation
    [2594] => patrons
    [2596] => walgreens
    [2597] => filed
    [2599] => lawsuit
    [2602] => company
    [2604] => 2011
    [2606] => selling
    [2607] => prescription
    [2608] => information
    [2610] => data
    [2611] => mining
    [2612] => companies
    [2615] => turn
    [2616] => provided
    [2618] => data
    [2620] => pharmaceutical
    [2621] => companies
    [2622] => 33
    [2623] => situation
    [2625] => europe
    [2626] => edit
    [2627] => europe
    [2630] => strong
    [2631] => privacy
    [2632] => laws
    [2634] => efforts
    [2636] => underway
    [2639] => strengthen
    [2641] => rights
    [2644] => consumers
    [2647] => u
    [2648] => s
    [2649] => -e
    [2650] => u
    [2651] => safe
    [2652] => harbor
    [2653] => principles
    [2655] => effectively
    [2656] => expose
    [2657] => european
    [2658] => users
    [2660] => privacy
    [2661] => exploitation
    [2663] => u
    [2664] => s
    [2665] => companies
    [2668] => consequence
    [2670] => edward
    [2671] => snowden
    [2672] => 's
    [2673] => global
    [2674] => surveillance
    [2675] => disclosure
    [2679] => increased
    [2680] => discussion
    [2682] => revoke
    [2684] => agreement
    [2689] => data
    [2692] => fully
    [2693] => exposed
    [2696] => national
    [2697] => security
    [2698] => agency
    [2700] => attempts
    [2702] => reach
    [2704] => agreement
    [2706] => failed
    [2707] => citation
    [2708] => needed
    [2709] => situation
    [2712] => united
    [2713] => states
    [2714] => edit
    [2717] => united
    [2718] => states
    [2719] => privacy
    [2720] => concerns
    [2723] => addressed
    [2727] => congress
    [2730] => passage
    [2732] => regulatory
    [2733] => controls
    [2737] => health
    [2738] => insurance
    [2739] => portability
    [2741] => accountability
    [2742] => act
    [2743] => hipaa
    [2745] => hipaa
    [2746] => requires
    [2747] => individuals
    [2749] => give
    [2751] => informed
    [2752] => consent
    [2754] => information
    [2756] => provide
    [2759] => intended
    [2760] => present
    [2762] => future
    [2767] => article
    [2769] => biotech
    [2770] => business
    [2771] => week
    [2772] => '
    [2774] => n
    [2775] => practice
    [2776] => hipaa
    [2779] => offer
    [2781] => greater
    [2782] => protection
    [2785] => longstanding
    [2786] => regulations
    [2789] => research
    [2790] => arena
    [2791] => '
    [2794] => aahc
    [2796] => importantly
    [2798] => rule's
    [2799] => goal
    [2801] => protection
    [2803] => informed
    [2804] => consent
    [2806] => approach
    [2808] => level
    [2810] => incomprehensibility
    [2812] => average
    [2813] => individuals
    [2814] => 34
    [2816] => underscores
    [2818] => necessity
    [2820] => data
    [2821] => anonymity
    [2823] => data
    [2824] => aggregation
    [2826] => mining
    [2827] => practices
    [2828] => u
    [2829] => s
    [2830] => information
    [2831] => privacy
    [2832] => legislation
    [2835] => hipaa
    [2838] => family
    [2839] => educational
    [2840] => rights
    [2842] => privacy
    [2843] => act
    [2844] => ferpa
    [2845] => applies
    [2849] => specific
    [2850] => areas
    [2854] => law
    [2855] => addresses
    [2858] => data
    [2859] => mining
    [2862] => majority
    [2864] => businesses
    [2867] => u
    [2868] => s
    [2871] => controlled
    [2874] => legislation
    [2875] => copyright
    [2876] => law
    [2877] => edit
    [2878] => situation
    [2880] => europe
    [2881] => edit
    [2882] => due
    [2885] => lack
    [2887] => flexibilities
    [2889] => european
    [2890] => copyright
    [2892] => database
    [2893] => law
    [2895] => mining
    [2897] => in-copyright
    [2898] => works
    [2901] => web
    [2902] => mining
    [2905] => permission
    [2908] => copyright
    [2909] => owner
    [2912] => legal
    [2915] => database
    [2917] => pure
    [2918] => data
    [2920] => europe
    [2927] => copyright
    [2929] => database
    [2930] => rights
    [2932] => exist
    [2934] => data
    [2935] => mining
    [2937] => subject
    [2939] => regulations
    [2942] => database
    [2943] => directive
    [2946] => recommendation
    [2949] => hargreaves
    [2950] => review
    [2952] => led
    [2955] => uk
    [2956] => government
    [2958] => amend
    [2960] => copyright
    [2961] => law
    [2963] => 2014
    [2964] => 35
    [2967] => content
    [2968] => mining
    [2971] => limitation
    [2973] => exception
    [2977] => country
    [2980] => world
    [2985] => japan
    [2987] => introduced
    [2989] => exception
    [2991] => 2009
    [2993] => data
    [2994] => mining
    [2996] => due
    [2999] => restriction
    [3002] => copyright
    [3003] => directive
    [3005] => uk
    [3006] => exception
    [3009] => content
    [3010] => mining
    [3012] => non-commercial
    [3013] => purposes
    [3014] => uk
    [3015] => copyright
    [3016] => law
    [3022] => provision
    [3025] => overridden
    [3027] => contractual
    [3028] => terms
    [3030] => conditions
    [3032] => european
    [3033] => commission
    [3034] => facilitated
    [3035] => stakeholder
    [3036] => discussion
    [3038] => text
    [3040] => data
    [3041] => mining
    [3043] => 2013
    [3046] => title
    [3048] => licences
    [3050] => europe
    [3051] => 36
    [3053] => focus
    [3056] => solution
    [3059] => legal
    [3060] => issue
    [3062] => licences
    [3065] => limitations
    [3067] => exceptions
    [3068] => led
    [3070] => representatives
    [3072] => universities
    [3073] => researchers
    [3074] => libraries
    [3075] => civil
    [3076] => society
    [3077] => groups
    [3079] => open
    [3080] => access
    [3081] => publishers
    [3083] => leave
    [3085] => stakeholder
    [3086] => dialogue
    [3089] => 2013
    [3090] => 37
    [3091] => situation
    [3094] => united
    [3095] => states
    [3096] => edit
    [3098] => contrast
    [3100] => europe
    [3102] => flexible
    [3103] => nature
    [3106] => copyright
    [3107] => law
    [3111] => fair
    [3113] => means
    [3115] => content
    [3116] => mining
    [3118] => america
    [3123] => fair
    [3125] => countries
    [3128] => israel
    [3129] => taiwan
    [3131] => south
    [3132] => korea
    [3134] => viewed
    [3137] => legal
    [3139] => content
    [3140] => mining
    [3142] => transformative
    [3148] => supplant
    [3150] => original
    [3151] => work
    [3154] => viewed
    [3157] => lawful
    [3159] => fair
    [3164] => part
    [3167] => google
    [3168] => book
    [3169] => settlement
    [3171] => presiding
    [3172] => judge
    [3175] => case
    [3176] => ruled
    [3178] => google's
    [3179] => digitisation
    [3180] => project
    [3182] => in-copyright
    [3183] => books
    [3185] => lawful
    [3187] => part
    [3191] => transformative
    [3195] => digitisation
    [3196] => project
    [3197] => displayed
    [3201] => text
    [3203] => data
    [3204] => mining
    [3205] => 38
    [3206] => software
    [3207] => edit
    [3210] => category
    [3211] => data
    [3212] => mining
    [3214] => machine
    [3215] => learning
    [3216] => software
    [3217] => free
    [3218] => open-source
    [3219] => data
    [3220] => mining
    [3221] => software
    [3223] => applications
    [3224] => edit
    [3227] => applications
    [3231] => free
    [3232] => open
    [3233] => source
    [3234] => licenses
    [3235] => public
    [3236] => access
    [3238] => application
    [3239] => source
    [3240] => code
    [3244] => carrot2
    [3245] => text
    [3247] => search
    [3248] => results
    [3249] => clustering
    [3250] => framework
    [3251] => chemicalize
    [3252] => org
    [3254] => chemical
    [3255] => structure
    [3256] => miner
    [3258] => web
    [3259] => search
    [3260] => engine
    [3261] => elki
    [3263] => university
    [3264] => research
    [3265] => project
    [3267] => advanced
    [3268] => cluster
    [3269] => analysis
    [3271] => outlier
    [3272] => detection
    [3273] => methods
    [3274] => written
    [3277] => java
    [3278] => language
    [3279] => gate
    [3281] => natural
    [3282] => language
    [3283] => processing
    [3285] => language
    [3286] => engineering
    [3287] => tool
    [3288] => knime
    [3290] => konstanz
    [3291] => information
    [3292] => miner
    [3294] => user
    [3295] => friendly
    [3297] => comprehensive
    [3298] => data
    [3299] => analytics
    [3300] => framework
    [3301] => massive
    [3302] => online
    [3303] => analysis
    [3304] => moa
    [3306] => real-time
    [3307] => big
    [3308] => data
    [3309] => stream
    [3310] => mining
    [3312] => concept
    [3313] => drift
    [3314] => tool
    [3317] => java
    [3318] => programming
    [3319] => language
    [3320] => mepx
    [3322] => cross
    [3323] => platform
    [3324] => tool
    [3326] => regression
    [3328] => classification
    [3329] => problems
    [3330] => based
    [3333] => genetic
    [3334] => programming
    [3335] => variant
    [3336] => ml-flex
    [3338] => software
    [3339] => package
    [3341] => enables
    [3342] => users
    [3344] => integrate
    [3346] => third-party
    [3347] => machine-learning
    [3348] => packages
    [3349] => written
    [3352] => programming
    [3353] => language
    [3354] => execute
    [3355] => classification
    [3356] => analyses
    [3358] => parallel
    [3360] => multiple
    [3361] => computing
    [3362] => nodes
    [3364] => produce
    [3365] => html
    [3366] => reports
    [3368] => classification
    [3369] => results
    [3370] => mlpack
    [3371] => library
    [3373] => collection
    [3375] => ready-to-use
    [3376] => machine
    [3377] => learning
    [3378] => algorithms
    [3379] => written
    [3382] => c
    [3383] => language
    [3384] => nltk
    [3385] => natural
    [3386] => language
    [3387] => toolkit
    [3389] => suite
    [3391] => libraries
    [3393] => programs
    [3395] => symbolic
    [3397] => statistical
    [3398] => natural
    [3399] => language
    [3400] => processing
    [3401] => nlp
    [3404] => python
    [3405] => language
    [3406] => opennn
    [3407] => open
    [3408] => neural
    [3409] => networks
    [3410] => library
    [3411] => orange
    [3413] => component-based
    [3414] => data
    [3415] => mining
    [3417] => machine
    [3418] => learning
    [3419] => software
    [3420] => suite
    [3421] => written
    [3424] => python
    [3425] => language
    [3426] => r
    [3428] => programming
    [3429] => language
    [3431] => software
    [3432] => environment
    [3434] => statistical
    [3435] => computing
    [3436] => data
    [3437] => mining
    [3439] => graphics
    [3442] => part
    [3445] => gnu
    [3446] => project
    [3447] => scikit-learn
    [3450] => open
    [3451] => source
    [3452] => machine
    [3453] => learning
    [3454] => library
    [3457] => python
    [3458] => programming
    [3459] => language
    [3460] => torch
    [3462] => open
    [3463] => source
    [3464] => deep
    [3465] => learning
    [3466] => library
    [3469] => lua
    [3470] => programming
    [3471] => language
    [3473] => scientific
    [3474] => computing
    [3475] => framework
    [3477] => wide
    [3478] => support
    [3480] => machine
    [3481] => learning
    [3482] => algorithms
    [3483] => uima
    [3485] => uima
    [3486] => unstructured
    [3487] => information
    [3488] => management
    [3489] => architecture
    [3492] => component
    [3493] => framework
    [3495] => analyzing
    [3496] => unstructured
    [3497] => content
    [3500] => text
    [3501] => audio
    [3503] => video
    [3504] => originally
    [3505] => developed
    [3507] => ibm
    [3508] => weka
    [3510] => suite
    [3512] => machine
    [3513] => learning
    [3514] => software
    [3515] => applications
    [3516] => written
    [3519] => java
    [3520] => programming
    [3521] => language
    [3522] => proprietary
    [3523] => data-mining
    [3524] => software
    [3526] => applications
    [3527] => edit
    [3530] => applications
    [3534] => proprietary
    [3535] => licenses
    [3536] => angoss
    [3537] => knowledgestudio
    [3538] => data
    [3539] => mining
    [3540] => tool
    [3541] => clarabridge
    [3542] => text
    [3543] => analytics
    [3544] => product
    [3545] => kxen
    [3546] => modeler
    [3547] => data
    [3548] => mining
    [3549] => tool
    [3550] => provided
    [3552] => kxen
    [3554] => lionsolver
    [3556] => integrated
    [3557] => software
    [3558] => application
    [3560] => data
    [3561] => mining
    [3562] => business
    [3563] => intelligence
    [3565] => modeling
    [3567] => implements
    [3569] => learning
    [3571] => intelligent
    [3572] => optimization
    [3573] => lion
    [3574] => approach
    [3575] => megaputer
    [3576] => intelligence
    [3577] => data
    [3579] => text
    [3580] => mining
    [3581] => software
    [3583] => called
    [3584] => polyanalyst
    [3585] => microsoft
    [3586] => analysis
    [3587] => services
    [3588] => data
    [3589] => mining
    [3590] => software
    [3591] => provided
    [3593] => microsoft
    [3594] => netowl
    [3595] => suite
    [3597] => multilingual
    [3598] => text
    [3600] => entity
    [3601] => analytics
    [3602] => products
    [3604] => enable
    [3605] => data
    [3606] => mining
    [3607] => opentext
    [3608] => big
    [3609] => data
    [3610] => analytics
    [3611] => visual
    [3612] => data
    [3613] => mining
    [3614] => predictive
    [3615] => analysis
    [3617] => open
    [3618] => text
    [3619] => corporation
    [3620] => oracle
    [3621] => data
    [3622] => mining
    [3623] => data
    [3624] => mining
    [3625] => software
    [3627] => oracle
    [3628] => corporation
    [3629] => pseven
    [3630] => platform
    [3632] => automation
    [3634] => engineering
    [3635] => simulation
    [3637] => analysis
    [3638] => multidisciplinary
    [3639] => optimization
    [3641] => data
    [3642] => mining
    [3643] => provided
    [3645] => datadvance
    [3646] => qlucore
    [3647] => omics
    [3648] => explorer
    [3649] => data
    [3650] => mining
    [3651] => software
    [3652] => rapidminer
    [3654] => environment
    [3656] => machine
    [3657] => learning
    [3659] => data
    [3660] => mining
    [3661] => experiments
    [3662] => sas
    [3663] => enterprise
    [3664] => miner
    [3665] => data
    [3666] => mining
    [3667] => software
    [3668] => provided
    [3671] => sas
    [3672] => institute
    [3673] => spss
    [3674] => modeler
    [3675] => data
    [3676] => mining
    [3677] => software
    [3678] => provided
    [3680] => ibm
    [3681] => statistica
    [3682] => data
    [3683] => miner
    [3684] => data
    [3685] => mining
    [3686] => software
    [3687] => provided
    [3689] => statsoft
    [3690] => tanagra
    [3691] => visualisation-oriented
    [3692] => data
    [3693] => mining
    [3694] => software
    [3697] => teaching
    [3698] => vertica
    [3699] => data
    [3700] => mining
    [3701] => software
    [3702] => provided
    [3704] => hewlett-packard
    [3705] => marketplace
    [3706] => surveys
    [3707] => edit
    [3709] => researchers
    [3711] => organizations
    [3713] => conducted
    [3714] => reviews
    [3716] => data
    [3717] => mining
    [3718] => tools
    [3720] => surveys
    [3722] => data
    [3723] => miners
    [3725] => identify
    [3729] => strengths
    [3731] => weaknesses
    [3734] => software
    [3735] => packages
    [3738] => provide
    [3740] => overview
    [3743] => behaviors
    [3744] => preferences
    [3746] => views
    [3748] => data
    [3749] => miners
    [3753] => reports
    [3754] => include
    [3755] => hurwitz
    [3756] => victory
    [3757] => index
    [3758] => report
    [3760] => advanced
    [3761] => analytics
    [3764] => market
    [3765] => research
    [3766] => assessment
    [3767] => tool
    [3769] => highlights
    [3772] => diverse
    [3775] => advanced
    [3776] => analytics
    [3777] => technology
    [3780] => vendors
    [3782] => make
    [3784] => applications
    [3786] => recent-research
    [3787] => rexer
    [3788] => analytics
    [3789] => data
    [3790] => miner
    [3791] => surveys
    [3792] => 2007
    [3793] => 2015
    [3794] => 39
    [3795] => 2011
    [3796] => wiley
    [3797] => interdisciplinary
    [3798] => reviews
    [3799] => data
    [3800] => mining
    [3802] => knowledge
    [3803] => discovery
    [3804] => 40
    [3805] => forrester
    [3806] => research
    [3807] => 2010
    [3808] => predictive
    [3809] => analytics
    [3811] => data
    [3812] => mining
    [3813] => solutions
    [3814] => report
    [3815] => 41
    [3816] => gartner
    [3817] => 2008
    [3818] => magic
    [3819] => quadrant
    [3820] => report
    [3821] => 42
    [3822] => robert
    [3824] => nisbet's
    [3825] => 2006
    [3827] => part
    [3828] => series
    [3830] => articles
    [3831] => data
    [3832] => mining
    [3833] => tools
    [3839] => crm
    [3840] => 43
    [3841] => haughton
    [3843] => al
    [3844] => 's
    [3845] => 2003
    [3846] => review
    [3848] => data
    [3849] => mining
    [3850] => software
    [3851] => packages
    [3854] => american
    [3855] => statistician
    [3856] => 44
    [3857] => goebel
    [3858] => gruenwald
    [3859] => 1999
    [3861] => survey
    [3863] => data
    [3864] => mining
    [3866] => knowledge
    [3867] => discovery
    [3868] => software
    [3869] => tools
    [3871] => sigkdd
    [3872] => explorations
    [3873] => 45
    [3876] => edit
    [3877] => methods
    [3878] => agent
    [3879] => mining
    [3880] => anomaly
    [3881] => outlier
    [3882] => change
    [3883] => detection
    [3884] => association
    [3885] => rule
    [3886] => learning
    [3887] => bayesian
    [3888] => networks
    [3889] => classification
    [3890] => cluster
    [3891] => analysis
    [3892] => decision
    [3893] => trees
    [3894] => ensemble
    [3895] => learning
    [3896] => factor
    [3897] => analysis
    [3898] => genetic
    [3899] => algorithms
    [3900] => intention
    [3901] => mining
    [3902] => learning
    [3903] => classifier
    [3904] => system
    [3905] => multilinear
    [3906] => subspace
    [3907] => learning
    [3908] => neural
    [3909] => networks
    [3910] => regression
    [3911] => analysis
    [3912] => sequence
    [3913] => mining
    [3914] => structured
    [3915] => data
    [3916] => analysis
    [3917] => support
    [3918] => vector
    [3919] => machines
    [3920] => text
    [3921] => mining
    [3922] => time
    [3923] => series
    [3924] => analysis
    [3925] => application
    [3926] => domains
    [3927] => analytics
    [3928] => behavior
    [3929] => informatics
    [3930] => big
    [3931] => data
    [3932] => bioinformatics
    [3933] => business
    [3934] => intelligence
    [3935] => data
    [3936] => analysis
    [3937] => data
    [3938] => warehouse
    [3939] => decision
    [3940] => support
    [3941] => system
    [3942] => domain
    [3943] => driven
    [3944] => data
    [3945] => mining
    [3946] => drug
    [3947] => discovery
    [3948] => exploratory
    [3949] => data
    [3950] => analysis
    [3951] => predictive
    [3952] => analytics
    [3953] => web
    [3954] => mining
    [3955] => application
    [3956] => examples
    [3957] => main
    [3958] => article
    [3959] => examples
    [3961] => data
    [3962] => mining
    [3965] => category
    [3966] => applied
    [3967] => data
    [3968] => mining
    [3969] => automatic
    [3970] => number
    [3971] => plate
    [3972] => recognition
    [3975] => united
    [3976] => kingdom
    [3977] => customer
    [3978] => analytics
    [3979] => educational
    [3980] => data
    [3981] => mining
    [3982] => national
    [3983] => security
    [3984] => agency
    [3985] => quantitative
    [3986] => structure
    [3987] => activity
    [3988] => relationship
    [3989] => surveillance
    [3990] => mass
    [3991] => surveillance
    [3992] => e
    [3993] => g
    [3994] => stellar
    [3995] => wind
    [3996] => related
    [3997] => topics
    [3998] => data
    [3999] => mining
    [4002] => analyzing
    [4003] => data
    [4005] => information
    [4007] => extracting
    [4008] => information
    [4011] => data
    [4013] => data
    [4014] => integration
    [4015] => data
    [4016] => transformation
    [4017] => electronic
    [4018] => discovery
    [4019] => information
    [4020] => extraction
    [4021] => information
    [4022] => integration
    [4023] => named-entity
    [4024] => recognition
    [4025] => profiling
    [4026] => information
    [4027] => science
    [4028] => psychometrics
    [4029] => social
    [4030] => media
    [4031] => mining
    [4032] => surveillance
    [4033] => capitalism
    [4034] => web
    [4035] => scraping
    [4037] => resources
    [4038] => international
    [4039] => journal
    [4041] => data
    [4042] => warehousing
    [4044] => mining
    [4045] => references
    [4046] => edit
    [4048] => b
    [4049] => c
    [4050] => d
    [4051] => e
    [4052] => data
    [4053] => mining
    [4054] => curriculum
    [4055] => acm
    [4056] => sigkdd
    [4057] => 2006-04-30
    [4058] => retrieved
    [4059] => 2014-01-27
    [4060] => han
    [4061] => kamber
    [4062] => pei
    [4063] => jaiwei
    [4064] => micheline
    [4065] => jian
    [4066] => june
    [4067] => 9
    [4068] => 2011
    [4069] => data
    [4070] => mining
    [4071] => concepts
    [4073] => techniques
    [4074] => 3rd
    [4075] => ed
    [4076] => morgan
    [4077] => kaufmann
    [4078] => isbn
    [4079] => 978-0-12-381479-1
    [4080] => cs1
    [4081] => maint
    [4082] => multiple
    [4083] => names
    [4084] => authors
    [4085] => list
    [4086] => link
    [4087] => clifton
    [4088] => christopher
    [4089] => 2010
    [4090] => encyclop
    [4091] => dia
    [4092] => britannica
    [4093] => definition
    [4095] => data
    [4096] => mining
    [4097] => retrieved
    [4098] => 2010-12-09
    [4099] => hastie
    [4100] => trevor
    [4101] => tibshirani
    [4102] => robert
    [4103] => friedman
    [4104] => jerome
    [4105] => 2009
    [4107] => elements
    [4109] => statistical
    [4110] => learning
    [4111] => data
    [4112] => mining
    [4113] => inference
    [4115] => prediction
    [4116] => retrieved
    [4117] => 2012-08-07
    [4119] => b
    [4120] => c
    [4121] => fayyad
    [4122] => usama
    [4123] => piatetsky-shapiro
    [4124] => gregory
    [4125] => smyth
    [4126] => padhraic
    [4127] => 1996
    [4129] => data
    [4130] => mining
    [4132] => knowledge
    [4133] => discovery
    [4135] => databases
    [4136] => pdf
    [4137] => retrieved
    [4138] => 17
    [4139] => december
    [4140] => 2008
    [4141] => han
    [4142] => jiawei
    [4143] => kamber
    [4144] => micheline
    [4145] => 2001
    [4146] => data
    [4147] => mining
    [4148] => concepts
    [4150] => techniques
    [4151] => morgan
    [4152] => kaufmann
    [4153] => p
    [4154] => 5
    [4155] => isbn
    [4156] => 978-1-55860-489-6
    [4158] => data
    [4159] => mining
    [4164] => appropriately
    [4165] => named
    [4166] => knowledge
    [4167] => mining
    [4169] => data
    [4174] => long
    [4176] => e
    [4177] => g
    [4178] => okairp
    [4179] => 2005
    [4180] => fall
    [4181] => conference
    [4182] => arizona
    [4183] => state
    [4184] => university
    [4187] => datamining
    [4188] => witten
    [4189] => ian
    [4190] => h
    [4191] => frank
    [4192] => eibe
    [4193] => hall
    [4194] => mark
    [4196] => 30
    [4197] => january
    [4198] => 2011
    [4199] => data
    [4200] => mining
    [4201] => practical
    [4202] => machine
    [4203] => learning
    [4204] => tools
    [4206] => techniques
    [4207] => 3
    [4208] => ed
    [4209] => elsevier
    [4210] => isbn
    [4211] => 978-0-12-374856-0
    [4212] => bouckaert
    [4213] => remco
    [4214] => r
    [4215] => frank
    [4216] => eibe
    [4217] => hall
    [4218] => mark
    [4220] => holmes
    [4221] => geoffrey
    [4222] => pfahringer
    [4223] => bernhard
    [4224] => reutemann
    [4225] => peter
    [4226] => witten
    [4227] => ian
    [4228] => h
    [4229] => 2010
    [4230] => weka
    [4231] => experiences
    [4234] => java
    [4235] => open-source
    [4236] => project
    [4237] => journal
    [4239] => machine
    [4240] => learning
    [4241] => research
    [4242] => 11
    [4243] => 2533
    [4244] => 2541
    [4246] => original
    [4247] => title
    [4248] => practical
    [4249] => machine
    [4250] => learning
    [4252] => changed
    [4254] => term
    [4255] => data
    [4256] => mining
    [4258] => added
    [4259] => primarily
    [4261] => marketing
    [4262] => reasons
    [4263] => mena
    [4264] => jes
    [4265] => s
    [4266] => 2011
    [4267] => machine
    [4268] => learning
    [4269] => forensics
    [4271] => law
    [4272] => enforcement
    [4273] => security
    [4275] => intelligence
    [4276] => boca
    [4277] => raton
    [4278] => fl
    [4279] => crc
    [4280] => press
    [4281] => taylor
    [4282] => francis
    [4283] => group
    [4284] => isbn
    [4285] => 978-1-4398-6069-4
    [4286] => piatetsky-shapiro
    [4287] => gregory
    [4288] => parker
    [4289] => gary
    [4290] => 2011
    [4291] => lesson
    [4292] => data
    [4293] => mining
    [4295] => knowledge
    [4296] => discovery
    [4298] => introduction
    [4299] => introduction
    [4301] => data
    [4302] => mining
    [4303] => kd
    [4304] => nuggets
    [4305] => retrieved
    [4306] => 30
    [4307] => august
    [4308] => 2012
    [4309] => fayyad
    [4310] => usama
    [4311] => 15
    [4312] => june
    [4313] => 1999
    [4315] => editorial
    [4317] => editor-in-chief
    [4318] => sigkdd
    [4319] => explorations
    [4320] => 13
    [4321] => 1
    [4322] => 102
    [4323] => doi
    [4324] => 10
    [4325] => 1145
    [4326] => 2207243
    [4327] => 2207269
    [4328] => retrieved
    [4329] => 27
    [4330] => december
    [4331] => 2010
    [4332] => kantardzic
    [4333] => mehmed
    [4334] => 2003
    [4335] => data
    [4336] => mining
    [4337] => concepts
    [4338] => models
    [4339] => methods
    [4341] => algorithms
    [4342] => john
    [4343] => wiley
    [4344] => sons
    [4345] => isbn
    [4346] => 0-471-22852-4
    [4347] => oclc
    [4348] => 50055336
    [4349] => gregory
    [4350] => piatetsky-shapiro
    [4351] => 2002
    [4352] => kdnuggets
    [4353] => methodology
    [4354] => poll
    [4355] => gregory
    [4356] => piatetsky-shapiro
    [4357] => 2004
    [4358] => kdnuggets
    [4359] => methodology
    [4360] => poll
    [4361] => gregory
    [4362] => piatetsky-shapiro
    [4363] => 2007
    [4364] => kdnuggets
    [4365] => methodology
    [4366] => poll
    [4367] => gregory
    [4368] => piatetsky-shapiro
    [4369] => 2014
    [4370] => kdnuggets
    [4371] => methodology
    [4372] => poll
    [4373] => scar
    [4374] => marb
    [4375] => n
    [4376] => gonzalo
    [4377] => mariscal
    [4379] => javier
    [4380] => segovia
    [4381] => 2009
    [4383] => data
    [4384] => mining
    [4385] => knowledge
    [4386] => discovery
    [4387] => process
    [4388] => model
    [4390] => data
    [4391] => mining
    [4393] => knowledge
    [4394] => discovery
    [4396] => real
    [4397] => life
    [4398] => applications
    [4399] => book
    [4400] => edited
    [4402] => julio
    [4403] => ponce
    [4405] => adem
    [4406] => karahoca
    [4407] => isbn
    [4408] => 978-3-902613-53-0
    [4409] => pp
    [4410] => 438
    [4411] => 453
    [4412] => february
    [4413] => 2009
    [4414] => i-tech
    [4415] => vienna
    [4416] => austria
    [4417] => lukasz
    [4418] => kurgan
    [4420] => petr
    [4421] => musilek
    [4422] => 2006
    [4424] => survey
    [4426] => knowledge
    [4427] => discovery
    [4429] => data
    [4430] => mining
    [4431] => process
    [4432] => models
    [4434] => knowledge
    [4435] => engineering
    [4436] => review
    [4437] => volume
    [4438] => 21
    [4439] => issue
    [4440] => 1
    [4441] => march
    [4442] => 2006
    [4443] => pp
    [4444] => 1
    [4445] => 24
    [4446] => cambridge
    [4447] => university
    [4448] => press
    [4450] => york
    [4451] => ny
    [4452] => usa
    [4453] => doi
    [4454] => 10
    [4455] => 1017
    [4456] => s0269888906000737
    [4457] => azevedo
    [4460] => santos
    [4461] => m
    [4462] => f
    [4463] => kdd
    [4464] => semma
    [4466] => crisp-dm
    [4468] => parallel
    [4469] => overview
    [4470] => archived
    [4471] => 2013-01-09
    [4474] => wayback
    [4475] => machine
    [4477] => proceedings
    [4480] => iadis
    [4481] => european
    [4482] => conference
    [4484] => data
    [4485] => mining
    [4486] => 2008
    [4487] => pp
    [4488] => 182
    [4489] => 185
    [4490] => hawkins
    [4491] => douglas
    [4492] => m
    [4493] => 2004
    [4495] => problem
    [4497] => overfitting
    [4498] => journal
    [4500] => chemical
    [4501] => information
    [4503] => computer
    [4504] => sciences
    [4505] => 44
    [4506] => 1
    [4507] => 1
    [4508] => 12
    [4509] => doi
    [4510] => 10
    [4511] => 1021
    [4512] => ci0342472
    [4513] => microsoft
    [4514] => academic
    [4515] => search
    [4516] => top
    [4517] => conferences
    [4519] => data
    [4520] => mining
    [4521] => microsoft
    [4522] => academic
    [4523] => search
    [4524] => google
    [4525] => scholar
    [4526] => top
    [4527] => publications
    [4529] => data
    [4530] => mining
    [4531] => analysis
    [4532] => google
    [4533] => scholar
    [4534] => proceedings
    [4535] => international
    [4536] => conferences
    [4538] => knowledge
    [4539] => discovery
    [4541] => data
    [4542] => mining
    [4543] => acm
    [4545] => york
    [4546] => sigkdd
    [4547] => explorations
    [4548] => acm
    [4550] => york
    [4551] => g
    [4552] => nnemann
    [4553] => stephan
    [4554] => kremer
    [4555] => hardy
    [4556] => seidl
    [4557] => thomas
    [4558] => 2011
    [4560] => extension
    [4563] => pmml
    [4564] => standard
    [4566] => subspace
    [4567] => clustering
    [4568] => models
    [4569] => proceedings
    [4572] => 2011
    [4573] => workshop
    [4575] => predictive
    [4576] => markup
    [4577] => language
    [4578] => modeling
    [4580] => pmml
    [4581] => '11
    [4582] => p
    [4583] => 48
    [4584] => doi
    [4585] => 10
    [4586] => 1145
    [4587] => 2023598
    [4588] => 2023605
    [4589] => isbn
    [4590] => 978-1-4503-0837-3
    [4591] => seltzer
    [4592] => william
    [4594] => promise
    [4596] => pitfalls
    [4598] => data
    [4599] => mining
    [4600] => ethical
    [4601] => issues
    [4602] => pdf
    [4603] => pitts
    [4604] => chip
    [4605] => 15
    [4606] => march
    [4607] => 2007
    [4609] => end
    [4611] => illegal
    [4612] => domestic
    [4613] => spying
    [4615] => count
    [4618] => washington
    [4619] => spectator
    [4620] => archived
    [4623] => original
    [4625] => 2007-10-29
    [4626] => taipale
    [4627] => kim
    [4629] => 15
    [4630] => december
    [4631] => 2003
    [4632] => data
    [4633] => mining
    [4635] => domestic
    [4636] => security
    [4637] => connecting
    [4639] => dots
    [4641] => make
    [4642] => sense
    [4644] => data
    [4645] => columbia
    [4646] => science
    [4648] => technology
    [4649] => law
    [4650] => review
    [4651] => 5
    [4652] => 2
    [4653] => oclc
    [4654] => 45263753
    [4655] => ssrn
    [4656] => 546782
    [4657] => resig
    [4658] => john
    [4659] => teredesai
    [4660] => ankur
    [4661] => 2004
    [4663] => framework
    [4665] => mining
    [4666] => instant
    [4667] => messaging
    [4668] => services
    [4669] => proceedings
    [4672] => 2004
    [4673] => siam
    [4674] => dm
    [4675] => conference
    [4677] => b
    [4678] => c
    [4682] => dig
    [4683] => privacy
    [4684] => implications
    [4686] => data
    [4687] => mining
    [4688] => aggregation
    [4689] => archived
    [4690] => 2008-12-17
    [4693] => wayback
    [4694] => machine
    [4695] => nascio
    [4696] => research
    [4698] => september
    [4699] => 2004
    [4700] => ohm
    [4701] => paul
    [4703] => build
    [4705] => database
    [4707] => ruin
    [4708] => harvard
    [4709] => business
    [4710] => review
    [4711] => darwin
    [4712] => bond-graham
    [4713] => iron
    [4714] => cagebook
    [4717] => logical
    [4718] => end
    [4720] => facebook's
    [4721] => patents
    [4722] => counterpunch
    [4723] => org
    [4724] => 2013
    [4725] => 12
    [4726] => 03
    [4727] => darwin
    [4728] => bond-graham
    [4729] => inside
    [4731] => tech
    [4732] => industry's
    [4733] => startup
    [4734] => conference
    [4735] => counterpunch
    [4736] => org
    [4737] => 2013
    [4738] => 09
    [4739] => 11
    [4740] => aol
    [4741] => search
    [4742] => data
    [4743] => identified
    [4744] => individuals
    [4745] => securityfocus
    [4746] => august
    [4747] => 2006
    [4748] => kshetri
    [4749] => nir
    [4750] => 2014
    [4751] => big
    [4752] => data
    [4753] => s
    [4754] => impact
    [4756] => privacy
    [4757] => security
    [4759] => consumer
    [4760] => welfare
    [4761] => telecommunications
    [4762] => policy
    [4763] => 38
    [4764] => 11
    [4765] => 1134
    [4766] => 1145
    [4767] => doi
    [4768] => 10
    [4769] => 1016
    [4770] => j
    [4771] => telpol
    [4772] => 2014
    [4773] => 10
    [4774] => 002
    [4775] => biotech
    [4776] => business
    [4777] => week
    [4778] => editors
    [4779] => june
    [4780] => 30
    [4781] => 2008
    [4782] => biomedicine
    [4783] => hipaa
    [4784] => privacy
    [4785] => rule
    [4786] => impedes
    [4787] => biomedical
    [4788] => research
    [4789] => biotech
    [4790] => business
    [4791] => week
    [4792] => retrieved
    [4793] => 17
    [4794] => november
    [4795] => 2009
    [4797] => lexisnexis
    [4798] => academic
    [4799] => uk
    [4800] => researchers
    [4802] => data
    [4803] => mining
    [4807] => uk
    [4808] => copyright
    [4809] => laws
    [4810] => archived
    [4811] => june
    [4812] => 9
    [4813] => 2014
    [4816] => wayback
    [4817] => machine
    [4818] => out-law
    [4820] => retrieved
    [4821] => 14
    [4822] => november
    [4823] => 2014
    [4824] => licences
    [4826] => europe
    [4828] => structured
    [4829] => stakeholder
    [4830] => dialogue
    [4831] => 2013
    [4832] => european
    [4833] => commission
    [4834] => retrieved
    [4835] => 14
    [4836] => november
    [4837] => 2014
    [4838] => text
    [4840] => data
    [4841] => mining
    [4843] => importance
    [4848] => change
    [4850] => europe
    [4851] => association
    [4853] => european
    [4854] => research
    [4855] => libraries
    [4856] => retrieved
    [4857] => 14
    [4858] => november
    [4859] => 2014
    [4860] => judge
    [4861] => grants
    [4862] => summary
    [4863] => judgment
    [4865] => favor
    [4867] => google
    [4868] => books
    [4870] => fair
    [4872] => victory
    [4873] => lexology
    [4875] => antonelli
    [4876] => law
    [4878] => retrieved
    [4879] => 14
    [4880] => november
    [4881] => 2014
    [4882] => karl
    [4883] => rexer
    [4884] => heather
    [4885] => allen
    [4886] => paul
    [4887] => gearan
    [4888] => 2011
    [4889] => understanding
    [4890] => data
    [4891] => miners
    [4892] => analytics
    [4893] => magazine
    [4895] => june
    [4896] => 2011
    [4897] => informs
    [4898] => institute
    [4900] => operations
    [4901] => research
    [4904] => management
    [4905] => sciences
    [4906] => mikut
    [4907] => ralf
    [4908] => reischl
    [4909] => markus
    [4910] => september
    [4911] => october
    [4912] => 2011
    [4913] => data
    [4914] => mining
    [4915] => tools
    [4916] => wiley
    [4917] => interdisciplinary
    [4918] => reviews
    [4919] => data
    [4920] => mining
    [4922] => knowledge
    [4923] => discovery
    [4924] => 1
    [4925] => 5
    [4926] => 431
    [4927] => 445
    [4928] => doi
    [4929] => 10
    [4930] => 1002
    [4931] => widm
    [4932] => 24
    [4933] => retrieved
    [4934] => october
    [4935] => 21
    [4936] => 2011
    [4937] => kobielus
    [4938] => james
    [4940] => forrester
    [4941] => wave
    [4942] => predictive
    [4943] => analytics
    [4945] => data
    [4946] => mining
    [4947] => solutions
    [4948] => q1
    [4949] => 2010
    [4950] => forrester
    [4951] => research
    [4952] => 1
    [4953] => july
    [4954] => 2008
    [4955] => herschel
    [4956] => gareth
    [4957] => magic
    [4958] => quadrant
    [4960] => customer
    [4961] => data-mining
    [4962] => applications
    [4963] => gartner
    [4965] => 1
    [4966] => july
    [4967] => 2008
    [4968] => nisbet
    [4969] => robert
    [4971] => 2006
    [4972] => data
    [4973] => mining
    [4974] => tools
    [4980] => crm
    [4981] => part
    [4982] => 1
    [4983] => information
    [4984] => management
    [4985] => special
    [4986] => reports
    [4987] => january
    [4988] => 2006
    [4989] => haughton
    [4990] => dominique
    [4991] => deichmann
    [4992] => joel
    [4993] => eshghi
    [4994] => abdolreza
    [4995] => sayek
    [4996] => selin
    [4997] => teebagy
    [4998] => nicholas
    [5000] => topi
    [5001] => heikki
    [5002] => 2003
    [5004] => review
    [5006] => software
    [5007] => packages
    [5009] => data
    [5010] => mining
    [5012] => american
    [5013] => statistician
    [5014] => vol
    [5015] => 57
    [5017] => 4
    [5018] => pp
    [5019] => 290
    [5020] => 309
    [5021] => goebel
    [5022] => michael
    [5023] => gruenwald
    [5024] => le
    [5025] => 1999
    [5027] => survey
    [5029] => data
    [5030] => mining
    [5032] => knowledge
    [5033] => discovery
    [5034] => software
    [5035] => tools
    [5036] => sigkdd
    [5037] => explorations
    [5038] => vol
    [5039] => 1
    [5040] => issue
    [5041] => 1
    [5042] => pp
    [5043] => 20
    [5044] => 33
    [5046] => reading
    [5047] => edit
    [5048] => cabena
    [5049] => peter
    [5050] => hadjnian
    [5051] => pablo
    [5052] => stadler
    [5053] => rolf
    [5054] => verhees
    [5055] => jaap
    [5056] => zanasi
    [5057] => alessandro
    [5058] => 1997
    [5059] => discovering
    [5060] => data
    [5061] => mining
    [5063] => concept
    [5065] => implementation
    [5066] => prentice
    [5067] => hall
    [5068] => isbn
    [5069] => 0-13-743980-6
    [5070] => m
    [5071] => s
    [5072] => chen
    [5073] => j
    [5074] => han
    [5075] => p
    [5076] => s
    [5077] => yu
    [5078] => 1996
    [5079] => data
    [5080] => mining
    [5082] => overview
    [5085] => database
    [5086] => perspective
    [5087] => knowledge
    [5089] => data
    [5090] => engineering
    [5091] => ieee
    [5092] => transactions
    [5094] => 8
    [5095] => 6
    [5096] => 866
    [5097] => 883
    [5098] => feldman
    [5099] => ronen
    [5100] => sanger
    [5101] => james
    [5102] => 2007
    [5104] => text
    [5105] => mining
    [5106] => handbook
    [5107] => cambridge
    [5108] => university
    [5109] => press
    [5110] => isbn
    [5111] => 978-0-521-83657-9
    [5112] => guo
    [5113] => yike
    [5115] => grossman
    [5116] => robert
    [5117] => editors
    [5118] => 1999
    [5119] => high
    [5120] => performance
    [5121] => data
    [5122] => mining
    [5123] => scaling
    [5124] => algorithms
    [5125] => applications
    [5127] => systems
    [5128] => kluwer
    [5129] => academic
    [5130] => publishers
    [5131] => han
    [5132] => jiawei
    [5133] => micheline
    [5134] => kamber
    [5136] => jian
    [5137] => pei
    [5138] => data
    [5139] => mining
    [5140] => concepts
    [5142] => techniques
    [5143] => morgan
    [5144] => kaufmann
    [5145] => 2006
    [5146] => hastie
    [5147] => trevor
    [5148] => tibshirani
    [5149] => robert
    [5151] => friedman
    [5152] => jerome
    [5153] => 2001
    [5155] => elements
    [5157] => statistical
    [5158] => learning
    [5159] => data
    [5160] => mining
    [5161] => inference
    [5163] => prediction
    [5164] => springer
    [5165] => isbn
    [5166] => 0-387-95284-5
    [5167] => liu
    [5168] => bing
    [5169] => 2007
    [5170] => web
    [5171] => data
    [5172] => mining
    [5173] => exploring
    [5174] => hyperlinks
    [5175] => contents
    [5177] => usage
    [5178] => data
    [5179] => springer
    [5180] => isbn
    [5181] => 3-540-37881-2
    [5182] => murphy
    [5183] => chris
    [5184] => 16
    [5186] => 2011
    [5188] => data
    [5189] => mining
    [5190] => free
    [5191] => speech
    [5192] => informationweek
    [5193] => umb
    [5194] => 12
    [5195] => nisbet
    [5196] => robert
    [5197] => elder
    [5198] => john
    [5199] => miner
    [5200] => gary
    [5201] => 2009
    [5202] => handbook
    [5204] => statistical
    [5205] => analysis
    [5206] => data
    [5207] => mining
    [5208] => applications
    [5209] => academic
    [5210] => press
    [5211] => elsevier
    [5212] => isbn
    [5213] => 978-0-12-374765-5
    [5214] => poncelet
    [5215] => pascal
    [5216] => masseglia
    [5217] => florent
    [5219] => teisseire
    [5220] => maguelonne
    [5221] => editors
    [5222] => october
    [5223] => 2007
    [5224] => data
    [5225] => mining
    [5226] => patterns
    [5228] => methods
    [5230] => applications
    [5231] => information
    [5232] => science
    [5233] => reference
    [5234] => isbn
    [5235] => 978-1-59904-162-9
    [5236] => tan
    [5237] => pang-ning
    [5238] => steinbach
    [5239] => michael
    [5241] => kumar
    [5242] => vipin
    [5243] => 2005
    [5244] => introduction
    [5246] => data
    [5247] => mining
    [5248] => isbn
    [5249] => 0-321-32136-7
    [5250] => theodoridis
    [5251] => sergios
    [5253] => koutroumbas
    [5254] => konstantinos
    [5255] => 2009
    [5256] => pattern
    [5257] => recognition
    [5258] => 4th
    [5259] => edition
    [5260] => academic
    [5261] => press
    [5262] => isbn
    [5263] => 978-1-59749-272-0
    [5264] => weiss
    [5265] => sholom
    [5266] => m
    [5268] => indurkhya
    [5269] => nitin
    [5270] => 1998
    [5271] => predictive
    [5272] => data
    [5273] => mining
    [5274] => morgan
    [5275] => kaufmann
    [5276] => witten
    [5277] => ian
    [5278] => h
    [5279] => frank
    [5280] => eibe
    [5281] => hall
    [5282] => mark
    [5284] => 30
    [5285] => january
    [5286] => 2011
    [5287] => data
    [5288] => mining
    [5289] => practical
    [5290] => machine
    [5291] => learning
    [5292] => tools
    [5294] => techniques
    [5295] => 3
    [5296] => ed
    [5297] => elsevier
    [5298] => isbn
    [5299] => 978-0-12-374856-0
    [5302] => free
    [5303] => weka
    [5304] => software
    [5305] => ye
    [5306] => nong
    [5307] => 2003
    [5309] => handbook
    [5311] => data
    [5312] => mining
    [5313] => mahwah
    [5314] => nj
    [5315] => lawrence
    [5316] => erlbaum
    [5317] => external
    [5318] => links
    [5319] => edit
    [5320] => wikimedia
    [5321] => commons
    [5323] => media
    [5324] => related
    [5326] => data
    [5327] => mining
    [5328] => knowledge
    [5329] => discovery
    [5330] => software
    [5332] => curlie
    [5333] => based
    [5335] => dmoz
    [5336] => data
    [5337] => mining
    [5338] => tool
    [5339] => vendors
    [5341] => curlie
    [5342] => based
    [5344] => dmoz
    [5345] => v
    [5346] => t
    [5347] => e
    [5348] => data
    [5349] => analysis
    [5350] => cleansing
    [5351] => compression
    [5352] => corruption
    [5353] => curation
    [5354] => editing
    [5355] => farming
    [5356] => fusion
    [5357] => integration
    [5358] => integrity
    [5359] => loss
    [5360] => mining
    [5361] => pre-processing
    [5362] => quality
    [5363] => reduction
    [5364] => scraping
    [5365] => scrubbing
    [5366] => security
    [5367] => storage
    [5368] => validation
    [5369] => warehouse
    [5370] => wrangling
    [5371] => munging
    [5372] => protection
    [5373] => privacy
    [5374] => v
    [5375] => t
    [5376] => e
    [5377] => data
    [5378] => warehouse
    [5379] => creating
    [5381] => data
    [5382] => warehouse
    [5383] => concepts
    [5384] => database
    [5385] => dimension
    [5386] => dimensional
    [5387] => modeling
    [5388] => fact
    [5389] => olap
    [5390] => star
    [5391] => schema
    [5392] => aggregate
    [5393] => variants
    [5394] => anchor
    [5395] => modeling
    [5396] => column-oriented
    [5397] => dbms
    [5398] => data
    [5399] => vault
    [5400] => modeling
    [5401] => holap
    [5402] => molap
    [5403] => rolap
    [5404] => operational
    [5405] => data
    [5406] => store
    [5407] => elements
    [5408] => data
    [5409] => dictionary
    [5410] => metadata
    [5411] => data
    [5412] => mart
    [5413] => sixth
    [5414] => normal
    [5415] => form
    [5416] => surrogate
    [5417] => key
    [5418] => fact
    [5419] => fact
    [5420] => table
    [5421] => early-arriving
    [5422] => fact
    [5423] => measure
    [5424] => dimension
    [5425] => dimension
    [5426] => table
    [5427] => degenerate
    [5428] => slowly
    [5429] => changing
    [5430] => filling
    [5431] => extract-transform-load
    [5432] => etl
    [5433] => extract
    [5434] => transform
    [5435] => load
    [5438] => data
    [5439] => warehouse
    [5440] => concepts
    [5441] => business
    [5442] => intelligence
    [5443] => dashboard
    [5444] => data
    [5445] => mining
    [5446] => decision
    [5447] => support
    [5448] => system
    [5449] => dss
    [5450] => olap
    [5451] => cube
    [5452] => data
    [5453] => warehouse
    [5454] => automation
    [5455] => languages
    [5456] => data
    [5457] => mining
    [5458] => extensions
    [5459] => dmx
    [5460] => multidimensional
    [5461] => expressions
    [5462] => mdx
    [5463] => xml
    [5465] => analysis
    [5466] => xmla
    [5467] => tools
    [5468] => business
    [5469] => intelligence
    [5470] => software
    [5471] => reporting
    [5472] => software
    [5473] => spreadsheet
    [5474] => related
    [5475] => people
    [5476] => bill
    [5477] => inmon
    [5478] => ralph
    [5479] => kimball
    [5480] => products
    [5481] => comparison
    [5483] => olap
    [5484] => servers
    [5485] => data
    [5486] => warehousing
    [5487] => products
    [5490] => producers
    [5491] => v
    [5492] => t
    [5493] => e
    [5494] => major
    [5495] => fields
    [5497] => computer
    [5498] => science
    [5499] => note
    [5501] => template
    [5502] => roughly
    [5505] => 2012
    [5506] => acm
    [5507] => computing
    [5508] => classification
    [5509] => system
    [5510] => hardware
    [5511] => printed
    [5512] => circuit
    [5513] => board
    [5514] => peripheral
    [5515] => integrated
    [5516] => circuit
    [5517] => very-large-scale
    [5518] => integration
    [5519] => energy
    [5520] => consumption
    [5521] => electronic
    [5522] => design
    [5523] => automation
    [5524] => computer
    [5525] => systems
    [5526] => organization
    [5527] => computer
    [5528] => architecture
    [5529] => embedded
    [5530] => system
    [5531] => real-time
    [5532] => computing
    [5533] => dependability
    [5534] => networks
    [5535] => network
    [5536] => architecture
    [5537] => network
    [5538] => protocol
    [5539] => network
    [5540] => components
    [5541] => network
    [5542] => scheduler
    [5543] => network
    [5544] => performance
    [5545] => evaluation
    [5546] => network
    [5547] => service
    [5548] => software
    [5549] => organization
    [5550] => interpreter
    [5551] => middleware
    [5552] => virtual
    [5553] => machine
    [5554] => operating
    [5555] => system
    [5556] => software
    [5557] => quality
    [5558] => software
    [5559] => notations
    [5561] => tools
    [5562] => programming
    [5563] => paradigm
    [5564] => programming
    [5565] => language
    [5566] => compiler
    [5567] => domain-specific
    [5568] => language
    [5569] => modeling
    [5570] => language
    [5571] => software
    [5572] => framework
    [5573] => integrated
    [5574] => development
    [5575] => environment
    [5576] => software
    [5577] => configuration
    [5578] => management
    [5579] => software
    [5580] => library
    [5581] => software
    [5582] => repository
    [5583] => software
    [5584] => development
    [5585] => software
    [5586] => development
    [5587] => process
    [5588] => requirements
    [5589] => analysis
    [5590] => software
    [5591] => design
    [5592] => software
    [5593] => construction
    [5594] => software
    [5595] => deployment
    [5596] => software
    [5597] => maintenance
    [5598] => programming
    [5599] => team
    [5600] => open-source
    [5601] => model
    [5602] => theory
    [5604] => computation
    [5605] => model
    [5607] => computation
    [5608] => formal
    [5609] => language
    [5610] => automata
    [5611] => theory
    [5612] => computational
    [5613] => complexity
    [5614] => theory
    [5615] => logic
    [5616] => semantics
    [5617] => algorithms
    [5618] => algorithm
    [5619] => design
    [5620] => analysis
    [5622] => algorithms
    [5623] => randomized
    [5624] => algorithm
    [5625] => computational
    [5626] => geometry
    [5627] => mathematics
    [5629] => computing
    [5630] => discrete
    [5631] => mathematics
    [5632] => probability
    [5633] => statistics
    [5634] => mathematical
    [5635] => software
    [5636] => information
    [5637] => theory
    [5638] => mathematical
    [5639] => analysis
    [5640] => numerical
    [5641] => analysis
    [5642] => information
    [5643] => systems
    [5644] => database
    [5645] => management
    [5646] => system
    [5647] => information
    [5648] => storage
    [5649] => systems
    [5650] => enterprise
    [5651] => information
    [5652] => system
    [5653] => social
    [5654] => information
    [5655] => systems
    [5656] => geographic
    [5657] => information
    [5658] => system
    [5659] => decision
    [5660] => support
    [5661] => system
    [5662] => process
    [5663] => control
    [5664] => system
    [5665] => multimedia
    [5666] => information
    [5667] => system
    [5668] => data
    [5669] => mining
    [5670] => digital
    [5671] => library
    [5672] => computing
    [5673] => platform
    [5674] => digital
    [5675] => marketing
    [5676] => world
    [5677] => wide
    [5678] => web
    [5679] => information
    [5680] => retrieval
    [5681] => security
    [5682] => cryptography
    [5683] => formal
    [5684] => methods
    [5685] => security
    [5686] => services
    [5687] => intrusion
    [5688] => detection
    [5689] => system
    [5690] => hardware
    [5691] => security
    [5692] => network
    [5693] => security
    [5694] => information
    [5695] => security
    [5696] => application
    [5697] => security
    [5698] => human
    [5699] => computer
    [5700] => interaction
    [5701] => interaction
    [5702] => design
    [5703] => social
    [5704] => computing
    [5705] => ubiquitous
    [5706] => computing
    [5707] => visualization
    [5708] => accessibility
    [5709] => concurrency
    [5710] => concurrent
    [5711] => computing
    [5712] => parallel
    [5713] => computing
    [5714] => distributed
    [5715] => computing
    [5716] => multithreading
    [5717] => multiprocessing
    [5718] => artificial
    [5719] => intelligence
    [5720] => natural
    [5721] => language
    [5722] => processing
    [5723] => knowledge
    [5724] => representation
    [5726] => reasoning
    [5727] => computer
    [5728] => vision
    [5729] => automated
    [5730] => planning
    [5732] => scheduling
    [5733] => search
    [5734] => methodology
    [5735] => control
    [5736] => method
    [5737] => philosophy
    [5739] => artificial
    [5740] => intelligence
    [5741] => distributed
    [5742] => artificial
    [5743] => intelligence
    [5744] => machine
    [5745] => learning
    [5746] => supervised
    [5747] => learning
    [5748] => unsupervised
    [5749] => learning
    [5750] => reinforcement
    [5751] => learning
    [5752] => multi-task
    [5753] => learning
    [5754] => cross-validation
    [5755] => graphics
    [5756] => animation
    [5757] => rendering
    [5758] => image
    [5759] => manipulation
    [5760] => graphics
    [5761] => processing
    [5762] => unit
    [5763] => mixed
    [5764] => reality
    [5765] => virtual
    [5766] => reality
    [5767] => image
    [5768] => compression
    [5769] => solid
    [5770] => modeling
    [5771] => applied
    [5772] => computing
    [5773] => e-commerce
    [5774] => enterprise
    [5775] => software
    [5776] => computational
    [5777] => mathematics
    [5778] => computational
    [5779] => physics
    [5780] => computational
    [5781] => chemistry
    [5782] => computational
    [5783] => biology
    [5784] => computational
    [5785] => social
    [5786] => science
    [5787] => computational
    [5788] => engineering
    [5789] => computational
    [5790] => healthcare
    [5791] => digital
    [5792] => art
    [5793] => electronic
    [5794] => publishing
    [5795] => cyberwarfare
    [5796] => electronic
    [5797] => voting
    [5798] => video
    [5799] => game
    [5800] => word
    [5801] => processing
    [5802] => operations
    [5803] => research
    [5804] => educational
    [5805] => technology
    [5806] => document
    [5807] => management
    [5808] => book
    [5809] => category
    [5810] => portal
    [5811] => wikiproject
    [5812] => commons
    [5813] => authority
    [5814] => control
    [5815] => gnd
    [5816] => 4428654-5
    [5817] => ndl
    [5818] => 00948240
    [5819] => retrieved
    [5821] => https
    [5823] => wikipedia
    [5824] => org
    [5825] => w
    [5826] => index
    [5827] => php
    [5828] => title
    [5829] => data
    [5830] => mining
    [5831] => oldid
    [5832] => 826460924
    [5833] => categories
    [5834] => data
    [5835] => mining
    [5836] => formal
    [5837] => sciences
    [5838] => hidden
    [5839] => categories
    [5840] => cs1
    [5841] => maint
    [5842] => multiple
    [5843] => names
    [5844] => authors
    [5845] => list
    [5846] => webarchive
    [5847] => template
    [5848] => wayback
    [5849] => links
    [5850] => articles
    [5853] => expanded
    [5855] => september
    [5856] => 2011
    [5858] => articles
    [5860] => unsourced
    [5861] => statements
    [5862] => articles
    [5864] => unsourced
    [5865] => statements
    [5867] => april
    [5868] => 2014
    [5869] => pages
    [5871] => div
    [5872] => col
    [5874] => cols
    [5876] => colwidth
    [5877] => parameters
    [5878] => pages
    [5880] => columns-list
    [5882] => deprecated
    [5883] => parameters
    [5884] => articles
    [5886] => curlie
    [5887] => links
    [5888] => wikipedia
    [5889] => articles
    [5891] => gnd
    [5892] => identifiers
    [5893] => navigation
    [5894] => menu
    [5895] => personal
    [5896] => tools
    [5898] => logged
    [5900] => talk
    [5901] => contributions
    [5902] => create
    [5903] => account
    [5904] => log
    [5906] => namespaces
    [5907] => article
    [5908] => talk
    [5909] => variants
    [5910] => views
    [5911] => read
    [5912] => edit
    [5913] => view
    [5914] => history
    [5916] => search
    [5917] => navigation
    [5918] => main
    [5919] => page
    [5920] => contents
    [5921] => featured
    [5922] => content
    [5923] => current
    [5924] => events
    [5925] => random
    [5926] => article
    [5927] => donate
    [5929] => wikipedia
    [5930] => wikipedia
    [5931] => store
    [5932] => interaction
    [5935] => wikipedia
    [5936] => community
    [5937] => portal
    [5938] => recent
    [5940] => contact
    [5941] => page
    [5942] => tools
    [5944] => links
    [5946] => related
    [5948] => upload
    [5949] => file
    [5950] => special
    [5951] => pages
    [5952] => permanent
    [5953] => link
    [5954] => page
    [5955] => information
    [5956] => wikidata
    [5957] => item
    [5958] => cite
    [5960] => page
    [5961] => print
    [5962] => export
    [5963] => create
    [5965] => book
    [5966] => download
    [5968] => pdf
    [5969] => printable
    [5970] => version
    [5973] => projects
    [5974] => wikimedia
    [5975] => commons
    [5976] => languages
    [5977] => az
    [5978] => rbaycanca
    [5979] => catal
    [5980] => e
    [5981] => tina
    [5982] => dansk
    [5983] => deutsch
    [5984] => eesti
    [5985] => espa
    [5986] => ol
    [5987] => euskara
    [5988] => fran
    [5989] => ais
    [5990] => hrvatski
    [5991] => bahasa
    [5992] => indonesia
    [5993] => italiano
    [5994] => latvie
    [5995] => u
    [5996] => magyar
    [5997] => nederlands
    [5998] => norsk
    [5999] => polski
    [6000] => portugu
    [6001] => s
    [6002] => rom
    [6003] => n
    [6004] => scots
    [6005] => shqip
    [6006] => simple
    [6007] => english
    [6008] => sloven
    [6009] => ina
    [6010] => sloven
    [6011] => ina
    [6012] => srpski
    [6013] => srpskohrvatski
    [6014] => basa
    [6015] => sunda
    [6016] => suomi
    [6017] => svenska
    [6018] => t
    [6019] => rk
    [6020] => e
    [6021] => ti
    [6022] => ng
    [6023] => vi
    [6024] => t
    [6025] => edit
    [6026] => links
    [6028] => page
    [6031] => edited
    [6033] => 19
    [6034] => february
    [6035] => 2018
    [6037] => 06
    [6038] => 52
    [6039] => text
    [6044] => creative
    [6045] => commons
    [6046] => attribution-sharealike
    [6047] => license
    [6048] => additional
    [6049] => terms
    [6051] => apply
    [6055] => site
    [6057] => agree
    [6060] => terms
    [6064] => privacy
    [6065] => policy
    [6066] => wikipedia
    [6069] => registered
    [6070] => trademark
    [6073] => wikimedia
    [6074] => foundation
    [6077] => non-profit
    [6078] => organization
    [6079] => privacy
    [6080] => policy
    [6082] => wikipedia
    [6083] => disclaimers
    [6084] => contact
    [6085] => wikipedia
    [6086] => developers
    [6087] => cookie
    [6088] => statement
    [6089] => mobile
    [6090] => view
)
======================
Text: data mining - wikipedia data mining from wikipedia the free encyclopedia...
Total Keywords: 4218
======================

Demo2.php

<?php

//All Keywords as an array
$tm = new TextMiner();

$tm->addFile("http://en.wikipedia.org/wiki/Data_mining");
$tm->process();

printa($tm->getKeywords());
echo 
$tm->printSummary();
        
?>