{"id":809,"date":"2025-07-25T18:34:59","date_gmt":"2025-07-25T18:34:59","guid":{"rendered":"https:\/\/ccds.ai\/?p=809"},"modified":"2025-08-10T18:15:34","modified_gmt":"2025-08-10T18:15:34","slug":"cse417-data-mining-and-data-warehouse","status":"publish","type":"post","link":"https:\/\/ccds.ai\/?p=809","title":{"rendered":"CSE417: Data mining and Data warehouse"},"content":{"rendered":"\n<h2 class=\"wp-block-heading\">Course Description<\/h2>\n\n\n\n<p>We will learn theory, concepts, and applications on how to extract useful information from huge amounts of data.<\/p>\n\n\n\n<h3 class=\"wp-block-heading\">Course Information<\/h3>\n\n\n\n<p><a href=\"https:\/\/docs.google.com\/document\/d\/14s3vStvPZ-_fYjfPdnzL2dL6OPxdOWhE\/\" target=\"_blank\" rel=\"noopener\">Syllabus<\/a><\/p>\n\n\n\n<figure class=\"wp-block-table\"><table class=\"has-fixed-layout\"><thead><tr><th>Week<\/th><th>Session<\/th><th>Topics<\/th><th>Resources<\/th><th>Assignments<\/th><\/tr><\/thead><tbody><tr><td>Week-1<\/td><td>Session-1<\/td><td>Data Matrix, Attributes, Vector Recap, Basic Statistics, Distributions, PDF, CDF<\/td><td><a href=\"https:\/\/dataminingbook.info\/resources\/\" target=\"_blank\" rel=\"noopener\">https:\/\/dataminingbook.info\/resources\/<\/a><br>Book: DMML, Chapter 1 and Chapter 2<\/td><td>Assignment-1<\/td><\/tr><tr><td>Week-2<\/td><td>Session-2<\/td><td>Multivariate Gaussian, Covariance Matrix, Geometry of the multivariate normal, Diagonalization of Covariance Matrix<\/td><td><a href=\"https:\/\/dataminingbook.info\/resources\/\" target=\"_blank\" rel=\"noopener\">https:\/\/dataminingbook.info\/resources\/<\/a><br>Book: DMML, Chapter 1 and Chapter 2<\/td><td><\/td><\/tr><tr><td>Week-3<\/td><td>Session-3<\/td><td>Frequent Itemset Mining, The Market-Basket Model, Mining Association Rules, Finding Frequent Pairs, A-Priori Algorithm, FP Growth, *Eclat algorithm<\/td><td><a href=\"http:\/\/www.mmds.org\/#book\" target=\"_blank\" rel=\"noopener\">http:\/\/www.mmds.org\/#book<\/a><br>Book: MMDS, Chapter 6<\/td><td>Assignment-2<\/td><\/tr><tr><td>Week-4<\/td><td>Session-4<\/td><td>Mining Data Streams, General Stream Processing Model, Sampling from a Data Stream, *Queries over a (long) Sliding Window<\/td><td><a href=\"http:\/\/www.mmds.org\/#book\" target=\"_blank\" rel=\"noopener\">http:\/\/www.mmds.org\/#book<\/a><br>Book: MMDS, Chapter 4<\/td><td><\/td><\/tr><tr><td>Week-5<\/td><td>Session-5<\/td><td>Analysis of Large Graphs: Link Analysis, PageRank, Topic Specific Page rank, *Sim Rank<\/td><td><a href=\"http:\/\/www.mmds.org\/#book\" target=\"_blank\" rel=\"noopener\">http:\/\/www.mmds.org\/#book<\/a><br>Book: MMDS, Chapter 5<\/td><td>Assignment-3<\/td><\/tr><tr><td>Week-6<\/td><td>Session-6<\/td><td>Recommender Systems, Content-based Systems, Collaborative Filtering<\/td><td><a href=\"http:\/\/www.mmds.org\/#book\" target=\"_blank\" rel=\"noopener\">http:\/\/www.mmds.org\/#book\/&gt;Book: MMDS, Chapter 9<\/a><\/td><td><\/td><\/tr><tr><td>Week-7<\/td><td>Session-7<\/td><td>Recommender Systems, Latent Factor Models, SVD<\/td><td><a href=\"http:\/\/www.mmds.org\/#book\" target=\"_blank\" rel=\"noopener\">http:\/\/www.mmds.org\/#book<\/a><br>Book: MMDS, Chapter 9, 11<\/td><td>Assignment-4<\/td><\/tr><tr><td>Week-8<\/td><td>Session-8<\/td><td>Application of SVD in recommender system, *SVD for dimension reduction<\/td><td><a href=\"http:\/\/www.mmds.org\/#book\" target=\"_blank\" rel=\"noopener\">http:\/\/www.mmds.org\/#book<\/a><br>Book: MMDS, Chapter 9, 11<\/td><td><\/td><\/tr><tr><td>Week-9<\/td><td>Session-9<\/td><td>Analysis of Large Graphs: Community Detection, Betweenness, Modularity, Graph Partitioning, *Graph Cut, Spectral Partitioning<\/td><td><a href=\"http:\/\/www.mmds.org\/#book\" target=\"_blank\" rel=\"noopener\">http:\/\/www.mmds.org\/#book<\/a><br>Book: MMDS, Chapter 10<\/td><td>Assignment-5<\/td><\/tr><tr><td>Week-10<\/td><td>Session-10<\/td><td>Map-Reduce and the New Software Stack<\/td><td><a href=\"http:\/\/www.mmds.org\/#book\" target=\"_blank\" rel=\"noopener\">http:\/\/www.mmds.org\/#book<\/a><br>Book: MMDS, Chapter 10<\/td><td>Assignment-6<\/td><\/tr><tr><td>Week-11<\/td><td>Session-11<\/td><td>*Finding Similar Items: Locality Sensitive Hashing, *Distance Measure, *MinHashing<\/td><td><a href=\"http:\/\/www.mmds.org\/#book\" target=\"_blank\" rel=\"noopener\">http:\/\/www.mmds.org\/#book<\/a><br>Book: MMDS, Chapter 3<\/td><td><\/td><\/tr><tr><td>Week-12<\/td><td>Session-12<\/td><td><\/td><td>TBA<\/td><td>TBA<\/td><\/tr><\/tbody><\/table><\/figure>\n\n\n\n<p><\/p>\n","protected":false},"excerpt":{"rendered":"<p>Course Description We will learn theory, concepts, and applications on how to extract useful information from huge amounts of data. Course Information Syllabus Week Session Topics Resources Assignments Week-1 Session-1 [&hellip;]<\/p>\n","protected":false},"author":2,"featured_media":0,"comment_status":"closed","ping_status":"open","sticky":false,"template":"","format":"standard","meta":{"_acf_changed":false,"_jetpack_memberships_contains_paid_content":false,"footnotes":""},"categories":[13],"tags":[],"class_list":["post-809","post","type-post","status-publish","format-standard","hentry","category-courses"],"acf":[],"jetpack_featured_media_url":"","jetpack_sharing_enabled":true,"_links":{"self":[{"href":"https:\/\/ccds.ai\/index.php?rest_route=\/wp\/v2\/posts\/809","targetHints":{"allow":["GET"]}}],"collection":[{"href":"https:\/\/ccds.ai\/index.php?rest_route=\/wp\/v2\/posts"}],"about":[{"href":"https:\/\/ccds.ai\/index.php?rest_route=\/wp\/v2\/types\/post"}],"author":[{"embeddable":true,"href":"https:\/\/ccds.ai\/index.php?rest_route=\/wp\/v2\/users\/2"}],"replies":[{"embeddable":true,"href":"https:\/\/ccds.ai\/index.php?rest_route=%2Fwp%2Fv2%2Fcomments&post=809"}],"version-history":[{"count":3,"href":"https:\/\/ccds.ai\/index.php?rest_route=\/wp\/v2\/posts\/809\/revisions"}],"predecessor-version":[{"id":827,"href":"https:\/\/ccds.ai\/index.php?rest_route=\/wp\/v2\/posts\/809\/revisions\/827"}],"wp:attachment":[{"href":"https:\/\/ccds.ai\/index.php?rest_route=%2Fwp%2Fv2%2Fmedia&parent=809"}],"wp:term":[{"taxonomy":"category","embeddable":true,"href":"https:\/\/ccds.ai\/index.php?rest_route=%2Fwp%2Fv2%2Fcategories&post=809"},{"taxonomy":"post_tag","embeddable":true,"href":"https:\/\/ccds.ai\/index.php?rest_route=%2Fwp%2Fv2%2Ftags&post=809"}],"curies":[{"name":"wp","href":"https:\/\/api.w.org\/{rel}","templated":true}]}}