generated from BU-DiSC/CS561-Spring2024
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathproject.html
executable file
·363 lines (328 loc) · 21.3 KB
/
project.html
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
<!DOCTYPE html>
<html lang="en">
<head>
<meta charset="utf-8">
<meta http-equiv="X-UA-Compatible" content="IE=edge">
<meta name="viewport" content="width=device-width, initial-scale=1">
<meta name="description" content="">
<meta name="author" content="">
<link href="img/disc-favicon.png" rel="shortcut icon" type="image/x-icon" />
<title>CAS CS561 - Project - Data Systems Architectures @ Boston University</title>
<!-- Bootstrap Core CSS -->
<link href="vendor/bootstrap/css/bootstrap.min.css" rel="stylesheet">
<!-- Theme CSS -->
<link href="css/clean-blog.min.css" rel="stylesheet">
<!-- Custom CSS -->
<link href="css/main.css" rel="stylesheet">
<!-- Custom Fonts -->
<link href="vendor/font-awesome/css/font-awesome.min.css" rel="stylesheet" type="text/css">
<link href='https://fonts.googleapis.com/css?family=Lora:400,700,400italic,700italic' rel='stylesheet' type='text/css'>
<link href='https://fonts.googleapis.com/css?family=Open+Sans:300italic,400italic,600italic,700italic,800italic,400,300,600,700,800' rel='stylesheet' type='text/css'>
<!-- HTML5 Shim and Respond.js IE8 support of HTML5 elements and media queries -->
<!-- WARNING: Respond.js doesn't work if you view the page via file:// -->
<!--[if lt IE 9]>
<script src="https://oss.maxcdn.com/libs/html5shiv/3.7.0/html5shiv.js"></script>
<script src="https://oss.maxcdn.com/libs/respond.js/1.4.2/respond.min.js"></script>
<![endif]-->
</head>
<body>
<!-- Navigation -->
<nav class="navbar navbar-default navbar-custom navbar-fixed-top">
<div class="container-fluid">
<!-- Brand and toggle get grouped for better mobile display -->
<div class="navbar-header page-scroll">
<button type="button" class="navbar-toggle" data-toggle="collapse" data-target="#bs-example-navbar-collapse-1">
<span class="sr-only">Toggle navigation</span>
Menu <i class="fa fa-bars"></i>
</button>
<a class="navbar-brand" href="index.html">CS 561</a>
</div>
<!-- Collect the nav links, forms, and other content for toggling -->
<div class="collapse navbar-collapse" id="bs-example-navbar-collapse-1">
<ul class="nav navbar-nav navbar-right">
<li>
<a href="index.html">Home</a>
</li>
<li>
<a href="project.html">Project</a>
<!-- <a class="inactiveLink">Project</a> -->
</li>
<li>
<a href="labs.html">Labs</a>
</li>
<li>
<a href="http://tinyurl.com/S25-CS561-presentations" target="_blank">Presentations</a>
<!-- <a class="inactiveLink">Project</a> -->
</li>
<!-- <li>
<a href="syllabus.html">Syllabus</a>
</li> -->
<!-- <li>
<a href="http://tinyurl.com/" target="_blank">Notes</a>
</li> -->
<li>
<a href="https://www.gradescope.com/courses/918719" target="_blank">Gradescope</a>
<!-- <a href="https://tinyurl.com/CS591A1-blackboard" target="_blank">Blackboard</a> -->
</li>
<li>
<a href="https://piazza.com/bu/spring2025/cs561/" target="_blank">Piazza</a>
</li>
<li>
<a href="https://disc.bu.edu/" target="_blank">DiSC lab</a>
</li>
<!-- <li>
<a href="contact.html">Contact</a>
</li>
-->
<!-- <li>
<a href="#first">1st</a>
</li>
<li>
<a href="#second">2nd</a>
</li> -->
</ul>
</div>
<!-- /.navbar-collapse -->
</div>
<!-- /.container -->
</nav>
<!-- Page Header -->
<!-- Set your background image for this header on the line below. -->
<header class="intro-header" style="background-image: url('img/project-bg.jpg')">
<div class="container">
<div class="row">
<div class="col-lg-8 col-lg-offset-2 col-md-10 col-md-offset-1">
<div class="page-heading">
<h1>Project</h1>
<hr class="small">
<span class="subheading">Getting hands-on experience with state-of-the-art data systems!</span>
<p class="text-center">
<!-- <a class="btn btn-xl" style="color: #fff;" href="#project0">Project 0</a> -->
<!-- <a class="btn btn-xl" style="color: #fff;" href="#project">Class Project</a> -->
</p>
</div>
</div>
</div>
</div>
</header>
<!-- Keeping it as a template for future notes -->
<div class="row">
<div class="col-lg-8 col-lg-offset-2">
<div class="alert alert-danger" role="alert">
<p><strong>Note: </strong> The material of the website is currently updated. Please visit periodically to monitor updates as the beginning of the semester approaches.
</p>
</div>
</div>
</div>
<!-- Main Content -->
<div class="container">
<!-- <div class="row">
<div class="col-md-12 text-center">
<h4>Update 04/08/20</h4>
<p>
We have uploaded a
<a target="_blank" style="text-decoration: underline;" href="resources/final_report_template.zip">final project report template</a>
for reference.
</p>
</div>
</div> -->
<div class="row">
<div class="col-md-12">
<div class="text-center">
<h1>Project Deadlines</h1>
<!-- <h3>(Tentative dates)</h3> -->
<br>
<table style="margin-left:auto;margin-right:auto; border:0pt;">
<tr>
<td style="text-align:left"><b>Title </b></td>
<!-- <td style="text-align:left"><b>Release Date </b></td> -->
<td style="text-align:left"><b> Due Date</b></td>
<td style="text-align:left"><b> Material</b></td>
</tr>
<tr>
<td style="text-align:left"><a href="https://www.gradescope.com/courses/693490/assignments/3859930" target="_blank" style="text-decoration: underline;">Project 0</a></td>
<!-- <td style="text-align:left">01/28</td> -->
<td style="text-align:left"> 02/02 </td>
<td style="text-align:left"> <a href="projects/CS561-S24-Proj0-Zonemaps.pdf" target="_blank" style="text-decoration: underline;">Project 0 Doc</a></td>
</tr>
<tr>
<td style="text-align:left"><a href="https://www.gradescope.com/courses/693490/assignments/3988336" target="_blank" style="text-decoration: underline;">Project 1</a></td>
<!-- <td style="text-align:left">01/28</td> -->
<td style="text-align:left"> 02/16</td>
<td style="text-align:left"> <a href="projects/CS561-S24-Proj1-RocksDB.pdf" target="_blank" style="text-decoration: underline;">Project 1 Doc</a></td>
</tr>
<tr>
<!-- <td style="text-align:left"><a href="https://www.gradescope.com/courses/470999/assignments/2693017" target="_blank" style="text-decoration: underline;">Project Proposal</a></td> -->
<td style="text-align:left"><a href="" target="_blank" style="text-decoration: underline;">Project Proposal</a></td>
<td style="text-align:left"> 02/23 </td>
<!-- <td style="text-align:left"> 03/01 </td> -->
<!-- <td style="text-align:left">SimpleDB part 2 </td> -->
</tr>
<tr>
<td style="text-align:left"><a href="https://www.gradescope.com/courses/693490/assignments/4251488/" target="_blank" style="text-decoration: underline;">Mid-semester Report</a> </td>
<td style="text-align:left"> 03/29 </td>
<!-- <td style="text-align:left"> <font color="red">03/31</font </td> -->
<td style="text-align:left"> <a href="https://www.overleaf.com/read/ryckhctxswvk" target="_blank" style="text-decoration: underline;">Report Template</a></td>
<!-- <td style="text-align:left">SimpleDB part 3</td> -->
</tr>
<tr>
<td style="text-align:left"><a href="#" target="_blank" style="text-decoration: underline;">Preliminary Project Report</a></td>
<td style="text-align:left"> 04/22 </td>
<!-- <td style="text-align:left"> 04/27 </td> -->
<!-- <td style="text-align:left"> 04/26 </td> -->
</tr>
<tr>
<td style="text-align:left"><a href="#" target="_blank" style="text-decoration: underline;">Final Project Report</a></td>
<td style="text-align:left"> 04/26 </td>
<!-- <td style="text-align:left"> 05/06 </td> -->
<!-- <td style="text-align:left">Query optimization</td> -->
</tr>
<!-- <tr>
<td style="text-align:left"><font color="red">NEW (BONUS): </font><a href="./projects/PA3.pdf">PA3</a></td>
<td style="text-align:left"><strike>11/26 </strike> 12/1</td>
<td style="text-align:left;"><strike>12/8</strike> <font color="red">12/11 </font></td>
<td style="text-align:left">NoSQL systems</td>
</tr> -->
</table>
</div>
</div>
</div>
<div class="row">
<div class="col-md-12">
<h4 style="margin-bottom: 5px">Project 0</h4>
<p style="margin-top: 0px">A quick dev. project to sharpen C++ skills and to prepare for the upcoming research/dev project.
<!-- For project 0, you are tasked to implement a simple zone map data structure. A zone map maintains min/max value ranges of
one or more columns over contiguous sets of data blocks. The objective of the project is to implement and evaluate the performance
of zonemaps with varying workloads. More information about the project can be found <a href="./projects/Proj0.pdf" target="_blank"
style="text-decoration: underline;">here</a>. -->
</p>
</div>
</div>
<div class="row">
<div class="col-md-12">
<h4 style="margin-bottom: 5px">Project 1</h4>
<!-- <h4 style="margin-bottom: 5px">Project 1: Row-store vs. Col-store</h4> -->
<p style="margin-top: 0px">A small benchmarking project on RocksDB.
<!-- A project that will expose you to the two fundamental relational data system architectures
(row-stores and column-stores). The objective is to deploy and experiment with a row-store system (PostgreSQL) and
a column-store system (MonetDB) and compare them for different queries in order to showcase when each system should
be used. More information about the project can be found <a href="./projects/Proj1.pdf" target="_blank"
style="text-decoration: underline;">here</a>. -->
</p>
</div>
</div>
<div class="row">
<div class="col-md-12">
<h4 style="margin-bottom: 5px">Class Project</h4>
<p style="margin-top: 0px">
Every student should complete a semester-long class project. The students can decide between a systems project and a research project.
</p>
<h4>Useful links:</h4>
<ul>
<li><a target="_blank" style="text-decoration: underline;" href="resources/short-intro-storage-hierarchy.pdf">Introduction to Storage and Memory Hierarchy</a> and some <a href="https://github.com/manathan1984/CacheTests" style="text-decoration: underline;">example code</a></li>
<li><a target="_blank" style="text-decoration: underline;" href="resources/DevTools.pdf">Introduction to debugging and performance tools [material developed at Harvard]</a></li>
<li><a target="_blank" style="text-decoration: underline;" href="resources/PerfTools.pdf">Performance monitoring [material developed at Harvard]</a></li>
<li><a target="_blank" style="text-decoration: underline;" href="resources/tpc-h-tool.zip">TPCH Data and Query generator tool</a></li>
<li><a target="_blank" style="text-decoration: underline;" href="https://dl.acm.org/citation.cfm?doid=2588555.2588892">A short summary of how to efficiently code multi-cores </a> (for a more detailed version drop by my office)</li>
<li><a target="_blank" style="text-decoration: underline;" href="resources/final_report_template.zip">Final project report template</a></li>
</ul>
</div>
</div>
<div class="row">
<div class="col-md-6 text-center">
<h1> System Projects</h1>
<p>A system project sharpens your systems skills and provides
background on state-of-the-art systems, data structures and
algorithms. For a successful systems project you will design
and implement a systems component in C or C++, and you will
deal with low-level system implementation details like memory
allocation and management, cache-aware processing, parallel
and concurrent processing and a deeper understanding of
read/write performance trade-offs, and performance
scalability. <b>Systems projects can be carried out by one student or a group of two students.</b></p>
<p>This year we will have two topics for a systems project.</p>
<h2>Project </h2>
<p> <a href="./projects/system/CS561-S24-SysProj-LSM-trees.pdf" target="_blank" style="text-decoration: underline;">Implementation of LSM-Trees</a> </p>
<p> <a href="./projects/system/CS561-S24-SysProj-Bufferpool.pdf" target="_blank" style="text-decoration: underline;">Implementation of a Bufferpool</a> </p>
</div>
<div class="col-md-6 text-center">
<h1> Research Projects</h1>
<p>A research project, on the other hand, aims at
challenging the state-of-the-art. The goal is (i) either to
better understand an open research problem through
analysis and benchmarking, or (ii) to solve open problems
through new designs and proof-of-concept implementations.
The ultimate goal of a research project is to give a taste
of research to students, and ideally lead to publications.
When working on a research project, the student will
interact with the instructor and the teaching assistants
closely. <b>Students will work in groups of three students.</b></p>
<p>We have a number of possible research topics below. The
students can also propose their own project (subject to
instructor's approval). </p>
<h2>Subjects</h2>
<p> <a href="./projects/research/CS561-S24-Research-Skew-Optimization-Postgres.pdf" target="_blank" style="text-decoration: underline;">Boosting Join Implementation for Skew Correlation in Postgres</a> </p>
<p> <a href="./projects/research/CS561-S24-Research-Optimal-Index-Granularity-in-LSM.pdf" target="_blank" style="text-decoration: underline;">Finding the Optimal Granularity of Index</a> </p>
<p> <a href="./projects/research/CS561-S24-Quantifying_WA_LSM_SSD.pdf" target="_blank" style="text-decoration: underline;">Quantifying Write Amplification in LSM-based Key-Value Stores on SSDs</a> </p>
<p> <a href="./projects/research/CS561-S24-Research-Graph-Benchmarking.pdf" target="_blank" style="text-decoration: underline;">Benchmark Large Graph Processing Systems</a> </p>
<p> <a href="./projects/research/CS561-S24-Research-Query-Selectivity.pdf" target="_blank" style="text-decoration: underline;">Q-QUEST: Are Questionable QUEry Selectivity Tolerable?</a> </p>
<p> <a href="./projects/research/CS561-S24-Spatial-Index-Ingestion.pdf" target="_blank" style="text-decoration: underline;">Robust Ingestion for Spatial Indexes</a> </p>
<p> <a href="./projects/research/CS561-S24-Research-compression-sortedness.pdf" target="_blank" style="text-decoration: underline;">Compression Algorithms Under Varying Data Sortedness</a> </p>
<!-- <p> <a href="./projects/research/CS561-S23-Research-RangeDeletesLSM.pdf" target="_blank" style="text-decoration: underline;">Range Deletes in LSM-Trees</a> </p>
<p> <a href="./projects/research/CS561-S23-Research-Query-driven-LSM-Compaction.pdf" target="_blank" style="text-decoration: underline;">Query-driven compaction in LSM-trees</a> </p>
<p> <a href="./projects/research/CS561-S23-Research-Sorting_Algorithms.pdf" target="_blank" style="text-decoration: underline;">Evaluating Sorting Algorithms with Varying Data Sortedness</a> </p>
<p> <a href="./projects/research/CS561-S23-Research-RobustnessMeasures.pdf" target="_blank" style="text-decoration: underline;">Measuring the Robustness of Modern Key-Value Stores</a> </p>
<p> <a href="./projects/research/CS561-S23-Research-Graph-Benchmarking.pdf" target="_blank" style="text-decoration: underline;">Benchmarking Large Graph Processing Systems</a> </p>
<p> <a href="./projects/research/CS561-S23-Research-Benchmark-Compression-With-Near-Sortedness.pdf" target="_blank" style="text-decoration: underline;">Benchmark Compression With Near Sortedness</a> </p> -->
</div>
</div>
</div>
</div>
<hr>
<!-- Footer -->
<footer>
<div class="container">
<div class="row">
<div class="col-lg-8 col-lg-offset-2 col-md-10 col-md-offset-1">
<!-- <ul class="list-inline text-center">
<li>
<a href="#">
<span class="fa-stack fa-lg">
<i class="fa fa-circle fa-stack-2x"></i>
<i class="fa fa-twitter fa-stack-1x fa-inverse"></i>
</span>
</a>
</li>
<li>
<a href="#">
<span class="fa-stack fa-lg">
<i class="fa fa-circle fa-stack-2x"></i>
<i class="fa fa-facebook fa-stack-1x fa-inverse"></i>
</span>
</a>
</li>
<li>
<a href="#">
<span class="fa-stack fa-lg">
<i class="fa fa-circle fa-stack-2x"></i>
<i class="fa fa-github fa-stack-1x fa-inverse"></i>
</span>
</a>
</li>
</ul> -->
<p class="copyright text-muted">Copyright © DiSC Lab</p>
</div>
</div>
</div>
</footer>
<!-- jQuery -->
<script src="vendor/jquery/jquery.min.js"></script>
<!-- Bootstrap Core JavaScript -->
<script src="vendor/bootstrap/js/bootstrap.min.js"></script>
<!-- Contact Form JavaScript -->
<script src="js/jqBootstrapValidation.js"></script>
<script src="js/contact_me.js"></script>
<!-- Theme JavaScript -->
<script src="js/clean-blog.min.js"></script>
</body>
</html>