-
-
Notifications
You must be signed in to change notification settings - Fork 0
/
index.html
160 lines (129 loc) · 3.91 KB
/
index.html
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
<!doctype html>
<html lang="en">
<head>
<meta charset="utf-8">
<meta name="viewport" content="width=device-width, initial-scale=1.0, maximum-scale=1.0, user-scalable=no">
<title>Mwmbl: how to build a search engine with (almost) no money</title>
<link rel="stylesheet" href="dist/reset.css">
<link rel="stylesheet" href="dist/reveal.css">
<link rel="stylesheet" href="dist/theme/black.css">
<!-- Theme used for syntax highlighted code -->
<link rel="stylesheet" href="plugin/highlight/monokai.css">
</head>
<body>
<div class="reveal">
<div class="slides">
<!-- <section>Slide 1</section> -->
<!-- <section>Slide 2</section> -->
<section>
<h1>How to build a search engine with (almost) no money</h1>
<br>
<h3>Daoud Clarke</h3>
<br>
OSSym24 - 10th October 2024
</section>
<section>
<h3>A confession</h3>
</section>
<section>
<h3>December 2020</h3>
</section>
<!-- <section> -->
<!-- <h3>Indexing and searching</h3> -->
<!-- </section> -->
<!-- <section> -->
<!-- <img class="stretch" src="img/latency-1.png"> -->
<!-- </section> -->
<!-- <section> -->
<!-- <img class="stretch" src="img/latency-2.png"> -->
<!-- </section> -->
<!-- <section> -->
<!-- <img class="stretch" src="img/latency-3.png"> -->
<!-- </section> -->
<!-- <section> -->
<!-- <img class="stretch" src="img/latency-4.png"> -->
<!-- </section> -->
<!-- <section> -->
<!-- <h3>A traditional inverted index is costly</h3> -->
<!-- </section> -->
<section>
<img class="stretch" src="img/inverted-index.png">
</section>
<section>
<h3>We need a new architecture</h3>
</section>
<section data-background-size="contain" data-background-image="img/tiny-storage.svg" data-background-color="white"></section>
<section>
<h3>Crawling</h3>
</section>
<section data-background-size="contain" data-background-image="img/crawler-script.png" data-background-color="white"></section>
<section>
<img class="stretch" src="img/firefox-plugin.png">
</section>
<!-- <section> -->
<!-- <ul> -->
<!-- <li> We fit around 23 results in one page of 4096 bytes -->
<!-- <li> Google indexes around 100 billion pages per locale -->
<!-- <li> We would need an index of around 16TB -->
<!-- </ul> -->
<!-- </section> -->
<section>
<ul>
<li> 500 million pages indexed
<li> 4TB index size
</ul>
</section>
<section data-background-image="img/stats0.png" data-background-size="contain"> </section>
<section>
<h3>Technology is not enough</h3>
</section>
<section>
<img class="stretch" src="img/finances.png">
</section>
<!-- <section> -->
<!-- <img class="stretch" src="img/contributions.png"> -->
<!-- </section> -->
<section>
<img class="stretch" src="img/curations.png">
</section>
<section>
<ul>
<li> Over 4,000 registered users
<li> Over 33,000 user curations
</ul>
</section>
<section>
<img class="stretch" src="img/contributors.png">
</section>
<section>
<img class="stretch" src="img/contributors-front-end.png">
</section>
<section>
<h3>Daniel</h3>
</section>
<section>
<h3>xyny & Realmy</h3>
</section>
<section data-background-size="contain" data-background-image="img/alpha-mwmbl.png" data-background-color="white">
<a href="https://alpha.mwmbl.org">
<h3><br><br><br><br><br>Demo</h3>
</a>
</section>
</div>
</div>
<script src="dist/reveal.js"></script>
<script src="plugin/notes/notes.js"></script>
<script src="plugin/markdown/markdown.js"></script>
<script src="plugin/highlight/highlight.js"></script>
<script>
// More info about initialization & config:
// - https://revealjs.com/initialization/
// - https://revealjs.com/config/
Reveal.initialize({
hash: true,
// Learn about plugins: https://revealjs.com/plugins/
plugins: [ RevealMarkdown, RevealHighlight, RevealNotes ]
});
</script>
</body>
</html>