forked from materials-data-facility/llm-hackathon
-
Notifications
You must be signed in to change notification settings - Fork 62
/
main.tex
328 lines (236 loc) · 13.1 KB
/
main.tex
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
\PassOptionsToPackage{hyphens}{url}
\documentclass[superscriptaddress, nofootinbib, amsmath, amssymb, twocolumn]{revtex4-2}
\usepackage[margin=1.5cm]{geometry}
\usepackage[english]{babel}
\usepackage[utf8]{inputenc}
\usepackage[]{graphicx}
\usepackage{xspace}
\usepackage{siunitx}
\usepackage{mhchem}
\DeclareSIUnit\angstrom{\text {Å}}
\usepackage{orcidlink}
\usepackage{hyperref}
\usepackage{fontawesome5}
\usepackage{natmove}
\usepackage{placeins}
\usepackage{xparse}
\usepackage{hyperref}
\usepackage[a-1b]{pdfx}
\newcommand{\githublink}[2]{
\href{https://github.com/#1/#2}{\faGithub\ \url{#1/#2}}
}
\newcommand{\twitterlink}[1]{
\href{#1}{\faTwitter}
}
\newcommand{\zenodolink}[1]{
\href{https://doi.org/#1}{\faArchive\ \url{#1}}
}
%https://twitter.com/SamCox822/status/1641484192566460416?s=20
\newcommand{\hflogo}{%
\includegraphics[height=.9em]{figures/huggingface.png}
}
\newcommand{\huggingfacelink}[2]{
\href{https://huggingface.co/spaces/#1/#2}{\hflogo \url{#1/#2}}
}
\newcommand{\huggingfacehublink}[2]{
\href{https://huggingface.co/#1/#2}{\hflogo \url{#1/#2}}
}
% Adjusted Hyperref Setup for Automatically Colored Text Links
\hypersetup{
colorlinks=true, % Enables colored links
breaklinks=true,
urlcolor=blue, % Sets the color of URL links
linkcolor=blue, % Sets the color of internal links
citecolor=blue, % Sets the color of citation links
filecolor=blue, % Sets the color of file links
allcolors=blue, % Ensures all link types are blue by default
pdftitle={Title}, % PDF Title
pdfauthor={Author} % PDF Author
}
\usepackage[nameinlink,capitalise]{cleveref} %needs to appear after hyperref, https://tex.stackexchange.com/questions/396728/my-equations-referencing-not-working
\Crefname{figure}{Figure}{Figures} %needs to appear after hyperref and cleveref
\crefname{appsec}{Appendix}{Appendices}
\newcommand\crefrangeconjunction{--} % modify the reference style
% =====================================================
% packages for creating code listings
\usepackage{listings, xcolor}
\definecolor{codegreen}{rgb}{0,0.6,0}
\definecolor{codegray}{rgb}{0.5,0.5,0.5}
\definecolor{codepurple}{rgb}{0.58,0,0.82}
\definecolor{tqblue}{HTML}{08293d}
\definecolor{backcolour}{HTML}{fefdf5}
\lstdefinestyle{pythonstyle}{
backgroundcolor=\color{backcolour},
commentstyle=\color{codegreen},
keywordstyle=\color{magenta},
numberstyle=\tiny\color{codegray},
stringstyle=\color{codepurple},
basicstyle=\ttfamily\footnotesize\color{tqblue},
breakatwhitespace=false,
breaklines=true,
postbreak=\mbox{\textcolor{magenta}{$\hookrightarrow$}\space},
captionpos=b,
keepspaces=true,
numbers=left,
numbersep=5pt,
showspaces=false,
showstringspaces=false,
showtabs=false,
tabsize=2
}
\lstset{style=pythonstyle}
\hbadness=99999
\newcolumntype{C}{>{$}c<{$}}
\AtBeginDocument{%
\heavyrulewidth=.08em
\lightrulewidth=.05em
\cmidrulewidth=.03em
\belowrulesep=.65ex
\belowbottomsep=0pt
\aboverulesep=.4ex
\abovetopsep=0pt
\cmidrulesep=\doublerulesep
\cmidrulekern=.5em
\defaultaddspace=.5em
}
\usepackage[most]{tcolorbox}
\tcbset {
base/.style={
arc=0mm,
bottomtitle=0.5mm,
boxrule=0mm,
colbacktitle=black!10!white,
coltitle=black,
fonttitle=\bfseries,
left=2.5mm,
leftrule=1mm,
right=8.5mm,
title={#1},
toptitle=0.75mm,
width=\textwidth,
breakable
}
}
\definecolor{brandblue}{rgb}{0, 0.27843137254902, 0.466666666666667}
\newtcolorbox{agentinteraction}[1]{
colframe=brandblue,
base={#1}
}
\definecolor{brandbred}{rgb}{0.63921568627451, 0, 0}
\newtcolorbox{agentinteraction2}[1]{
colframe=brandbred,
base={#1}
}
\newtcolorbox{subbox}[1]{
colframe=black!30!white,
base={#1}
}
\usepackage [autostyle, english = american]{csquotes}
\usepackage[acronym, nonumberlist]{glossaries}
\makeglossaries
\input{latex/glossary}
\usepackage{tabularx} % For flexible tables with adjustable column widths
\usepackage{booktabs} % For better table lines (\toprule, \midrule, \bottomrule)
\usepackage{cleveref}
\let\originalcite\cite
\renewcommand{\cite}[1]{\unskip~\originalcite{#1}}
\usepackage{setspace}
% \clubpenalty=10000
% \widowpenalty=10000
% \displaywidowpenalty=10000
\usepackage{titlesec}
\titlespacing{\subsection}
{0pt}{9pt}{6pt}
\usepackage{array}
\usepackage{ragged2e}
\usepackage{nicefrac}
\usepackage[caption=false]{subfig}
\newcolumntype{P}[1]{>{\raggedright\arraybackslash}p{#1}}
\begin{document}
\title{Bayesian Optimization Hackathon for Chemistry and Materials}
% \input{latex/authors}
\begin{abstract}
The Acceleration Consortium and Merck KGaA hosted a 2-day virtual hackathon on March 27-28, 2024, bringing together scientists to explore, collaborate, and innovate in the field of Bayesian optimization for the physical sciences. Participants were encouraged to select or develop Bayesian optimization algorithms, apply them to benchmarking tasks, design new benchmarks, create instructional tutorials, and describe real-world applications. With over 100 participants across 60 academic, industry, and government organizations located in 38 cities, 14 countries, and 4 continents, this was a global event. % https://chatgpt.com/share/f6cd733f-1126-4151-86c5-d4b59d158dc3
The outputs from this event, including developed algorithms, benchmarks, and tutorials, will serve as valuable resources for the research community, in addition to the new skills learned and connections formed. Released projects and general information are available at \url{https://ac-bo-hackathon.github.io/} and other locations linked from individual project pages. This event demonstrated the potential of community-driven research efforts to accelerate advances in Bayesian optimization in chemistry and materials science.
\end{abstract}
\maketitle
% ToDo:
% emphasize tooling/constrained prompting/guidance
\section{Introduction}
Bayesian optimization (BO) has emerged as a powerful tool in optimizing complex and expensive-to-evaluate functions, often outperforming traditional search methods in a variety of scientific domains such as optimizing composition and processing parameters to maximize alloy yield strength or identifying synthesis pathways that maximize efficacy of HIV drugs (\cref{fig:intro-bo}). Hackathons help people to connect, gain skills, and flesh out new ideas. In the words of Michelle Duke, the "Hackathon Queen":
\begin{quote}
A hackathon is a short competition where people work together in teams to solve problems and challenges by coming up with solutions and ideas.
\end{quote}
\begin{figure}
\centering
\includegraphics[width=1\linewidth]{latex/figures/intro-bo.png}
\caption{Optimization traces for traditional design of experiment (DoE) methods compared with Bayesian optimization (BO), typically outperforms. BO uses a smart model to predict where to look next in an experiment to find the best results with few experiments.}
\label{fig:intro-bo}
\end{figure}
The goal of the AC BO Hackathon was to leverage the expertise of a diverse, global community to advance the development and application of BO techniques for solving critical challenges in the physical sciences. The hackathon also aimed to foster collaboration and knowledge sharing among participants from different backgrounds, including academia, national laboratories, government agencies, and private industry. The event attracted 120 active participants from 44 teams, representing 41 academic institutions, 12 national labs, and 9 companies. Likewise, the participants were located in 38 cities, 14 countries, and 4 continents (\cref{fig:map}). A full list of projects, including links to the corresponding GitHub repositories, submission video, and social media post are provided in \cref{tab:projects}.
\begin{figure}[h!]
\centering
% \captionsetup{justification=centering}
\includegraphics[width=1\linewidth]{latex/figures/world_map.png}
\caption{Demographic distributions of the participating teams and their affiliations. \label{fig:map}}
\end{figure}
\begin{table*}[]
\caption{List of projects and project types, with links to corresponding website project pages, repositories, videos, and social media posts.}
\label{tab:projects}
\setlength{\extrarowheight}{0.4em}
\begin{tabularx}{\textwidth}{>{\centering\arraybackslash}p{1cm} X >{\centering\arraybackslash}X}
\toprule
\# & Project Name & Links \\ \midrule
\href{https://example.com}{\#1} & Project A &
\href{https://github.com/example}{\faGithub} \,
\href{https://youtube.com}{\faVideo} \,
\href{https://twitter.com}{\faTwitter} \tabularnewline
\href{https://example.com}{\#2} & Project B &
\href{https://github.com/example}{\faGithub} \,
\href{https://youtube.com}{\faVideo} \,
\href{https://linkedin.com}{\faLinkedin} \tabularnewline
\href{https://example.com}{\#3} & Project C &
\href{https://github.com/example}{\faGithub} \,
\href{https://youtube.com}{\faVideo} \,
\href{https://twitter.com}{\faTwitter} \tabularnewline
\bottomrule
\end{tabularx}
\end{table*}
Participants were provided with various resources to prepare for the hackathon – this included GitHub classroom assignments with automated feedback, application- and theory-focused videos and tutorials, Python refresher materials, and a list of tools to consider using during the hackathon (\cref{fig:preparation}).
\begin{figure}
\centering
\includegraphics[width=1\linewidth]{latex/figures/preparation.png}
\caption{A snapshot of \href{https://ac-bo-hackathon.github.io/resources/}{resources listed on the hackathon webpage} such as hackathon orientation, intro to BO, and Python refreshers.}
\label{fig:preparation}
\end{figure}
One of the unique aspects of this event is that it was hosted in Gather Town, a sort of union between traditional video conferencing software and retro arcade-style avatars and virtual spaces (\cref{fig:gathertown}). Participants create a custom avatar and maneuver in a two-dimensional space. The videos and audio of other participants appear and become audible when nearby, and fade out when far away, simulating an in-person experience. At the beginning of the hackathon, all participants gathered to listen to keynotes in realtime, which were broadcasted via YouTube live and embedded into the Gather Town space. The videos were then \href{https://ac-bo-hackathon.github.io/videos-slides/}{made available on the hackathon website}. After 2 months, the videos collectively had approximately 1600 views. After the keynotes, teams were assigned tables in breakout rooms, each with a whiteboard. Individual tables were assigned as "private spaces" which isolated the shared audio and video within each space. This had a number of advantages for collaboration within and across teams.
\begin{figure}
\centering
\includegraphics[width=1\linewidth]{latex/figures/gathertown.png}
\caption{Gather town \href{https://ac-bo-hackathon.github.io/videos-slides/}{keynote} room (left), custom avatars (top-right), and an example of a breakout room for teams (bottom-right). Keynotes were broadcasted in realtime to participants via an embedded YouTube livestream. Use of Gather Town leveled the playing field for teams who were in physically separate locations and made it easier for facilitators and other teams to have more natural "check-ins" with other projects.}
\label{fig:gathertown}
\end{figure}
The hackathon concluded with a project showcase accompanied by crowdsourced judging within a "poster room" (\cref{fig:poster}).
% Preparation for the hackathon - 111 GitHub Classroom assignments accepted
% The hackathon was designed with tips, trick, and resources from various sources, such as https://github.com/github/hackathons.
% Hosts: Acceleration Consortium, Merck KGaA
\begin{table*}[]
\caption{Project Topics for the Hackathon. See \href{https://ac-bo-hackathon.github.io/submission/}{the submission page} for more details.}
\label{tab:project_topics}
\setlength{\extrarowheight}{0.4em}
\begin{tabularx}{\textwidth}{>{\centering\arraybackslash}p{0.5cm} p{4.5cm} X}
\toprule
& \textbf{Topic} & \textbf{Description} \\ \midrule
1 & \textbf{Apply Algorithms} & Choose a package or algorithm and apply it to one of \href{https://huggingface.co/collections/AccelerationConsortium/optimization-benchmarks-66a44daf10de1a0335f28826}{the benchmark tasks prepackaged for the hackathon}. \\
2 & \textbf{Develop Benchmarks} & Develop a new benchmark and add it to the suite of benchmarks from above. \\
3 & \textbf{Create Tutorials} & Create "gentle introduction" tutorials for \href{https://ac-microcourses.readthedocs.io/en/latest/courses/data-science/overview.html}{advanced optimization topics}. \\
4 & \textbf{Propose Tasks} & Propose materials tasks that \textit{can} and \textit{should} be tackled with BO \\
5 & \textbf{General} & Other projects that are related to Bayesian optimization for the physical sciences \\
\bottomrule
\end{tabularx}
\end{table*}
\section*{Acknowledgements}
%\printglossaries
% \bibliographystyle{achemso}
\bibliography{latex/ac-bo-hackathon}
\end{document}