Skip to content

Commit 9d4914e

Browse files
Update bibliography (#40)
1 parent 2536107 commit 9d4914e

File tree

2 files changed

+128
-67
lines changed

2 files changed

+128
-67
lines changed

LJMiranda_CV.tex

Lines changed: 80 additions & 33 deletions
Original file line numberDiff line numberDiff line change
@@ -14,16 +14,20 @@
1414
\usepackage[usenames,dvipsnames]{color}
1515
\usepackage{verbatim}
1616
\usepackage{enumitem}
17-
\usepackage{natbib}
17+
% \usepackage[numbers,sort&compress]{natbib}
18+
\usepackage[sorting=ydnt,backend=biber,style=numeric,defernumbers=true,minbibnames=7,maxbibnames=99]{biblatex}
1819
\usepackage[colorlinks=true,urlcolor=darkblue]{hyperref}
1920
\usepackage{fancyhdr}
2021
\usepackage[english]{babel}
2122
\usepackage{tabularx}
2223
\usepackage{xcolor}
2324
\input{glyphtounicode}
2425
\definecolor{darkblue}{rgb}{0.0, 0.0, 0.5}
25-
26-
26+
\hypersetup{
27+
colorlinks=true,
28+
citecolor=darkblue
29+
}
30+
\addbibresource{publications.bib}
2731
%----------FONT OPTIONS----------
2832
% sans-serif
2933
% \usepackage[sfdefault]{FiraSans}
@@ -102,12 +106,12 @@
102106
\newcommand{\resumeItemListStart}{\begin{itemize}}
103107
\newcommand{\resumeItemListEnd}{\end{itemize}\vspace{-5pt}}
104108

105-
\renewcommand{\bibpreamble}{
106-
You can also check my \href{https://scholar.google.com/citations?user=2RtnNKEAAAAJ&hl=en}{Google Scholar profile}
107-
(Scholar ID: \texttt{2RtnNKEAAAAJ})
108-
for an updated list of my publications.
109-
Note: an asterisk (*) denotes equal or major contributions.
110-
}
109+
% \renewcommand{\bibpreamble}{
110+
% You can also check my \href{https://scholar.google.com/citations?user=2RtnNKEAAAAJ&hl=en}{Google Scholar profile}
111+
% (Scholar ID: \texttt{2RtnNKEAAAAJ})
112+
% for an updated list of my publications.
113+
% Note: an asterisk (*) denotes equal or major contributions.
114+
% }
111115

112116
%-------------------------------------------
113117
%%%%%% RESUME STARTS HERE %%%%%%%%%%%%%%%%%%%%%%%%%%%%
@@ -138,33 +142,34 @@ \section{Experience}
138142
{Allen Institute for AI}{2023 -- Present}
139143
{Predoctoral Young Investigator}{Seattle, WA}
140144
\resumeItemListStart
141-
\resumeItem{Conducts research broadly in LLM post-training and alignment, such as preference annotation (\textsc{MultiPref}), reward model evaluation (\textsc{RewardBench}), and fully open-source post-training recipes (\textsc{T\"ulu 3}, \textsc{OLMo 2}).}
142-
% \resumeItem{Mentors: Pradeep Dasigi, Yanai Elazar, Yizhong Wang}
145+
\resumeItem{Conducts research in language model post-training and alignment \cite{lambert2024tulu,lambert-etal-2025-rewardbench,miranda2025hybrid}.}
146+
\resumeItem{Mentors: Pradeep Dasigi, Yizhong Wang, Yanai Elazar}
143147
\resumeItemListEnd
144148

145149
\resumeSubheading
146150
{Explosion GmbH}{2021 -- 2023}
147151
{Machine Learning Engineer, spaCy Team}{Berlin, DE}
148152
\resumeItemListStart
149-
\resumeItem{Authored a technical paper on benchmarking spaCy's hash-embedding trick on span categorization and NER.}
150-
\resumeItem{Developed human-in-the-loop and LLM annotation workflows for Prodigy, our data annotation product.}
151-
\resumeItem{Built several open-source NLP tools such as \href{https://github.com/explosion/spacy-llm}{spacy-llm} (production LLM pipelines), \href{https://github.com/explosion/vscode-prodigy}{vscode-prodigy} (VSCode extension for data annotation), and \href{https://github.com/explosion/projects}{spaCy projects} (end-to-end NLP workflows for production).}
153+
\resumeItem{Software developer and researcher for the \href{https://spacy.io}{spaCy} NLP library and the \href{https://prodigy.ai}{Prodigy} annotation tool.}
154+
\resumeItem{Wrote a technical report on benchmarking spaCy's embeddings on span categorization tasks \cite{miranda2022multihash}.}
155+
% \resumeItem{Developed human-in-the-loop and LLM annotation workflows for Prodigy, our data annotation product.}
156+
% \resumeItem{Built several open-source NLP tools such as \href{https://github.com/explosion/spacy-llm}{spacy-llm} (production LLM pipelines), \href{https://github.com/explosion/vscode-prodigy}{vscode-prodigy} (VSCode extension for data annotation), and \href{https://github.com/explosion/projects}{spaCy projects} (end-to-end NLP workflows for production).}
152157
\resumeItemListEnd
153158

154159
\resumeSubheading
155160
{Thinking Machines Data Science}{2018 -- 2021}
156161
{Machine Learning Researcher}{Metro Manila, PH}
157162
\resumeItemListStart
158-
\resumeItem{Developed several production-grade NLP applications for a sovereign wealth fund in Singapore.}
159-
\resumeItem{Led a team in a large-scale digitization project of government financial statements for The World Bank.}
160-
\resumeItem{Led an internal team of six in document processing initiatives to improve our Document AI product.}
163+
\resumeItem{Developed NLP products for clients in the financial and the utilities sector.}
164+
\resumeItem{Managed an internal research team for document processing.}
161165
\resumeItemListEnd
162166

163167
\resumeSubheading
164168
{Preferred Networks}{2018}
165169
{Research Intern}{Tokyo, JP}
166170
\resumeItemListStart
167-
\resumeItem{Project: Implementing a parallelization feature for ChainerRL to support efficient batch Proximal Policy Optimization (PPO) and Advantage Actor Critic (A2C) for reinforcement learning.}
171+
\resumeItem{Developed a parallelized Advantage Actor Critic (A2C) algorithm for the \href{https://github.com/chainer/chainerrl}{ChainerRL} library.}
172+
\resumeItem{Mentors: Yasuhiro Fujita, Toshiki Kataoka}
168173
\resumeItemListEnd
169174

170175
\resumeSubHeadingListEnd
@@ -176,19 +181,35 @@ \section{Education}
176181
{Waseda University}{2016 -- 2018}
177182
{M.Eng. Information Architecture, Neurocomputing Systems Laboratory}{Fukuoka, JP}
178183
\resumeItemListStart
179-
\resumeItem{Thesis: Autoencoder-based Feature Extraction Techniques for Protein Function Prediction}
180-
\resumeItem{Awards: Monbukagakusho (MEXT) Japanese Government Scholarship}
184+
\resumeItem{Thesis: Autoencoder-based Feature Extraction Techniques for Protein Function Prediction \cite{miranda2018deep,miranda2018feature}}
185+
\resumeItem{Supervisor: Jinglu Hu}
186+
% \resumeItem{Awards: Monbukagakusho (MEXT) Japanese Government Scholarship}
181187
\resumeItemListEnd
182188

183189
\resumeSubheading
184190
{Ateneo de Manila University}{2011 -- 2016}
185191
{B.S. Electronics and Communications Engineering, Minor in Philosophy (Cum Laude)}{Metro Manila, PH}
186192
\resumeItemListStart
187-
\resumeItem{Thesis: Appliance Recognition using Hall-Effect Current Sensors for Power Management Systems}
188-
\resumeItem{Awards: DOST-SEI Merit Scholarship, Ateneo College Scholarship}
193+
\resumeItem{Thesis: Appliance Recognition using Hall-Effect Current Sensors for Power Management Systems \cite{miranda2016appliance}}
194+
\resumeItem{Supervisors: Rosula S.J. Reyes, Matthew Dumlao}
195+
% \resumeItem{Awards: DOST-SEI Merit Scholarship, Ateneo College Scholarship}
189196
\resumeItemListEnd
190197
\resumeSubHeadingListEnd
191198

199+
%-----------AWARDS-----------
200+
\section{Awards \& Fellowships}
201+
\resumeSubHeadingListStart
202+
\resumeProjectHeading
203+
{\textbf{Cohere Labs Aya Expedition Silver Prize} (for M-RewardBench \cite{gureja2025mrewardbench}) $|$ \emph{Cohere Labs}}{2024}
204+
\resumeProjectHeading
205+
{\textbf{Monbukagakusho (MEXT) Japanese Government Scholarship} $|$ \emph{Waseda University}}{2016}
206+
\resumeProjectHeading
207+
{\textbf{PhilFrance French Embassy Scholarship} $|$ \emph{Institut Catholique d'Arts et Métiers}}{2015}
208+
\resumeProjectHeading
209+
{\textbf{DOST-SEI Merit Scholarship} $|$ \emph{Ateneo de Manila University}}{2011}
210+
\resumeProjectHeading
211+
{\textbf{Ateneo College Scholarship} $|$ \emph{Ateneo de Manila University}}{2011}
212+
\resumeSubHeadingListEnd
192213

193214
%-----------PROJECTS-----------
194215
\section{Open-source Projects}
@@ -197,38 +218,64 @@ \section{Open-source Projects}
197218
{\textbf{calamanCy} $|$ \url{https://github.com/ljvmiranda921/calamanCy}}{2023}
198219
\resumeItemListStart
199220
\resumeItem{Natural language processing toolkit for building Tagalog pipelines based on spaCy.}
200-
\resumeItem{Software paper was published in the NLP-OSS workshop at EMNLP `23.}
201-
\resumeItem{Associated NER dataset was published in the SEALP workshop at IJCNLP-AACL `23.}
221+
\resumeItem{Presented at several NLP workshops \cite{miranda2023calamancy,miranda2023developing}.}
202222
\resumeItemListEnd
203223
\resumeProjectHeading
204224
{\textbf{PySwarms} $|$ \url{https://github.com/ljvmiranda921/pyswarms}}{2018}
205225
\resumeItemListStart
206-
\resumeItem{Python-based framework for implementing swarm optimization algorithms.}
207-
\resumeItem{Software paper was published in the Journal of Open Source Software (JOSS).}
208-
\resumeItem{Has over 1k+ GitHub stars and used by over 300 repositories and packages.}
226+
\resumeItem{Python-based framework for implementing swarm optimization algorithms (1k+ GitHub stars).}
227+
\resumeItem{Published in the Journal of Open Source Software \cite{miranda2018pyswarms}.}
209228
\resumeItemListEnd
210229
\resumeSubHeadingListEnd
211230

231+
%-----------PROJECTS-----------
212232
\section{Invited Talks}
213233
\resumeSubHeadingListStart
214234
\resumeProjectHeading
215-
{\textbf{Artisanal Filipino Resources in the Age of LLMs} $|$ \emph{De la Salle University - Manila}}{2024}
235+
{\textbf{Artisanal Filipino Resources in the Age of LLMs} (host: Charibeth Cheng) $|$ \emph{DLSU - Manila}}{2024}
216236
\resumeProjectHeading
217-
{\textbf{Labeling with LLMs} $|$ \emph{University of North Carolina - Charlotte}}{2024}
237+
{\textbf{Labeling with LLMs} (host: Ryan Wesslen \& Chang Hsin Lee) $|$ \emph{University of North Carolina - Charlotte}}{2024}
218238
\resumeProjectHeading
219-
{\textbf{Geospatial Data at Scale with Geomancer} $|$ \emph{Databeers Manila, Google Developer Group Conference}}{2019}
239+
{\textbf{Geospatial Data at Scale with Geomancer} (host: Erika Legara) $|$ \emph{Databeers Manila}}{2019}
220240
\resumeSubHeadingListEnd
221241

242+
% %-----------SERVICE-----------
243+
% \section{Professional \& Community Service}
244+
% \resumeSubHeadingListStart
245+
% \resumeProjectHeading
246+
% {\textbf{Reviewer}}{2024--Present}
247+
% \resumeItemListStart
248+
% \resumeItem{Venues: ICLR `25, COLM `25.}
249+
% \resumeItem{Published in several NLP workshops \cite{miranda2023calamancy,miranda2023developing}}
250+
% \resumeItemListEnd
251+
% \resumeSubHeadingListEnd
222252

223-
% BIBLIOGRAPHY ---------------------------------------------------------
224253
\newpage
254+
You can also check my \href{https://scholar.google.com/citations?user=2RtnNKEAAAAJ&hl=en}{Google Scholar profile}
255+
(Scholar ID: \texttt{2RtnNKEAAAAJ})
256+
for an updated list of my publications.
257+
Note: an asterisk (*) denotes equal or major contributions.
225258
\nocite{*}
226259
{
227260
\small
228-
\bibliographystyle{unsrt}
229-
\bibliography{publications}
261+
\newrefcontext[labelprefix=J]
262+
\printbibliography[keyword=journal,title=Journal Publications]
263+
\newrefcontext[labelprefix=C]
264+
\printbibliography[keyword=conference,title=Conference Papers]
265+
\newrefcontext[labelprefix=W]
266+
\printbibliography[keyword=workshop,title=Peer-Reviewed Workshop Papers]
267+
\newrefcontext[labelprefix=P]
268+
\printbibliography[keyword=preprint,title=Preprints \& Technical Reports]
230269
}
231270

271+
% BIBLIOGRAPHY ---------------------------------------------------------
272+
% \newpage
273+
% \nocite{*}
274+
% {
275+
% \bibliographystyle{plain}
276+
% \bibliography{publications}
277+
% }
278+
232279

233280
%-------------------------------------------
234281
\end{document}

publications.bib

Lines changed: 48 additions & 34 deletions
Original file line numberDiff line numberDiff line change
@@ -5,6 +5,7 @@ @inproceedings{miranda2025hybrid
55
month = jul,
66
year = {2025},
77
address = {Vienna, Austria},
8+
keywords = {conference},
89
publisher = {Association for Computational Linguistics}
910
}
1011

@@ -15,6 +16,7 @@ @inproceedings{gureja2025mrewardbench
1516
month = jul,
1617
year = {2025},
1718
address = {Vienna, Austria},
19+
keywords = {conference},
1820
publisher = {Association for Computational Linguistics}
1921
}
2022

@@ -25,19 +27,21 @@ @inproceedings{aquino2025ud
2527
month = jul,
2628
year = {2025},
2729
address = {Vienna, Austria},
30+
keywords = {conference},
2831
publisher = {Association for Computational Linguistics}
2932
}
3033

3134
@article{lambert2024tulu,
32-
title = {{T\"ulu 3: Pushing Frontiers in Open Language Model Post-Training}},
33-
author = {Nathan Lambert* and Jacob Morrison* and Valentina Pyatkin* and Shengyi Huang* and Hamish Ivison* and Faeze Brahman* and
34-
\textbf{Lester James V. Miranda}* and Alisa Liu and Nouha Dziri and Xinxi Lyu and
35-
Yuling Gu and Saumya Malik and Victoria Graf and Jena D. Hwang and
36-
Jiangjiang Yang and Ronan Le Bras and Oyvind Tafjord and Chris Wilhelm and
37-
Luca Soldaini and Noah A. Smith and Yizhong Wang and Pradeep Dasigi and Hannaneh Hajishirzi},
38-
journal = {Preprint},
39-
year = {2024},
40-
month = nov
35+
title = {{T\"ulu 3: Pushing Frontiers in Open Language Model Post-Training}},
36+
author = {Nathan Lambert* and Jacob Morrison* and Valentina Pyatkin* and Shengyi Huang* and Hamish Ivison* and Faeze Brahman* and
37+
\textbf{Lester James V. Miranda}* and Alisa Liu and Nouha Dziri and Xinxi Lyu and
38+
Yuling Gu and Saumya Malik and Victoria Graf and Jena D. Hwang and
39+
Jiangjiang Yang and Ronan Le Bras and Oyvind Tafjord and Chris Wilhelm and
40+
Luca Soldaini and Noah A. Smith and Yizhong Wang and Pradeep Dasigi and Hannaneh Hajishirzi},
41+
journal = {arXiv preprint arXiv:2411.15124},
42+
year = {2024},
43+
keywords = {preprint},
44+
month = nov
4145
}
4246

4347

@@ -49,6 +53,7 @@ @inproceedings{lovenia2024seacrowd
4953
year = {2024},
5054
month = nov,
5155
address = {Miami, Florida},
56+
keywords = {conference},
5257
publisher = {Empirical Methods in Natural Language Processing}
5358
}
5459

@@ -73,6 +78,7 @@ @inproceedings{lambert-etal-2025-rewardbench
7378
publisher = {Association for Computational Linguistics},
7479
url = {https://aclanthology.org/2025.findings-naacl.96/},
7580
pages = {1755--1797},
81+
keywords = {conference},
7682
isbn = {979-8-89176-195-7}
7783
}
7884

@@ -84,6 +90,7 @@ @inproceedings{miranda2024allen
8490
year = {2024},
8591
address = {St Julian's, Malta},
8692
pages = {151--159},
93+
keywords = {workshop},
8794
publisher = {Association for Computational Linguistics}
8895
}
8996

@@ -98,6 +105,7 @@ @inproceedings{miranda2023calamancy
98105
publisher = {Empirical Methods in Natural Language Processing},
99106
url = {https://aclanthology.org/2023.nlposs-1.1},
100107
pages = {1--7},
108+
keywords = {workshop},
101109
abstract = {We introduce calamanCy, an open-source toolkit for constructing natural language processing (NLP) pipelines for Tagalog. It is built on top of spaCy, enabling easy experimentation and integration with other frameworks. calamanCy addresses the development gap by providing a consistent API for building NLP applications and offering general-purpose multitask models with out-of-the-box support for dependency parsing, parts-of-speech (POS) tagging, and named entity recognition (NER). calamanCy aims to accelerate the progress of Tagalog NLP by consolidating disjointed resources in a unified framework.The calamanCy toolkit is available on GitHub: https://github.com/ljvmiranda921/calamanCy.}
102110
}
103111

@@ -109,6 +117,7 @@ @inproceedings{miranda2023developing
109117
year = {2023},
110118
address = {Nusa Dua, Bali, Indonesia},
111119
publisher = {Association for Computational Linguistics},
120+
keywords = {workshop},
112121
url = {https://aclanthology.org/2023.sealp-1.2},
113122
pages = {13--20}
114123
}
@@ -121,58 +130,63 @@ @inproceedings{mayhew2023universal
121130
month = jun,
122131
address = {Mexico City, Mexico},
123132
publisher = {Association for Computational Linguistics},
133+
keywords = {conference},
124134
url = {https://aclanthology.org/2024.naacl-long.243},
125135
pages = {4322--4337}
126136
}
127137

128138
@article{miranda2022multihash,
129-
title = {{Multi hash embeddings in spaCy}},
130-
author = {\textbf{Lester James V. Miranda}* and \'Akos K\'ad\'ar* and Adriane Boyd and Sofie Van Landeghem and Anders S{\o}gaard and Matthew Honnibal},
131-
journal = {{arXiv}},
132-
year = {2022},
133-
month = dec,
134-
volume = {abs/2212.09255}
139+
title = {{Multi hash embeddings in spaCy}},
140+
author = {\textbf{Lester James V. Miranda}* and \'Akos K\'ad\'ar* and Adriane Boyd and Sofie Van Landeghem and Anders S{\o}gaard and Matthew Honnibal},
141+
journal = {arXiv preprint arXiv:2212.09255},
142+
year = {2022},
143+
keywords = {preprint},
144+
month = dec
135145
}
136146

137-
inproceedings{miranda2018feature,
138-
author = {\underline{Lester James V. Miranda} and Jinglu Hu},
147+
@inproceedings{miranda2018feature,
148+
author = {\textbf{Lester James V. Miranda} and Jinglu Hu},
139149
title = {{Feature Extraction using a Mutually-Competitive Autoencoder for Protein Function Prediction}},
140150
booktitle = {Proceedings of the IEEE International Conference on System, Man, and Cybernetics (SMC)},
141151
publisher = {IEEE},
142152
note = {doi: \url{10.1109/SMC.2018.00234}},
143-
month = {October},
153+
keywords = {conference},
154+
month = oct,
144155
year = {2018}
145156
}
146157

147-
inproceedings{miranda2018deep,
148-
author = {\underline{Lester James V. Miranda} and Jinglu Hu},
158+
@inproceedings{miranda2018deep,
159+
author = {\textbf{Lester James V. Miranda} and Jinglu Hu},
149160
title = {{A Deep Learning Approach based on Stacked Denoising Autoencoders for Protein Function Prediction}},
150161
booktitle = {Proceedings of the 42nd IEEE Computer Society Signature Conference on Computers, Software, and Applications (COMPSAC)},
151162
publisher = {IEEE},
152-
month = {July},
163+
month = jul,
164+
keywords = {conference},
153165
note = {doi: \url{10.1109/COMPSAC.2018.00074}},
154166
year = {2018}
155167
}
156168

157-
article{miranda2018pyswarms,
158-
author = {\underline{Lester James V. Miranda}},
159-
title = {{PySwarms, a research-toolkit for Particle Swarm Optimization in Python}},
160-
journal = {Journal of Open Source Software (JOSS)},
161-
year = {2018},
162-
volume = {3},
163-
issue = {21},
164-
number = {433},
165-
note = {doi: \url{10.21105/joss.00433}},
166-
url = {https://doi.org/10.21105/joss.00433}
169+
@article{miranda2018pyswarms,
170+
author = {\textbf{Lester James V. Miranda}},
171+
title = {{PySwarms, a research-toolkit for Particle Swarm Optimization in Python}},
172+
journal = {Journal of Open Source Software (JOSS)},
173+
year = {2018},
174+
volume = {3},
175+
issue = {21},
176+
number = {433},
177+
keywords = {journal},
178+
note = {doi: \url{10.21105/joss.00433}},
179+
url = {https://doi.org/10.21105/joss.00433}
167180
}
168181

169182

170-
inproceedings{miranda2016appliance,
171-
author = {\underline{Lester James V. Miranda}* and Marian Joice Gutierrez* and Samuel Matthew Dumlao and Rosula Reyes},
183+
@inproceedings{miranda2016appliance,
184+
author = {\textbf{Lester James V. Miranda}* and Marian Joice Gutierrez* and Samuel Matthew Dumlao and Rosula Reyes},
172185
title = {{Appliance Recognition using Hall-Effect Sensors and k-Nearest Neighbors for Power Management Systems}},
173186
booktitle = {Proceedings of the 2016 IEEE Region 10 Conference 2016 (TENCON)},
174187
publisher = {IEEE},
175-
month = {November},
188+
month = oct,
189+
keywords = {conference},
176190
note = {doi: \url{10.1109/TENCON.2016.7847947}},
177191
year = {2016}
178192
}

0 commit comments

Comments
 (0)