You signed in with another tab or window. Reload to refresh your session.You signed out in another tab or window. Reload to refresh your session.You switched accounts on another tab or window. Reload to refresh your session.Dismiss alert
You can also check my \href{https://scholar.google.com/citations?user=2RtnNKEAAAAJ&hl=en}{Google Scholar profile}
107
-
(Scholar ID: \texttt{2RtnNKEAAAAJ})
108
-
for an updated list of my publications.
109
-
Note: an asterisk (*) denotes equal or major contributions.
110
-
}
109
+
%\renewcommand{\bibpreamble}{
110
+
% You can also check my \href{https://scholar.google.com/citations?user=2RtnNKEAAAAJ&hl=en}{Google Scholar profile}
111
+
% (Scholar ID: \texttt{2RtnNKEAAAAJ})
112
+
% for an updated list of my publications.
113
+
% Note: an asterisk (*) denotes equal or major contributions.
114
+
%}
111
115
112
116
%-------------------------------------------
113
117
%%%%%% RESUME STARTS HERE %%%%%%%%%%%%%%%%%%%%%%%%%%%%
@@ -138,33 +142,34 @@ \section{Experience}
138
142
{Allen Institute for AI}{2023 -- Present}
139
143
{Predoctoral Young Investigator}{Seattle, WA}
140
144
\resumeItemListStart
141
-
\resumeItem{Conducts research broadly in LLM post-training and alignment, such as preference annotation (\textsc{MultiPref}), reward model evaluation (\textsc{RewardBench}), and fully open-source post-training recipes (\textsc{T\"ulu 3}, \textsc{OLMo 2}).}
\resumeItem{Authored a technical paper on benchmarking spaCy's hash-embedding trick on span categorization and NER.}
150
-
\resumeItem{Developed human-in-the-loop and LLM annotation workflows for Prodigy, our data annotation product.}
151
-
\resumeItem{Built several open-source NLP tools such as \href{https://github.com/explosion/spacy-llm}{spacy-llm} (production LLM pipelines), \href{https://github.com/explosion/vscode-prodigy}{vscode-prodigy} (VSCode extension for data annotation), and \href{https://github.com/explosion/projects}{spaCy projects} (end-to-end NLP workflows for production).}
153
+
\resumeItem{Software developer and researcher for the \href{https://spacy.io}{spaCy} NLP library and the \href{https://prodigy.ai}{Prodigy} annotation tool.}
154
+
\resumeItem{Wrote a technical report on benchmarking spaCy's embeddings on span categorization tasks \cite{miranda2022multihash}.}
155
+
% \resumeItem{Developed human-in-the-loop and LLM annotation workflows for Prodigy, our data annotation product.}
156
+
% \resumeItem{Built several open-source NLP tools such as \href{https://github.com/explosion/spacy-llm}{spacy-llm} (production LLM pipelines), \href{https://github.com/explosion/vscode-prodigy}{vscode-prodigy} (VSCode extension for data annotation), and \href{https://github.com/explosion/projects}{spaCy projects} (end-to-end NLP workflows for production).}
152
157
\resumeItemListEnd
153
158
154
159
\resumeSubheading
155
160
{Thinking Machines Data Science}{2018 -- 2021}
156
161
{Machine Learning Researcher}{Metro Manila, PH}
157
162
\resumeItemListStart
158
-
\resumeItem{Developed several production-grade NLP applications for a sovereign wealth fund in Singapore.}
159
-
\resumeItem{Led a team in a large-scale digitization project of government financial statements for The World Bank.}
160
-
\resumeItem{Led an internal team of six in document processing initiatives to improve our Document AI product.}
163
+
\resumeItem{Developed NLP products for clients in the financial and the utilities sector.}
164
+
\resumeItem{Managed an internal research team for document processing.}
161
165
\resumeItemListEnd
162
166
163
167
\resumeSubheading
164
168
{Preferred Networks}{2018}
165
169
{Research Intern}{Tokyo, JP}
166
170
\resumeItemListStart
167
-
\resumeItem{Project: Implementing a parallelization feature for ChainerRL to support efficient batch Proximal Policy Optimization (PPO) and Advantage Actor Critic (A2C) for reinforcement learning.}
171
+
\resumeItem{Developed a parallelized Advantage Actor Critic (A2C) algorithm for the \href{https://github.com/chainer/chainerrl}{ChainerRL} library.}
publisher = {Empirical Methods in Natural Language Processing},
99
106
url = {https://aclanthology.org/2023.nlposs-1.1},
100
107
pages = {1--7},
108
+
keywords = {workshop},
101
109
abstract = {We introduce calamanCy, an open-source toolkit for constructing natural language processing (NLP) pipelines for Tagalog. It is built on top of spaCy, enabling easy experimentation and integration with other frameworks. calamanCy addresses the development gap by providing a consistent API for building NLP applications and offering general-purpose multitask models with out-of-the-box support for dependency parsing, parts-of-speech (POS) tagging, and named entity recognition (NER). calamanCy aims to accelerate the progress of Tagalog NLP by consolidating disjointed resources in a unified framework.The calamanCy toolkit is available on GitHub: https://github.com/ljvmiranda921/calamanCy.}
author = {\textbf{Lester James V. Miranda}* and \'Akos K\'ad\'ar* and Adriane Boyd and Sofie Van Landeghem and Anders S{\o}gaard and Matthew Honnibal},
131
-
journal = {{arXiv}},
132
-
year = {2022},
133
-
month = dec,
134
-
volume = {abs/2212.09255}
139
+
title= {{Multi hash embeddings in spaCy}},
140
+
author= {\textbf{Lester James V. Miranda}* and \'Akos K\'ad\'ar* and Adriane Boyd and Sofie Van Landeghem and Anders S{\o}gaard and Matthew Honnibal},
141
+
journal= {arXiv preprint arXiv:2212.09255},
142
+
year= {2022},
143
+
keywords = {preprint},
144
+
month = dec
135
145
}
136
146
137
-
inproceedings{miranda2018feature,
138
-
author = {\underline{Lester James V. Miranda} and Jinglu Hu},
147
+
@inproceedings{miranda2018feature,
148
+
author = {\textbf{Lester James V. Miranda} and Jinglu Hu},
139
149
title = {{Feature Extraction using a Mutually-Competitive Autoencoder for Protein Function Prediction}},
140
150
booktitle = {Proceedings of the IEEE International Conference on System, Man, and Cybernetics (SMC)},
141
151
publisher = {IEEE},
142
152
note = {doi: \url{10.1109/SMC.2018.00234}},
143
-
month = {October},
153
+
keywords = {conference},
154
+
month = oct,
144
155
year = {2018}
145
156
}
146
157
147
-
inproceedings{miranda2018deep,
148
-
author = {\underline{Lester James V. Miranda} and Jinglu Hu},
158
+
@inproceedings{miranda2018deep,
159
+
author = {\textbf{Lester James V. Miranda} and Jinglu Hu},
149
160
title = {{A Deep Learning Approach based on Stacked Denoising Autoencoders for Protein Function Prediction}},
150
161
booktitle = {Proceedings of the 42nd IEEE Computer Society Signature Conference on Computers, Software, and Applications (COMPSAC)},
151
162
publisher = {IEEE},
152
-
month = {July},
163
+
month = jul,
164
+
keywords = {conference},
153
165
note = {doi: \url{10.1109/COMPSAC.2018.00074}},
154
166
year = {2018}
155
167
}
156
168
157
-
article{miranda2018pyswarms,
158
-
author = {\underline{Lester James V. Miranda}},
159
-
title = {{PySwarms, a research-toolkit for Particle Swarm Optimization in Python}},
160
-
journal = {Journal of Open Source Software (JOSS)},
161
-
year = {2018},
162
-
volume = {3},
163
-
issue = {21},
164
-
number = {433},
165
-
note = {doi: \url{10.21105/joss.00433}},
166
-
url = {https://doi.org/10.21105/joss.00433}
169
+
@article{miranda2018pyswarms,
170
+
author = {\textbf{Lester James V. Miranda}},
171
+
title = {{PySwarms, a research-toolkit for Particle Swarm Optimization in Python}},
172
+
journal = {Journal of Open Source Software (JOSS)},
173
+
year = {2018},
174
+
volume = {3},
175
+
issue = {21},
176
+
number = {433},
177
+
keywords = {journal},
178
+
note = {doi: \url{10.21105/joss.00433}},
179
+
url = {https://doi.org/10.21105/joss.00433}
167
180
}
168
181
169
182
170
-
inproceedings{miranda2016appliance,
171
-
author = {\underline{Lester James V. Miranda}* and Marian Joice Gutierrez* and Samuel Matthew Dumlao and Rosula Reyes},
183
+
@inproceedings{miranda2016appliance,
184
+
author = {\textbf{Lester James V. Miranda}* and Marian Joice Gutierrez* and Samuel Matthew Dumlao and Rosula Reyes},
172
185
title = {{Appliance Recognition using Hall-Effect Sensors and k-Nearest Neighbors for Power Management Systems}},
173
186
booktitle = {Proceedings of the 2016 IEEE Region 10 Conference 2016 (TENCON)},
0 commit comments