Skip to content

Commit 7f1edb4

Browse files
committed
emnlp update
1 parent b213e06 commit 7f1edb4

File tree

5 files changed

+68
-33
lines changed

5 files changed

+68
-33
lines changed

_bibliography/pubs.bib

Lines changed: 57 additions & 25 deletions
Original file line numberDiff line numberDiff line change
@@ -1,33 +1,65 @@
11
%% This BibTeX bibliography file was created using BibDesk.
22
%% http://bibdesk.sourceforge.net/
33
4-
%% Created for j at 2021-09-10 10:36:49 -0400
5-
6-
7-
%% Saved with string encoding Unicode (UTF-8)
4+
%% Created for j at 2021-09-10 10:36:49 -0400
85
96
7+
%% Saved with string encoding Unicode (UTF-8)
108
119
@inproceedings{hoover.j:2020,
12-
abstract = {Icelandic dative-nominative constructions exhibit a syntactic hierarchy effect known as the Person Restriction: only third person nominatives may control agreement. In these constructions, there is variation between speakers in the extent to which the verb agrees with the nominative for number. Sigurðsson & Holmberg (2008) explain this variation as arising due to differences between varieties in the timing of subject raising, using a split phi-probe. This paper revises their approach, using the feature gluttony mechanism for Agree developed in Coon & Keine (2020), and a split phi-probe in which person probing precedes number probing. Within this framework, the observed variation can be captured by allowing variability two independent parameters: the timing of EPP subject raising, and the visibility of a number feature on dative DPs. The proposed mechanism describes the variation, including predicting the observed optional agreement in certain cases that previous literature had struggled to account for, and makes additional predictions about the differences between varieties in cases of syncretism within the verbal paradigm. An investigation into these predictions should allow this already well-studied area of Icelandic grammar to continue to be a useful test-case for crosslinguistic assumptions about the mechanism of Agree, and the status of dative arguments.},
13-
address = {Somerville, Mass., USA},
14-
author = {Jacob Louis Hoover},
15-
booktitle = {Proceedings of the 38th West Coast Conference on Formal Linguistics},
16-
editor = {Daniel Reisinger and Rachel Soo},
17-
handout = {http://doi.org/10.14288/1.0389856},
18-
pdf = {wccfl2020-icelandic_gluttony-proceedings.pdf},
19-
publisher = {Cascadilla Proceedings Project},
20-
pubstate = {forthcoming},
21-
title = {Accounting for variation in number agreement in Icelandic dative--nominative constructions},
22-
year = {2020}}
10+
abstract = {Icelandic dative-nominative constructions exhibit a syntactic
11+
hierarchy effect known as the Person Restriction: only third
12+
person nominatives may control agreement. In these constructions,
13+
there is variation between speakers in the extent to which the
14+
verb agrees with the nominative for number. <a
15+
href="https://ling.auf.net/lingbuzz/000371">Sigurðsson & Holmberg
16+
(2008)</a> explain this variation as arising due to differences
17+
between varieties in the timing of subject raising, using a split
18+
phi-probe. This paper revises their approach, using the feature
19+
gluttony mechanism for Agree developed in <a
20+
href="https://ling.auf.net/lingbuzz/004224">Coon & Keine
21+
(2020)</a>, and a split phi-probe in which person probing precedes
22+
number probing. Within this framework, the observed variation
23+
can be captured by allowing variability two independent
24+
parameters: the timing of EPP subject raising, and the visibility
25+
of a number feature on dative DPs. The proposed mechanism
26+
describes the variation, including predicting the observed
27+
optional agreement in certain cases that previous literature had
28+
struggled to account for, and makes additional predictions about
29+
the differences between varieties in cases of syncretism within
30+
the verbal paradigm. An investigation into these predictions
31+
should allow this already well-studied area of Icelandic grammar
32+
to continue to be a useful test-case for crosslinguistic
33+
assumptions about the mechanism of Agree, and the status of dative
34+
arguments.},
35+
address = {Somerville, Mass., USA},
36+
author = {Jacob Louis Hoover},
37+
booktitle = {Proceedings of the 38th West Coast Conference on Formal
38+
Linguistics},
39+
editor = {Daniel Reisinger and Rachel Soo},
40+
handout = {http://doi.org/10.14288/1.0389856},
41+
pdf = {wccfl2020-icelandic_gluttony-proceedings.pdf},
42+
publisher = {Cascadilla Proceedings Project},
43+
pubstate = {forthcoming},
44+
title = {Accounting for variation in number agreement in Icelandic
45+
dative--nominative constructions},
46+
year = {2020}}
2347

24-
@misc{hoover.j:2021,
25-
abstract = {Are pairs of words that tend to occur together also likely to stand in a linguistic dependency? This empirical question is motivated by a long history of literature in cognitive science, psycholinguistics, and NLP. In this work we contribute an extensive analysis of the relationship between linguistic dependencies and statistical dependence between words. Improving on previous work, we introduce the use of large pretrained language models to compute contextualized estimates of the pointwise mutual information between words (CPMI). For multiple models and languages, we extract dependency trees which maximize CPMI, and compare to gold standard linguistic dependencies. Overall, we find that CPMI dependencies achieve an unlabelled undirected attachment score of at most $\approx 0.5$. While far above chance, and consistently above a non-contextualized PMI baseline, this score is generally comparable to a simple baseline formed by connecting adjacent words. We analyze which kinds of linguistic dependencies are best captured in CPMI dependencies, and also find marked differences between the estimates of the large pretrained language models, illustrating how their different training schemes affect the type of dependencies they capture.},
26-
archiveprefix = {arXiv},
27-
author = {Jacob Louis Hoover and Alessandro Sordoni and Wenyu Du and Timothy J. O'Donnell},
28-
date-modified = {2021-09-10 10:36:49 -0400},
29-
eprint = {2104.08685},
30-
note = {Accepted to EMNLP2021},
31-
primaryclass = {cs.CL},
32-
title = {Linguistic Dependencies and Statistical Dependence},
33-
year = {2021}}
48+
@inproceedings{hoover-etal-2021-linguistic,
49+
title = "Linguistic Dependencies and Statistical Dependence",
50+
author = "Hoover, Jacob Louis and
51+
Du, Wenyu and
52+
Sordoni, Alessandro and
53+
O{'}Donnell, Timothy J.",
54+
booktitle = "Proceedings of the 2021 Conference on Empirical Methods in Natural Language Processing",
55+
month = nov,
56+
year = "2021",
57+
address = "Online and Punta Cana, Dominican Republic",
58+
publisher = "Association for Computational Linguistics",
59+
url = "https://aclanthology.org/2021.emnlp-main.234",
60+
pages = "2941--2963",
61+
abstract = "Are pairs of words that tend to occur together also likely to stand in a linguistic dependency? This empirical question is motivated by a long history of literature in cognitive science, psycholinguistics, and NLP. In this work we contribute an extensive analysis of the relationship between linguistic dependencies and statistical dependence between words. Improving on previous work, we introduce the use of large pretrained language models to compute contextualized estimates of the pointwise mutual information between words (CPMI). For multiple models and languages, we extract dependency trees which maximize CPMI, and compare to gold standard linguistic dependencies. Overall, we find that CPMI dependencies achieve an unlabelled undirected attachment score of at most $\approx 0.5$. While far above chance, and consistently above a non-contextualized PMI baseline, this score is generally comparable to a simple baseline formed by connecting adjacent words. We analyze which kinds of linguistic dependencies are best captured in CPMI dependencies, and also find marked differences between the estimates of the large pretrained language models, illustrating how their different training schemes affect the type of dependencies they capture.",
62+
poster = {2021.10.11.EMNLP.poster.pdf},
63+
code = {https://github.com/mcqll/cpmi-dependencies},
64+
slides = {2021.10.11.EMNLP.talk-slides.pdf},
65+
}

assets/CV/jlh-academic_cv.pdf

825 Bytes
Binary file not shown.

assets/CV/jlh-academic_cv.tex

Lines changed: 11 additions & 8 deletions
Original file line numberDiff line numberDiff line change
@@ -179,21 +179,21 @@ \section{Education}
179179
%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
180180
\begin{longtable}{p{1.7cm}|p{15cm}}
181181
\textsc{Fall 2021}&%
182-
Guest lecture for \textbf{McGill} COMP 445 \emph{Computational Linguistics}\\
182+
Guest lecture for McGill COMP 445 \emph{Computational Linguistics}\\
183183
&
184-
TA for \textbf{McGill} COMP 445 \emph{Computational Linguistics}
184+
TA for McGill COMP 445 \emph{Computational Linguistics}
185185
(Prof.\ Timothy O'Donnell)\\
186186
\textsc{Winter 2021}&%
187-
TA for \textbf{McGill} COMP 596 \emph{Probabilistic Programming}
187+
TA for McGill COMP 596 \emph{Probabilistic Programming}
188188
(Prof.\ Timothy O'Donnell)\\
189189
\textsc{Fall 2020}&%
190-
TA for \textbf{McGill} COMP 445 \emph{Computational Linguistics}
190+
TA for McGill COMP 445 \emph{Computational Linguistics}
191191
(Prof.\ Timothy O'Donnell)\\
192192
\textsc{Winter 2020}&%
193-
TA for \textbf{McGill} LING 201 \emph{Introduction to Linguistics}
193+
TA for McGill LING 201 \emph{Introduction to Linguistics}
194194
(Prof.\ Francisco Torreira, Mathieu Paillé)\\
195195
\textsc{Fall 2019}&%
196-
TA for \textbf{McGill} LING 201 \emph{Introduction to Linguistics}
196+
TA for McGill LING 201 \emph{Introduction to Linguistics}
197197
(Prof.\ Francisco Torreira, Prof\. Junko Shimoyama)\\
198198
\end{longtable}
199199

@@ -252,7 +252,7 @@ \section{Education}
252252

253253
% Print bibliography, manual order
254254
\vspace{5pt}
255-
\nocite{hoover.j:2021,hoover.j:2020}
255+
\nocite{hoover.j:2021,hoover.j:2020,hoover.j:2020wccflhandout}
256256
\AtNextBibliography{\small}
257257
\printbibliography[heading=none]{}
258258
\vspace{5pt}
@@ -282,10 +282,13 @@ \section{Education}
282282
&%
283283
Intermediate (2½ years living and working in Estonia:
284284
\textasciitilde\ CEF level B2)\\
285+
French
286+
&%
287+
Intermediate (\textasciitilde\ B1)\\
285288
Japanese
286289
&%
287290
Novice (two years' university study, at this point rather atrophied)\\
288-
Russian, Spanish, French%
291+
Russian, Spanish%
289292
&%
290293
Basic knowledge\\
291294
\multicolumn{2}{c}{}\\
924 KB
Binary file not shown.
2.69 MB
Binary file not shown.

0 commit comments

Comments
 (0)