Skip to content

Commit 59b3618

Browse files
committed
add dissertation to bib page
1 parent 4047721 commit 59b3618

File tree

3 files changed

+29
-60
lines changed

3 files changed

+29
-60
lines changed

2024-10-29/2024-10-29-coglunch.pdf

2.11 MB
Binary file not shown.

2024-10-29/index.html

Lines changed: 15 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,15 @@
1+
<!DOCTYPE HTML>
2+
<html lang="en-US">
3+
<head>
4+
<meta charset="UTF-8">
5+
<meta http-equiv="refresh" content="0; url=./2024-10-29-coglunch.pdf">
6+
<script type="text/javascript">
7+
window.location.href = "./2024-10-29-coglunch.pdf"
8+
</script>
9+
<title>Page Redirection</title>
10+
</head>
11+
<body>
12+
If you are not redirected automatically, follow this <a
13+
href='./2024-10-29-coglunch.pdf'>link</a>.
14+
</body>
15+
</html>

_bibliography/pubs.bib

Lines changed: 14 additions & 60 deletions
Original file line numberDiff line numberDiff line change
@@ -23,23 +23,7 @@ @article{hoover-etal-2023-plausibility
2323
doi = {10.1162/opmi_a_00086},
2424
url = {https://www.ncbi.nlm.nih.gov/pmc/articles/PMC10449406/},
2525
urldate = {2023-07-21},
26-
abstract = {Words that are more surprising given context take longer to
27-
process. However, no incremental parsing algorithm has been shown to directly
28-
predict this phenomenon. In this work, we focus on a class of algorithms whose
29-
runtime does naturally scale in surprisal\textemdash those that involve
30-
repeatedly sampling from the prior. Our first contribution is to show that
31-
simple examples of such algorithms predict runtime to increase superlinearly
32-
with surprisal, and also predict variance in runtime to increase. These two
33-
predictions stand in contrast with literature on surprisal theory (<a
34-
href="https://www.aclweb.org/anthology/N01-1021">Hale, 2001</a>; <a
35-
href="https://doi.org/10.1016/j.cognition.2007.05.006">Levy, 2008</a>) which
36-
assumes that the expected processing cost increases linearly with surprisal,
37-
and makes no prediction about variance. In the second part of this paper, we
38-
conduct an empirical study of the relationship between surprisal and reading
39-
time, using a collection of modern language models to estimate surprisal. We
40-
find that with better language models, reading time increases superlinearly in
41-
surprisal, and also that variance increases. These results are consistent with
42-
the predictions of sampling-based algorithms.},
26+
abstract = {Words that are more surprising given context take longer to process. However, no incremental parsing algorithm has been shown to directly predict this phenomenon. In this work, we focus on a class of algorithms whose runtime does naturally scale in surprisal\textemdash those that involve repeatedly sampling from the prior. Our first contribution is to show that simple examples of such algorithms predict runtime to increase superlinearly with surprisal, and also predict variance in runtime to increase. These two predictions stand in contrast with literature on surprisal theory (<a href="https://www.aclweb.org/anthology/N01-1021">Hale, 2001</a>; <a href="https://doi.org/10.1016/j.cognition.2007.05.006">Levy, 2008</a>) which assumes that the expected processing cost increases linearly with surprisal, and makes no prediction about variance. In the second part of this paper, we conduct an empirical study of the relationship between surprisal and reading time, using a collection of modern language models to estimate surprisal. We find that with better language models, reading time increases superlinearly in surprisal, and also that variance increases. These results are consistent with the predictions of sampling-based algorithms.},
4327
copyright = {All rights reserved},
4428
openaccess = {true},
4529
pmcid = {PMC10449406},
@@ -51,31 +35,7 @@ @article{hoover-etal-2023-plausibility
5135

5236

5337
@inproceedings{hoover-2020-icelandic,
54-
abstract = {Icelandic dative-nominative constructions exhibit a syntactic
55-
hierarchy effect known as the Person Restriction: only third
56-
person nominatives may control agreement. In these constructions,
57-
there is variation between speakers in the extent to which the
58-
verb agrees with the nominative for number. <a
59-
href="https://ling.auf.net/lingbuzz/000371">Sigurðsson & Holmberg
60-
(2008)</a> explain this variation as arising due to differences
61-
between varieties in the timing of subject raising, using a split
62-
phi-probe. This paper revises their approach, using the feature
63-
gluttony mechanism for Agree developed in <a
64-
href="https://ling.auf.net/lingbuzz/004224">Coon & Keine
65-
(2020)</a>, and a split phi-probe in which person probing precedes
66-
number probing. Within this framework, the observed variation
67-
can be captured by allowing variability two independent
68-
parameters: the timing of EPP subject raising, and the visibility
69-
of a number feature on dative DPs. The proposed mechanism
70-
describes the variation, including predicting the observed
71-
optional agreement in certain cases that previous literature had
72-
struggled to account for, and makes additional predictions about
73-
the differences between varieties in cases of syncretism within
74-
the verbal paradigm. An investigation into these predictions
75-
should allow this already well-studied area of Icelandic grammar
76-
to continue to be a useful test-case for crosslinguistic
77-
assumptions about the mechanism of Agree, and the status of dative
78-
arguments.},
38+
abstract = {Icelandic dative-nominative constructions exhibit a syntactic hierarchy effect known as the Person Restriction: only third person nominatives may control agreement. In these constructions, there is variation between speakers in the extent to which the verb agrees with the nominative for number. <a href="https://ling.auf.net/lingbuzz/000371">Sigurðsson & Holmberg (2008)</a> explain this variation as arising due to differences between varieties in the timing of subject raising, using a split phi-probe. This paper revises their approach, using the feature gluttony mechanism for Agree developed in <a href="https://ling.auf.net/lingbuzz/004224">Coon & Keine (2020)</a>, and a split phi-probe in which person probing precedes number probing. Within this framework, the observed variation can be captured by allowing variability two independent parameters: the timing of EPP subject raising, and the visibility of a number feature on dative DPs. The proposed mechanism describes the variation, including predicting the observed optional agreement in certain cases that previous literature had struggled to account for, and makes additional predictions about the differences between varieties in cases of syncretism within the verbal paradigm. An investigation into these predictions should allow this already well-studied area of Icelandic grammar to continue to be a useful test-case for crosslinguistic assumptions about the mechanism of Agree, and the status of dative arguments.},
7939
address = {Somerville, Mass., USA},
8040
author = {Jacob Louis Hoover},
8141
booktitle = {Proceedings of the 38th West Coast Conference on Formal Linguistics},
@@ -92,23 +52,7 @@ @inproceedings{hoover-2020-icelandic
9252
}
9353

9454
@inproceedings{hoover-etal-2021-emnlp,
95-
abstract = {Are pairs of words that tend to occur together also likely to
96-
stand in a linguistic dependency? This empirical question is motivated by a
97-
long history of literature in cognitive science, psycholinguistics, and NLP.
98-
In this work we contribute an extensive analysis of the relationship between
99-
linguistic dependencies and statistical dependence between words. Improving on
100-
previous work, we introduce the use of large pretrained language models to
101-
compute contextualized estimates of the pointwise mutual information between
102-
words (CPMI). For multiple models and languages, we extract dependency trees
103-
which maximize CPMI, and compare to gold standard linguistic dependencies.
104-
Overall, we find that CPMI dependencies achieve an unlabelled undirected
105-
attachment score of at most $\approx 0.5$. While far above chance, and
106-
consistently above a non-contextualized PMI baseline, this score is generally
107-
comparable to a simple baseline formed by connecting adjacent words. We
108-
analyze which kinds of linguistic dependencies are best captured in CPMI
109-
dependencies, and also find marked differences between the estimates of the
110-
large pretrained language models, illustrating how their different training
111-
schemes affect the type of dependencies they capture.},
55+
abstract = {Are pairs of words that tend to occur together also likely to stand in a linguistic dependency? This empirical question is motivated by a long history of literature in cognitive science, psycholinguistics, and NLP. In this work we contribute an extensive analysis of the relationship between linguistic dependencies and statistical dependence between words. Improving on previous work, we introduce the use of large pretrained language models to compute contextualized estimates of the pointwise mutual information between words (CPMI). For multiple models and languages, we extract dependency trees which maximize CPMI, and compare to gold standard linguistic dependencies. Overall, we find that CPMI dependencies achieve an unlabelled undirected attachment score of at most $\approx 0.5$. While far above chance, and consistently above a non-contextualized PMI baseline, this score is generally comparable to a simple baseline formed by connecting adjacent words. We analyze which kinds of linguistic dependencies are best captured in CPMI dependencies, and also find marked differences between the estimates of the large pretrained language models, illustrating how their different training schemes affect the type of dependencies they capture.},
11256
address = {Online and Punta Cana, Dominican Republic},
11357
author = {Hoover, Jacob Louis and Du, Wenyu and Sordoni, Alessandro and O{'}Donnell, Timothy J.},
11458
booktitle = {Proceedings of the 2021 Conference on Empirical Methods in Natural Language Processing},
@@ -123,4 +67,14 @@ @inproceedings{hoover-etal-2021-emnlp
12367
year = {2021}
12468
}
12569

126-
70+
@thesis{hoover.j:2024phd,
71+
title = {The Cost of Information: Looking beyond Predictability in Language Processing},
72+
author = {Hoover, Jacob Louis},
73+
type = {PhD},
74+
year = {2024},
75+
month = aug,
76+
note = {PhD Thesis, McGill University, Linguistics Department},
77+
school = {McGill University},
78+
langid = {english},
79+
url = {https://jahoo.github.io/assets/dissertation.pdf}
80+
}

0 commit comments

Comments
 (0)