-
Notifications
You must be signed in to change notification settings - Fork 1
/
3_exp.qmd
1486 lines (1278 loc) · 83.3 KB
/
3_exp.qmd
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
611
612
613
614
615
616
617
618
619
620
621
622
623
624
625
626
627
628
629
630
631
632
633
634
635
636
637
638
639
640
641
642
643
644
645
646
647
648
649
650
651
652
653
654
655
656
657
658
659
660
661
662
663
664
665
666
667
668
669
670
671
672
673
674
675
676
677
678
679
680
681
682
683
684
685
686
687
688
689
690
691
692
693
694
695
696
697
698
699
700
701
702
703
704
705
706
707
708
709
710
711
712
713
714
715
716
717
718
719
720
721
722
723
724
725
726
727
728
729
730
731
732
733
734
735
736
737
738
739
740
741
742
743
744
745
746
747
748
749
750
751
752
753
754
755
756
757
758
759
760
761
762
763
764
765
766
767
768
769
770
771
772
773
774
775
776
777
778
779
780
781
782
783
784
785
786
787
788
789
790
791
792
793
794
795
796
797
798
799
800
801
802
803
804
805
806
807
808
809
810
811
812
813
814
815
816
817
818
819
820
821
822
823
824
825
826
827
828
829
830
831
832
833
834
835
836
837
838
839
840
841
842
843
844
845
846
847
848
849
850
851
852
853
854
855
856
857
858
859
860
861
862
863
864
865
866
867
868
869
870
871
872
873
874
875
876
877
878
879
880
881
882
883
884
885
886
887
888
889
890
891
892
893
894
895
896
897
898
899
900
901
902
903
904
905
906
907
908
909
910
911
912
913
914
915
916
917
918
919
920
921
922
923
924
925
926
927
928
929
930
931
932
933
934
935
936
937
938
939
940
941
942
943
944
945
946
947
948
949
950
951
952
953
954
955
956
957
958
959
960
961
962
963
964
965
966
967
968
969
970
971
972
973
974
975
976
977
978
979
980
981
982
983
984
985
986
987
988
989
990
991
992
993
994
995
996
997
998
999
1000
---
title: "Experiment 3"
subtitle: "**Effects of Including Pronouns on Nametags and in Introductions on Spoken Production**"
toc-title: "Experiment 3: Effects of Including Pronouns on Nametags and in Introductions on Spoken Production"
---
```{r}
#| label: exp3-setup
#| include: false
library(tidyverse) # data wrangling
library(magrittr)
library(sjmisc)
options(dplyr.group.inform = FALSE, dplyr.summarise.inform = FALSE)
library(lme4) # stats
library(lmerTest)
library(buildmer)
library(simr) # power analysis
library(brms) # reliability
library(insight) # model results
library(broom.mixed)
library(flextable) # tables
library(sjPlot)
library(patchwork) # plots
library(RColorBrewer)
library(ggtext)
library(Hmisc) # correlations
library(ggcorrplot)
library(rstatix)
rainbow <- read.csv("resources/formatting/rainbow.csv") # colors
rainbow_primary <- rainbow %>%
filter(Spectral != "") %>%
select(-Score) %>%
column_to_rownames("Spectral")
source("resources/data-functions/exp3_load_data.R") # setting up data
source("resources/formatting/printing.R") # model results in text
source("resources/formatting/aesthetics.R") # plot and table themes
source("resources/data-functions/demographics.R") # demographics tables
```
[![](resources/icons/preregistered.svg){title="Preregistration" width="30"}](https://osf.io/bt7yn) [![](resources/icons/open-materials.svg){title="Materials" width="30"}](https://github.com/bethanyhgardner/dissertation/blob/main/materials/exp3) [![](resources/icons/open-data.svg){title="Data" width="30"}](https://github.com/bethanyhgardner/dissertation/blob/main/data) [![](resources/icons/file-code-fill.svg){title="Analysis Code" width="30"}](https://github.com/bethanyhgardner/dissertation/blob/main/3_exp.qmd)
<br>
```{r}
#| label: exp3-load-data
# demographics counts
exp3_d_demographics <- read.csv(
"data/exp3_demographics.csv",
stringsAsFactors = TRUE
)
# all survey responses
exp3_d_survey <- read.csv("data/exp3_survey.csv", stringsAsFactors = TRUE)
# accuracy data only has trials with pronouns
exp3_d_acc <- exp3_load_data_acc()
contrasts(exp3_d_acc$Pronoun) # check contrast coding added
contrasts(exp3_d_acc$Nametag)
contrasts(exp3_d_acc$Intro)
# distribution data has all trials
exp3_d_full <- exp3_load_data_dist()
```
## Motivation
Encouraging people to include their pronouns when introducing themselves and providing space for people to indicate their pronouns in display names, email signatures, and nametags are common recommendations for making environments inclusive of [TGD](0_introduction.qmd#def-TGD "trans and gender diverse") people [@richards2013]. Options to specify your pronouns are currently included in many social media platforms such as Instagram and LinkedIn, in institutional platforms such as Brightspace and Slack, and in tools such as Zoom and Github. Ideally, group norms of indicating pronouns makes disclosure less marked, which supports the individuals who need to explicitly state their pronouns in order to avoid being [misgendered](0_introduction.qmd#def-misgendering)---which is the majority of people who use they/them pronouns, in the majority of contexts.
Some recent research has investigated the effects of pronoun-sharing practices. Both TGD and other LGBQ+ people evaluated a potential workplace more positively when a biography of a staff member included that she used she/her pronouns, when she/her would have been assumed [@johnson2021]. This suggests that other people indicating their pronouns can act as an identity-safety cue when TGD and LGBQ+ people are forming initial appraisals of an environment, so they may be more likely to choose that environment and be more comfortable being out.[^exp3-1] Additionally, directly explaining that a character used they/them supported people's ability to correctly comprehend *they* as singular, not plural [@arnold2021] (see [Section 0.4.4](#names)).
[^exp3-1]: However, see @mcgonagill2023, discussed in [Section 0.7](#misgendering), for data about how nonbinary people felt that being out would negatively affect their job search and how this was borne out in experiments with resume response rates and hiring manager surveys. When an otherwise-identical resume included they/them pronouns, the applicant received less interest and was rated as less qualified.
An unanswered question, however, is whether pronoun-sharing practices affect people's language *production*---specifically, if they reduce the frequency of misgendering and support accurate use of singular *they*. While creating an environment where TGD people feel safe asking for the correct gendered language and where others understand the usage of singular *they* are both good outcomes, EDI practices need to affect allies' concrete behavior [e.g., @kattari2018], beyond their knowledge and attitudes.
In the first two experiments, I have argued for a model where learning to use they/them pronouns requires retrieving information about a person's pronouns from episodic memory, instead of inferring pronouns from morphosyntactic features of their name or from an inference about their gender. Experiment 1 demonstrated that when a character's pronouns cannot be inferred from their name, people can learn to associate pronouns with the character and use that information in language production, and Experiment 2 demonstrated that accurately producing they/them pronouns can be supported by providing participants with information about why paying attention to a person's pronouns is important. Experiment 3 moves from testing an intervention that may influence how participants pay attention to and attempt to recall information about a person's pronouns to comparing different ways of presenting information about pronouns. The current experiment investigates two practices for providing explicit information about what pronouns a person uses: stating pronouns when introducing someone, which makes this information highly salient at the beginning of the conversation, and including pronouns on someone's nametag/display name, which keeps this information accessible throughout the conversation. Ideally, pronoun-sharing practices will support production of singular *they*. However, pronoun-sharing practices may not consistently impact pronoun production---at all, or at least not to a degree that has real-world applicability. The frequency of seemingly-counterintuitive errors like "she uses they/them" shows that speakers may have information about a person's pronouns available, but still produce the incorrect pronoun.
## Methods
The design and analysis plan were [preregistered](https://osf.io/bt7yn "Experiment 3 Preregistration") on the Open Science Framework. Sources and attributions for the images are included with the [materials](https://github.com/bethanyhgardner/dissertation/tree/main/materials/exp3 "Experiment 3 Materials"), and the edited images are available upon request. The de-identified [data](https://github.com/bethanyhgardner/dissertation/blob/main/data "Experiment 3 Data") and [analysis code](https://github.com/bethanyhgardner/dissertation/blob/main/exp3.qmd "Source Code") are available at this dissertation's [Github repository](https://github.com/bethanyhgardner/dissertation "Github repository").
### Participants
```{r}
#| label: exp3-power-parameters
# get Pronoun * PSA interaction from Exp2 production model
load("r_data/exp2.RData")
exp2_r_effect_size <- exp2_m_prod@model %>%
tidy() %>%
filter(term == "Pronoun=They_HeShe:PSA=GenLang") %>%
pull(estimate) %>%
round(2)
exp2_r_effect_size # log-odds
exp(exp2_r_effect_size) # odds ratio
```
```{r}
#| label: exp3-power-data-struct
# start with 108 participants each doing 30 trials
exp3_pw_data_struct <- data.frame(
Participant = rep(as.factor(1:108),
each = 30
),
Trial = rep(
as.factor(1:30),
108
)
)
# Trials are split between 3 Pronoun Pair conditions, which are contrast-coded
# to compare:
# (1) They|HeShe vs HeShe|They + HeShe|SheHe
# (2) HeShe|They vs HeShe\|SheHe
exp3_pw_data_struct %<>% bind_cols(
"Pronoun" =
rep(
rep(
factor(c("He", "She", "They")),
each = 10
),
108
)
)
contrasts(exp3_pw_data_struct$Pronoun) <- cbind(
"_T vs HS" = c(.33, .33, -.66),
"_H vs S" = c(-.5, .5, 0)
)
# Nametag and Introduction conditions vary in a 2x2 between-P design, and both
# are mean-centered effects coded.
exp3_pw_data_struct %<>% bind_cols(
"Nametag" = rep(
rep(
factor(c(0, 0, 1, 1)),
each = 30
),
108 / 4
),
"Intro" = rep(
rep(
factor(c(0, 1, 0, 1)),
each = 30
),
108 / 4
)
)
contrasts(exp3_pw_data_struct$Nametag) <- cbind(
"_No_Yes" = c(-.5, .5)
)
contrasts(exp3_pw_data_struct$Intro) <- cbind(
"_No_Yes" = c(-.5, .5)
)
# Item is defined as each unique image-name-pronoun combination. There are 6
# sets of characters, and each list sees 3, making 18 unique characters.
exp3_pw_data_struct %<>% bind_cols(
"Character" =
rep(
as.factor(1:18),
each = 30 / 3,
108 / 6
)
)
str(exp3_pw_data_struct)
exp3_pw_data_struct %>%
group_by(Nametag, Intro) %>%
summarise(n_distinct(Participant))
```
```{r}
#| label: exp3-power-fixed
# The closest thing to existing data is the Exp2 (written) production task.
# Since interpreting effect sizes is apparently more complicated for logistic
# regression, let's go with the Exp2 results as a baseline. That's a rough
# estimate of how much harder they/them is to produce than he/him and she/her.
# And let's set the hypothetical Nametag and Introduction effects to be about
# the same size as the PSA. Hopefully that's small enough to be kind of
# conservative with the power analysis, but not aiming for effects too small to
# be practically relevant.
exp2_m_prod_fixed <- exp2_m_prod@model %>%
tidy() %>%
filter(effect == "fixed") %>%
select(term, estimate)
exp2_m_prod_fixed
# Predictions for Exp3 based on ranges from Exp2:
exp3_pw_fixed <- c(
+0.75, # Intercept Medium
+3.00, # Pronoun: T vs HS Largest
-0.10, # Pronoun: H vs S NS, maybe small
+0.10, # Nametag NS, maybe small
+0.10, # Introduction NS, maybe small
-2.00, # Pronoun: T vs HS * Nametag Same size as PSA interaction
-0.10, # Pronoun: H vs S * Nametag NS, maybe small
-2.00, # Pronoun: T vs HS * Intro Same size as PSA interaction
-0.10, # Pronoun: H vs S * Intro NS, maybe small
+0.25, # Nametag * Intro Maybe small
-2.00, # 3 way T vs HS Same size as PSA interaction
-0.10 # 3 way H vs S NS, maybe small
)
```
```{r}
#| label: exp3-power-random
# The model for the Exp2 production task only converged with random intercepts
# by item, and no random effects by participant.
exp2_m_prod_random <- VarCorr(exp2_m_prod@model)
exp2_m_prod_random
# The model for the Exp1 production task only converged with random intercepts
# and slopes by participant, and no random effects by item.
load("r_data/exp1.RData")
exp1_m_prod_random <- VarCorr(exp1a_m_prod@model)
exp1_m_prod_random
# So, I'll combine those two as a starting place to estimate the random effects.
# It's possible the actual data won't converge with the maximal random effects
# structure, but for now let's assume it will.
exp3_pw_random <- exp1_m_prod_random
exp3_pw_random[["Item"]] <- exp2_m_prod_random[["Name"]]
exp3_pw_random
```
```{r}
#| label: exp3-power-sim-model-data
#| cache: true
# Create model with this data structure, fixed effects, and random effects
exp3_pw_m_108 <- makeGlmer(
formula = SimAcc ~ Pronoun * Nametag * Intro +
(Pronoun | Participant) + (1 | Character),
family = binomial,
fixef = exp3_pw_fixed,
VarCorr = exp3_pw_random,
data = exp3_pw_data_struct
)
summary(exp3_pw_m_108)
# Simulate data
exp3_pw_sim_data <- doSim(exp3_pw_m_108)
exp3_pw_data_struct %<>% bind_cols("SimAcc" = exp3_pw_sim_data)
summary(exp3_pw_data_struct)
```
```{r}
#| label: exp3-power-simulated
#| eval: false
# Code to run simulation:
powerSim(
exp3_pw_m_108,
nsim = 1000,
test = fixed("Pronoun_T vs HS:Nametag_No_Yes", "z")
)
# Then extend model to larger N
exp3_pw_m_132 <- extend(exp3_pw_m_108,
along = "Participant", n = 132
)
```
```{r}
#| label: exp3-power-results
exp3_pw_results <- bind_rows(
.id = "sim",
"2_108" = readRDS("r_data/exp3_power_2way_N108.RDA") %>% summary(),
"2_132" = readRDS("r_data/exp3_power_2way_N132.RDA") %>% summary(),
"2_156" = readRDS("r_data/exp3_power_2way_N156.RDA") %>% summary(),
"2_180" = readRDS("r_data/exp3_power_2way_N180.RDA") %>% summary(),
"3_132" = readRDS("r_data/exp3_power_3way_N132.RDA") %>% summary(),
"3_156" = readRDS("r_data/exp3_power_3way_N156.RDA") %>% summary()
) %>%
mutate(
n_participants = str_sub(sim, 3),
effect = case_when(
str_sub(sim, 0, 1) == "2" ~ "Pronoun * Nametag/Intro",
str_sub(sim, 0, 1) == "3" ~ "Pronoun * Nametag * Intro"
)
) %>%
column_to_rownames(var = "sim")
```
A simulation-based power analysis using the *simr* package in R [@green2016] estimated the number of participants required to detect a 2-way interaction between the condition manipulation and pronoun type with the same effect size (`r exp2_r_prod['Pronoun=They_HeShe:PSA=GenLang', 'Beta']`, OR = `r round(exp(exp2_r_effect_size), 2)`) as the production task in Experiment 2. This indicated that 156 participants, each completing 30 trials, would have `r round(exp3_pw_results['2_156', 'mean'], 2)` \[`r round(exp3_pw_results['2_156', 'lower'], 2)`, `r round(exp3_pw_results['2_156', 'upper'], 2)`\] power at α = .05 to detect the interaction.
Participants were recruited from Prolific [@peer2022] and required to be over the age of 18, be native or advanced speakers of English, and have a device with a microphone to record audio. The task took approximately 20 minutes. `r n_distinct(exp3_d_survey$Participant)` participants are included in the analysis, with an additional 11 participants excluded for stopping the study before completing 25 test trials, having technical errors saving data, or having \>5 test trial recordings that did not include a response to the task. Participant demographics are described in @tbl-exp3-demographics1.
### Materials
#### Characters
Participants were introduced to 3 characters, each of whom was associated with a set of pronouns (1 he/him, 1 she/her, 1 they/them), a name, an image, a pictured brother character, and a pictured sister character. The character images were selected from *The Gender Spectrum Collection*, a stock photo library created to provide a diverse range of images of transgender and nonbinary people [@drucker2019]. The sibling [images](https://github.com/bethanyhgardner/dissertation/blob/main/materials/exp3/images.md "Experiment 3 Images") were selected from a free-use stock photo database. Each image was edited to show 1 person from the shoulders up with a white background. Nametags were shown in white text on a black bar along the bottom of the image, resembling display names in the Zoom interface. For characters, the nametags showed the first name and, depending on the condition, their pronouns. For siblings, the nametags showed *\[character name\]'s \[brother/sister\]*, in order to limit the number of names participants needed to learn and to elicit possessive pronouns referring to the character.
```{r}
#| label: exp3-norming-data
exp3_d_norming <- read.csv(
"data/exp3_image-norming.csv",
stringsAsFactors = TRUE
)
str(exp3_d_norming)
exp3_r_norming <- exp3_d_norming %>%
count(Pronoun) %>%
mutate(
mean = n / length(exp3_d_norming$Response),
percent = round(mean * 100, 0)
) %>%
column_to_rownames("Pronoun")
exp3_r_norming
```
Across the lists, there were 6 [images](https://github.com/bethanyhgardner/dissertation/blob/main/materials/exp3/images.md "Experiment 3 Images") for the main characters. These were selected by conducting a norming study on 12 images. Participants (N = `r n_distinct(exp3_d_norming$ParticipantID)`) on Prolific saw each image paired with a sentence completion prompt, which referred to the pictured person as "this person" and did not include a name (e.g., *This person made a mug of tea. Before it cooled...*). No information about pronouns was included, either in the instructions or in the prompts. Participants wrote a completion to each prompt, in order to measure which pronouns, if any, were chosen to refer to the character (@tbl-norming). Unlike in the first two studies, participants produced they/them frequently (`r exp3_r_norming['they/them', 'percent']`% of responses). This is potentially due to prompts not including names, as well as a different participant population on Prolific compared to MTurk. From the results of this norming study, 3 images where people did not produce she/her pronouns and 3 images where people did not produce he/him pronouns were selected. The goal was to create stimuli where we can expect that participants are primarily choosing between he/him and they/them or between she/her and they/them, not between all three, which may involve a different mechanism. This design allows us to test if including pronouns on nametags and in introductions increases accuracy for they/them, as compared to the pronouns that speakers would typically have defaulted to. This is the situation in which many people who use they/them find themselves, where they want people to stop using he/him or she/her pronouns. Additionally, the decision between he/him and she/her involves additional social dynamics that are outside the scope of the current study.
Participants were randomly assigned to 1 of 6 lists, in order to counterbalance the images and names associated with the character who uses they/them. Out of the 6 images, 3 appeared twice with he/him and once with they/them across lists, and 3 appeared twice with she/her and once with they/them across lists. There were 6 names, all gender-neutral: Alex, Casey, Jaime, Jordan, Sam, Taylor [@flowers2015]. While people who use they/them pronouns use a variety of names, this experiment uses gender-neutral names because counterbalancing the gender associations of the names within lists was not feasible. Critically, across lists they/them appears once with each image and once with each name, in order to avoid confounding interpretations about which aspects of a person's name or appearance may make it easier for someone to learn that they use they/them pronouns.
#### Pronoun Elicitation Task
Following a task established by @pozzan2017, each trial showed 2 characters in the center of the screen, with their siblings in the 4 corners (@fig-exp3-trial). An animation showed an object moving from a character to one of their siblings, and participants verbally described what happened. This was designed to elicit possessive pronouns about the target character, e.g., *Jaime gave the apple to their brother*. It also allowed participants to produce subject pronouns referring to the character, e.g., *They gave the apple to their brother*, or to avoid pronouns entirely, e.g., *Jaime gave the apple to Jaime's brother*. Trials manipulated which pronouns the two pictured characters used [\[Pronoun Pair\]]{.fw-semibold}: they/them targets with he/him or she/her distractors [\[They\|HeShe\]]{.fw-semibold}, he/him and she/her targets with they/them distractors [\[HeShe\|They\]]{.fw-semibold}, and he/him and she/her targets with she/her or he/him distractors [\[HeShe\|SheHe\]]{.fw-semibold}. Trials also counterbalanced whether the object was passed to the brother or the sister and the locations of the characters. These trial frames were identical for each of the 6 character lists. Unlike @pozzan2017, no filler trials were included, as it was not possible to conceal that the study was targeting pronoun production.
![Experiment 3: Example Trial in the +⁠Nametag condition, which preferentially <br>elicited "Jaime gave the apple to their brother."](materials/exp3/figures/stimuli.png){#fig-exp3-trial width="650"}
### Procedure
#### Introductions to Characters
Participants were randomly assigned to 1 of 4 between-participants conditions, manipulating what information about pronouns was given [\[+⁠Nametag vs --⁠Nametag; +⁠Introduction vs --⁠Introduction\]]{.fw-semibold}, then to 1 of 6 lists within each condition, counterbalancing the images and names of the characters. First, participants read introductions to 3 characters (1 he/him, 1 she/her, 1 they/them) (@fig-exp3-procedure). The characters were introduced by name, and in the +⁠Introduction condition, their pronouns were explicitly stated (e.g., *This is Jaime, who uses they/them pronouns*). The images associated with each character included their name, resembling a display name in Zoom; in the +⁠Nametag conditions, the images also included the character's pronouns in parentheses after their name. Each character had a brother and a sister, whose nametags indicated their relationship to the character. In all conditions, the facts about the character and the introductions to their siblings included 3 instances of the character's pronouns, with the character facts preceding the sibling introductions to reduce the ambiguity of singular *they* (i.e., not plural referring to the character and the sibling introduced next).
![Experiment 3: Stimuli and Procedure. \[A\] Example stimuli for the introductions to the characters, shown for the +⁠Nametag +⁠Introduction and --⁠Nametag --⁠Introduction conditions. \[B\] Experiment procedure.](materials/exp3/figures/procedure.png){#fig-exp3-procedure width="80%"}
#### Speech Production
Participants saw 1 example trial for each character, which demonstrated the frame *\[Name\] gave the \[object\] to \[their/his/her\] \[brother/sister\]* and included another instance of the character's pronouns. Participants then completed 1 practice trial for each character, to learn the timing of the task. Each scene, with the object moving from beside a character to beside their brother or sister, took a total of 5 seconds. Then the microphone recorded for 8 seconds, with the images remaining on the screen. After each practice trial, participants read feedback in the frame *Did you say something like, "\[Name\] gave the \[object\] to \[their/his/her\] \[brother/sister\]?"* At this point in the experiment, participants in the condition where the characters' pronouns were not directly indicated (--⁠Nametag --⁠Introduction) had observed 5 examples of each characters' pronouns. Participants then completed 30 test trials, which did not include feedback. The order of all trials was randomized. Trials were divided evenly between 3 within-subjects conditions, which varied the pronouns of both the target character and the other pictured character \[Pronoun Pair: They\|HeShe; HeShe\|They; HeShe\|SheHe\].
#### Survey
After the speech production task, participants completed a [survey](https://github.com/bethanyhgardner/dissertation/blob/main/materials/exp3/survey.md "Experiment 3 Survey") measuring their prior beliefs about singular *they* and [TGD](0_introduction.qmd#def-TGD "trans and gender diverse") identities. First, they judged 6 sentences using singular *they*: coreferring with [generic](0_introduction.qmd#def-generic "generic singular they") [antecedents](0_introduction.qmd#def-antecedent "antecedent") (e.g., *the ideal barista*), quantified antecedents (e.g., *each dog owner*, *every music fan*), and proper names (masculine, feminine, and gender-neutral). Items were drawn from @conrod2019, and participants rated them on a Likert scale with 1 being "very unnatural" and 7 being "very natural." Second, participants were asked about their prior familiarity with using they/them and pronoun-sharing practices. They could choose one or more options: use they/them for themself, close to someone who uses they/them, have met someone who uses they/them, have heard about using they/them but have not met anyone who does, and have not heard anything about using they/them. For including pronouns in introduction and in places like nametags or signatures, participants indicated frequency in the groups they were a part of (all, most, some, a few, none) and for themselves (always, usually, sometimes, rarely, never because prefer not to, never because had not heard of it). Third, participants completed Nagoshi et al.'s Transphobia Scale, which measures endorsement of gender essentialism and the gender binary, and discomfort with people who violate these expectations [@nagoshi2008; see also @tebbe2012]; this is referred to as the Gender Beliefs measure from here forward.
Finally, participants completed [demographic questions](https://github.com/bethanyhgardner/dissertation/blob/main/materials/exp3/demographics.md "Experiment 3 Demographic Questions"). They were asked about their age, gender, and sexuality, as prior work indicates that being younger and part of the LGBTQ+ community correlates with higher acceptability ratings for singular *they* [@camilliere2021; @conrod2019; @hekanaho2020; @hernandez2020]. The question about gender was two steps: a free-response box, then options to indicate whether their gender was the same or different than the sex indicated on their original birth certificate. This follows recommendations for identifying the broadest set of TGD people: anyone whose gender does not match their sex assigned at birth, of whom not all call themselves transgender. This format also accounts for the fact that terms for gender vary widely, allowing participants to choose the language that best describes them, but avoiding relying on terms that many participants may not be familiar with [@ansara2014; @cameron2019; NASEM, -@nasem2022; @zimman2017]. In addition to or instead of the options for sex assigned at birth, participants could indicate whether they considered themselves cisgender, transgender, or neither. Although these factors do not relate directly to the current research questions, participants were also asked about their race, ethnicity, and education level, in order to characterize the participant sample [@buchanan2021]. All demographic questions included the option to not respond. The experiment was coded and hosted using PCIbex [@zehr2018].
## Predictions
Like in the first two experiments, we expect to observe lower accuracy for they/them characters compared to he/him and she/her characters, but recall that the characters in Experiment 3 differ in several ways. First, instead of masculine or feminine names, where two thirds of the characters used the expected he/him or she/her and one third used they/them, all of the names here are gender-neutral. If participants rely on lexical knowledge about the gender associations of the name to select a pronoun, responses would be split between he/him or she/her, instead of being strongly biased to one or the other. Second, the characters now include images, which provide additional information that participants may be using to make an inference about the character's gender and then to select pronouns. Third---while still brief---the introductions to the characters here contain more repetitions of the character's pronouns. While the introductions to the characters in Experiments 1 & 2 stated their pronouns directly but did not use pronouns to refer to the character (e.g., *This is Emily, who uses they/them pronouns. Emily...*), participants in all four Experiment 3 conditions see each character's pronouns used three times in the introductions, once in the example trials, and once in the practice trials. Putting aside potential differences between spoken and written production for the moment, this means that we may see higher accuracy for they/them in the --⁠Nametag --⁠Introduction condition than in Experiments 1 & 2, since information about the characters' pronouns is presented multiple times.
The primary hypotheses concern whether the Nametag and Introduction conditions attenuate the lower accuracy of singular *they*. Including pronouns in introductions makes the information about pronouns salient at the beginning. If speakers use this information in production---presumably by retrieving it from episodic memory---we would expect to see a smaller penalty for they/them in the two +⁠Introduction conditions. Alternatively, if speakers do not remember the information about the character's pronouns from the beginning of the experiment, or if this information is not used when selecting the pronoun to produce, we would see no differences between the +⁠Introduction and --⁠Introduction conditions.
Including pronouns on the characters' nametags keeps the information accessible throughout the experiment, and compared to the Introduction manipulation, does not require speakers to retrieve information from episodic memory. If speakers use the nametag information when selecting the pronoun to produce, we would expect to see a smaller penalty for they/them in the two +⁠Nametag conditions. If speakers do not use the nametag information, instead relying on their lexical knowledge of the name or an inference about the character's gender based on their appearance, we would see no differences between the +⁠Nametag and --⁠Nametag conditions.
If the introductions and nametags do reduce the relative difficulty of singular *they*, the combination of the two may be more effective than just one, resulting in the higher accuracy for the +⁠Nametag +⁠Introduction condition compared to the +⁠Nametag --⁠Introduction and the --⁠Nametag +⁠Introduction conditions. This could result if including pronouns in introductions directs people to pay attention to the nametags, and if the nametags serve as a cue to retrieve the a memory of the introduction information.
## Results
### Participant Backgrounds
```{r}
#| label: exp3-demographic-counts
# Age
exp3_r_age <- exp3_d_survey %>%
filter(Category == "Age") %>%
select(ParticipantID, Response_Num) %>%
summarise(
min = min(Response_Num, na.rm = TRUE),
med = median(Response_Num, na.rm = TRUE),
max = max(Response_Num, na.rm = TRUE)
) %>%
pivot_longer(
cols = c("min", "med", "max"),
values_to = "stat"
) %>%
column_to_rownames("name")
# Gender
exp3_r_gender <- exp3_d_demographics %>%
filter(Category == "Gender" & Group != "Total") %>%
select(Group, Total) %>%
column_to_rownames("Group")
# TGD
exp3_r_TGD <- exp3_d_survey %>%
filter(Category == "Transgender & Gender-Diverse" &
(str_detect(Item, "My gender is different") |
str_detect(Item, "consider myself transgender")) &
Response_Bool == TRUE) %>%
pull(ParticipantID) %>%
n_distinct()
# LGBQ+
exp3_r_LGBQ <- exp3_d_survey %>%
filter(Category == "Sexuality" &
str_detect(Item, "Asexual|Bi|Gay|Queer") &
Response_Bool == TRUE) %>%
pull(ParticipantID) %>%
n_distinct()
```
```{r}
#| label: exp3-survey-ratings-means
# Subset data
exp3_d_ratings <- exp3_d_survey %>%
filter(Category == "Sentence Naturalness Ratings" &
!is.na(Response_Num)) %>%
select(ParticipantID, Item, Response_Num) %>%
mutate(Type = ifelse(str_detect(Item, "Name"), "Name", "Indefinite"))
# Means
exp3_r_rating_means <- exp3_d_ratings %>%
group_by(Type) %>%
summarise(
mean = mean(Response_Num, na.rm = TRUE),
SD = sd(Response_Num, na.rm = TRUE)
) %>%
column_to_rownames("Type") %>%
round(2)
exp3_r_rating_means
```
```{r}
#| label: exp3-survey-ratings-model
# Mean-center according to scale
exp3_d_ratings %<>% mutate(Response_Centered = Response_Num - 4)
# Compare names to indefinites
exp3_d_ratings$Type %<>% as.factor()
contrasts(exp3_d_ratings$Type) <- cbind("=Name_Indefinite" = c(+.5, -.5))
contrasts(exp3_d_ratings$Type)
exp3_m_ratings <- lmer(
formula = Response_Centered ~ Type + (1 | Item) + (Type | ParticipantID),
data = exp3_d_ratings
)
summary(exp3_m_ratings)
exp3_r_ratings <- exp3_m_ratings %>%
tidy_model_results() %>%
mutate(Text = str_replace(Text, "z", "t"))
```
```{r}
#| label: exp3-survey-gender-beliefs
# Subset & scale data
exp3_d_gender_beliefs <- exp3_d_survey %>%
filter(Category == "Transphobia Scale" & !is.na(Response_Num)) %>%
mutate(Response_Scaled = Response_Num - 1) %>%
group_by(ParticipantID) %>%
summarise(Total = sum(Response_Scaled))
# Summary stats
exp3_r_gender_beliefs <- exp3_d_gender_beliefs %>%
summarise(
min = min(Total),
max = max(Total),
mean = mean(Total) %>% round(2),
SD = sd(Total) %>% round(2),
)
exp3_r_gender_beliefs
```
Participants were older than the typical college student sample (range = `r exp3_r_age['min','stat']`--`r exp3_r_age['max','stat']`, Mdn = `r exp3_r_age['med','stat']`). Around half the participants were women, and 6 were under the nonbinary umbrella. `r exp3_r_TGD` participants said that their gender was different than their sex assigned at birth and/or that they considered themselves transgender, and `r exp3_r_LGBQ` were LGBQ+ (@tbl-exp3-demographics1). These rates are somewhat higher than the U.S. average, but in line with previous data about the Prolific participant population [@douglas2023]. Overall, just about all participants were at least somewhat familiar with singular *they* before the experiment: a third had heard about people using they/them pronouns but had not met anyone who does, a third had met but were not close to anyone who uses they/them, and a third were close to someone who uses they/them and/or used they/them themselves ([Figure @fig-exp3-survey]D). Similarly, most participants were familiar with including pronouns when introducing yourself and on nametags/display names, but didn't consider it a part of their or their social circles' norms. When describing their own habits, about half said they never do either because they prefer not to, about a quarter said they do rarely or sometimes, and about a tenth said they do usually or always ([Figure @fig-exp3-survey]B). When describing what people around them do, about a third were never around people who share pronouns, about half were rarely or sometimes around people who share pronouns, and about a fifth were usually or always around people who share pronouns ([Figure @fig-exp3-survey]C). Including pronouns on nametags was somewhat more common than including pronouns in introductions, which is unsurprising given that the former can be less marked. When rating the naturalness of singular *they* coreferring with different types of referents ([Figure @fig-exp3-survey]A), acceptance of indefinite forms was generally high (*M* = `r exp3_r_rating_means['Indefinite', 'mean']`, *SD* = `r exp3_r_rating_means['Indefinite', 'SD']`), and acceptance of proper names was more variable (*M* = `r exp3_r_rating_means['Name', 'mean']`, *SD* = `r exp3_r_rating_means['Name', 'SD']`) and was significantly lower (`r exp3_r_ratings['Type=Name_Indefinite', 'Text']`) (@tbl-exp3-ratings). For gender beliefs [@nagoshi2008], responses on a 1--7 Likert scale were scaled to the 0--6 range, giving a total range of 0--54, with higher scores indicating higher endorsement of the gender binary and gender essentialism and thus less favorable attitudes about trans and gender-nonconforming people ([Figure @fig-exp3-survey]E). Participant totals spanned the entire scale (range = `r exp3_r_gender_beliefs$min`--`r exp3_r_gender_beliefs$max`), but were skewed towards the lower end, with a mean response that was moderately favorable towards trans and gender-nonconforming people (*M* = `r exp3_r_gender_beliefs$mean`, *SD* = `r exp3_r_gender_beliefs$SD`; see @tbl-exp3-gender-beliefs for item text and means). While this experiment did not include direct measures of political affiliation, other studies show that the Prolific population skews left, with 35% identifying as a strong Democrat, and only 20% identifying as a strong, weak, or independent Republican [@douglas2023].
| |
|-----|
| |
: Experiment 3: Participant Demographics. The trans & gender diverse and sexuality categories have variable totals, as participants could select multiple options. Participant education, English experience, and race/ethnicity are included in the appendix (@tbl-exp3-demographics2). {#tbl-exp3-demographics1 .borderless}
```{r ft.align="left"}
#| output: true
demographics_table(
exp3_d_demographics,
categories = c("Age", "Gender", "Transgender & Gender-Diverse", "Sexuality"),
title = "Experiment 3: Participant Demographics"
)
```
```{r}
#| label: fig-exp3-survey
#| fig-cap: "[A] Naturalness ratings (1 = very unnatural, 7 = very natural) for singular *they* coreferring with indefinites and proper names. [B] Frequency that participants include their pronouns when introducing themselves and in places like nametags. [C] Frequency that the participants’ social circles include pronouns in introductions and on nametags. [D] Experience with using they/them. [E] Gender binary and essentialism beliefs [@nagoshi2008], with higher scores indicating higher endorsement and thus more negative attitudes about trans and gender non-conforming people. The black line is the mean response."
#| fig-asp: 1.25
#| output: true
#| cache: true
# Ratings----
exp3_p_ratings <- exp3_d_survey %>%
filter(Category == "Sentence Naturalness Ratings") %>%
filter(!is.na(Response_Num)) %>% # missing data
mutate(
Response_Num = Response_Num %>%
as.factor() %>%
fct_rev() %>%
recode("7" = "7 Very Natural"),
Item = Item %>%
as.factor() %>%
droplevels() %>%
str_replace("\n", " ") %>%
fct_relevel("Generic", after = 0) %>%
fct_relevel("Every", after = 1) %>%
fct_relevel("Neutral Name", after = 3) %>%
fct_relevel("Fem Name", after = 5)
) %>%
ggplot(aes(y = fct_rev(Item), fill = Response_Num)) +
geom_bar(position = "fill") +
scale_x_continuous(expand = c(0, 0)) +
scale_y_discrete(expand = c(0, 0)) +
scale_fill_brewer(
palette = "Spectral", direction = -1,
guide = guide_legend(
title = "Very Unnatural",
byrow = TRUE, nrow = 1,
direction = "horizontal", reverse = TRUE,
keywidth = .8, keyheight = .8
)
) +
theme_classic() +
survey_theme +
labs(
title = "Singular <i>They</i> Naturalness Ratings",
x = element_blank(), y = element_blank()
)
# Pronoun sharing: self----
exp3_p_sharing_self <- exp3_d_survey %>%
filter(
str_detect(Category, "Sharing") &
str_detect(Item, "Self") & !is.na(Response_Cat)
) %>%
select(ParticipantID, Item, Response_Cat) %>%
group_by(Item, Response_Cat) %>%
summarise(n = n_distinct(ParticipantID)) %>%
mutate(
Item = Item %>%
droplevels() %>%
recode_factor("Intros: Self" = "Intros", "Nametags: Self" = "Nametags"),
Response_Cat = Response_Cat %>%
droplevels() %>%
recode_factor(
"Never, because I had not heard of this before" = "Not Heard About",
"Never, because I prefer not to" = "Prefer Not"
) %>%
factor(
ordered = TRUE,
levels = c(
"Always", "Usually", "Sometimes", "Rarely", "Prefer Not",
"Not Heard About"
))
) %>%
ggplot(aes(x = n, y = Item, fill = Response_Cat)) +
geom_bar(position = "fill", stat = "identity") +
scale_fill_manual(values = c(
rainbow_primary["purple", "Color"],
rainbow_primary["blue", "Color"],
rainbow_primary["green", "Color"],
rainbow_primary["yellow", "Color"],
rainbow_primary["orange", "Color"],
rainbow_primary["red", "Color"]
)) +
scale_x_continuous(expand = c(0, 0)) +
scale_y_discrete(expand = c(0, 0)) +
theme_classic() +
survey_theme +
labs(
title = "Familiarity With Pronoun-Sharing Practices: Self",
x = element_blank(), y = element_blank()
) +
guides(fill = guide_legend(
title = NULL,
byrow = TRUE, nrow = 2, ncol = 6,
reverse = TRUE,
direction = "horizontal",
keywidth = .8, keyheight = .8
))
# Pronoun sharing: others----
exp3_p_sharing_others <- exp3_d_survey %>%
filter(
str_detect(Category, "Sharing") &
str_detect(Item, "Others") & !is.na(Response_Cat)
) %>%
select(ParticipantID, Item, Response_Cat) %>%
group_by(Item, Response_Cat) %>%
summarise(n = n_distinct(ParticipantID)) %>%
mutate(
Item = Item %>%
droplevels() %>%
recode_factor(
"Intros: Others" = "Intros",
"Nametags: Others" = "Nametags"
),
Response_Cat = Response_Cat %>%
droplevels() %>%
recode_factor("A few" = "A Few") %>%
factor(
levels = c("All", "Most", "Some", "A Few", "None"),
ordered = TRUE
)
) %>%
ggplot(aes(x = n, y = Item, fill = Response_Cat)) +
geom_bar(position = "fill", stat = "identity") +
scale_fill_manual(values = c(
rainbow_primary["blue", "Color"],
rainbow_primary["green", "Color"],
rainbow_primary["yellow", "Color"],
rainbow_primary["orange", "Color"],
rainbow_primary["red", "Color"]
)) +
scale_x_continuous(expand = c(0, 0)) +
scale_y_discrete(expand = c(0, 0), ) +
theme_classic() +
survey_theme +
labs(
title = "Familiarity With Pronoun-Sharing Practices: Others",
x = element_blank(), y = element_blank()
) +
guides(fill = guide_legend(
title = NULL,
byrow = TRUE, nrow = 2, ncol = 6,
reverse = TRUE,
direction = "horizontal",
keywidth = .8, keyheight = .8
))
# Experience using they/them----
exp3_p_familiarity <- exp3_d_survey %>%
filter(str_detect(Category, "They/Them")) %>%
filter(Item != "Aggregate" & Response_Bool == TRUE) %>%
select(ParticipantID, Item, Response_Bool) %>%
pivot_wider(
names_from = Item,
values_from = Response_Bool
) %>%
mutate(`Myself + Close To` = ifelse(
Myself == TRUE & `Close To` == TRUE, TRUE, NA
)) %>%
mutate(.keep = c("unused"), HighestFamiliarity = case_when(
`Myself + Close To` == TRUE ~ "Myself +\nClose To",
`Myself` == TRUE ~ "Myself",
`Close To` == TRUE ~ "Close To",
`Have Met` == TRUE ~ "Have Met",
`Heard About` == TRUE ~ "Heard About",
`Not Heard About` == TRUE ~ "Not Heard\nAbout"
)) %>%
group_by(HighestFamiliarity) %>%
summarise(n = n_distinct(ParticipantID)) %>%
mutate(
Label = "Highest\nFamiliarity",
HighestFamiliarity %<>% factor(
levels = c(
"Myself +\nClose To", "Myself", "Close To",
"Have Met", "Heard About", "Not Heard\nAbout"
),
ordered = TRUE
)
) %>%
ggplot(aes(y = Label, x = n, fill = HighestFamiliarity)) +
geom_bar(position = "fill", stat = "identity") +
scale_fill_brewer(
palette = "Spectral", direction = -1,
guide = guide_legend(
title = NULL, ncol = 6,
direction = "horizontal", reverse = TRUE,
keywidth = .8, keyheight = .8
)
) +
scale_x_continuous(expand = c(0, 0)) +
scale_y_discrete(expand = c(0, 0)) +
theme_classic() +
survey_theme +
labs(
title = "Experience Using They/Them Pronouns",
x = element_blank(),
y = element_blank(),
fill = element_blank()
) +
guides(fill = guide_legend(
title = NULL,
ncol = 6,
reverse = TRUE,
direction = "horizontal",
keywidth = .8, keyheight = .8
))
# Gender beliefs----
exp3_p_gender_beliefs <- exp3_d_gender_beliefs %>%
ggplot(aes(x = Total, fill = as.factor(Total))) +
geom_histogram(binwidth = 1, show.legend = FALSE) +
geom_vline(aes(xintercept = mean(Total))) +
coord_cartesian(xlim = c(54, 0), expand = 0, clip = "off") +
scale_y_continuous(breaks = c(1, 5, 10)) +
scale_fill_manual(
values = rainbow %>%
filter(Score %in% exp3_d_gender_beliefs$Total) %>%
pull(Color)
) +
theme_classic() +
survey_theme +
theme(axis.title.y = element_text(
angle = 0, margin = margin(r = -0.9, unit = "in")
)) +
labs(
title = "Gender Binary & Gender Essentialism Beliefs",
x = "More Endorsement – Less Endorsement",
y = "N\nParticipants"
)
# Combine----
(exp3_p_ratings / exp3_p_sharing_self / exp3_p_sharing_others /
exp3_p_familiarity / exp3_p_gender_beliefs) +
plot_layout(heights = c(2.5, 1, 1, 0.75, 1.5)) +
plot_annotation(
tag_levels = "A",
title = "Experiment 3: Prior Familiarity & Attitudes",
theme = patchwork_theme
) +
plot_annotation(theme = theme(
plot.margin = margin(t = 5, b = 0, l = 5, r = 5)
))
```
### Distribution of Pronouns Produced
```{r}
#| label: exp3-counts
# N trials
exp3_n_subj <- n_distinct(exp3_d_full$ParticipantID)
exp3_n_trials_max <- exp3_n_subj * 30 # trials expected
exp3_n_trials_total <- length(exp3_d_full$ParticipantID) # total trials in data
# % trials not recorded/not completing task
exp3_prop_trials_excluded <- exp3_n_trials_total / exp3_n_trials_max
exp3_prop_trials_excluded <- round((1 - exp3_prop_trials_excluded) * 100, 2)
# number of subject pronouns (vs possessive)
exp3_n_subject_pro <- exp3_d_full %>%
select(He, She, They) %>%
summarise(
He = sum(He),
She = sum(She),
They = sum(They)
) %>%
rotate_df() %>%
rename("n" = "V1")
exp3_n_subject_pro
# number of multiple pronouns/corrections
exp3_n_multiple <- exp3_d_full %>%
filter(MultiplePronouns == 1) %>%
count(T_Pronoun, PronounProduced, His, Her, Their) %>% # count combinations
mutate(CorrectPronoun = case_when( # get correct possessive form
T_Pronoun == "he/him" ~ "his",
T_Pronoun == "she/her" ~ "her",
T_Pronoun == "they/them" ~ "their"
)) %>% # pronoun produced is final pronoun, so figure out first pronoun
mutate(FirstPronoun = case_when(
His == 1 & PronounProduced != "his" ~ "his",
Her == 1 & PronounProduced != "her" ~ "her",
Their == 1 & PronounProduced != "their" ~ "their"
)) %>%
mutate(PronounCombo = str_c(FirstPronoun, PronounProduced, sep = " ")) %>%
group_by(PronounCombo) %>% # sum pairs of pronouns
summarise(n = sum(n)) %>% # which collapses over accuracy of final pronoun
column_to_rownames("PronounCombo")
exp3_n_multiple
exp3_prop_multiple <- (
(sum(exp3_n_multiple$n) / exp3_n_trials_total) * 100
) %>%
format(digits = 2, nsmall = 2)
# number of trials with no pronouns
exp3_n_none <- exp3_d_full %>%
filter(None == 1) %>%
group_by(T_Pronoun) %>%
summarise(n = n()) %>%
column_to_rownames("T_Pronoun")
exp3_n_none
exp3_prop_none <- ((sum(exp3_n_none$n) / exp3_n_trials_total) * 100) %>%
round(2)
```
```{r}
#| label: exp3-test-no-pronouns
exp3_t_none <- t.test(
exp3_d_full %>% filter(T_Pronoun != "they/them") %>% pull(None),
exp3_d_full %>% filter(T_Pronoun == "they/them") %>% pull(None)
)
exp3_t_none
exp3_r_none <- exp3_t_none %>% tidy_t_results()
```
Trials were automatically transcribed using *whisper* [@radford2022], then checked to include disfluencies. After excluding trials that were inaudible or did not include a response to the task (`r exp3_prop_trials_excluded`% of data), `r exp3_n_trials_total` trials were included in the analysis. Each trial was coded for pronoun(s) referring to the target character, which occurred in nearly all trials (`r 100 - exp3_prop_none`%). Because subject pronouns were infrequent (`r exp3_n_subject_pro['He', 'n']` *he*, `r exp3_n_subject_pro['She', 'n']` *she*, `r exp3_n_subject_pro['They', 'n']` *they*) and did not occur in trials without a corresponding possessive pronoun, the analyses only include possessive pronouns. There were no outliers between the 6 lists varying the name-image-pronoun combinations (@fig-exp3-by-character).
[Figure @fig-exp3-dist]A shows the distribution of final pronouns produced by target character and condition. Trials with one pronoun are shown in darker colors; trials with multiple pronouns (e.g., *Jaime gave the apple to her bro---to their brother*, `r exp3_prop_multiple`%) show the final pronoun in lighter colors. Participants were numerically more likely to not use pronouns for they/them characters (N = `r exp3_n_none['they/them', 'n']`) than for he/him (N = `r exp3_n_none['he/him', 'n']`) and she/her characters (N = `r exp3_n_none['she/her', 'n']`), but the comparison between the mean rates of no-pronoun responses for they/them and he/him + she/her was not statistically significant, *t*(`r exp3_r_none$df`) = `r exp3_r_none$t`, `r exp3_r_none$p`. Rather, participants who only used names (e.g., *Jaime gave the apple to Jaime's brother*) tended to do so for all 3 characters. In trials where participants produced multiple pronouns, self-corrections from *his* to *their* (N = `r exp3_n_multiple['his their', 'n']`) and *her* to *their* (N = `r exp3_n_multiple['her their', 'n']`) were more common than self-corrections from *their* to *his* (N = `r exp3_n_multiple['their his', 'n']`) or *her* (N = `r exp3_n_multiple['their her', 'n']`), or between *his* and *her* (N = `r exp3_n_multiple['his her', 'n']`, N = `r exp3_n_multiple['her his', 'n']`). Unexpectedly, *their* responses for each participant were typically at floor or near ceiling ([Figure @fig-exp3-dist]B), with the Nametag and Introduction conditions affecting whether a participant produced *their* at all, more than affecting accuracy within participants who produced *their* in some trials.
```{r}
#| label: fig-exp3-dist
#| fig-cap: "Experiment 3: Distribution of Responses.[A] Final pronoun produced. Trials where participants used multiple pronouns to refer to the character (e.g., *Jaime gave the apple to her bro---to their brother*) are grouped based on the final pronoun and shown in lighter colors. [B] Number of *their* responses per participant."
#| fig-asp: 1
#| output: true
#| cache: true
# Distribution----
exp3_p_dist <- exp3_load_data_dist() %>%
group_by(CondLabels, T_Pronoun, PronounProduced, Order) %>%
summarise(n = n()) %>%
ggplot(aes(
x = T_Pronoun, y = n,
fill = PronounProduced, alpha = Order
)) +
geom_bar(stat = "identity", position = "fill") +
facet_wrap(~CondLabels) +
scale_alpha_discrete(range = c(.5, 1)) +
scale_fill_manual(values = c("#1B9E77", "#D95F02", "#7570B3", "gray50")) +
scale_x_discrete(expand = c(0, 0)) +
scale_y_continuous(expand = c(0, 0)) +
theme_classic() +
dissertation_plot_theme +
white_facet_theme +
labs(
title = "Final Pronouns Produced",
x = "Character Pronouns",
y = "Proportion of Responses",
alpha = "Pronoun Position",
fill = "Pronoun Produced"
)
# They/them total----
exp3_p_they <- exp3_load_data_dist() %>%
mutate(IsThey = ifelse(
PronounProduced == "their", 1, 0
)) %>%
group_by(CondLabels, ParticipantID) %>%
summarise(nThey = sum(IsThey)) %>%
mutate(
Col = "",
nThey = nThey %>%
as.factor() %>%
fct_recode(
"1–3" = "1", "1–3" = "2", "1–3" = "3", "4–6" = "4", "4–6" = "5",
"4–6" = "6", "7–9" = "7", "7–9" = "8", "7–9" = "9",
"10 (Correct)" = "10", "11+" = "11", "11+" = "14", "11+" = "20"
) %>%
factor(
ordered = TRUE,
levels = c("0", "1–3", "4–6", "7–9", "10 (Correct)", "11+")
)
) %>%
ggplot(aes(x = Col, fill = nThey)) +
facet_wrap(~CondLabels) +
geom_bar(position = "fill") +
scale_fill_manual(values = c("#666666", brewer.pal(5, "Purples"))) +
scale_x_discrete(expand = c(0, 0)) +
scale_y_continuous(expand = c(0, 0)) +
theme_classic() +
dissertation_plot_theme +
white_facet_theme +
theme(
legend.box.margin = margin(b = 0.25, unit = "in"),
plot.margin = margin(b = -0.20, unit = "in"),
plot.title = element_markdown(lineheight = 1.1, size = 12, face = "bold"),
) +
guides(fill = guide_legend(
byrow = TRUE, keywidth = unit(0.25, "in"),
keyheight = unit(0.245, "in")
)) +
labs(
title = "<i>Their</i> Responses",
x = element_blank(),
y = "Proportion of Participants",
fill = "Total Per Participant"
)
# Combine----
exp3_p_dist + exp3_p_they +
plot_layout(heights = c(1.25, 1)) +
plot_annotation(
title = "Experiment 3: Distribution of Responses",
tag_levels = "A",
theme = patchwork_theme
)
```
### Pronoun Accuracy
The primary analysis measured accuracy of pronouns referring to the target character (@fig-exp3-acc). Trials where participants produced different pronouns (`r exp3_prop_multiple`%) were coded based on the final pronoun (e.g., *Jaime gave the apple to her bro---to their brother* would be coded based on the accuracy of *their*); trials with no pronouns (`r exp3_prop_none`%) were excluded from this analysis. Pronoun was manipulated between both the character described (target) and the other character pictured on the screen (distractor). The first Pronoun Pair contrast compared trials with they/them target characters to trials with he/him and she/her target characters (They\|HeShe vs HeShe\|They + HeShe\|They). Within he/him and she/her character trials, the second contrast compared trials with they/them distractors to trials with he/him and she/her distractors (HeShe\|They vs HeShe\|They). There were no significant effects of the second Pronoun Pair contrast, so for simplicity's sake, the first Pronoun Pair contrast is referred to as the effect of Pronoun from here on. The fixed effects of Nametag and Introduction (between-participants) were both mean-center effects coded. The maximal model justified by the experimental design [@baayen2008; @barr2013] included by-participant slopes for Pronoun and by-item intercepts. Item was defined as the combinations of names, images, and pronouns that varied across the 6 lists of characters; because these combinations did not fully vary across pronouns, by-item random slopes were not included. The final model (@tbl-exp3-acc) included all interactions between fixed effects, plus by-item and by-participant intercepts [@bates2015; @rcoreteam2023; @voeten2023].
```{r}
#| label: fig-exp3-acc
#| fig-cap: "Experiment 3: Production Accuracy, split by Nametag and Introduction conditions. Trials using no pronouns are excluded. By-participant means are shown as points; error bars indicate 95% CIs calculated over the by-participant means."
#| fig-asp: 0.6
#| output: true
#| cache: true
exp3_load_data_dist() %>%
group_by(ParticipantID, CondLabels, Pronoun_Pair, T_Pronoun) %>%
summarise(SubjMean = mean(Accuracy, na.rm = TRUE)) %>%
filter(!is.na(SubjMean)) %>% # one subj who used 0 pronouns
ggplot(aes(
x = T_Pronoun, fill = T_Pronoun, color = T_Pronoun,
y = SubjMean)) +
stat_summary(
fun.data = mean_cl_boot, geom = "bar",
alpha = 0.4, color = "white"
) +
geom_point(
position = position_jitter(height = 0.02, width = 0.4, seed = 3),
size = 0.5
) +
stat_summary(
fun.data = mean_cl_boot, geom = "errorbar",
color = "black", linewidth = 0.5, width = 0.5
) +
facet_wrap(~CondLabels) +
scale_color_brewer(palette = "Dark2") +
scale_fill_brewer(palette = "Dark2") +
scale_x_discrete(expand = c(0, 0)) +
theme_classic() +
dissertation_plot_theme +
white_facet_theme +
guides(color = guide_none(), fill = guide_none()) +
labs(
title =
"Experiment 3: Production Accuracy by Pronoun Information Condition",
x = "Character Pronouns",
y = "By-Participant Mean Accuracy"
)
```
```{r}
#| label: exp3-mean-acc
exp3_r_means <- exp3_d_acc %>%
mutate(Pronoun = ifelse(Pronoun == "T_HS", "T", "HS")) %>%
group_by(Pronoun, Nametag, Intro) %>%
summarise( # they and he/she for each condition
mean = mean(Accuracy, na.rm = TRUE),
sd = sd(Accuracy, na.rm = TRUE)
) %>%
ungroup() %>%
add_row( # they across conditions
Pronoun = "T", Nametag = "All", Intro = "",
mean = exp3_d_acc %>%
filter(Pronoun == "T_HS") %>%
pull(Accuracy) %>%
mean(),
sd = exp3_d_acc %>%
filter(Pronoun == "T_HS") %>%
pull(Accuracy) %>%
sd()
) %>%
add_row( # he+she across conditions
Pronoun = "HS", Nametag = "All", Intro = "",
mean = exp3_d_acc %>%
filter(Pronoun != "T_HS") %>%
pull(Accuracy) %>%
mean(),
sd = exp3_d_acc %>%
filter(Pronoun != "T_HS") %>%
pull(Accuracy) %>%
sd()
) %>%
mutate(.keep = c("unused"),
Condition = str_c(Pronoun, Nametag, Intro, sep = " ")
) %>%
column_to_rownames("Condition") %>%
round(2) %>%
format(nsmall = 2)
exp3_r_means
```
```{r}
#| label: exp3-model-buildmer
#| cache: true