STEI-estimates/diff.tex at main · USFWS/STEI-estimates · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
611
612
613
614
615
616
617
618
619
620
621
622
623
624
625
626
627
628
629
630
631
632
633
634
635
636
637
638
639
640
641
642
643
644
645
646
647
648
649
650
651
652
653
654
655
656
657
658
659
660
661
662
663
664
665
666
667
668
669
670
671
672
673
674
675
676
677
678
679
680
681
682
683
684
685
686
687
688
689
690
691
692
693
694
695
696
697
698
699
700
701
702
703
704
705
706
707
708
709
710
711
712
713
714
715
716
717
718
719
720
721
722
723
724
725
726
727
728
729
730
731
732
733
734
735
736
737
738
739
740
741
742
743
744
745
746
747
748
749
750
751
752
753
754
755
756
757
758
759
760
761
762
763
764
765
766
767
768
769
770
771
772
773
774
775
776
777
778
779
780
781
782
783
784
785
786
787
788
789
790
791
792
793
794
795
796
797
798
799
800
801
802
803
804
805
806
807
808
809
810
811
812
813
814
815
816
817
818
819
820
821
822
823
824
825
826
827
828
829
830
831
832
833
834
835
836
837
838
839
840
841
842
843
844
845
846
847
848
849
850
851
852
853
854
855
856
857
858
859
860
861
862
863
864
865
866
867
868
869
870
871
872
873
874
875
876
877
878
879
880
881
882
883
884
885
886
887
888
889
890
891
892
893
894
895
896
897
898
899
900
901
902
903
904
905
906
907
908
909
910
911
912
913
914
915
916
917
918
919
920
921
922
923
924
925
926
927
928
929
930
931
932
933
934
935
936
937
938
939
940
941
942
943
944
945
946
947
948
949
950
951
952
953
954
955
956
957
958
959
960
961
962
963
964
965
966
967
968
969
970
971
972
973
974
975
976
977
978
979
980
981
982
983
984
985
986
987
988
989
990
991
992
993
994
995
996
997
998
999
1000
% Options for packages loaded elsewhere
%DIF LATEXDIFF DIFFERENCE FILE
%DIF DEL STEI__report_plos_reformat.tex           Thu Jan 22 14:45:55 2026
%DIF ADD STEI__report_plos_reformat_revised.tex   Thu Mar 26 09:31:08 2026
\PassOptionsToPackage{unicode}{hyperref}
\PassOptionsToPackage{hyphens}{url}
%


\PassOptionsToPackage{table}{xcolor}

\documentclass[
  10pt,
  letterpaper,
]{article}

\usepackage{amsmath,amssymb}
\usepackage{iftex}
\ifPDFTeX
  \usepackage[T1]{fontenc}
  \usepackage[utf8]{inputenc}
  \usepackage{textcomp} % provide euro and other symbols
\else % if luatex or xetex
  \usepackage{unicode-math}
  \defaultfontfeatures{Scale=MatchLowercase}
  \defaultfontfeatures[\rmfamily]{Ligatures=TeX,Scale=1}
\fi
\usepackage{lmodern}
\ifPDFTeX\else
    % xetex/luatex font selection
\fi
% Use upquote if available, for straight quotes in verbatim environments
\IfFileExists{upquote.sty}{\usepackage{upquote}}{}
\IfFileExists{microtype.sty}{% use microtype if available
  \usepackage[]{microtype}
  \UseMicrotypeSet[protrusion]{basicmath} % disable protrusion for tt fonts
}{}
\makeatletter
\@ifundefined{KOMAClassName}{% if non-KOMA class
  \IfFileExists{parskip.sty}{%
    \usepackage{parskip}
  }{% else
    \setlength{\parindent}{0pt}
    \setlength{\parskip}{6pt plus 2pt minus 1pt}}
}{% if KOMA class
  \KOMAoptions{parskip=half}}
\makeatother
\usepackage{xcolor}
\usepackage[top=0.85in,left=2.75in,footskip=0.75in]{geometry}
\setlength{\emergencystretch}{3em} % prevent overfull lines
\setcounter{secnumdepth}{-\maxdimen} % remove section numbering


\providecommand{\tightlist}{%
  \setlength{\itemsep}{0pt}\setlength{\parskip}{0pt}}\usepackage{longtable,booktabs,array}
\usepackage{calc} % for calculating minipage widths
% Correct order of tables after \paragraph or \subparagraph
\usepackage{etoolbox}
\makeatletter
\patchcmd\longtable{\par}{\if@noskipsec\mbox{}\fi\par}{}{}
\makeatother
% Allow footnotes in longtable head/foot
\IfFileExists{footnotehyper.sty}{\usepackage{footnotehyper}}{\usepackage{footnote}}
\makesavenoteenv{longtable}
\usepackage{graphicx}
\makeatletter
\newsavebox\pandoc@box
\newcommand*\pandocbounded[1]{% scales image to fit in text height/width
  \sbox\pandoc@box{#1}%
  \Gscale@div\@tempa{\textheight}{\dimexpr\ht\pandoc@box+\dp\pandoc@box\relax}%
  \Gscale@div\@tempb{\linewidth}{\wd\pandoc@box}%
  \ifdim\@tempb\p@<\@tempa\p@\let\@tempa\@tempb\fi% select the smaller of both
  \ifdim\@tempa\p@<\p@\scalebox{\@tempa}{\usebox\pandoc@box}%
  \else\usebox{\pandoc@box}%
  \fi%
}
% Set default figure placement to htbp
\def\fps@figure{htbp}
\makeatother

% Use adjustwidth environment to exceed column width (see example table in text)
\usepackage{changepage}

% marvosym package for additional characters
\usepackage{marvosym}

% cite package, to clean up citations in the main text. Do not remove.
% Using natbib instead
% \usepackage{cite}

% Use nameref to cite supporting information files (see Supporting Information section for more info)
\usepackage{nameref,hyperref}

% line numbers
\usepackage[right]{lineno}

% ligatures disabled
\usepackage{microtype}
\DisableLigatures[f]{encoding = *, family = * }

% create "+" rule type for thick vertical lines
\newcolumntype{+}{!{\vrule width 2pt}}

% create \thickcline for thick horizontal lines of variable length
\newlength\savedwidth
\newcommand\thickcline[1]{%
  \noalign{\global\savedwidth\arrayrulewidth\global\arrayrulewidth 2pt}%
  \cline{#1}%
  \noalign{\vskip\arrayrulewidth}%
  \noalign{\global\arrayrulewidth\savedwidth}%
}

% \thickhline command for thick horizontal lines that span the table
\newcommand\thickhline{\noalign{\global\savedwidth\arrayrulewidth\global\arrayrulewidth 2pt}%
\hline
\noalign{\global\arrayrulewidth\savedwidth}}

% Text layout
\raggedright
\setlength{\parindent}{0.5cm}
\textwidth 5.25in
\textheight 8.75in

% Bold the 'Figure #' in the caption and separate it from the title/caption with a period
% Captions will be left justified
\usepackage[aboveskip=1pt,labelfont=bf,labelsep=period,justification=raggedright,singlelinecheck=off]{caption}
\renewcommand{\figurename}{Fig}

% Remove brackets from numbering in List of References
\makeatletter
\renewcommand{\@biblabel}[1]{\quad#1.}
\makeatother

% Header and Footer with logo
\usepackage{lastpage,fancyhdr}
\usepackage{epstopdf}
%\pagestyle{myheadings}
\pagestyle{fancy}
\fancyhf{}
%\setlength{\headheight}{27.023pt}
%\lhead{\includegraphics[width=2.0in]{PLOS-submission.eps}}
\rfoot{\thepage/\pageref{LastPage}}
\renewcommand{\headrulewidth}{0pt}
\renewcommand{\footrule}{\hrule height 2pt \vspace{2mm}}
\fancyheadoffset[L]{2.25in}
\fancyfootoffset[L]{2.25in}
\lfoot{\today}
\usepackage{booktabs}
\usepackage{caption}
\usepackage{longtable}
\usepackage{colortbl}
\usepackage{array}
\usepackage{anyfontsize}
\usepackage{multirow}
\usepackage{setspace}
\doublespacing
\makeatletter
\@ifpackageloaded{caption}{}{\usepackage{caption}}
\AtBeginDocument{%
\ifdefined\contentsname
  \renewcommand*\contentsname{Table of contents}
\else
  \newcommand\contentsname{Table of contents}
\fi
\ifdefined\listfigurename
  \renewcommand*\listfigurename{List of Figures}
\else
  \newcommand\listfigurename{List of Figures}
\fi
\ifdefined\listtablename
  \renewcommand*\listtablename{List of Tables}
\else
  \newcommand\listtablename{List of Tables}
\fi
\ifdefined\figurename
%DIF 173c173
%DIF <   \renewcommand*\figurename{Figure}
%DIF -------
  \renewcommand*\figurename{Fig} %DIF >
%DIF -------
\else
%DIF 175c175
%DIF <   \newcommand\figurename{Figure}
%DIF -------
  \newcommand\figurename{Fig} %DIF >
%DIF -------
\fi
\ifdefined\tablename
  \renewcommand*\tablename{Table}
\else
  \newcommand\tablename{Table}
\fi
}
\@ifpackageloaded{float}{}{\usepackage{float}}
\floatstyle{ruled}
\@ifundefined{c@chapter}{\newfloat{codelisting}{h}{lop}}{\newfloat{codelisting}{h}{lop}[chapter]}
\floatname{codelisting}{Listing}
\newcommand*\listoflistings{\listof{codelisting}{List of Listings}}
\makeatother
\makeatletter
\makeatother
\makeatletter
\@ifpackageloaded{caption}{}{\usepackage{caption}}
\@ifpackageloaded{subcaption}{}{\usepackage{subcaption}}
\makeatother

\usepackage[numbers,square,comma]{natbib}
\bibliographystyle{plos2025}
\usepackage{bookmark}

\IfFileExists{xurl.sty}{\usepackage{xurl}}{} % add URL line breaks if available
\urlstyle{same} % disable monospaced font for URLs
\hypersetup{
  pdftitle={Periodicity in Steller's eider (Polysticta stelleri) population size and density on the Arctic Coastal Plain, Alaska, revealed using generalized additive models},
  pdfauthor={Erik E. Osnas},
  hidelinks,
  pdfcreator={LaTeX via pandoc}}
%DIF PREAMBLE EXTENSION ADDED BY LATEXDIFF
%DIF UNDERLINE PREAMBLE %DIF PREAMBLE
\RequirePackage[normalem]{ulem} %DIF PREAMBLE
\RequirePackage{color}\definecolor{RED}{rgb}{1,0,0}\definecolor{BLUE}{rgb}{0,0,1} %DIF PREAMBLE
\providecommand{\DIFaddtex}[1]{{\protect\color{blue}\uwave{#1}}} %DIF PREAMBLE
\providecommand{\DIFdeltex}[1]{{\protect\color{red}\sout{#1}}} %DIF PREAMBLE
%DIF SAFE PREAMBLE %DIF PREAMBLE
\providecommand{\DIFaddbegin}{} %DIF PREAMBLE
\providecommand{\DIFaddend}{} %DIF PREAMBLE
\providecommand{\DIFdelbegin}{} %DIF PREAMBLE
\providecommand{\DIFdelend}{} %DIF PREAMBLE
\providecommand{\DIFmodbegin}{} %DIF PREAMBLE
\providecommand{\DIFmodend}{} %DIF PREAMBLE
%DIF FLOATSAFE PREAMBLE %DIF PREAMBLE
\providecommand{\DIFaddFL}[1]{\DIFadd{#1}} %DIF PREAMBLE
\providecommand{\DIFdelFL}[1]{\DIFdel{#1}} %DIF PREAMBLE
\providecommand{\DIFaddbeginFL}{} %DIF PREAMBLE
\providecommand{\DIFaddendFL}{} %DIF PREAMBLE
\providecommand{\DIFdelbeginFL}{} %DIF PREAMBLE
\providecommand{\DIFdelendFL}{} %DIF PREAMBLE
%DIF HYPERREF PREAMBLE %DIF PREAMBLE
\providecommand{\DIFadd}[1]{\texorpdfstring{\DIFaddtex{#1}}{#1}} %DIF PREAMBLE
\providecommand{\DIFdel}[1]{\texorpdfstring{\DIFdeltex{#1}}{}} %DIF PREAMBLE
\providecommand{\DIFscaledelfig}{0.5}
%DIF HIGHLIGHTGRAPHICS PREAMBLE %DIF PREAMBLE
\RequirePackage{settobox} %DIF PREAMBLE
\RequirePackage{letltxmacro} %DIF PREAMBLE
\newsavebox{\DIFdelgraphicsbox} %DIF PREAMBLE
\newlength{\DIFdelgraphicswidth} %DIF PREAMBLE
\newlength{\DIFdelgraphicsheight} %DIF PREAMBLE
% store original definition of \includegraphics %DIF PREAMBLE
\LetLtxMacro{\DIFOincludegraphics}{\includegraphics} %DIF PREAMBLE
\providecommand{\DIFaddincludegraphics}[2][]{{\color{blue}\fbox{\DIFOincludegraphics[#1]{#2}}}} %DIF PREAMBLE
\providecommand{\DIFdelincludegraphics}[2][]{% %DIF PREAMBLE
\sbox{\DIFdelgraphicsbox}{\DIFOincludegraphics[#1]{#2}}% %DIF PREAMBLE
\settoboxwidth{\DIFdelgraphicswidth}{\DIFdelgraphicsbox} %DIF PREAMBLE
\settoboxtotalheight{\DIFdelgraphicsheight}{\DIFdelgraphicsbox} %DIF PREAMBLE
\scalebox{\DIFscaledelfig}{% %DIF PREAMBLE
\parbox[b]{\DIFdelgraphicswidth}{\usebox{\DIFdelgraphicsbox}\\[-\baselineskip] \rule{\DIFdelgraphicswidth}{0em}}\llap{\resizebox{\DIFdelgraphicswidth}{\DIFdelgraphicsheight}{% %DIF PREAMBLE
\setlength{\unitlength}{\DIFdelgraphicswidth}% %DIF PREAMBLE
\begin{picture}(1,1)% %DIF PREAMBLE
\thicklines\linethickness{2pt} %DIF PREAMBLE
{\color[rgb]{1,0,0}\put(0,0){\framebox(1,1){}}}% %DIF PREAMBLE
{\color[rgb]{1,0,0}\put(0,0){\line( 1,1){1}}}% %DIF PREAMBLE
{\color[rgb]{1,0,0}\put(0,1){\line(1,-1){1}}}% %DIF PREAMBLE
\end{picture}% %DIF PREAMBLE
}\hspace*{3pt}}} %DIF PREAMBLE
} %DIF PREAMBLE
\LetLtxMacro{\DIFOaddbegin}{\DIFaddbegin} %DIF PREAMBLE
\LetLtxMacro{\DIFOaddend}{\DIFaddend} %DIF PREAMBLE
\LetLtxMacro{\DIFOdelbegin}{\DIFdelbegin} %DIF PREAMBLE
\LetLtxMacro{\DIFOdelend}{\DIFdelend} %DIF PREAMBLE
\DeclareRobustCommand{\DIFaddbegin}{\DIFOaddbegin \let\includegraphics\DIFaddincludegraphics} %DIF PREAMBLE
\DeclareRobustCommand{\DIFaddend}{\DIFOaddend \let\includegraphics\DIFOincludegraphics} %DIF PREAMBLE
\DeclareRobustCommand{\DIFdelbegin}{\DIFOdelbegin \let\includegraphics\DIFdelincludegraphics} %DIF PREAMBLE
\DeclareRobustCommand{\DIFdelend}{\DIFOaddend \let\includegraphics\DIFOincludegraphics} %DIF PREAMBLE
\LetLtxMacro{\DIFOaddbeginFL}{\DIFaddbeginFL} %DIF PREAMBLE
\LetLtxMacro{\DIFOaddendFL}{\DIFaddendFL} %DIF PREAMBLE
\LetLtxMacro{\DIFOdelbeginFL}{\DIFdelbeginFL} %DIF PREAMBLE
\LetLtxMacro{\DIFOdelendFL}{\DIFdelendFL} %DIF PREAMBLE
\DeclareRobustCommand{\DIFaddbeginFL}{\DIFOaddbeginFL \let\includegraphics\DIFaddincludegraphics} %DIF PREAMBLE
\DeclareRobustCommand{\DIFaddendFL}{\DIFOaddendFL \let\includegraphics\DIFOincludegraphics} %DIF PREAMBLE
\DeclareRobustCommand{\DIFdelbeginFL}{\DIFOdelbeginFL \let\includegraphics\DIFdelincludegraphics} %DIF PREAMBLE
\DeclareRobustCommand{\DIFdelendFL}{\DIFOaddendFL \let\includegraphics\DIFOincludegraphics} %DIF PREAMBLE
%DIF AMSMATHULEM PREAMBLE %DIF PREAMBLE
\makeatletter %DIF PREAMBLE
\let\sout@orig\sout %DIF PREAMBLE
\renewcommand{\sout}[1]{\ifmmode\text{\sout@orig{\ensuremath{#1}}}\else\sout@orig{#1}\fi} %DIF PREAMBLE
\makeatother %DIF PREAMBLE
%DIF END PREAMBLE EXTENSION ADDED BY LATEXDIFF

\begin{document}
\vspace*{0.2in}

% Title must be 250 characters or less.
\begin{flushleft}
{\Large
\textbf\newline{Periodicity in Steller's eider (\emph{Polysticta
stelleri}) population size and density on the Arctic Coastal Plain,
Alaska, revealed using generalized additive
models} % Please use "sentence case" for title and headings (capitalize only the first word in a title (or heading), the first word in a subtitle (or subheading), and any proper nouns).
}
\newline
\\
% Insert author names, affiliations and corresponding author email (do not include titles, positions, or degrees).
Erik E. Osnas\textsuperscript{1*}
\\
\bigskip
\DIFdelbegin \textbf{\DIFdel{1}} %DIFAUXCMD
\DIFdelend \DIFaddbegin \DIFadd{\textsuperscript{1} }\DIFaddend Division of Migratory Bird Management, \DIFdelbegin \DIFdel{US }\DIFdelend \DIFaddbegin \DIFadd{United States }\DIFaddend Fish and Wildlife Service, Anchorage, \DIFdelbegin \DIFdel{AK, USA,
}\DIFdelend \DIFaddbegin \DIFadd{Alaska, United States of America
}\DIFaddend \bigskip

* \DIFaddbegin \DIFadd{Corresponding author }\newline
\DIFadd{E-mail: }\DIFaddend erik\_osnas@fws.gov \DIFaddbegin \DIFadd{(EO)
}\DIFaddend

\end{flushleft}

\section*{Abstract}
Annual population and spatial density estimates are needed for the
threatened Alaska-breeding population of Steller's eiders
(\emph{Polysticta stelleri}) to assess recovery status and guide
recovery actions but these quantities are poorly estimated in this rare
species using traditional methods. Therefore, population size and
spatial variation in density were estimated across the Arctic Coastal
Plain (ACP) and Utqiagvik Triangle (Triangle) survey areas using
spatio-temporal generalized additive models and compared to traditional
design-based estimates. Compared to design-based estimates, model-based
estimates were more precise and less variable between years. Moreover,
data sets can be combined to produce common estimates, detection
probability can be incorporated to estimate population size, and spatial
density maps can be produced from model-based estimates. Across both
data sets and when combined, Steller's eider populations fluctuated with
an approximate 6.53-year period (95\% CI: \DIFdelbegin \DIFdel{5.49, 7.72}\DIFdelend \DIFaddbegin \DIFadd{5.46, 7.93}\DIFaddend ) with populations
cycling from modelled posterior lows of 25 to 500 individuals and highs
from 230 to \DIFdelbegin \DIFdel{\textgreater2000 }\DIFdelend \DIFaddbegin \DIFadd{\textgreater 2000 }\DIFaddend individuals across the ACP. Over the long
term, the posterior 25-year geometric mean growth rate was -0.02 (\DIFaddbegin \DIFadd{95\% }\DIFaddend CI:
-0.07, 0.02), and shorter term growth rates were less well-estimated and
fluctuated between positive and near zero. Density maps showed a high
concentration in the northern part of the Triangle area and lower
densities southward and across the ACP. Models fit to just the Triangle
area indicated that eider density has been shifting northward though
time, but this pattern was not supported in the sparse ACP data set, nor
was it well-estimated when the ACP and Triangle data sets were combined.
Given the strong cycle in this population, estimates of population size
at similar cycle phases should be used for trend estimates.

\linenumbers

\section{Introduction}\label{introduction}

The Pacific population of Steller's eider (\emph{Polysticta stelleri})
is a seaduck that nests in northeastern Russia and Alaska, with the
Alaska breeding population currently listed as Threatened under the
Endangered Species Act. As such, frequent status assessments are needed
to determine correct listing status and to guide recovery actions.
Unfortunately, the rarity and low density of this eider in Alaska make
inferences of population size, trend, and distribution especially
difficult. Moreover, observations of Steller's eider on surveys are
extremely variable among years, with some years having no observed
eiders \DIFdelbegin \DIFdel{\mbox{%DIFAUXCMD
\citep{obritschkewitsch2008steller} }\hskip0pt%DIFAUXCMD
\mbox{%DIFAUXCMD
\citep{wilson2025population}}\hskip0pt%DIFAUXCMD
}\DIFdelend \DIFaddbegin \DIFadd{\mbox{%DIFAUXCMD
\citep{obritschkewitsch2008steller, wilson2025population}}\hskip0pt%DIFAUXCMD
}\DIFaddend .
It has been hypothesized that these eiders forgo breeding in some years
when \DIFdelbegin \DIFdel{when }\DIFdelend brown lemming (\emph{Lemmus trimucronatus}) abundance and
their avian predators are low \citep{quakenbush2004breeding}. Such
cycles or intermittent breeding would further complicate methods to
estimate long term trends or model population viability
\citep{dunham2017evaluating}. The effort described here is an attempt to
make the most of the available data using modern model-based methods to
distinguish sampling variation from the underlying signal of population
differences between years and locations.

The approach here is inspired by \DIFdelbegin \DIFdel{\mbox{%DIFAUXCMD
\citep{miller2013} }\hskip0pt%DIFAUXCMD
and
}\DIFdelend \DIFaddbegin \DIFadd{Miller et al \mbox{%DIFAUXCMD
\citep{miller2013} }\hskip0pt%DIFAUXCMD
and
Amundson et al. }\DIFaddend \citep{amundson2019}, where generalized additive models
\DIFdelbegin \DIFdel{\mbox{%DIFAUXCMD
\citep{hastie1986generalized} }\hskip0pt%DIFAUXCMD
\mbox{%DIFAUXCMD
\citep{wood2017} }\hskip0pt%DIFAUXCMD
}\DIFdelend \DIFaddbegin \DIFadd{\mbox{%DIFAUXCMD
\citep{hastie1986generalized, wood2017} }\hskip0pt%DIFAUXCMD
}\DIFaddend are used to estimate
temporal and spatial variation in eider density. This approach to
estimating population trend also borrows from the work of
\DIFdelbegin \DIFdel{\mbox{%DIFAUXCMD
\citep{sauer2002hierarchical}}\hskip0pt%DIFAUXCMD
, \mbox{%DIFAUXCMD
\citep{rosenberg2019decline}}\hskip0pt%DIFAUXCMD
, and
\mbox{%DIFAUXCMD
\citep{smith2021north} }\hskip0pt%DIFAUXCMD
}\DIFdelend \DIFaddbegin \DIFadd{\mbox{%DIFAUXCMD
\citep{sauer2002hierarchical, rosenberg2019decline, smith2021north} }\hskip0pt%DIFAUXCMD
}\DIFaddend among others, although the focus here is only one species. In general, the advantage of model-based estimates are that they help to separate noise (i.e., sampling variation) from the true underlying signal (i.e., temporal or spatial patterns in density \DIFdelbegin \DIFdel{,
\mbox{%DIFAUXCMD
\citep{BDA3}}\hskip0pt%DIFAUXCMD
, \mbox{%DIFAUXCMD
\citep{hooten2015guide}}\hskip0pt%DIFAUXCMD
, }\DIFdelend \DIFaddbegin \DIFadd{\mbox{%DIFAUXCMD
\citep{BDA3, hooten2015guide}}\hskip0pt%DIFAUXCMD
, }\DIFaddend many others) and is closely related to the concept of shrinkage of random effects
\DIFdelbegin \DIFdel{\mbox{%DIFAUXCMD
\citep{efron1977stein}}\hskip0pt%DIFAUXCMD
, \mbox{%DIFAUXCMD
\citep{BDA3}}\hskip0pt%DIFAUXCMD
, }\DIFdelend \DIFaddbegin \DIFadd{\mbox{%DIFAUXCMD
\citep{efron1977stein, BDA3}}\hskip0pt%DIFAUXCMD
, }\DIFaddend where information is shared across
samples in time, space, or other groups. This contrasts with pure
design-based estimates, which make minimal assumptions, but suffer from
high variability in this rare species. Specifically, sampling variation
alone might lead to observations of zero eiders even when eiders did
exist in the survey area. While correcting for the detection process is
possible for design-based estimates, in the case of zero observations,
no correction can be made, and these years will tend to under represent
the true animal density. Sampling variation also inflates the
year-to-year variance in estimates and will tend to make population
trend estimates less precise and potentially more extreme, especially
when multiple species are compared or statistical significance tests are
used to detect trends \citep{sauer2002hierarchical}. In contrast,
model-based estimates require the specification of a probability model
for observations and help distinguish sampling from non-sampling
variation. In the spatial and temporal context, where correlation is
generally high and positive between nearby measurements, models that
exploit this feature are especially helpful, and nearly all modern
methods to detect trends in time and space use such models (see
citations above, and \DIFdelbegin \DIFdel{\mbox{%DIFAUXCMD
\citep{kery2015applied}}\hskip0pt%DIFAUXCMD
, \mbox{%DIFAUXCMD
\citep{kery2020applied}}\hskip0pt%DIFAUXCMD
}\DIFdelend \DIFaddbegin \DIFadd{\mbox{%DIFAUXCMD
\citep{kery2015applied, kery2020applied}}\hskip0pt%DIFAUXCMD
}\DIFaddend ).

Below, I apply spatio-temporal models to provide the best available
estimates of Steller's eider density and annual population size on the
Arctic Coastal Plain (hereafter, ACP) and a smaller but highly sampled
triangle-shaped area (Triangle survey) near Utqiagvik, Alaska. I first
describe the data (\S Survey areas and data source). I then describe the
calculations of design-based estimates (\S Design-based estimates). This
is the first report of design-based estimates for the Triangle data that
include an estimate of uncertainty. These provide a reference point
against model-based estimates. I then describe the data formatting and a
variety of spatio-temporal generalized additive models fit to the data
(\S Model-based estimates). Posterior simulations from the fitted model
estimates are then used to calculate total population size and trend
(\S Prediction and posterior simulation). I also describe the detection
estimate used during posterior simulations (\S Incorporating detection).
Finally (\S Wavelet analysis), I conduct a wavelet analysis of the
posterior mean population size across years to estimate and
statistically test for a periodic cycle in the eider population. This is
of practical significance because it has been hypothesized that nesting
effort of Steller's eiders is highest when brown lemming populations are
at or near peak of their boom-bust cycles, and if there is a strong
cycle, estimates of trend will depend on the relative endpoints used in
building the estimate. Thus, if the population is cyclic, consistent
relative positions in the cycle should be used for trend estimates.
Throughout the results I provide some interpretation and provide
comparisons to past work (\S Results and Interpretation). I then provide
some recommendations for model-based estimation of population size and
trends, compare these methods to related efforts, and discuss the
importance of the population cycles and detection estimates for species
status assessment under the US Endangered Species Act (\S Discussion,
\S Conclusion).

\section{Methods}\label{methods}

\subsection{Survey areas and data
source}\label{survey-areas-and-data-source}

Data used in this report came from the ACP Survey conducted by the
United States Fish and Wildlife Service, Division of Migratory Bird
Management, Alaska Region, and a survey conducted by ABR, Inc.-
Environmental Research and Services (ABR) near Utqiagvik, Alaska, under
contract by the United States Fish and Wildlife Service, Ecological
Services Field Office, Fairbanks, Alaska, (hereafter, the Triangle
survey, Fig~\ref{fig-area}). The ACP survey has been described in
\citep{amundson2019} and \citep{wilson2025population}. Unlike in
\citep{amundson2019}, here only data from the actual ACP survey (2007 to
2019 and 2022 to 2024) are used. \DIFaddbegin \DIFadd{Amundson et al. }\DIFaddend \citep{amundson2019} also included data from a different survey (before 2007) with different seasonal timing that causes a difference in observed response (a major subject of the effort in \citep{amundson2019}). Data collected before 2007 have also not undergone the same level of quality control, which was a major effort for this analysis. The ACP data from 2007 to 2024 used in this report, a description of quality control processes, and a description of data manipulations are available at \DIFdelbegin \DIFdel{\mbox{%DIFAUXCMD
\citep{osnas-github}
}\hskip0pt%DIFAUXCMD
\mbox{%DIFAUXCMD
\citep{osnasACP} }\hskip0pt%DIFAUXCMD
}\DIFdelend \DIFaddbegin \DIFadd{\mbox{%DIFAUXCMD
\citep{osnas-github, osnasACP} }\hskip0pt%DIFAUXCMD
}\DIFaddend (see \nameref{s1-acpdata}).

The Triangle survey is described in reports from ABR
\DIFdelbegin \DIFdel{\mbox{%DIFAUXCMD
\citep{obritschkewitsch2008steller} }\hskip0pt%DIFAUXCMD
\mbox{%DIFAUXCMD
\citep{triangleABR}}\hskip0pt%DIFAUXCMD
}\DIFdelend \DIFaddbegin \DIFadd{\mbox{%DIFAUXCMD
\citep{obritschkewitsch2008steller, triangleABR}}\hskip0pt%DIFAUXCMD
}\DIFaddend . Data for the
Triangle survey were obtained from ABR and are available at
\nameref{s2-tridata}. A lengthy quality control process was applied to
make data available for use in this report (documented in the file
\texttt{wrangle\_ABR.R}, available at \nameref{s3-code}).

Important differences between the surveys include the much higher
sampling coverage of the Triangle survey (25-50\%) compared to the ACP
survey (approximately 1 - 8\%), the much larger area of the ACP survey,
and the sampling effort is stratified in the ACP survey
(Fig~\ref{fig-area}). Hen eiders, birds occurring off of defined
transects, and behavior (flying/not flying) are also recorded on the
Triangle survey, but these are not generally recorded during the ACP
survey. In addition, the ACP survey records all waterbird species, but
the Triangle survey records a smaller subset (king {[}\emph{Somateria
spectabilis}{]} and spectacled {[}\emph{Somateria fischeri}{]} eiders in
addition to Steller's, other species in some years). Otherwise, the two
surveys follow standard aerial waterfowl survey protocols
\citep{cws1987}. No flocked Steller's eiders were observed on either
survey, and females outside of male-female pairs and all off-transect
observations were dropped from the Triangle data for all analyses. There
was one case of an \DIFdelbegin \DIFdel{`}\DIFdelend \DIFaddbegin \DIFadd{"}\DIFaddend open 1\DIFdelbegin \DIFdel{' }\DIFdelend \DIFaddbegin \DIFadd{" }\DIFaddend Steller's eider in the ACP data set (a
general category for a group of unknown sex or pair status that is not
appropriate for an observation of a single), and it was assumed to be a
single male.

\begin{figure}

\caption{\label{fig-area}\DIFdelbeginFL \DIFdelFL{Arctic Coastal Plain (ACP) and Triangle survey
areas. East-West transect lines are shown in black for one year on the
ACP. Strata with different sampling intensity for the ACP are shown in
thicker black lines and different fill colors. The Triangle area is
shown as a stratum, but it is completely contained within the ACP
stratum `High'. Transects in the Triangle area are very close (800m in
most years) so would appear as a solid color at this scale. On the
Arctic Coastal Plain survey transects are rotated north-south over a
four year period to increase spatial coverage (not shown).}\DIFdelendFL \DIFaddbeginFL \textbf{\DIFaddFL{Arctic Coastal Plain (ACP) and Triangle survey areas.}} \newline{East-west transect lines are shown in black for one year on the ACP. Strata with different transect sampling intensities for the ACP are shown by different fill colors. The Triangle area is shown as a stratum, but it is completely contained within the ACP High stratum. Transects for the Triangle survey are very close (800m in most years) so would appear as a solid color at this scale. On the Arctic Coastal Plain survey, transects are rotated north-south over a four year period to increase spatial coverage (not shown). All map data are products of the U.S. Government and are in the Public Domain.}\DIFaddendFL }

\end{figure}%

All general data manipulation and analysis was done with program R
\citep{r-base} in RStudio \citep{RStudio2024} with the tidyverse
packages \citep{tidyverse}. This manuscript was produced using Quarto
(https://quarto.org/) and the PLOS One journal template found at
https://github.com/quarto-journals/plos in an effort to maximize
reproducibility. Code for this analysis, results, and production of this
manuscript is maintained at https://github.com/USFWS/STEI-estimates.

\subsection{Design-based estimates}\label{design-based-estimates}

I calculated a design-based estimate using formula R3 of Fewster et
al. \citep{fewster2009} \DIFdelbegin \DIFdel{, }\DIFdelend (also see \citep{buckland2001}, p.~79)
\DIFdelbegin \DIFdel{,
}\DIFdelend modified for strip transects. A ratio estimator, which is more common
for strip-transect surveys \DIFdelbegin \DIFdel{\mbox{%DIFAUXCMD
\citep{cochran1977} }\hskip0pt%DIFAUXCMD
\mbox{%DIFAUXCMD
\citep{williams2002}
}\hskip0pt%DIFAUXCMD
\mbox{%DIFAUXCMD
\citep{thompson2012}}\hskip0pt%DIFAUXCMD
}\DIFdelend \DIFaddbegin \DIFadd{\mbox{%DIFAUXCMD
\citep{cochran1977, williams2002, thompson2012}}\hskip0pt%DIFAUXCMD
}\DIFaddend , was investigated but found to be poor \DIFdelbegin \DIFdel{due to the
distribution of observations and the triangle shape of the survey area,
where most observations }\DIFdelend \DIFaddbegin \DIFadd{(very high variance) because most observations of Steller's eiders }\DIFaddend are on short transects in the \DIFdelbegin \DIFdel{north }\DIFdelend \DIFaddbegin \DIFadd{northern end of the triangular-shaped area }\DIFaddend and longer transects in the south rarely have observed \DIFdelbegin \DIFdel{animals. This nullifies any
advantage of a ratio estimator , which can produce a better estimate when the transect length and number of encounters are positively related
\mbox{%DIFAUXCMD
\citep{cochran1977}}\hskip0pt%DIFAUXCMD
, \mbox{%DIFAUXCMD
\citep{thompson2012}}\hskip0pt%DIFAUXCMD
}\DIFdelend \DIFaddbegin \DIFadd{eiders. The ratio estimator can provide lower variance estimates when there is a positive correlation between the two variables (here, animal count and transect length or area) \mbox{%DIFAUXCMD
\citep{cochran1977, thompson2012}}\hskip0pt%DIFAUXCMD
. In this survey area, however, there is a negative correlation between count and transect length (or area). This makes the ratio estimator worse than a simple plot-based estimator or the R3 estimator of Fewster \mbox{%DIFAUXCMD
\citep{fewster2009}}\hskip0pt%DIFAUXCMD
}\DIFaddend . The point estimate was calculated as

\begin{equation}\phantomsection\label{eq-1}{\hat N = A \frac{\Sigma_i n_i}{\Sigma_i a_i}}\end{equation}
and the variance of \(\hat N\) was calculated as
\DIFdelbegin %DIFDELCMD <

%DIFDELCMD < %%%
\DIFdelend \begin{equation}\phantomsection\label{eq-2}{var(\hat N) = \left( \frac{A}{a} \right)^2 \frac{a}{k-1} \sum_i a_i\left( \frac{n_i}{a_i} - \frac{n}{a} \right)^2}\end{equation}
where \(A\) is the total area of the study area, \(a_i\) is the area of
strip transect \(i\), \(n_i\) is the number of encountered single males
or pairs on strip transect \(i\), and \(n\) is the total encounters on
the \(k\) surveyed strips, and \(a\) is the total area of the \(k\)
surveyed strips. It is arguable if a finite population correction,
\((1 - a/A)\), is appropriate, so I left it out as it is not used by
Fewster et al. \citep{fewster2009} or Buckland et al.
\citep{buckland2001} because observations on transects are not
repeatable due to movement of birds and the detection process. Fewster
et al. \citep{fewster2009} showed that \DIFdelbegin \DIFdel{the above }\DIFdelend \DIFaddbegin \DIFadd{Eq (2) }\DIFaddend can overestimate the
variance of systematic surveys when there is a strong gradient in
density, as there is in this area. In \DIFdelbegin \DIFdel{any case, }\DIFdelend \DIFaddbegin \DIFadd{this specific case, however, }\DIFaddend the estimator above is much better than a standard ratio estimator\DIFdelbegin \DIFdel{in this specific case}\DIFdelend .

\subsection{Model-based estimates}\label{model-based-estimates}

I used generalized additive models (GAMs, \DIFdelbegin \DIFdel{\mbox{%DIFAUXCMD
\citep{hastie1986generalized}}\hskip0pt%DIFAUXCMD
,
\mbox{%DIFAUXCMD
\citep{wood2017}}\hskip0pt%DIFAUXCMD
, \mbox{%DIFAUXCMD
\citep{pedersen2019hierarchical}}\hskip0pt%DIFAUXCMD
}\DIFdelend \DIFaddbegin \DIFadd{\mbox{%DIFAUXCMD
\citep{hastie1986generalized, wood2017, pedersen2019hierarchical}}\hskip0pt%DIFAUXCMD
}\DIFaddend ) to estimate eider density as a function of location and time. A GAM can be thought of as a generalized linear mixed model that fits smooth functions (splines) of covariates to predict the response, in addition to standard linear mixed model terms if specified. The optimal degree of smoothing is determined during model fitting through a model selection-like process. The smoothed temporal or spatial effect, thus, can account for autocorrelation in these domains \DIFdelbegin \DIFdel{\mbox{%DIFAUXCMD
\citep{wood2017}}\hskip0pt%DIFAUXCMD
,
\mbox{%DIFAUXCMD
\citep{pedersen2019hierarchical}}\hskip0pt%DIFAUXCMD
, \mbox{%DIFAUXCMD
\citep{hefley2017basis}}\hskip0pt%DIFAUXCMD
}\DIFdelend \DIFaddbegin \DIFadd{\mbox{%DIFAUXCMD
\citep{wood2017, pedersen2019hierarchical, hefley2017basis}}\hskip0pt%DIFAUXCMD
}\DIFaddend . GAMs are
widely used in animal density surface modeling (e.g., \DIFdelbegin \DIFdel{\mbox{%DIFAUXCMD
\citep{miller2013}}\hskip0pt%DIFAUXCMD
, \mbox{%DIFAUXCMD
\citep{amundson2019}}\hskip0pt%DIFAUXCMD
, \mbox{%DIFAUXCMD
\citep{hollmen2023climate}}\hskip0pt%DIFAUXCMD
,
}\DIFdelend \DIFaddbegin \DIFadd{\mbox{%DIFAUXCMD
\citep{miller2013, amundson2019, hollmen2023climate} }\hskip0pt%DIFAUXCMD
}\DIFaddend and many others).

To set up the data for model fitting, I divided sampled transects into 1
(Triangle survey) or 6 (ACP survey) km segments and assigned
observations of eiders (including observation of zero eiders) to segment
centroids. Segments on the boundary of the study area were often smaller
due to boundary issues. I then assumed a half-strip width of 200 m and
calculated an area for each segment. Total number of eider observations
(pairs and males) were summed for each segment and the coordinates (in \DIFdelbegin \DIFdel{isomorphic UTMs}\DIFdelend \DIFaddbegin \DIFadd{Alaska Albers Equal Area projection, EPSG:3338}\DIFaddend ) of the centroid were used for spatial location. Year was used as the covariate for temporal effects. The same procedure was used for both the entire ACP and for the Triangle survey, but for the ACP-only model (see below) the segment size for model fitting was 6 km. This was done for computational reasons (time) related to fitting many different models and to be consistent with \citep{amundson2019}. When Triangle and ACP data were combined into one model, a common 1 km segment size was used. All spatial data manipulation was done using the R package \texttt{sf} \citep{sf}.

I fit a variety of models to explore spatial and temporal effects. The
linear predictor for each model was:

\[M0: Count \sim s(X, Y)\] \[M1: Count \sim s(X, Y) + s(Year)\]
\[M2: Count \sim s(X, Y) + s(Year) + ti(X, Y, Year)\]
\[M3: Count \sim s(X, Y) + s(Year) + s_{re}(fYear)\]
\[M4: Count \sim s(X, Y) + s_{re}(fYear)\] In the above, \(Count\) is
the total number of pairs or males observed in a transect segment,
\(s()\) indicates a smooth function, \(ti()\) indicates a ``tensor
product smooth'' (a multidimensional smooth that allows the units \DIFdelbegin \DIFdel{for
}\DIFdelend \DIFaddbegin \DIFadd{of the }\DIFaddend dimensions to differ), and \(s_{re}()\) is a random effect in the usual
mixed model sense (in
\texttt{mgcv:\ s(...,\ bs\ =\ \textquotesingle{}re\textquotesingle{})}).
\(Year\) is calendar year as a continuous numeric variable, and
\(fYear\) is calendar year as a factor variable. Model \(M0\) is just a
smooth of location that does not change through time. Model \(M1\) is a
smooth of location and a separate smooth of year. This model means that
on the log scale the spatial smooth does not change its relative shape
through time but the overall height changes as a smooth function of
year. Model \(M2\) is a smooth of location, year, and a spatio-temporal
interaction between location and year. Model \(M2\) allows the shape of
the spatial pattern to change through time and allows the time trend to
depend on location. Model \(M3\) estimates a smooth of location, a
smooth of year, and a separate random effect of year, which allows
abrupt non-smooth deviations from an underlying smooth trend
\citep{smith2021north}. Model \(M4\) estimates a smooth of location and
treats year as a simple random effect. The model with year as a random
effect still imposes smoothing on the year effect, just as in the usual
mixed model, where year effects are pulled or ``shrunk'' toward an
overall grand mean. In the models above, each effect is written as an
``average'' or ``partial'' effect relative to the others and all contain
an intercept (not shown). Thus, \(s(X,Y) + s(Year)\) is an average
effect of location and an average effect of Year as a deviation from an
overall intercept. All models used a negative binomial response, a log
link function, and the log segment area as an offset, which controlled
for varying areas of segments near study area boundaries. Thus, the
model is estimating the expected response in 1 \(km^2\) of area. The
scale parameter of the negative binomial was estimated during model
fitting. Other response models were fit (Poisson, Tweedie) and all were
found to be substantially worse fitting than the negative binomial. I
used a \DIFdelbegin \DIFdel{a }\DIFdelend `thin plate regression spline' (\texttt{s(...,\ bs\ =\ "tp")}
in \texttt{mgcv}, \citep{r-mgcv}) as the spline basis function for all
smooth effects in all models. All model fitting and prediction was done
using the R package \texttt{mgcv} \citep{r-mgcv}. Model diagnostics were
inspected using the residual simulation methods in R package
\texttt{DHARMa} \citep{DHARMa} and visualizations using the R package
\texttt{gratia} \citep{r-gratia}. Special attention was given to
quantile-quantile plots and over-dispersion and zero-inflation metrics.
Residual simulations suggested that the negative binomial distribution
appropriately model\DIFaddbegin \DIFadd{l}\DIFaddend ed the large number of response zeros in these data.
To select the best model, the \texttt{\DIFdelbegin \DIFdel{mgcv::}\DIFdelend AIC} function was used \DIFaddbegin \DIFadd{with the correct degrees of freedom for a GAM (see }\texttt{\DIFadd{?mgcv::AIC.gam}} \DIFadd{in \mbox{%DIFAUXCMD
\citep{r-mgcv}}\hskip0pt%DIFAUXCMD
)}\DIFaddend .

For modelling the ACP data alone, additional models were fit that
contained a random effect for observer. The response for these models
was observer-specific; therefore, each segment was only 200 m wide
(i.e., each side of the plane was a separate observation 200 m wide). An
additional five models were fit where each model above also contained an
observer effect, \(s_{re}(Observer)\). Observer effects were not
estimated for the Triangle data because they were not recorded in most
years. When I combined the Triangle data with the ACP data, I used a
fixed factor effect for survey (Triangle or ACP) to model any average
difference between surveys and used a model with spatial and temporal
smooths as in \(M1\). A model with a spatio-temporal interaction
(\(M2\)) was also explored for the combined Triangle and ACP data, but
rejected. The two data series do not overlap during the period of
1999-2006, so the interaction term was not well estimated and produced
widely variable population estimates during posterior simulations for
the years 1999 to 2006. During posterior simulation (see below), the
survey covariate was set to predict the Triangle survey because this is
the area where detection was estimated. R code giving the details of
model fitting can be found in the supplemental information
(\nameref{s3-code}).

\subsection{Prediction and posterior
simulation}\label{prediction-and-posterior-simulation}

I used the \texttt{predict.gam} function from \texttt{mgcv} package
\DIFdelbegin \DIFdel{\mbox{%DIFAUXCMD
\citep{r-mgcv}}\hskip0pt%DIFAUXCMD
, \mbox{%DIFAUXCMD
\citep{wood2017} }\hskip0pt%DIFAUXCMD
}\DIFdelend \DIFaddbegin \DIFadd{\mbox{%DIFAUXCMD
\citep{r-mgcv, wood2017} }\hskip0pt%DIFAUXCMD
}\DIFaddend to predict the expected density of
eiders across the study area (Triangle or ACP) in each year, from 1999
to 2023 for the Triangle and from 2007 to 2024 for the ACP. Note that
years with no data collection are included in these predictions. To do
this, the study area was gridded into 1 \(km^2\) or smaller
cells--smaller when the cells intersect the boundary of the study
area--and centroids and areas of each cell were calculated. A data set
was then created by replicating these point locations and areas for each
year. This large data set was then used in the \texttt{predict} function
along with the model object from the best fitting GAM model. For spatial
maps to represent relative differences in eider density, predictions
were made on the response scale (\texttt{predict} option
\texttt{type\ =\ "response"}) and the year effect was excluded
(\texttt{exclude\ =\ "s(Year)"} or
\texttt{exclude\ =\ c("s(Year)",\ "ti(X,Y,Year)")}). Predictions at cell
centroids were used for the entire cell, that is, the continuous smooth
density surface was rasterized into 1 \(km^2\) or smaller cells for
display in maps.

Results of fitting a GAM in \texttt{mgcv} provide a posterior
distribution of model parameters \DIFdelbegin \DIFdel{\mbox{%DIFAUXCMD
\citep{wood2017}
}\hskip0pt%DIFAUXCMD
\mbox{%DIFAUXCMD
\citep{miller2025bayesian}}\hskip0pt%DIFAUXCMD
}\DIFdelend \DIFaddbegin \DIFadd{\mbox{%DIFAUXCMD
\citep{wood2017, miller2025bayesian}}\hskip0pt%DIFAUXCMD
}\DIFaddend . Therefore, posterior simulation was used to calculate population totals over the study area for each year (see examples in help files for \texttt{mgcv::predict} in \citep{r-mgcv} or \citep{wood2017}, p.~342-343). Predictions were made once on the same grid and years as described above but \texttt{type\ =\ lpmatrix} was specified so that a design matrix, \(\textbf X\), was returned with one row for each prediction location-year and one column for each term in the model. Multivariate normal samples of the model parameters, \(\textbf b_i\) were then simulated using the fitted model parameter vector and variance-covariance matrix. For the Triangle study area, direct simulation from a multivariate normal distribution was used. For all simulations on the ACP study area, a Metropolis-Hastings algorithm was used to obtain samples because large areas of zero observations caused poor performance based on direct multivariate normal simulation using the parameter estimates and covariance matrix (see
\texttt{?mgcv::gam.mh} in \citep{r-mgcv} or \citep{gratiaPost}). A
posterior sample on the response scale was then calculated as
\begin{equation}\phantomsection\label{eq-3}{\textbf y_i = \textbf a exp(\textbf X \textbf b_i )}\end{equation}
where \(\textbf a\) is a vector of the area of each grid cell and
\(\textbf y_i\) is a vector of the expected responses. Note that
\(\textbf y_i\) is the expectation of the negative binomial distribution
and not an actual realization; thus, it is \(>0\) for all predictions.
The above simulation was repeated a large number of times (500) and
results were stored.

Various derived quantities of the posterior samples can also be
calculated. To find the expected population total in a given year, the
sampled vector can be summed over all cells for a given year. Let \(i\)
index the posterior sample, \(j\) index year, and \(k\) index the cell,
then a posterior sample for the expected population total in year \(j\)
is
\begin{equation}\phantomsection\label{eq-4}{\hat Y_{ij} = \sum_k y_{ijk}.}\end{equation}
Because the model was fit to pairs and single males, the above gives the
total ``indicated pairs''. To transform this to birds and ``indicated
birds'', the above posterior sample would be multiplied by 2. A
detection corrected population total for ``indicated birds'' can be
found as
\begin{equation}\phantomsection\label{eq-5}{\hat N_{ij} = 2 \hat Y _{ij}/d_{ij}}\end{equation}
if detection varies only by year, where \(d_{ij}\) is a posterior sample
of detection in year \(j\). If detection varies with location or other
covariates, then the adjustment needs to take place at a lower level of
\(y_{ijk}\).

The posterior trend on the log scale from year \(j\) to \(j+t\) can be
found as
\begin{equation}\phantomsection\label{eq-6}{T_{it} = log \left[ (\hat N_{ij+t}/\hat N_{ij})^{1/t} \right] = \frac{log(\hat N_{ij+t}) - log(\hat N_{ij})}{t}.}\end{equation}
Note that this measure of trend is identical to the slope parameter in a
``log-linear'' regression when the smooth of year in the GAM model,
\(s(Year)\), gives a straight line. The advantage of the GAM is that the
notion of trend can be generalized to non-linear cases where the trend
may be increasing, decreasing, or changing cyclically through time. The
posterior distribution for any quantity can then be displayed using a
histogram or summarized with various metrics. I summarized the posterior
with the mean and the 0.025, 0.5 (median), and 0.975 quantiles. For
trend, I only used detection corrected posterior estimates (see below).
Full detail of the posterior simulations can be found in the
supplemental information (\nameref{s3-code}).

\subsection{Incorporating detection}\label{incorporating-detection}

I used a preliminary detection rate estimated from the second year
(2018) of an on-going field study using artificial decoys to estimate
detection. The detection analysis was completed by Catherine Bradley
(USFWS, retired) and showed that detection rate in 2018 depended only on
distance from transect (see \nameref{s4-bradley}). Detection was also
estimated during 2017, the first year of the study, but field protocol
issues caused problems during this pilot year, and the protocol was
stabilized in 2018. Because distance was not available for observations
outside the decoy detection study area (a sub-set of the Triangle area),
I calculated the average `unconditional' detection rate over the
transect half-strip width (\DIFdelbegin \DIFdel{Table 3 from }\DIFdelend \nameref{s4-bradley}). In this
context, `unconditional' is the detection rate estimated from
double-observer sightability trials that include decoys not observed by
either observer (a `00' capture history). I also used this same
detection rate for the ACP because no better estimate for Steller's
eider is available. The detection rate used here should be viewed as
provisional until a more complete analysis can be conducted
incorporating data from across multiple years and crews. In any case, it
is meant to be the average detection rate over all observations,
including the covariates of distance, year, observer, sun angle, etc.,
and was in fact used for the Steller's eider Species Status Assessment
of 2025 \citep{steiSSA2025}.

To calculate an average detection rate, I assumed that eiders (detected
and undetected) were expected to be uniformly distributed with distance
from the transect, which is true given the design of the Triangle and
ACP surveys. I then averaged detection and the variance of the detection
estimate over each of the four distance bins in \DIFdelbegin \DIFdel{Table 3 of
}\DIFdelend \nameref{s4-bradley}. Because distance bins were of equal width, detection was estimated as a factor of bin (i.e, a continuous distance function was not estimated), and no other covariates were found important, the mean and variance are a simple equally weighted average over the distance bins. In \DIFdelbegin \DIFdel{Table 3 of }\DIFdelend \nameref{s4-bradley} only the mean and ninety-five percent credible interval was given, so I approximated the standard error of the estimate in each bin by the range divided by 2*1.96, which is the typical number of standard deviations in the range of a symmetric credible interval.

This worked out to a detection rate of 0.307 with a standard deviation
of 0.092 or a Beta(7.41, 16.72). Note that this detection prior will
result in a large amount of uncertainty in the estimated number of
eiders. At detection rates of 0.16 and 0.47 (the fifth and ninety-fifth
percentile of the distribution, respectively), the eider population
estimate will be increased about 6- and 2-fold, respectively. Thus,
increased information on detection would be valuable for improving our
knowledge of the eider population size. Interestingly, this detection
rate prior has a very similar mean but is much more variable compared to
that used in the past based on expert judgment
\citep{dunham2017evaluating}.

The posterior population estimate for ``indicated breeding birds''
(single males and pairs), accounting for constant detection, was then
calculated as
\begin{equation}\phantomsection\label{eq-7}{\hat N_{ij} = 2\hat Y _{ij}/d_{i}.}\end{equation}
with \(d_i\) sampled from a Beta distribution with the mean and standard
deviation above. Thus, detection was assumed constant across years and
other covariates (e.g., crews, singles, pairs). If detection varies with
year, location or other covariates, then the adjustment needs to take
place at a lower level as in (Eq~\ref{eq-5}).

In general, quantities \(\hat Y\) are designated as ``indicated pairs''
because single males are assumed to ``indicate'' an observed female on
the nest (the male-female sex ratio is assumed equal). (Technically,
within the tradition of waterfowl biology, ``indicated pairs'' include
flocked drakes in groups of less than 5. However, none of these were
observed in either data set; thus, ``indicated breeding pairs'' and
``indicated pairs'' are the same.) When ``indicated pairs'' are
multiplied by 2, \(2\hat Y\), then the quantity becomes ``indicated
birds'' because each pair is 2 individuals. Hereafter, I use ``indicated
breeding birds'', and I use the word ``index'' to distinguish quantities
that are not corrected for detection. Thus, \(2\hat Y\) is the
``indicated breeding bird index,'' and \(2\hat Y/d\) is simply
``indicated breeding birds,'' to reflect that it is a population
estimate, at least conditional on the assumptions inherent with
``indicated.''

\subsection{Wavelet analysis}\label{wavelet-analysis}

In order to formally estimate the period of a repeating cycle in the
Steller's eider population, I used wavelet analysis to detect and
statistically test for the presence of a cycle. Wavelet analysis is
similar to a Fourier transform of a time series where the time domain is
expressed in the frequency domain. Unlike a basic Fourier transform,
however, a wavelet transform localizes the frequency information in time
so that changes in the frequency of a signal with time can be examined.
The main product of a wavelet analysis is a ``power spectrum'' (also
know as a spectrogram) that is a three dimensional surface showing the
``power'' (z-axis or a measure of the strength of a particular frequency
or period) in a time series as a function of the wave period (y-axis)
and time (x-axis). High ``power'' ridges across time correspond to a
large signal at that frequency (or period) in the time series. If the
period is changing through time, the position of the ridge will change
relative to the period axis as time increases. An accessible
introduction can be found in \citep{cazelles2008wavelet} and in the
documentation to the R package \texttt{WaveletComp} \citep{r-wavelet}. I
used the function \texttt{analyze.wavelet} from the \texttt{WaveletComp}
package \citep{r-wavelet} to calculate the wavelet properties of the
posterior mean population time series estimate from the model that
combined both Triangle and ACP data. I used the null hypothesis of white
noise and 200 bootstrap simulations to test for statistical departure
form white noise (a flat or uniform frequency spectrum) and to calculate
a confidence interval for the period. I then used the functions
\texttt{wt.image} to visualize the power spectrum and \texttt{wt.avg} to
visualize the average power spectrum across years. To find the full
posterior of the dominant wave frequency, I calculated the wavelet
properties of 500 posterior samples of the population time series from
the best fitting GAM model and saved the wave period at the maximum
average power across time for each sample. I then used the mean and 95\%
credible interval to summarize this posterior.

\section{Results and Interpretation}\label{results-and-interpretation}

\subsection{Observations of Steller's
eider}\label{observations-of-stellers-eider}

Observed locations of Steller's eiders across the study area are shown
in Fig~\ref{fig-observations}. Most observations are in the northern
coastal area of the Triangle and Teshekpuk area. No observations of
Steller's eiders have been made in the two southernmost ACP strata.
Observations from the Triangle survey abruptly stop at the southern edge
of the Triangle survey area, suggesting that eiders sometimes exist
south of that area more often than observations from either survey
suggest. Fig~\ref{fig-count} shows the count of Steller's eiders by year
for both the Triangle and ACP surveys.

\begin{figure}

\caption{\label{fig-observations}\DIFdelbeginFL \DIFdelFL{Observed Steller's eider during the
Arctic Coastal Plain (2007-2024) and Triangle (1999-2023) surveys.}\DIFdelendFL \DIFaddbeginFL \textbf{\DIFaddFL{Observed Steller's eider during the Arctic Coastal Plain (2007-2024) and Triangle (1999-2023) surveys.}} \newline{Arctic Coastal Plain (ACP) strata are shown by black lines. Locations of eider observations by survey are given by the purple (ACP) or orange (Triangle) dots. All map data are products of the U.S. Government and are in the Public Domain.}\DIFaddendFL }

\end{figure}%

\begin{figure}

\caption{\label{fig-count}\DIFdelbeginFL \DIFdelFL{Number of Steller's eider observations by year
for the Arctic Coastal Plain and Triangle surveys.}\DIFdelendFL \DIFaddbeginFL \textbf{\DIFaddFL{Number of Steller's eider observations by year for the Arctic Coastal Plain and Triangle surveys.}}\DIFaddendFL }

\end{figure}%

\subsection{Design-based estimates}\label{design-based-estimates-1}

Design-based estimates for the both survey areas are shown in
Fig~\ref{fig-design}. No survey was conducted in 2020 for the Triangle
survey or in 2020 and 2021 for the ACP. Note the higher mean and
variance of estimates for the ACP compared to the Triangle survey and
that estimates for the ACP often overlap zero. This is due to the larger
area and smaller sampling fraction of the ACP design. Design-based
estimates make minimal assumptions and provide an important check on
model-based estimates. Two important assumptions behind design-based
estimates are that (1) the survey design is unbiased (random or
systematic selection of sampling units, here transects) and (2) the
survey was implemented as designed. These assumptions are met in these
surveys. An additional often unstated assumption is that the response is
measured without error. In this case, measurement errors include a large
detection bias and, presumably less often, species mis\DIFdelbegin \DIFdel{s-}\DIFdelend identification .
Detection bias causes a lower mean response and increased variance in
response. Finally, design-based estimates are based on estimating a mean
response across all sampled transects, and then use statistical sampling
theory to derive estimator variance. This works well for common species
and large sample size (many transects), but for rare species that might
not be encountered on any transects during a sample, the estimate and
its variance are necessarily zero when there are no detection events,
even when the species might have existed in the survey area. This might
have been the case in 2009 on the Triangle area (Fig~\ref{fig-design}A) and in 2010 for all strata of the ACP (Fig~\ref{fig-design}B), and
was the case in 2, 10, 16 and 16 years out of 16 for the High,
Teshekpuk, \DIFdelbegin \DIFdel{and }\DIFdelend Medium, and Low strata of the ACP, respectively.

\begin{figure}

\caption{\label{fig-design}\DIFdelbeginFL \DIFdelFL{Design-based estimates in the Triangle survey
area (A) and Arctic Coastal Plain survey area (B). Confidence intervals
(95\%, orange band) have been truncated at zero. No detection correction
was applied.}\DIFdelendFL \DIFaddbeginFL \textbf{\DIFaddFL{Design-based estimates for each survey.}}\newline{(A) Triangle survey area and (B) Arctic Coastal Plain survey area. Point estimates for each year are given by black dots contected by black lines across years. Confidence intervals (95\%, orange band) have been truncated at zero. No detection correction was applied.}\DIFaddendFL }

\end{figure}%

\subsection{Model-based Estimates:
Triangle}\label{model-based-estimates-triangle}

Models fit to data from the Triangle showed that the best model contains
a spatial smooth, a year smooth, and a spatio-temporal smooth (model M2,
Table~\ref{tbl-modelsTri}). The model with a separate space and time
smooth (M1) and all other models were worse (\(\Delta AIC >5\)). For all
results below, I used model M2.

\begin{table}

\caption{\label{tbl-modelsTri}\DIFdelbeginFL \DIFdelFL{AIC table for models fit to Triangle data.
Model structures are described in the main text.}\DIFdelendFL \DIFaddbeginFL \textbf{\DIFaddFL{AIC table for models fit to Triangle data.}}\DIFaddendFL }

\DIFdelbeginFL %DIFDELCMD < \centering{
%DIFDELCMD <

%DIFDELCMD < \fontsize{12.0pt}{14.4pt}\selectfont
%DIFDELCMD < \begin{tabular*}{\linewidth}{@{\extracolsep{\fill}}llrrr}
%DIFDELCMD < \toprule
%DIFDELCMD < Model & Linear Predictor & df & AIC & DeltaAIC \\
%DIFDELCMD < \midrule\addlinespace[2.5pt]
%DIFDELCMD < M2 & s(X,Y) + s(Year) + ti(X,Y,Year) & 35.48 & 2876.13 & 0.00 \\
%DIFDELCMD < M1 & s(X,Y) + s(Year) & 33.63 & 2881.94 & 5.81 \\
%DIFDELCMD < M3 & s(X,Y) + s(Year) + s(fYear) & 39.89 & 2884.29 & 8.15 \\
%DIFDELCMD < M4 & s(X,Y) + s(fYear) & 38.18 & 2888.06 & 11.92 \\
%DIFDELCMD < M0 & s(X,Y) & 19.78 & 2979.11 & 102.98 \\
%DIFDELCMD < \bottomrule
%DIFDELCMD < \end{tabular*}
%DIFDELCMD <

%DIFDELCMD < }
%DIFDELCMD <

%DIFDELCMD < %%%
\DIFdelendFL \DIFaddbeginFL \centering{