-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathindex.qmd
1532 lines (1221 loc) · 114 KB
/
index.qmd
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
611
612
613
614
615
616
617
618
619
620
621
622
623
624
625
626
627
628
629
630
631
632
633
634
635
636
637
638
639
640
641
642
643
644
645
646
647
648
649
650
651
652
653
654
655
656
657
658
659
660
661
662
663
664
665
666
667
668
669
670
671
672
673
674
675
676
677
678
679
680
681
682
683
684
685
686
687
688
689
690
691
692
693
694
695
696
697
698
699
700
701
702
703
704
705
706
707
708
709
710
711
712
713
714
715
716
717
718
719
720
721
722
723
724
725
726
727
728
729
730
731
732
733
734
735
736
737
738
739
740
741
742
743
744
745
746
747
748
749
750
751
752
753
754
755
756
757
758
759
760
761
762
763
764
765
766
767
768
769
770
771
772
773
774
775
776
777
778
779
780
781
782
783
784
785
786
787
788
789
790
791
792
793
794
795
796
797
798
799
800
801
802
803
804
805
806
807
808
809
810
811
812
813
814
815
816
817
818
819
820
821
822
823
824
825
826
827
828
829
830
831
832
833
834
835
836
837
838
839
840
841
842
843
844
845
846
847
848
849
850
851
852
853
854
855
856
857
858
859
860
861
862
863
864
865
866
867
868
869
870
871
872
873
874
875
876
877
878
879
880
881
882
883
884
885
886
887
888
889
890
891
892
893
894
895
896
897
898
899
900
901
902
903
904
905
906
907
908
909
910
911
912
913
914
915
916
917
918
919
920
921
922
923
924
925
926
927
928
929
930
931
932
933
934
935
936
937
938
939
940
941
942
943
944
945
946
947
948
949
950
951
952
953
954
955
956
957
958
959
960
961
962
963
964
965
966
967
968
969
970
971
972
973
974
975
976
977
978
979
980
981
982
983
984
985
986
987
988
989
990
991
992
993
994
995
996
997
998
999
1000
---
title: "Determinants of Plant Species Richness along Elevational Gradients: Insights with Climate, Energy and Water-Energy Dynamics"
date: last-modified
date-format: "DD MMM YYYY"
author:
- name: Abhishek Kumar
url: https://akumar.netlify.app/
orcid: 0000-0003-2252-7623
email: abhikumar.pu@gmail.com
affiliation: Panjab University, Chandigarh
- name: Meenu Patil
orcid: 0000-0002-7664-7877
affiliation: Panjab University, Chandigarh
- name: Pardeep Kumar
orcid: 0000-0001-6707-1485
affiliation: Panjab University, Chandigarh
- name: Anand Narain Singh
orcid: 0000-0002-0148-8680
affiliation: Panjab University, Chandigarh
bibliography: refs.bib
csl: apa7.csl
format:
html:
default-image-extension: svg
number-sections: true
toc: true
toc-depth: 2
pdf:
documentclass: scrartcl
papersize: a4
number-sections: true
mainfont: Arial
fontsize: 10pt
linestretch: 1.5
sansfont: Arial
colorlinks: true
link-citations: true
citecolor: blue
default-image-extension: pdf
code-block-bg: true
crossref:
fig-title: "Figure"
fig-prefix: "Figure"
tbl-title: "Table"
tbl-prefix: "Table"
title-delim: ": "
custom:
- kind: float
key: suppfig
latex-env: suppfig
reference-prefix: "Figure S"
caption-location: bottom
space-before-numbering: false
latex-list-of-description: Supplementary Figure
- kind: float
key: supptbl
latex-env: supptbl
reference-prefix: "Table S"
caption-location: top
space-before-numbering: false
latex-list-of-description: Supplementary Table
---
```{r setup, include=FALSE}
knitr::opts_chunk$set(
comment = "#>", echo = FALSE, eval = TRUE, message = FALSE, warning = FALSE
)
## load packages
library(DHARMa) ## GLM model diagnostics
library(flextable)
library(ggpubr)
library(rstatix) ## statistical hypothesis testing
library(sf) ## vector data handling
library(terra) ## raster data handling
library(tidyverse) ## general data manipulation and visualisation
library(tmap) ## visualising spatial data
## colour palette for study sites
mycol <- c("Morni" = "#e69f00", "Chail" = "#009e73",
"Churdhar" = "#cc79a7", "All" = "#0072b2")
myfill <- c("Morni" = "#fff7e6", "Chail" = "#d9fff5",
"Churdhar" = "#f7ebf2", "All" = "#d9f1ff")
## function for relative label positions
mypos <- function(xnpc, xmin, xmax){
xnpc*(xmax - xmin) + xmin
}
## theme for ggplot
theme_set(
theme_bw(base_size = 14) +
theme(panel.grid = element_blank(),
strip.background = element_blank(),
strip.text = element_text(hjust = 0, face = "bold"))
)
# biome_pal <- c(
# "#c1e1dd", "#a5c790", "#97b669", "#75a95e", "#317a22",
# "#a09700", "#dcbb50", "#fcd57a", "#d16e3f"
# )
set_flextable_defaults(font.size = 10)
```
# Abstract {.unnumbered}
**Background** Understanding the patterns and processes of species distributions has long remained a central focus of biogeographical and ecological research. While the evidence for elevational patterns in species richness is widespread, our understanding of underlying causes and mechanisms remained limited. Therefore, this study aimed to entangle the influence of environmental variables on plant species richness along elevational gradients in the Western Himalayas.
**Methods** We compiled elevational distribution for about 1150 vascular plants using the published literature and available database. The species richness was estimated in 100-m elevational bands using the range interpolation method. We used the generalised linear model and structural equation modelling (SEM) framework to identify the direct and indirect effects of climatic factors on species richness.
**Results** Our results indicated that primary environmental correlates of species richness varied with elevational gradients. Climatic variables combined with energy and water availability were more important than the topographic heterogeneity. Further, the direct and interaction effects of climatic variables were more substantial than their indirect effects. The indirect effects of climate are more strongly mediated by water--energy dynamics than the energy alone.
**Conclusions** Overall, our findings emphasise the importance of considering direct effects and interactions among environmental variables while studying the underlying mechanisms governing elevational biodiversity gradients. Species richness appeared to be shaped by climatic tolerances rather than habitat diversity at regional scales. This information can have implications for biodiversity dynamics under environmental change.
**Keywords:** Elevational Gradient, Species Richness, Vascular Plants, Western Himalayas
# Background
The variation in species richness along geographical gradients is a well-established phenomenon [@Dani2023; @Guo2013; @Lomolino2001; @McCain2010; @Rosenzweig1995]. Latitudinal and elevational gradients are two widely studied geographical gradients for understanding the patterns and processes of species distribution [@Cox2020; @Rosenzweig1995]. While latitudinal gradients have received historical attention [@Cox2020; @Rosenzweig1995; @Willig2003], elevational gradients gained importance only during past the few decades [@Dani2023; @Lomolino2001; @McCain2010]. Compared to latitudinal gradients, elevational gradients offer a unique advantage by providing diverse climatic and vegetational zones over shorter distances. Such condensed vegetation zones can facilitate the study of species distributions regulated by ecological processes, including dispersal, adaptation, and species interactions.
Available studies suggest that species richness does not vary randomly but exhibits predictable patterns along elevational gradients. However, these studies showed that species richness could follow a unimodal, decreasing, increasing or other complex patterns [@Costa2023; @Guo2013; @Rahbek1995; @Rahbek2005]. These variations in elevational patterns indicate that multiple factors can synergistically shape the patterns of species richness [@Rahbek2019a; @Rahbek2019b]. Understanding these factors is crucial for predicting how biodiversity will respond to future climate change and anthropogenic disturbances. Such knowledge is essential for not only identifying high biodiversity areas but also for their management under global environmental change.
Species distribution primarily determined by dispersal, habitat suitability and biotic interactions [@Guisan2017]. The distribution of a species is related to its ecological niche, which in turn depends on tolerance to several environmental variables, including abiotic and biotic factors [@Hutchinson1957]. While biotic factors are important at local scales, the climatic variables are principal determinants of species distribution at broader scales [@McGill2010]. Numerous hypotheses have been proposed to explain the broad-scale patterns of species richness [@Gaston2000; @Willig2003], some of these also apply to elevational gradients [@McCain2010].
A group of hypotheses propose climatic factors as direct determinants of species richness at broader scales [@Currie2004; @Francis2003; @Price2010]. Firstly, the *metabolic theory of ecology* links temperature to metabolic rates through chemical kinetics [@Price2010] and predicts a positive relationship between species richness and temperature [@Wang2009]. Similarly, precipitation has been suggested to be positively linked with species richness [@Ahmadi2023; @Hawkins2003]. However, available evidence indicates that neither temperature nor precipitation solely determines the species richness [@Currie2004; @Hawkins2007]. The *climatic tolerance hypothesis* states that each species can tolerate only a limited range of climatic conditions beyond which its survival becomes difficult [@Currie2004]. Thus, temperature and precipitation can jointly influence species richness by regulating the physiological tolerance of each species.
The second group of hypotheses suggest that climate indirectly governs species richness patterns by regulating energy and water availability [@OBrien1993; @Wright1983]. The *species--energy hypothesis* predicts a positive relationship between species richness and energy availability [@Bhatta2021; @Hawkins2003; @Vetaas2019; @Wright1983]. One mechanism is proposed by the *more individual hypothesis* [@Srivastava1998], which states that higher energy availability can increase species richness by supporting more individuals and reducing the extinction risk. However, available literature indicates mixed support for this hypothesis [@Evans2005; @Storch2018]. Further, the *water--energy dynamics hypothesis* proposes that biological activity depends on the availability of liquid water, which is regulated by thermal energy. Thus, water--energy dynamics jointly determine the species richness by controlling the availability of liquid water, especially in the case of plants [@OBrien2006]. This water--energy dynamics (WED) model has been supported by recent studies on the elevational pattern of plant species [@Bhatta2021; @Thakur2022; @Tolmos2022; @Vetaas2019]. While the direct influence of climatic factors is increasingly recognised, indirect effects of climate are variable and multiple mechanisms have been proposed to explain climatic control of plant species richness [@Currie2004; @Evans2005; @Hawkins2003].
Another group of hypotheses link non-climatic factors to species richness patterns at broader scales. The *heterogeneity--richness hypothesis* posits that environmental heterogeneity determines species richness by influencing resource and habitat diversity [@Stein2014]. The underlying idea is that diverse habitats or resource-rich environments provide more niches or opportunities for species to occupy. This increased niche availability can support more species with different ecological requirements, increasing species richness. Thus, species richness appeared to be regulated by a complex interaction of multiple factors. Further, the variations in determinants of species richness indicate that our understanding of the causes and mechanisms of species richness patterns remained limited.
```{r}
## html graphviz
# DiagrammeR::grViz("gv/hypothetical_sem.gv")
```
![A priori conceptual model representing the possible pathways that may determine the species richness along elevational gradients. Species richness may be regulated by (a) metabolic theory of ecology; (a, b, c) climatic tolerance hypothesis; (d) species-energy hypothesis; (e) heterogeneity richness hypothesis; and (f) water--energy dynamics hypothesis](figs/fig1_hypothetical-sem){#fig-hypo-sem width=70%}
A complex interplay of environmental factors with multiple mechanisms regulates species richness. In this study, we aim to untangle the contributions of different hypotheses shaping the plant species richness patterns along elevational gradients in the Himalayas (@fig-hypo-sem). Specifically, we sought to (1) identify primary environmental variables influencing species richness, (2) establish models of plant species richness along elevational gradients, (3) compare identified with existing models, and (4) explore mechanisms determining plant species richness along elevational gradients. Our investigation will not only elaborate our understanding of richness patterns but also have implications for biodiversity management in mountain ecosystems, under the pressures of environmental change and anthropogenic influence.
# Methods
## Study area
Our study aimed to investigate the significant determinants of plant species richness along elevational gradients. For this research, we selected three protected to semi-protected sites, each representing different elevational gradients within the Western Himalayas (@fig-sites). Specifically, our study sites included the Morni Hills (76.877--77.177°E and 30.574--30.753°N), Chail Wildlife Sanctuary (77.126--77.279°E and 30.889--31.012°N), and Churdhar Wildlife Sanctuary (77.389--77.497°E and 30.810--30.910°N), which corresponded to lower (300--1500 m), intermediate (900--2100 m), and upper (1600--3600 m) elevational gradients, respectively. These study sites provided us with a diverse and extensive elevational gradient, ranging from the lower foothills at 300 meters to the Churdhar Peak exceeding 3600 meters. The wide range of ecological zones and variations in topography across these sites established an ideal setting to investigate the driving factors behind plant species richness along elevational gradients in the Western Himalayas. In addition to the broad elevational gradient, our study area also exhibited notable differences in climate conditions due to their diverse elevation and topographical characteristics. Generally, the climate could be categorised into three seasons: summer, monsoon, and winter. These regions experienced a spectrum of climates, ranging from hot semi-arid (BSh) in the foothills to monsoonal warm-summer humid continental (Dwb) climate near the Churdhar Peak. The Morni Hills presented a transition from hot semi-arid (BSh) to monsoonal dry-winter humid subtropical climates (Cwa). The Chail Wildlife Sanctuary exhibited a shift from a monsoonal humid subtropical (Cwa) to a monsoonal dry-winter subtropical highland (Cwb) climate. Finally, the Churdhar Wildlife Sanctuary showcased a transition from a monsoonal dry-winter subtropical highland (Cwb) to a monsoonal warm-summer humid continental (Dwb) climate near the Churdhar Peak [@Beck2018].
```{r eval=FALSE}
## prepare and save the site map
# source("R/01_make-site-map.R")
```
![Geographic location of Morni Hills, Chail WLS and Churdhar WLS in Western Himalayas. The inset map shows the location of the study area in the Indian Western Himalayas.](figs/fig2_site-map.png){#fig-sites}
The Morni Hills host a variety of plant communities, including tropical mixed dry deciduous forests at lower elevations and Siwalik Chir Pine forests at higher elevations. The Chail Wildlife Sanctuary consists of subtropical Pine forests at lower elevations, transitioning to Oak forests and moist Deodar forests at higher elevations, with occasional Blue Pines interspersed. Meanwhile, the Churdhar Wildlife Sanctuary encompasses mixed coniferous forests at lower elevations, followed by Kharsu Oak forests and alpine pastures at higher elevations [@Champion1968]. Thus, our sites boast a rich diversity of plant communities, ranging from temperate forests of oak and rhododendron to alpine meadows adorned with vibrant wild-flowers. Within these diverse forests, numerous vascular plant species are found, with some species listed as Endangered (e.g., *Aconitum heterophyllum*, *Angelica glauca*, *Cypripedium himalaicum*, *Dactylorhiza hatagirea*, *Picrorhiza kurroa*, *Taxus wallichiana* and *Trillium govanianum*), Vulnerable (e.g., *Cypripedium cordigerum*, *Malaxis muscifera* and *Paris polyphylla*), and Near Threatened (e.g., *Abies spectabilis*) according to recent assessments of threatened species [@IUCN2023]. Additionally, these study areas provide vital habitats for numerous endemic wild animals, such as the Himalayan musk deer and Himalayan brown bears. Both the Chail Wildlife Sanctuary and Churdhar Wildlife Sanctuary are designated as Important Bird and Biodiversity Areas by BirdLife International [@Rahmani2016]. These areas are also home to some threatened bird species, including the Cheer Pheasant (*Catreus wallichii*), Himalayan Monal (*Lophophorus impejanus*), Indian Vulture (*Gyps indicus*), Koklass Pheasant (*Pucrasia macrolopha*), Red-headed Vulture (*Sarcogyps calvus*), and White-rumped Vulture (*Gyps bengalensis*).
## Data compilation
We compiled a comprehensive species checklist for each site by integrating data collected from field surveys and relevant literature. During 2021–2022, two to four field visits were conducted to each site in different seasons. The plant species encountered during the trek followed were recorded in the field notebook. Unknown plants were photographed because we were not permitted to sample plant due to legal protection of these sites. These plants were identified with the help of the herbarium (PAN) of the Panjab University, Chandigarh, and Janaki Ammal Herbarium (RRLH) of Indian Institute of Integrative Medicine, Jammu (<https://iiim.res.in/herbarium/index.htm>), and online database like eFlora of India (<https://efloraofindia.com/>) and Flowers of India (<http://www.flowersofindia.net/>).
To improve identification accuracy and complement our species list, the relevant studies were identified by searching [Google Scholar](https://scholar.google.co.in/) for its ability to retrieve the most obscure publications. The search was performed using the keywords "Morni," "Chail," and "Churdhar" in September 2021 and subsequently updated in August 2022. Then, we recorded all plant species reported in the identified studies for Morni Hills [@Balkrishna2018a; @Balkrishna2018b; @Dhiman2020; @Dhiman2021; @Singh2014], Chail Wildlife Sanctuary [@Bhardwaj2014; @Bhardwaj2017; @Kumar2013], and Churdhar Wildlife Sanctuary [@Choudhary2007; @Choudhary2012; @Gupta1998; @Radha2019; @Subramani2014; @Thakur2021a]. Each plant species record was manually standardised for its taxonomic name and botanical authority using the *Plants of the World Online* [@POWO2022]. Infra-specific taxa (variety and subspecies levels) were generally treated as species for the analysis to ensure consistency among the taxa. Each recorded plant species was further screened for distribution by matching with @POWO2022, and taxa with distribution outside the study sites were excluded. Finally, we updated all botanical names and their families by matching them with a static copy of the *World Checklist of Vascular Plants (WCVP)* version 10 dated 27 October 2022 [@Govaerts2021] using the `r packageVersion("rWCVP")` version of `rWCVP` package [@R-rWCVP].
```{r eval=FALSE}
## standardise plant names with WCVP
# source("R/02_standardise-plant-names.R")
```
We obtained the elevational distribution of our catalogued species from the *Database of Vascular Plants of Himalaya* [@Rana2017; @Rana2019gbif] published on the Global Biodiversity Information Facility ([GBIF](https://www.gbif.org/)). This dataset assembled the elevational distribution of over 10,500 Himalayan plant species from the published floras [@Rana2017]. It compiled the elevational ranges of over 3,000 plant species reported from Himachal Pradesh from published floras [@Chowdhery1984; @Collett1902]. We downloaded this dataset on 28 July 2023 using the `rgbif` package version `r packageVersion("rgbif")` [@R-rgbif] and standardised the botanical names using the `rWCVP` package [@R-rWCVP]. After standardising plant names, this dataset provided elevational data for more than 1,000 plants in our checklist. Further, elevational data for some species was extracted from a separate study [@Rana2019ecs] and the remaining species with unavailable or uncertain elevational data were excluded. For duplicates, we considered the maximum upper limit and the minimum lower limit of the elevational range. We preferentially taken the elevational distribution from Himachal Pradesh because our sites primarily fall within this Indian state. Finally, we adjusted the elevational limits of species distribution according to the full elevational extent of our study sites [@Colwell1994].
```{r eval=FALSE}
## get elevation range data
# source("R/03_get-elevation-ranges.R")
```
## Species richness
We first resampled the elevation data to a 30 arc-sec (~1 km) resolution using bilinear interpolation to assess species richness at different elevations. The resampling was performed using the `terra` package version `r packageVersion("terra")` [@R-terra]. This process updated the elevational extents for our study sites: lower elevational gradient at Morni Hills (300--1300 m), intermediate elevational gradient at Chail WLS (900--2100 m), higher elevational gradient at Churdhar WLS (1600--3400 m), and the entire elevational gradient for All Sites (300--3400 m). Next, we divided each elevational gradient into 100-m elevational bands for each site. This approach of using 100-m elevational bands has been previously employed in studying elevational patterns of species richness in plants [@Li2022; @Qian2022; @Rana2019ecs]. Each elevational band is represented by its upper elevational limit, both in the text and figures. To estimate species richness for each elevational band, we used the range interpolation approach [@Colwell1994]. This method assumes range continuity so that each species can be found everywhere within its distribution range [@Grytnes2002]. Such range interpolation has been frequently used to study the elevational distribution of species richness [@Hu2017; @Manish2021; @Rana2019ecs]. While this approach may bias species richness estimation [@Hu2017], it is commonly employed to address sampling issues and ensure methodological consistency [@McCain2010; @Rana2019ecs]. In this study, we focused only one-dimensional range interpolation as simple range-filling along elevational gradients. Following the range continuity, each species was assumed to exist in all elevational bands that entirely or partially covered its known range [@Grytnes2002; @Qian2022; @Rana2019ecs]. Species richness was then estimated by counting the total species within each 100-m elevational band. Thus, our calculated species richness represents the $\gamma$-diversity because it represents the total number of species present corresponding to the entire elevational band [@Lomolino2001].
```{r eval=FALSE}
## calculate species richness for each elevational band
# source("R/04_calculate-richness.R")
```
## Explanatory variables
We used four climatic variables mean annual temperature (MAT), temperature seasonality (TSE), mean total annual precipitation (MAP) and precipitation seasonality (PSE) to examine the influence of climate on plant species richness (@fig-hypo-sem). These climatic variables have been suggested as major determinants of plant species richness at broader scales [@Kreft2007; @OBrien1993; @Qian2022; @Wang2009]. We extracted these climatic variables at 30-arc-sec (~1 km) resolution from the CHELSA (<https://chelsa-climate.org/>) database version 2.1 [@Karger2017]. Since this database is developed using statistical downscaling methods [@Karger2017], it is considered more suitable for modelling complex ecosystems like the Himalayas [@Bobrowski2017; @Rana2019ecs]. Further, we used two energy variables, the net primary productivity (NPP) and soil organic carbon (SOC), to test the species--energy hypothesis [@Clarke2006; @Wang2022; @Wright1983]. The net primary productivity (NPP) estimated from the Miami model [@Lieth1973], was obtained from the CHELSA database. The mean value of soil organic carbon (SOC) for topsoil (0--5 cm) was downloaded at 250 m resolution from the SoilGrids database [@Hengl2017].
We used the actual evapotranspiration (AET), potential evapotranspiration (PET) and water deficit (WDF) as the variables representing the water--energy dynamics [@Currie1987; @OBrien1993; @Stephenson1990]. The AET [@Trabucco2019] and PET [@Zomer2022] data were obtained at 30-arc-sec (~1 km) resolution from the CGIAR-CSI database (<https://cgiarcsi.community/>). We calculated the water deficit (WDF) as the difference between the PET and AET [@Francis2003; @Stephenson1990]. Additionally, we used two metrics of environmental heterogeneity to test the heterogeneity--richness hypothesis [@Stein2014]. We obtained the median terrain ruggedness index (TRI) representing topographic heterogeneity [@Amatulli2018] and the EVI (enhanced vegetation index) homogeneity index (EHM) as a measure of vegetation heterogeneity [@Tuanmu2015] at 30-arc-sec (~1 km) from the EarthEnv database
(<https://www.earthenv.org/>). Thus, we used a total of 11 initial candidate explanatory variables consisting of four climatic (MAT, TSE, MAP and PSE), two energy (NPP and SOC), three water availability (AET, PET and WDF) and two environmental heterogeneity (EHM and TRI) variables (@fig-hypo-sem). All the raster data of explanatory variables were resampled to 30-arc-sec (~1 km) resolution using the `resample()` function from the `terra` package [@R-terra]. Then, the mean value of each explanatory variable was calculated for each 100-m elevational band using the `zonal()` function from the `terra` package [@R-terra]. The primary reason for calculating mean was to capture the average environmental conditions within each elevational band, thereby reducing the influence of variability in the explanatory variables. Further, this method allowed us to explore the determinants of species richness at a consistent elevational scale across our study sites.
```{r}
## calculate planar and 3d for each elevational band
# source("R/05_extract-explanatory-variables.R")
```
## Data analysis
```{r}
## prepare data for each site
site_morni <- read.csv("output/site_env.csv") |>
filter(site == "Morni") |>
select(-site) |>
mutate(across(!S, ~scale(.x)))
site_chail <- read.csv("output/site_env.csv") |>
filter(site == "Chail") |>
select(-site) |>
mutate(PET = sqrt(PET)) |>
mutate(across(!S, ~scale(.x)))
site_churdhar <- read.csv("output/site_env.csv") |>
filter(site == "Churdhar") |>
select(-site) |>
mutate(across(!S, ~scale(.x)))
site_all <- read.csv("output/site_env.csv") |>
filter(site == "All") |>
select(-site) |>
mutate(WDF = log(WDF)) |>
mutate(across(!S, ~scale(.x)))
```
Our primary aim was to investigate the potential determinants of plant species richness along the elevational gradients. We defined plant species richness as the number of unique species present within each 100-m elevational band. Given the discrete and non-negative nature of our response variable, we used the generalised linear model (GLM) by specifying the Poisson distribution with the log-link function [@Hilbe2014]. We used nine environmental variables representing climate, energy, heterogeneity and water availability as the potential predictors of plant species richness [@Cheng2023; @Kreft2007]. The potential evapotranspiration (PET) for Chail WLS was square-root transformed, whereas the water deficit (WDF) for full elevational gradient was log-transformed to remove the effect of extreme observations and skewness in data [@Legendre2012]. All explanatory variables were standardised to have mean = 0 and standard deviation = 1 using the z-transformation. The estimated species richness (S) was regressed against each proposed explanatory variable, assuming the Poisson error distribution with the log-link function. This regression was implemented in `R` statistical environment version `r packageVersion("stats")` using the `glm()` function from the `stats` package version `r packageVersion("stats")` [@R-base]. The explanatory variable with the highest deviance-squared (D^2^) was considered the 'primary' explanatory variable [@Field2009; @Hawkins2003]. The deviance-squared (D^2^) for the explanatory variable was estimated using the @eq-glm-r2:
$$
D^2 = \frac{D_{null} - D_{resid}}{D_{null}}; \quad
D^2_{adj} = 1 - \frac{(1-D^2) \times (n-1)}{n-k-1}
$$ {#eq-glm-r2}
where the $D_{null}$ represents the deviance of the null model (model with only an intercept) and the $D_{resid}$ represents the deviance of the model under study (model with explanatory variables). A higher value of deviance-squared indicates a model with better fit. Further, we estimated the adjusted deviance-squared ($D^2_{adj}$) by applying a correction for the small sample size (@eq-glm-r2). Then, we computed Spearman's correlation coefficient ($\rho$) for the identified primary variable and all other remaining explanatory variables. The explanatory variables with an absolute Spearman's correlation coefficient of greater than 0.7 were considered correlated and excluded from further analysis [@Dormann2013]. The final set of uncorrelated explanatory variables was used for developing regression models.
We build an initial full model consisting of species richness (S) as the response variable and all uncorrelated explanatory variables as predictor variables (@suppfig-correlation). The possible candidate models were identified using the `dredge()` function from the `MuMIn` package version `r packageVersion("MuMIn")` [@R-MuMIn]. The candidate models were compared using the Akaike's Information Criterion (AIC) with a correction for the small sample size [@Burnham2002; @Hurvich1989]. The corrected Akaike's Information Criterion (AICc) was calculated using the @eq-aicc:
$$
AIC = -2 \mathcal{L} + 2k; \quad
AICc = AIC + \frac{2k(k+1)}{n-k-1}
$$ {#eq-aicc}
where, $k$ is the number of parameters to be estimated by the model and $n$ is the total number of response observations in the model. We identified a top candidate model with lowest AICc for each site. This top candidate model was then compared with 15 previously proposed models of species richness (@tbl-richness-models). The model with the lowest AICc value was considered the best, and models with a difference of two AICc units were considered equally competitive [@Burnham2002]. We used model averaging if multiple models were identified as competitive. Since we aimed to investigate determinants of species richness, we used the full average instead of the conditional average [@Burnham2002]. The model averaging was implemented using the `model.avg()` function from the `MuMIn` package [@R-MuMIn].
```{r}
#| label: tbl-richness-models
#| tbl-cap: Previously proposed models for explaining the variation in species richness (S). The predictor variables are abbreviated as AET, actual evapotranspiration; MAT, mean annual temperature; TSE, temperature seasonality; MAP, mean total annual precipitation; ELE, elevation; NPP, net primary productivity; PET, potential evapotranspiration; TRI, terrain ruggedness index; and WDF, water deficit.
rbind(
c("@Currie1987", "S ~ AET"),
c("@Wang2009", "S ~ MAT"),
c("@OBrien1993", "S ~ MAP"),
c("@Wright1983", "S ~ NPP"),
c("@Stephenson1990", "S ~ WDF"),
c("@Bhatta2021", "S ~ MAP + PET^2^"),
c("@OBrien2006", "S ~ MAP + (PET − PET^2^)"),
c("@Bhatta2021", "S ~ NPP + NPP^2^"),
c("@OBrien1993", "S ~ PET + PET^2^"),
c("@OBrien1998", "S ~ ELE + MAP + PET"),
c("@OBrien1998", "S ~ ELE + MAP + TSE"),
c("@OBrien1993", "S ~ MAP + PET + PET^2^"),
c("@OBrien2006", "S ~ MAP + (PET − PET^2^) + TRI"),
c("@Francis2003", "S ~ MAT + WDF + MAT×WDF"),
c("@Francis2003", "S ~ WDF + PET + PET^2^")
) |>
as.data.frame() |>
rename("Reference" = V1, "Model" = V2) |>
select(Model, Reference) |>
knitr::kable()
```
The overall goodness-of-fit of the model was assessed using the deviance-based Chi-squared test. A non-significant p-value (*p* > 0.05) indicates no significant difference between the predictions of the model and observed data, i.e., the data is adequately fitted to the model. Then, the model was validated by analysing the dispersion and distributional assumptions of the fitted model. The simulated residuals (n = 1000) from the Poisson distribution were tested against the residuals of the fitted model [@Dunn1996]. The uniformity was tested using the Kolmogorov-Smirnov test, whereas the dispersion was tested using a simulation-based dispersion test. The outliers were tested by generating a simulation-based expectation for the outliers using bootstrapping. The model validation was performed using the `simulateResiduals()` function from the `DHARMa` package version `r packageVersion("DHARMa")` [@R-DHARMa].
Another aim of the present study was to disentangle the potential mechanisms for environmental determinants of plant species richness along the elevational gradients. We used the structural equation modelling (SEM) framework to reveal the complex relationships among variables and test theoretical models for species richness [@Grace2006]. Since the piecewise SEM approach solves each equation separately (local estimation), it allows model fitting for smaller datasets with non-normal error distribution [@Shipley2000]. Therefore, we used the piecewise SEM approach to analyse the direct and indirect effects of climate (MAT, TSE, MAP and PSE), energy (NPP and SOC), environmental heterogeneity (EHM and TRI) and water--energy dynamics (AET, PET, WDF) variables on species richness.
The proposed conceptual model (@fig-hypo-sem) was transformed into hypothetical causal models. Specifically, we used climatic variables in all models and sequentially added selected environmental variables representing energy, heterogeneity and water--energy dynamics (mediator variables). Each hypothetical causal model was translated into structural equations. The species richness was modelled using the generalised linear model by specifying the Poisson family with a log-link function. In contrast, all other variables were modelled using the general linear model. Before fitting the SEM, all variables except species richness were standardised by z-transformation (mean = 0 and standard deviation = 1) using the function `scale()` from the `stats` package [@R-base]. Then, each proposed hypothetical model was fitted using the `psem()` function from the `piecewiseSEM` package version `r packageVersion("piecewiseSEM")` [@R-piecewiseSEM].
The overall goodness-of-fit was assessed using Shipley's test of *directed separation* (d-sep test) based on Fisher's *C* statistic with *p* > 0.05, indicating a good model fit [@Shipley2000]. Shipley's test of directed separation tests the conditional independence of all included variables, i.e., missing relationships between included variables. The Fisher's *C* statistic is calculated by @eq-fisher-c as follows:
$$
C = -2 \sum_{i = 1}^K \ln(p_i)
$$ {#eq-fisher-c}
where $p_i$ is the $i$th independence claim in a basis set consisting of $K$ claims. This Fisher's *C* can be compared to a chi-squared distribution with $2K$ degrees of freedom. Closely related models were compared with Fisher's *C*-based Akaike's information criteria with a small sample size correction [@Shipley2013], which can be represented by @eq-sem-aicc as follows:
$$
AICc = C + \frac{2K \times n}{n - K - 1}
$$ {#eq-sem-aicc}
where $C$ is the Fisher's C statistic, $n$ is the total sample size and $K$ is the likelihood degrees of freedom. The strengths of each direct and indirect relationship were estimated if the model exhibited an adequate fit. If the model did not fit well, the non-significant paths were removed, and additional significant paths were added based on Shipley's d-sep test. The models exhibiting adequate fit were compared using the corrected Akaike's information criteria (AICc), and model with the lowest AICc value was considered the best model (@eq-sem-aicc). Given the relatively small sample size (n < 20) for each individual site, the SEM was performed only for the entire elevation gradient (n = 31). All analyses were implemented in `R` statistical environment version `r packageVersion("stats")` [@R-base], and the package `tidyverse` version `r packageVersion("tidyverse")` was used for general data wrangling and visualisation [@R-tidyverse].
# Results
Our dataset consisted of elevational distribution limits for 1159 plant species from All Sites, including 568 from Morni Hills, 377 from Chail WLS and 561 from Churdhar WLS. The species richness was estimated for ten elevational bands in Morni Hills, 12 in Chail WLS, 18 in Churdhar WLS and 31 in All Sites (@fig-richness). The species richness ranged from 60 to 226 in Morni Hills, 124 to 220 in Chail WLS, 106 to 520 in Churdhar WLS and 79 to 588 across the full elevational gradient (All Sites). The maximum species richness was observed around 800–900 m in Morni Hills, 1300–1400 m in Chail WLS, 1700–1800 m in Churdhar WLS and 1300–1400 m for All Sites (@fig-richness).
```{r fig.width=7, fig.height=5}
#| label: fig-richness
#| fig-cap: Distribution of plant species richness across elevational bands for (a) Morni Hills, (b) Chail WLS, (c) Churdhar WLS, and (d) All Sites combined. The value in parenthesis indicates the upper limit of the elevational band with the highest species richness (richness peak) for each panel.
p1 <- read.csv("output/band_richness.csv") |>
filter(site == "Morni") |>
#filter(richness == max(richness))
ggplot(aes(x = elevation, y = richness)) +
geom_line(color = "#e69f00") +
geom_point(shape = 21, size = 3,
fill = "#fff7e6", color = "#e69f00") +
annotate(geom = "text", x = 900, y = 245, hjust = 0.5,
label = "(900, 226)", color = "#e69f00") +
theme(legend.position = "none", axis.title = element_blank())
p2 <- read.csv("output/band_richness.csv") |>
filter(site == "Chail") |>
#filter(richness == max(richness))
ggplot(aes(x = elevation, y = richness)) +
geom_line(color = "#009e73") +
geom_point(shape = 21, size = 3,
fill = "#d9fff5", color = "#009e73") +
annotate(geom = "text", x = 1400, y = 230, hjust = 0.5,
label = "(1400, 220)", color = "#009e73") +
theme(legend.position = "none", axis.title = element_blank())
p3 <- read.csv("output/band_richness.csv") |>
filter(site == "Churdhar") |>
#filter(richness == max(richness))
ggplot(aes(x = elevation, y = richness)) +
geom_line(color = "#cc79a7") +
geom_point(shape = 21, size = 3,
fill = "#f7ebf2", color = "#cc79a7") +
annotate(geom = "text", x = 1850, y = 520, hjust = 0,
label = "(1800, 520)", color = "#cc79a7") +
theme(legend.position = "none", axis.title = element_blank())
p4 <- read.csv("output/band_richness.csv") |>
filter(site == "All") |>
# filter(richness == max(richness))
ggplot(aes(x = elevation, y = richness)) +
geom_line(color = "#0072b2") +
geom_point(shape = 21, size = 3,
fill = "#d9f1ff", color = "#0072b2") +
annotate(geom = "text", x = 1400, y = 640, hjust = 0.5,
label = "(1400, 588)", color = "#0072b2") +
theme(legend.position = "none", axis.title = element_blank())
## arrange plots
ggpubr::ggarrange(
p1, p2, p3 + xlim(1500, 3400), p4,
labels = c("a)", "b)", "c)", "d)"), align = "hv",
label.x = 0.11, label.y = 0.975
) |>
annotate_figure(
left = text_grob("Species richness", rot = 90, size = 14),
bottom = text_grob("Elevation (m)", size = 14)
)
# ggsave("figs/fig3_richness.pdf", width = 7, height = 5)
# ggsave("figs/fig3_richness.png", width = 7, height = 5)
```
## Primary variables
```{r}
## function to calculate corrected aic (AICc) -----
aicc <- function(model) {
n <- length(model$y)
k <- length(model$coefficients)
aic <- AIC(model)
return(aic + 2*k*(k+1)/(n-k-1))
}
## function to calculate corrected deviance explained -----
d2.adj <- function(model) {
n <- length(model$y)
k <- length(model$coefficients)
d2 <- 1 - (summary(model)$deviance / summary(model)$null.deviance)
d2a <- (1 - ((1 - d2)*(n - 1) / (n - k - 1)))*100
return(d2a)
}
## function to calculate deviance explained -----
d2.glm <- function(model){
g <- summary(model)
round((1 - g$deviance/g$null.deviance)*100, 2)
}
## function to estimate Chi p-value for model fit
p.glm <- function(model){
p <- pchisq(model$deviance, model$df.residual, lower.tail = FALSE)
p.format <- ifelse(
p > 0.001, paste0("= ", round(p, 3)), "< 0.001"
)
return(p.format)
}
```
Out of the initially proposed eleven explanatory variables, the univariate models suggested that water deficit (WDF) explained the highest deviance (D^2^ = 88.63%) for species richness in Morni Hills (@supptbl-primary-var). On the other hand, the terrain ruggedness index (TRI) appeared to be the most important predictor of species richness in Chail WLS (@supptbl-primary-var). In the case of Churdhar WLS, AET explained the highest deviance in species richness (D^2^ = 94.59%). When all sites are considered together, the net primary productivity (NPP) emerged as the important univariate predictor of species richness across the full elevational gradient (@supptbl-primary-var). It explained about 46% of the total variation in species richness. Water deficit (WDF), terrain ruggedness index (TRI), actual evapotranspiration (AET), and net primary productivity (NPP) were found to be the primary explanatory variables for lower (Morni Hills), intermediate (Chail WLS), upper (Churdhar WLS), and full elevational gradient (All Sites), respectively (@fig-primary-var).
```{r fig.width=7, fig.height=5}
#| label: fig-primary-var
#| fig-cap: Variation in percent deviance-squared (D^2^) for identified primary environmental variables across lower (Morni), intermediate (Chail), higher (Churdhar) and full (All) elevational gradient in Western Himalayas. The highest deviance-squared was observed for water deficit (WDF) in Morni Hills, terrain ruggedness index (TRI) in Chail WLS, actual evapotranspiration (AET) in Churdhar and net primary productivity (NPP) across full elevational gradient (All Sites).
compare.primary.var <- function(env.var){
data.frame(
Variable = env.var,
Morni = glm(paste0("S ~ ", env.var) |> as.formula(),
family = "poisson", data = site_morni) |> d2.glm(),
Chail = glm(paste0("S ~ ", env.var) |> as.formula(),
family = "poisson", data = site_chail) |> d2.glm(),
Churdhar = glm(paste0("S ~ ", env.var) |> as.formula(),
family = "poisson", data = site_churdhar) |> d2.glm(),
All = glm(paste0("S ~ ", env.var) |> as.formula(),
family = "poisson", data = site_all) |> d2.glm()
)
}
bind_rows(
compare.primary.var("WDF"),
compare.primary.var("TRI"),
compare.primary.var("AET"),
compare.primary.var("NPP")
) |>
pivot_longer(cols = -Variable, names_to = "Site", values_to = "y") |>
mutate(Site = factor(Site, c("Morni", "Chail", "Churdhar", "All"))) |>
ggplot(aes(x = Site, y = y, fill = Variable)) +
geom_bar(stat = "identity", position = "dodge", width = 0.8) +
geom_text(
aes(label = round(y, 1)), position = position_dodge(0.8),
size = 3.5, vjust = -0.35, show.legend = FALSE
) +
scale_fill_brewer(palette = "OrRd") +
ylim(0, 115) +
labs(x = "", y = expression(D^2~" (%)")) +
theme(legend.position = c(0.995, 0.99),
legend.justification = c(1, 1),
legend.direction = "horizontal",
legend.background = element_blank(),
legend.box.background = element_rect(color = "grey", linewidth = 0.25))
# ggsave("figs/fig4_primary-var.pdf", width = 7, height = 5, units = "in")
# ggsave("figs/fig4_primary-var.png", width = 7, height = 5)
```
The Spearman's correlation coefficient suggested that WDF is weakly correlated with PSE, EHM, and AET in Morni Hills (@suppfig-correlation a). Similarly, Spearman's correlation coefficient indicated that MAP, PET and TRI had weak inter-correlation in Chail WLS (@suppfig-correlation b). For Churdhar WLS, five weakly correlated explanatory variables (AET, EHM, MAP, TRI, and TSE) were selected for further modelling based on Spearman's correlation coefficient (@suppfig-correlation c). Across the entire elevational gradient, only EHM and TRI were found as the other weakly correlated predictors (@suppfig-correlation d). Out of the initially proposed eleven explanatory variables, only three environmental variables were found to be uncorrelated for Chail WLS and All Sites, while four variables were uncorrelated for Morni Hills and five for Churdhar WLS (@suppfig-correlation).
## Richness models
```{r top-model-morni-chail}
## prepare data for each site
bmod_morni <- glm(S ~ AET + WDF, family = "poisson", data = site_morni)
bmod_chail <- glm(S ~ TRI, family = "poisson", data = site_chail)
```
The top model identified for Morni Hills included actual evapotranspiration (AET) and water deficit (WDF) as predictors (@supptbl-mod-sel). This model exhibited an overall good fit (deviance = `r round(bmod_morni$deviance, 2)`, *df* = `r bmod_morni$df.residual`, *p* `r p.glm(bmod_morni)`) and explained `r round(d2.adj(bmod_morni), 2)`% of the total variation in species richness. The bivariate model with AET and WDF for Morni Hills performs better than most of the previously proposed models of plant species richness (@tbl-mod-comp). This model is jointly the best among the considered 15 previously proposed models for species richness. The model describing a quadratic relationship with potential evapotranspiration (PET) had slightly better AICc (ΔAICc = 0.01). In Chail WLS, the terrain ruggedness index (TRI) was included in the top model (@supptbl-mod-sel). The model exhibited an overall good fit (deviance = `r round(bmod_chail$deviance, 2)`, *df* = `r bmod_chail$df.residual`, *p* `r p.glm(bmod_chail)`) and explained `r round(d2.adj(bmod_chail), 2)`% of the total variation in species richness. While this univariate model with TRI performed better than many previously proposed models of plant species richness, water--energy dynamics models were better fitted to species richness in Chail WLS (@tbl-mod-comp). The best model suggested a quadratic relationship between species richness and potential evapotranspiration in Chail WLS and it was better than our univariate top model with TRI (ΔAICc = 3.82).
```{r}
#| label: tbl-mod-comp
#| tbl-cap: Comparison of the top model (shown in bold) with previously proposed models for determinants of species richness. The table shows the log-likelihood (logLik), corrected Akaike's Information Criteria (AICc), the difference in AICc (ΔAICc) and adjusted deviance-squared (D^2^~adj~) for each model. The difference in AICc was calculated against the top model (shown in bold) and negative values indicate a better model. Only models with a difference of two AICc units from the top model are presented for each site. Each model represents a generalised linear model (GLM) with Poisson distribution and the log-link function. The response variable was species richness (S). The predictor variables were actual evapotranspiration (AET), enhanced vegetation index homogeneity (EHM), elevation (ELE), mean total annual precipitation (MAP), mean annual temperature (MAT), potential evapotranspiration (PET), precipitation seasonality (PSE), temperature seasonality (TSE), terrain ruggedness index (TRI) and water deficit (WDF).
## compare top model with previous models
# source("R/06_compare-top-model.R")
read.csv("output/top_mod_comparison.csv") |>
filter(daicc < 2) |>
mutate(across(
is.double, ~ round(.x, 2)
)) |>
mutate(Model = ifelse(daicc == 0, paste0("**", Model, "**"), Model)) |>
relocate(Site) |>
rename("ΔAICc" = daicc, "D^2^~adj~ (%)" = dev.adj) |>
knitr::kable()
```
```{r top-model-churdhar-all}
bmod_churdhar <- glm(S ~ AET + MAP, family = "poisson", data = site_churdhar)
bmod_all <- glm(S ~ EHM + NPP + TRI, family = "poisson", data = site_all)
bmod_all1 <- glm(S ~ WDF + PET + I(PET^2), family = "poisson", data = site_all)
bmod_all2 <- glm(S ~ WDF + MAT + WDF:MAT, family = "poisson", data = site_all)
# site_all |> select(WDF, PET) |> cor(method = "spearman")
# car::vif(bmod_all1)
```
The top model for Churdhar WLS included actual evapotranspiration (AET) and mean total annual precipitation (MAP) as potential predictors of species richness (@supptbl-mod-sel). The model exhibited an overall good fit (deviance = `r round(bmod_churdhar$deviance, 2)`, *df* = `r bmod_churdhar$df.residual`, *p* `r p.glm(bmod_churdhar)`) and explained `r round(d2.adj(bmod_churdhar), 2)`% of the total variation in species richness for Churdhar WLS. This bivariate model with AET and MAP was better than all of the considered previous models of plant species richness (@tbl-mod-comp), and all other models differed from this model by at least four AICc units. When the full elevational gradient (All Sites) was considered, all three uncorrelated predictors, i.e., enhanced vegetation index homogeneity (EHM), net primary productivity (NPP) and terrain ruggedness index (TRI), were included in the top model (@supptbl-mod-sel). Although this model explained `r round(d2.adj(bmod_all), 2)`% deviance in species richness, it did not exhibit an overall good fit (deviance = `r round(bmod_all$deviance, 2)`, *df* = `r bmod_all$df.residual`, *p* `r p.glm(bmod_all)`). However, some models outperformed this top model (ΔAICc = 40.27 to 192.73), though this model performed better than many previously proposed models (@tbl-mod-comp). The model with the lowest AICc included WDF and quadratic terms of PET and explained about `r round(d2.adj(bmod_all1), 2)`% deviance in species richness. This model also indicated an overall good fit (deviance = `r round(bmod_all1$deviance, 2)`, *df* = `r bmod_all1$df.residual`, *p* `r p.glm(bmod_all1)`). However, the WDF and PET were highly correlated ($\rho$ = 0.95) and showed high variance inflation factor (VIF > 7), and therefore, we inferred this model as biased and overfitted. The second best model included an interaction between WDF and MAT (@tbl-mod-comp). This model explained `r round(d2.adj(bmod_all2), 2)`% deviance in species richness and indicated an adequate fit to our data (deviance = `r round(bmod_all2$deviance, 2)`, *df* = `r bmod_all2$df.residual`, *p* `r p.glm(bmod_all2)`). Further, model diagnostics and validation did not indicate any potential deviations from model assumptions. Therefore, we considered this model as best fitted to our data. Among all compared species richness models (n = 19), the climate-richness models proposed by @Francis2003 explained the highest deviance in plant species richness patterns across all four elevational gradients (@supptbl-mod-d2). Further, the water--energy dynamics model of @OBrien1993 was also equally good at explaining broad-scale patterns of plant species richness along elevational gradients. However, the model with topographic heterogeneity exhibited a good fit at lower and intermediate elevations, but failed at higher elevations and full elevational gradient (@supptbl-mod-d2).
## Best model
```{r}
bmod_morni2 <- glm(S ~ PET + I(PET^2), family = "poisson", data = site_morni)
# ## coefficient interpretation
# data.frame(
# IRR = coef(bmod_morni2) |> exp() |> round(2),
# confint(bmod_morni2) |> exp() |> round(2)
# )
# read.csv("output/site_env.csv") |>
# filter(site == "Morni") |>
# ggplot(aes(x = PET, y = S)) +
# geom_point() +
# geom_smooth(method = "glm", formula = y ~ x + I(x^2),
# method.args = list(family = "poisson"))
```
The single best model for Morni Hills suggested a quadratic relationship between potential evapotranspiration (PET) and species richness (@tbl-mod-comp). This model exhibited an overall good fit (deviance = `r round(bmod_morni2$deviance, 2)`, *df* = `r bmod_morni2$df.residual`, *p* `r p.glm(bmod_morni2)`) and explained `r round(d2.adj(bmod_morni2), 2)`% of the total variation in species richness. Further, analysis of model residuals and diagnostics indicated that the model adequately fits to our data (@suppfig-qqplot a, @suppfig-residual-plot a). Both linear and quadratic coefficients for potential evapotranspiration (PET) were negatively and significantly associated with species richness in Morni Hills (@tbl-bmod2). The linear term indicates species richness tends to decrease with an increase in PET. Specifically, for every unit increase in standard deviation (SD) of PET, species richness is expected to decrease by a factor of 0.75 (95% CI: 0.70--0.79) if all other factors remain constant. Further, the statistically significant quadratic term denotes the curvature of the relationship between species richness and PET. The negative coefficient of the quadratic term suggests the relationship may follow a concave pattern with an initial increase in species richness followed by a rapid decrease. Additionally, the confidence intervals for all predictors included zero, indicating little support for the effects of predictors on species richness in Morni Hills (@supptbl-morni-avg).
```{r}
#| label: tbl-bmod2
#| tbl-cap: Summary of the best Poisson GLM with log-link function for selected sites in the Western Himalayas. The species richness (S) was regressed against predictor variables including actual evapotranspiration (AET), mean total annual precipitation (MAP), mean annual temperature (MAT), potential evapotranspiration (PET) and water deficit (WDF). The interaction of water deficit (WDF) and mean annual temperature (MAT) was included for full elevational gradient. The table displays the estimated regression coefficients (Estimate), standard errors (SE), z-value (Z) and p-values (p) for each regression coefficient in the model.
bmod_morni2 <- glm(S ~ PET + I(PET^2), family = "poisson", data = site_morni)
bmod_chail2 <- glm(S ~ PET + I(PET^2), family = "poisson", data = site_chail)
bmod_churdhar2 <- glm(S ~ AET + MAP, family = "poisson", data = site_churdhar)
bmod_all2 <- glm(S ~ WDF + MAT + WDF:MAT, family = "poisson", data = site_all)
bind_rows(
summary(bmod_morni2)$coefficients |>
as.data.frame() |>
rownames_to_column("Parameters") |>
mutate(Site = "Morni"),
summary(bmod_chail2)$coefficients |>
as.data.frame() |>
rownames_to_column("Parameters") |>
mutate(Site = "Chail"),
summary(bmod_churdhar2)$coefficients |>
as.data.frame() |>
rownames_to_column("Parameters") |>
mutate(Site = "Churdhar"),
summary(bmod_all2)$coefficients |>
as.data.frame() |>
rownames_to_column("Parameters") |>
mutate(Site = "All")
) |>
rename("SE" = `Std. Error`, "Z" = `z value`, "p" = `Pr(>|z|)`) |>
mutate(across(is.double & !p, ~round(.x, 2))) |>
mutate(p = ifelse(p < 1e-3, "<0.001", as.character(round(p, 3))),
Parameters = gsub("I\\(|\\(|\\)", "", Parameters)) |>
relocate(Site) |>
knitr::kable(align = c("l", "r", "r", "r", "r", "r"))
```
```{r}
## coefficient interpretation
# data.frame(
# IRR = coef(bmod_chail2) |> exp() |> round(2),
# confint(bmod_chail2) |> exp() |> round(2)
# )
# read.csv("output/site_env.csv") |>
# filter(site == "Chail") |>
# ggplot(aes(x = PET, y = S)) +
# geom_point() +
# geom_smooth(method = "glm", formula = y ~ x + I(x^2),
# method.args = list(family = "poisson"))
```
The best model for Chail WLS suggested a quadratic relationship between species richness and potential evapotranspiration (PET) in Chail WLS (@tbl-mod-comp). This model exhibited an overall good fit (deviance = `r round(bmod_chail2$deviance, 2)`, *df* = `r bmod_chail2$df.residual`, *p* `r p.glm(bmod_chail2)`) and explained `r round(d2.adj(bmod_chail2), 2)`% of the total variation in species richness. Further, analysis of model assumptions indicated no significant problems (@suppfig-qqplot b), however, model residuals suggested significant quantile deviations (@suppfig-residual-plot b). In contrast to Morni Hills, the coefficient for linear PET term ($\beta$ = −0.02, SE = 0.02) was not statistically significant (*p* = 0.317). This small negative coefficient for linear term indicates that there will be little effects of PET on species richness if all other factors remain constant. However, the quadratic coefficient for PET was found to be negatively and significantly associated with species richness (@tbl-bmod2). This negative coefficient suggests that the relationship between species richness and PET follows a concave pattern, though the magnitude of curvature was lower than the Morni Hills. Taken together, these coefficient suggests a unimodal relationship between species richness and PET with a peak at intermediate levels of PET.
```{r}
# ## coefficient interpretation
# data.frame(
# IRR = coef(bmod_churdhar) |> exp() |> round(2),
# confint(bmod_churdhar) |> exp() |> round(2)
# )
```
Our top model identified for Churdhar WLS was the best model among all 15 models (@tbl-mod-comp). This bivariate model with actual evapotranspiration (AET) and mean total annual precipitation (MAP) exhibited an overall good fit (deviance = `r round(bmod_churdhar$deviance, 2)`, *df* = `r bmod_churdhar$df.residual`, *p* `r p.glm(bmod_churdhar)`). It explained `r round(d2.adj(bmod_churdhar), 2)`% of the total variation in species richness for Churdhar WLS. Further, model residuals and diagnostics analysis indicated that the model adequately fitted our data (@suppfig-qqplot c, @suppfig-residual-plot c). This model suggested that AET ($\beta$ = 0.42, SE = 0.02) was positively and significantly (*p* < 0.001) associated, whereas MAP ($\beta$ = −0.09, SE = 0.01) was negatively and significantly (*p* < 0.001) with species richness in Churdhar WLS (@tbl-bmod2). Specifically, this model suggests that for every unit increase in SD of AET, species richness is expected to increase by a factor of 1.52 (95% CI: 1.48--1.57). Similarly, for every one-unit increase in MAP, species richness is expected to decrease by a factor of 0.91 (95% CI: 0.89--0.94).
```{r}
bmod_all2 <- glm(S ~ WDF + MAT + WDF:MAT, family = "poisson", data = site_all)
## coefficient interpretation
# data.frame(
# IRR = coef(bmod_all2) |> exp() |> round(2),
# confint.default(bmod_all2) |> exp() |> round(2)
# ) |>
# ## convert in percentage
# apply(2, function(.x){(.x - 1)*100}) |>
# as.data.frame()
```
Across the full elevational gradient, the selected best model included water deficit (WDF), mean annual temperature (MAT) and their interaction (@tbl-mod-comp). This interaction model indicated a good fit to our data (deviance = `r round(bmod_all2$deviance, 2)`, *df* = `r bmod_all2$df.residual`, *p* `r p.glm(bmod_all2)`) and explained `r round(d2.adj(bmod_all2), 2)`% of the total variation in species richness. Further, model residuals and diagnostics analysis also indicated no potential problems (@suppfig-qqplot d, @suppfig-residual-plot d). The significant negative coefficient for WDF (@tbl-bmod2) suggests that the species richness is expected to decrease by 7% (95% CI: 2--13) for every unit increase in SD of WDF if MAT is held constant. Similarly, the significant positive coefficient for MAT indicated that for every unit increase in SD of MAT, the species richness is expected to increase by 22% (95% CI: 15--29) if WDF is held constant. The statistically significant coefficient for interaction between WDF and MAT (@tbl-bmod2), suggests that the effect of water deficit (WDF) on the species richness depends on the levels of mean annual temperature (MAT). The effect of water deficit on species richness decreases by 43% (95% CI: 42--45) for every unit increase of SD in mean annual temperature (@tbl-bmod2). We plotted the species richness against water deficit (WDF) with four temperature levels to visualise this interaction. The plot showed that the effect of WDF on species richness was stronger at lower temperatures as compared to higher temperatures. With increasing levels of water deficit, the species richness tended to increase at lower temperatures, whereas it tended to decrease at higher temperatures (@fig-intrplot-all).
```{r fig.width=7, fig.height=5}
#| label: fig-intrplot-all
#| fig-cap: Interaction plot showing the effect of water deficit (WDF) on plant species richness at different levels of mean annual temperature (MAT) for the full elevational gradient. The temperature levels were defined as cold (less than 10°C), cool (between 10°C to 15°C), warm (between 15°C to 20°C) and hot (more than 20°C). The smooth line was fitted using a Poisson generalised linear model (GLM) with log-link function and the 95% confidence interval is represented as shades around the predicted smooth lines.
pal_temp <- c("Cold" = "#2c7bb6", "Cool" = "#abd9e9",
"Warm" = "#fdae61", "Hot" = "#d7191c")
read.csv("output/site_env.csv") |>
filter(site == "All") |>
mutate(Temperature = case_when(
MAT < 10 ~"Cold",
between(MAT, 10, 15) ~"Cool",
between(MAT, 15, 20) ~"Warm",
MAT > 20 ~"Hot"
),
Temperature = factor(Temperature , c("Cold", "Cool", "Warm", "Hot"))) |>
ggplot(aes(x = WDF, y = S, colour = Temperature ,
fill = Temperature, shape = Temperature)) +
geom_smooth(method = "glm", method.args = list(family = "poisson"),
alpha = 0.1) +
geom_point(colour = "black", size = 3, alpha = 0.75) +
labs(x = "Water deficit (mm)",
y = "Species richness") +
scale_color_manual(values = pal_temp) +
scale_fill_manual(values = pal_temp) +
scale_shape_manual(values = c(23, 24, 22, 21)) +
theme(legend.position = c(1, 1), legend.justification = c(1, 1),
#legend.direction = "horizontal",
legend.title = element_text(size = 12),
legend.background = element_rect(fill = NA),
axis.title = element_text(colour = "black"))
# ggsave("figs/fig5_interaction.pdf", width = 7, height = 5)
# ggsave("figs/fig5_interaction.png", width = 7, height = 5)
```
## Richness mechanisms
```{r}
library(piecewiseSEM)
## read all data
site_env <- read.csv("output/site_env.csv") |>
mutate(WDF = log(WDF), MTP = MAT*MAP)
## filter data for All Sites
site_all <- bind_cols(
site_env |> filter(site == "All") |> select(S),
site_env |> filter(site == "All") |> select(-c(site, S)) |>
apply(2, scale)
)
bmod_sem <- psem(
glm(S ~ MAT + MAP + PSE + MTP + PET + NPP,
family = "poisson", data = site_all),
lm(MTP ~ MAT + TSE + MAP + PSE, data = site_all),
lm(PET ~ MAT + TSE + MAP + PSE, data = site_all),
lm(NPP ~ MAT + TSE + MAP + MTP, data = site_all)
)
```
The identified best SEM model included climatic variables (MAT, TSE, MAP, PSE and MAT×MAP), net primary productivity (NPP) as the energy variable and potential evapotranspiration (PET) representing water--energy dynamics (@supptbl-sem-mods). This model for the species richness showed an overall good fit to the observed data as indicated by the Fisher's C statistic (*C* = 13.59, *df* = 8, *p* = 0.093) and also by the Chi-square goodness-of-fit test ($\chi^2$ = 9.11, *df* = 4, *p* = 0.058). These goodness-of-fit tests indicate that we fail to reject the null hypothesis, i.e., there are no significant differences between the proposed model and observed data. In other words, our data adequately represent the proposed hypothetical causal model. The best path model revealed that the mean annual temperature (MAT), mean total annual precipitation (MAP), interaction between MAT and MAP (MAT×MAP), precipitation seasonality (PSE), net primary productivity (NPP) and potential evapotranspiration (PET) directly regulate the species richness across the entire elevational gradient (@fig-sem). On the other hand, mean annual temperature (MAT), temperature seasonality (TSE), mean total annual precipitation (MAP) and precipitation seasonality (PSE) indirectly affect the species richness. Among the climate variables, MAT, MAP and PSE have direct and indirect effects on the species richness, whereas TSE has indirect effects on species richness. Further, the effect of climatic variables appears to be mediated by net primary productivity, potential evapotranspiration and an interaction between mean annual temperature and mean total annual precipitation (@fig-sem).
```{r}
# ## function to scale
# lwd01 <- function(x){x/max(x)}
#
# bmod_sem |>
# coefs() |>
# select(-9) |>
# mutate(lwd = lwd01(abs(Std.Estimate))) |>
# mutate(across(is.double & !P.Value, ~round(.x, 2))) |>
# mutate(p.signif = case_when(
# P.Value <= 1e-3 ~"***",
# P.Value <= 1e-2 & P.Value > 1e-3 ~"**",
# P.Value <= 0.05 & P.Value > 1e-2 ~"*",
# P.Value >= 0.05 ~""
# )) |>
# mutate(est.label = paste0('"', Std.Estimate, p.signif, '"')) |>
# mutate(linecol = ifelse(Std.Estimate > 0, '"#0072b2"', '"#d55e00"'),
# linetyp = ifelse(Std.Estimate > 0, '"solid"', '"dashed"')) |>
# mutate(sempath = paste0(
# Predictor, " -> ", Response, "[label=", est.label,
# ", penwidth=", lwd*5,
# ", style=", linetyp,
# ", color = ", linecol,
# "]"
# )) |>
# select(sempath)
```
![Final path model illustrating the direct and indirect environmental determinants of plant species richness. The model highlights the direct and indirect effects of mean annual temperature (MAT), temperature seasonality (TSE), precipitation seasonality (PSE), mean total annual precipitation (MAP), net primary productivity (NPP), the interaction between mean annual temperature and mean total annual precipitation (MAT×MAP) and potential evapotranspiration (PET) on the species richness. The standardised path coefficients and associated significance level indicate the strength and direction of each relationship. Each path coefficient represents the expected change in the standard deviation of response with a one-unit standard deviation change in the predictor. Solid blue arrows represent the positive effects, whereas negative effects are represented by dashed brown arrows. The width of each arrow is proportional to the standardised path coefficients. The significance levels represented as `***`, `**` and `*` correspond to *p*-values of <0.001, <0.01 and <0.05, respectively. The goodness of fit was assessed using the chi-squared test and Shipley's test of directed separation based on Fisher's C statistic.](figs/fig6_bmod-sem){#fig-sem}
```{r}
# percent.effect <- function(coef.value, se){
# est <- (exp(coef.value) - 1)*100
# ci.upper <- (exp(coef.value + 2*se) - 1)*100
# ci.lower <- (exp(coef.value - 2*se) - 1)*100
# data.frame(est, ci.lower, ci.upper) |>
# round(2)
# }
#
# ## interpret coefficients
# rbind(
# MAP = percent.effect(-1.08, 0.16), ## MAP
# MAT = percent.effect(-1.65, 0.20), ## MAT
# MATMAP = percent.effect(1.11, 0.13), ## MAT*MAP
# PET = percent.effect(-0.77, 0.28), ## PET
# NPP = percent.effect(0.40, 0.08), ## NPP
# PSE = percent.effect(0.14, 0.04) ## PSE
# )
```
The path analysis revealed that the mean total annual precipitation ($\beta$ = −1.08, *p* < 0.001) and the mean annual temperature ($\beta$ = −1.65, *p* < 0.001) had significant negative direct effects on species richness across the elevational gradient (@tbl-sem-coefs). These negative coefficients suggest that species richness is expected to decrease by 66% (95% CI: 53--75) for every unit increase in the standard deviation of MAP if all other variables held constant. Similarly, for every unit increase in the standard deviation of MAT, the species richness is expected to decrease by 81% (95% CI: 71--87), holding all other variables constant. The significant positive coefficient for MAT×MAP interaction indicate that the effects of precipitation on species richness depends on the temperature levels. With increased precipitation the species richness tends to increase at higher temperatures (more than 15°C) but decreases at lower temperatures (less than 15°C). The significant positive magnitude ($\beta$ = 1.11, *p* < 0.001) of interaction coefficient suggests that the effect of MAP on species richness increases by 203% (95% CI: 134--293) for every unit increase in SD of mean annual temperature. Further, the PET had a significant negative direct effect, whereas NPP and PSE significantly positively affected species richness. The species richness is expected to decrease by 53.7% (95% CI: 19--73) for every unit increase in the SD of PET, holding other variables constant. Similarly, the species richness is expected to increase by 49% (95% CI: 27--75) for every unit increase in SD of NPP, whereas it increases by 15% (95% CI: 6--24) for every unit increase in SD of precipitation seasonality (@tbl-sem-coefs).
```{r}
#| label: tbl-sem-coefs
#| tbl-cap: Summary of estimated path coefficients from structural equation modelling for species richness along the elevational gradient. The table displays the standardised path coefficient (Std.Estimate), unstandardised path coefficient (Estimate), standard error (SE), degrees of freedom (df), critical z-scores (Z), and p-values (p) for each path from independent (Predictor) to dependent (Response) variable in the model. The path coefficients represent the strength and direction of the relationships between variables. The standardised path coefficients (Std.Estimate) represent the expected change in dependent variable as a function of the change in independent variable in standard deviation (SD) units.
bmod_sem |>
coefs() |>
select(-9) |>
mutate(P.Value = ifelse(P.Value < 1e-3, "<0.001", as.character(round(P.Value, 3)))) |>
mutate(across(where(is.double) & !P.Value, ~round(.x, 2))) |>
mutate(Predictor = ifelse(Predictor == "MTP", "MAT×MAP", Predictor),
Response = ifelse(Response == "MTP", "MAT×MAP", Response)) |>
rename("SE" = Std.Error, "df" = DF, "Z" = Crit.Value, "p" = P.Value) |>
select(Predictor, Response, Std.Estimate, Estimate, SE, df, Z, p) |>
arrange(desc(Response), Predictor) |>
knitr::kable(align = c("l", "l", "r", "r", "r", "r", "r", "r"))
```
In addition to direct effects, the mean total annual precipitation (MAP), mean annual temperature (MAT), their interaction (MAT×MAP) and precipitation seasonality (PSE) influence species richness through their indirect effects mediated by NPP, PET and MAT×MAP (@fig-sem). These effects captured the influence of each variable on species richness mediated through other variables in the path model. The indirect effects of MAT on species richness are mediated through its significant negative influence on the NPP ($\gamma$ = −0.90, *p* < 0.001) and significant positive influence on MAT×MAP ($\gamma$ = 2.20, *p* < 0.001) and PET ($\gamma$ = 0.68, *p* < 0.001). Similarly, the indirect effects of MAP on species richness are mediated through its significant positive influence on the MAT×MAP ($\gamma$ = 0.67, *p* < 0.001) and significant negative influence on NPP ($\gamma$ = −1.44, *p* < 0.001) and PET ($\gamma$ = −0.23, *p* < 0.001). Further, the interaction between MAT and MAP (MAT×MAP) showed a significant indirect effect on species richness mediated through a strong positive influence on NPP ($\gamma$ = 1.02, *p* < 0.001). Similarly, the indirect effects of precipitation seasonality (PSE) on species richness are mediated through its significantly positive influence on PET ($\gamma$ = 0.06, *p* = 0.010) and significantly negative influence on MAT×MAP ($\gamma$ = −0.24, *p* = 0.022). Further, the temperature seasonality (TSE) indicated significant indirect effects on species richness that are mediated through NPP, PET and MAT×MAP (@fig-sem). The temperature seasonality indirectly affects the species richness through its significantly positive effect on PET ($\gamma$ = 0.05, *p* = 0.017) and significantly negative effect on NPP ($\gamma$ = −0.60, *p* < 0.001) and MAT×MAP ($\gamma$ = −0.50, *p* < 0.001).
```{r}
## function to calculate direct and indirect effects
calc.effs <- function(sem_mod, y){
## extract standardised coefs from sem model
df <- coefs(sem_mod) |> select(Predictor, Response, Std.Estimate)
## filter direct effect estimates
df_direct <- df |>
filter(Response == y) |>
rename("Direct" = Std.Estimate) |>
select(-Response)
## filter indirect effect estimates
df_indirect <- df |> filter(Response != y)
## calculate indirect estimates
left_join(
df_indirect, df_direct, by = join_by(Response == Predictor)
) |>
mutate(indirect_estimate = Std.Estimate * Direct) |>
group_by(Predictor) |>
summarise(Indirect = sum(indirect_estimate)) |>
full_join(df_direct, by = join_by(Predictor)) |>
mutate(Total = Indirect + Direct) |>
select(Predictor, Direct, Indirect, Total)
}
```
```{r fig.width=7, fig.height=5}
#| label: fig-sem-effects
#| fig-cap: Direct and indirect effects of environmental variables on plant species richness. The effect estimates are derived from the standardised path coefficients and represent the expected change in the standard deviation of species richness as a function of unit change in the standard deviation of the predictor variable.
bmod_sem |>
calc.effs("S") |>
mutate(Predictor = ifelse(Predictor == "MTP", "MAT×MAP", Predictor)) |>
pivot_longer(cols = -c(Predictor, Total), names_to = "Effect",
values_to = "Estimate") |>
ggplot(aes(x = Predictor, y = Estimate, fill = Effect)) +
geom_bar(stat = "identity", width = 0.7) +
geom_hline(yintercept = 0, linetype = 3) +
geom_text(aes(label = round(Estimate, 2)),
position = position_stack(vjust = 0.5),
size = 3.5, show.legend = FALSE) +
labs(x = "Predictor", y = "Standardised estimate") +
scale_fill_manual(values = c("Direct" = "#9ecae1", "Indirect" = "#deebf7")) +
theme_bw(base_size = 14) +
theme(legend.position = c(0.98, 0.98),
legend.justification = c(1, 1),
legend.background = element_rect(fill = NA),
panel.grid = element_blank())
# ggsave("figs/fig7_sem-effects.pdf", width = 7, height = 5)
# ggsave("figs/fig7_sem-effects.png", width = 7, height = 5)
```
The path analysis suggested that the climatic variables, except temperature seasonality (TSE), showed both direct and indirect effects on species richness (@fig-sem-effects). The temperature seasonality indicated only indirect effects, whereas net primary productivity (NPP) and potential evapotranspiration (PET) depicted only direct effects on species richness. The NPP showed direct positive, whereas PET showed direct negative effects on species richness. However, the effects of PET are more substantial than the NPP. Further, mean annual temperature (MAT) had the strongest direct and indirect effects on species richness among all environmental variables. However, the total net effects are strongest for the interaction between MAT and MAP (2.04 + 0.75 = 2.79), followed by the mean total annual precipitation (−1.97 + 0.63 = −1.34), precipitation seasonality (0.26 − 0.56 = −0.30) and mean annual temperature (−3.02 + 2.87 = −0.15). All climatic variables (MAT, TSE, MAP, and PSE) had a net negative effect on species richness whereas the MAT×MAP interaction had a strong net positive effect on plant species richness (@fig-sem-effects).
# Discussion
The present study aimed to explore the determinants of plant species richness along elevational patterns. Our results suggested that the water deficit (WDF) was important at the lower elevational gradient, the terrain ruggedness index (TRI) was important at the intermediate elevational gradient, actual evapotranspiration (AET) was important at the higher elevational gradient, and net primary productivity (NPP) was important across the entire elevational gradient for explaining variation in plant species richness (Question 1). A univariate model with TRI was identified for intermediate elevational gradient, a bivariate model with AET and WDF was identified for lower elevational gradient, a bivariate model with AET and mean total annual precipitation (MAP) was identified for higher elevational gradient, and the model for entire elevational gradient included NPP, enhanced vegetation index homogeneity (EHM) and TRI (Question 2). The identified model for higher elevational gradient performed best whereas the model for lower elevational gradient was second best among the compared models (Question 3). Further, our results highlighted that plant species richness is directly and indirectly influenced by climate, energy, and water–energy dynamics across the elevational gradients (Question 4). Overall, our findings contribute to a better understanding of the determinants of plant species richness along elevational gradients.
The most important finding of the present study is the consistent relationship of species richness with climatic variables representing water--energy dynamics across different elevational gradients (@supptbl-mod-d2). While the variables measuring energy and water availability differed across elevational gradients, all models included variables representing energy and water availability. Since thermal energy determines the availability of liquid water, the variables representing an interaction between water--energy availability are important determinants of species richness [@OBrien2006; @Stephenson1990]. These environmental variables have also been previously suggested as major determinants of species richness [@Currie1987; @Francis2003; @OBrien1993; @Stephenson1990].
Consistent with earlier studies [@OBrien1993; @Bhatta2021; @Vetaas2019], the potential evapotranspiration (PET) exhibited a quadratic relationship with species richness at lower and intermediate elevational gradients. This relationship suggests that species richness is influenced by both linear and non-linear effects of evapotranspiration, indicating potentially complex ecological dynamics. With an increase in PET, the species richness initially increases to reach a maximum and then starts decreasing at higher values of PET. Since PET measures the amount of surface water loss under sufficient water availability, it represents a combination of thermal energy and water availability. Higher PET values indicate higher thermal energy leading to water scarcity, whereas lower PET values indicate lower thermal energy leading to water freezing [@OBrien2006]. Thus, optimal thermal energy and water availability combination support maximum species richness. This explanation also applies to the decreasing species richness at higher elevational gradient, which can attributed to water scarcity due to lower thermal energy. This observation aligns with previous studies highlighting the importance of water--energy dynamics in determining broad-scale species richness of plants [@Bhatta2021; @Thakur2022; @Tolmos2022; @Vetaas2019]. However, the interaction between thermal energy (mean annual temperature) and water availability (water deficit) was more important for determining species richness across the full elevational gradient. The relationship between species richness and temperature depends on the levels of water deficit levels. Similarly, the relationship between species richness and water deficit depended on the temperature levels. These observations agree with richness-climate models of species richness, as @Francis2003 described, highlighting the joint effects of energy and water availability. It appears that mean annual temperature becomes more important than the PET as a measure of environmental energy for determining species richness at larger scales [@Francis2003]. Thus, our results indicate that climate is consistently related to species richness across the elevational gradient.
Our second important result highlights the direct and indirect effects of climatic variables on species richness across the full elevational gradient. Our analysis suggested species richness is shaped by both direct and indirect effects of climatic variables except temperature seasonality. However, the direct effects of climatic variables (MAT, MAP and MAT×MAP) were stronger than their indirect effects on species richness. This observation suggests that the climatic variables may regulate species richness by directly influencing the metabolism and physiology of organisms. Since more species can tolerate warm--wet climates, species richness is higher in warm--wet environments than the cold--dry climates [@Currie2004; @Hawkins2003]. The higher species richness at intermediate elevations (1300--1500 m) and the significant direct effects of climatic variables support the *climatic tolerance hypothesis* for broad-scale patterns of species richness. However, our results indicated little support for the *metabolic theory of ecology* as the direct effects of mean annual temperature were strongly negative on species richness [@Price2010; @Wang2009]. Contrary to the predictions of this theory, species richness decreased with increasing temperature in reduced water availability. Thus, the effects of temperature depended on the water availability. Therefore, it is unlikely that species richness is determined by temperature or precipitation separately.
Climate can indirectly influence species richness by controlling the water--energy availability across the elevational gradients [@OBrien1993; @OBrien2006]. This observation is supported by the significant negative relationship between species richness and potential evapotranspiration (PET) found in this study. The high levels of thermal energy led to high potential evapotranspiration (PET), which reduces the availability of liquid water (drought). In contrast, low levels of thermal energy led to low PET, which also results in reduced availability of liquid water (frozen water at higher elevations). Thus, our study supports the *water--energy dynamics hypothesis*, which posits that intermediate energy (thermal) levels result in higher water availability, which supports more species through biological activity [@OBrien1993; @OBrien2006]. This water--energy dynamics (WED) model has found support from recent studies on the elevational pattern of species for plants [@Bhatta2021; @Thakur2022; @Tolmos2022; @Vetaas2019].
Alternatively, climate can indirectly regulate species richness by influencing energy availability [@Currie2004; @Hawkins2003; @Jiang2022; @Wright1983]. We observed a direct positive relationship between species richness and net primary productivity (NPP) across the full elevational gradient. A positive relationship between species richness and energy variables like NPP has been previously observed across broad scales [@Bhatta2021; @Jiang2022]. One proposed mechanism to explain this species-energy relationship is called the *more individuals hypothesis* [@Srivastava1998], which states that higher energy availability can support a greater number of individuals leading to higher number of species with viable population sizes. Thus, energy availability can maintain species richness by preventing extinction due to smaller population size [@Wright1983]. This explanation of species richness based on energy availability has sometimes been referred to as the *species-energy hypothesis* [@Wright1983]. Our results apparently support this hypothesis, though energy can control species richness through multiple mechanisms [@Evans2005]. However, the effects of NPP were weaker than the environmental variables representing joint effects of water--energy availability (@fig-sem-effects). This weak magnitude of NPP effects indicates that NPP is not a primary variable controlling species richness at larger scales. Thus, our findings align with earlier studies showing little evidence for this hypothesis [@Adler2011; @Gaston2000; @Storch2018].
One notable finding of the present analysis is that environmental heterogeneity was not included in our identified models of species richness. We used enhanced vegetation index homogeneity index (EHM) to measure vegetation heterogeneity and terrain ruggedness index (TRI) to measure topographic heterogeneity. While both EHM and TRI generally increased with elevation, neither metric emerged as a significant predictor of species richness in our final models. These results suggest that the role of heterogeneity in shaping richness patterns depend on other factors. Alternatively, these metrics may not be sufficient to capture the environmental heterogeneity, or these are correlated with climatic variables. Thus, our study did not indicate support for the *heterogeneity richness hypothesis*, which posits that regions with higher heterogeneity tend to have more species due to increased habitat diversity [@Stein2014]. However, the topographic heterogeneity seems to regulate species richness at intermediate elevational gradients where water and energy are sufficiently available. Overall, our results suggest that environmental heterogeneity may play an important role in regions where climatic conditions are optimised, but it can not be the sole predictor of species richness at larger scales. Consistent with previous observations [@Field2009], our study indicated that climatic factors are more important than environmental heterogeneity for species richness, at least in the case of plants.
Our models indicated that energy (NPP), topographic heterogeneity (TRI), and water–energy dynamics (AET and WDF) were the primary environmental variables associated with species richness. These variables have been previously identified as the major environmental factors influencing plant species richness [@Hawkins2003; @Stein2014]. However, the importance of these variables varied with the extent and position of elevational gradients, highlighting the importance of spatial scale for ecological processes [@Field2009]. The water–energy dynamics appeared to be more important at lower and higher elevational gradients, whereas the topographic heterogeneity is important at intermediate elevational gradients. This observation suggests that liquid water availability is an important driver of plant species richness [@OBrien2006]. When the demand for liquid water is met (e.g., at intermediate elevations), topographic heterogeneity becomes an important determinant of plant species richness. Energy availability seemed to influence species richness across the full elevational gradient primarily. Thus, the influence of primary environmental factors can vary with the position and extent of the elevational gradients.
While our study has global implications for understanding determinants of species richness at larger scales, it is not free from limitations. First, we used the range interpolation method to estimate species richness [@Grytnes2002], which has been criticised for its assumption of continuous species distribution within the geographical range and biased estimation of species richness [@Hu2017]. Second, the environmental predictors used in this study are secondarily derived using statistical algorithms and scaling [@Karger2017], which might not capture the actual environment in complex environments such as Himalayan mountains. Third, the present study was based on the data compiled from the published flora, which can not be considered free from bias. Specifically, incomplete flora or biased estimation of distribution ranges can influence the observed patterns of species richness. Fourth, the results of this study can be biased because it did not considered the potential statistical non-independence and spatial autocorrelation introduced due to range interpolation and elevational gradient. Despite these known limitations, the range interpolation method and data from published floras have been used for exploring ecological and biogeographical patterns [@Bhatta2021; @Qian2022; @Rana2019ecs]. Overall, our findings highlight the importance of direct and indirect effects of climatic variables and our results agree well with the general climate-richness model proposed by @Francis2003 in determining species richness along elevational gradients. Future investigations should consider the field data with in-situ environmental variables across spatial scales to improve our understanding of the determinants and mechanisms underlying elevational patterns of species richness. Furthermore, we must be cautious while generalising these findings to other regions or ecosystems because ecological processes and mechanisms may vary with spatial-temporal scales.
# Conclusions
The present study revealed that climatic factors combining energy and water availability are important determinants of plant species richness at broader spatial scales. Our findings extend previous research by highlighting the direct, interaction, and indirect effects of climatic variables on species richness. While determinants of species richness may vary on different ecological scales, our study indicated an interplay of climatic, energy, and water-related variables as the primary determinant of species richness across elevational gradients. The significant effects of temperature, precipitation, net primary productivity, water deficit, and potential evapotranspiration highlight the multifaceted nature of plant species richness patterns. The observed interaction effects emphasise the need to consider the synergistic effects of energy (heat) and water variables when studying the patterns and processes of plant species richness. These insights contribute to a more holistic understanding of the mechanisms shaping plant species richness in complex ecosystems like the Himalayas. By unravelling the relationship between environmental factors and species richness, our study provides a foundation for developing strategies to conserve and manage the biodiversity in mountainous regions under global environmental change.
# Abbreviations {.unnumbered}
**AET:** Actual Evapotranspiration; **AIC:** Akaike's Information Criteria; **AICc:** Corrected Akaike's Information Criteria; **EHM:** Enhanced Vegetation Index Homogeneity Index; **GBIF:** Global Biodiversity Information Facility; **GLM:** Generalised Linear Model; **MAP:** Mean Total Annual Precipitation; **MAT:** Mean Annual Temperature; **NPP:** Net Primary Productivity; **PET:** Potential Evapotranspiration; **POWO:** Plants of the World Online; **PSE:** Precipitation Seasonality; **S:** Species Richness; **SD:** Standard Deviation; **SE:** Standard Error; **SEM:** Structural Equation Modelling; **SOC:** Soil Organic Carbon; **TRI:** Terrain Ruggedness Index; **TSE:** Temperature Seasonality; **WCVP:** World Checklist of Vascular Plants; **WDF:** Water Deficit; **WED:** Water–Energy Dynamics; **WLS:** Wildlife Sanctuary
# Declarations {.unnumbered}
**Ethics approval and consent to participate** Not applicable
**Consent for publication** Not applicable
**Availability of data and material** The data and `R` codes that support the findings of this study are available from figshare repository <https://figshare.com/s/3728be3aa8153653da93>. We will publish to figshare with DOI after acceptance.
**Competing interests** The authors declare that they have no competing interests
**Funding** This work was supported by the University Grants Commission (UGC), Government of India, New Delhi in the form of Senior Research Fellowships to Abhishek Kumar [507/ (OBC) (CSIR-UGC NET DEC. 2016)], Meenu Patil [492/ (CSIR-UGC NET JUNE 2017)], and Pardeep Kumar [443/ (CSIR-UGC NET DEC. 2017)].
**Authors' contributions**
```{r eval=TRUE}
auth.cont <- function(author){
df_auth <- read.csv("credit_author.csv") |>
select(Contribution, all_of(author)) |>
drop_na()
paste0(df_auth[, 1], " (", df_auth[, 2], ")", collapse = ", ")
}
```
**Abhishek Kumar:** `r auth.cont("AK")`. **Meenu Patil:** `r auth.cont("MP")`. **Pardeep Kumar:** `r auth.cont("PK")`. **Anand Narain Singh:** `r auth.cont("ANS")`.
**Acknowledgements** The authors are grateful to the Principal Chief Conservator of Forests (PCCF) of the Haryana Forest Department and the Himachal Pradesh Forest Department for kindly permitting them to visit the selected protected areas. We are also thankful to the Chairperson, Department of Botany, Panjab University, Chandigarh, for providing all the necessary facilities required for the work. We want to express our heartfelt gratitude to Sabir Hussain, Alok Sharma, Kamal Rana, Pravesh Bhardwaj, and Sukhveer Cheema for their invaluable assistance and support during the fieldwork phase of this research. Additionally, we appreciate the Forest Department of Himachal Pradesh staff and authorities, who facilitated the logistics and permits required for the fieldwork. We acknowledge the constructive feedback of two anonymous reviewers on our previous draft.
\newpage
# Supplementary Information {.unnumbered}
```{r}
## prepare data for each site
site_morni <- read.csv("output/site_env.csv") |>
filter(site == "Morni") |>
select(-site) |>
mutate(across(!S, ~scale(.x)))
site_chail <- read.csv("output/site_env.csv") |>
filter(site == "Chail") |>
select(-site) |>
mutate(PET = sqrt(PET)) |>
mutate(across(!S, ~scale(.x)))
site_churdhar <- read.csv("output/site_env.csv") |>
filter(site == "Churdhar") |>
select(-site) |>
mutate(across(!S, ~scale(.x)))
site_all <- read.csv("output/site_env.csv") |>
filter(site == "All") |>
select(-site) |>
mutate(WDF = log(WDF)) |>
mutate(across(!S, ~scale(.x)))
```
:::{#supptbl-primary-var}
```{r}
## function to find primary variable -----
primary.var <- function(site_x){
## vector of predictors
varall <- names(site_x)[-1]
## data list to collect
datalist <- list()
## for loop for all variables
for (i in 1:length(varall)){
## formula for model
fm <- paste0("S ~ ", varall[i]) |> as.formula()
## poisson model
mod <- glm(fm, family = "poisson", data = site_x)
## model parameters
datalist[[i]] <- data.frame(
Variable = varall[i],
d2 = (1 - summary(mod)$deviance / summary(mod)$null.deviance)*100
)
}
## combine results
do.call(dplyr::bind_rows, datalist)
}
## find primary variable
primary.var(site_morni) |>
rename("Morni" = d2) |>
left_join(
primary.var(site_chail) |> rename("Chail" = d2)
) |>
left_join(
primary.var(site_churdhar) |> rename("Churdhar" = d2)
) |>
left_join(
primary.var(site_all) |> rename("All" = d2)
) |>
arrange(Variable) |>
flextable() |>
colformat_double(digits = 2) |>
bold(~Morni == max(Morni), c(1, 2)) |>
bold(~Chail == max(Chail), c(1, 3)) |>
bold(~Churdhar == max(Churdhar), c(1, 4)) |>
bold(~All == max(All), c(1, 5)) |>
add_footer_lines(
as_paragraph("The species richness (S) was regressed against each explanatory variable using Poisson GLM with a log-link function. The values represent the estimated deviance-squared (D", as_sup('2'), ") in percent units and higher values indicate a better model fit. The variables with maximum D", as_sup('2'), " values are highlighted with bold text.")
) |>
fontsize(size = 9, part = "footer") |>
flextable::width(width = 5.7/5)
```
Summary of primary variable selection for explaining species richness at lower (Morni), intermediate (Chail), higher (Churdhar) and full (All) elevational gradient.
:::
\newpage
:::{#supptbl-mod-sel}
```{r}
options(na.action = "na.fail")
mods_morni <- glm(S ~ AET + PSE + EHM + WDF,
family = "poisson", data = site_morni) |>
MuMIn::dredge() |>
subset(delta < 4) |>
tibble() |>
mutate(AET = ifelse(is.na(AET), NA, "AET"),
EHM = ifelse(is.na(EHM), NA, "EHM"),
PSE = ifelse(is.na(PSE), NA, "PSE"),
WDF = ifelse(is.na(WDF), NA, "WDF")) |>
unite(col = "Model", AET:WDF) |>
mutate(Model = gsub("_NA", "", Model),
Model = paste0("S ~ ", gsub("_", " + ", Model))) |>
select(-"(Intercept)")
mods_chail <- glm(S ~ MAP + PET + TRI,
family = "poisson", data = site_chail) |>
MuMIn::dredge() |>
subset(delta < 4) |>
tibble() |>
mutate(MAP = ifelse(is.na(MAP), NA, "MAP"),
PET = ifelse(is.na(PET), NA, "PET"),
TRI = ifelse(is.na(TRI), NA, "TRI")) |>
unite(col = "Model", MAP:TRI) |>
mutate(Model = gsub("NA_|_NA", "", Model),
Model = paste0("S ~ ", gsub("_", " + ", Model))) |>
select(-"(Intercept)")
mods_churdhar <- glm(S ~ AET + EHM + MAP + TRI + TSE,
family = "poisson", data = site_churdhar) |>
MuMIn::dredge() |>
subset(delta < 4) |>
tibble() |>
mutate(AET = ifelse(is.na(AET), NA, "AET"),
EHM = ifelse(is.na(EHM), NA, "EHM"),
MAP = ifelse(is.na(MAP), NA, "MAP"),
TRI = ifelse(is.na(TRI), NA, "TRI"),
TSE = ifelse(is.na(TSE), NA, "TSE")) |>
unite(col = "Model", AET:TSE) |>
mutate(Model = gsub("_NA", "", Model),
Model = paste0("S ~ ", gsub("_", " + ", Model))) |>
select(-"(Intercept)")
mods_all <- glm(S ~ EHM + NPP + TRI,
family = "poisson", data = site_all) |>
MuMIn::dredge() |>
subset(delta < 4) |>
tibble() |>
mutate(EHM = ifelse(is.na(EHM), NA, "EHM"),
NPP = ifelse(is.na(NPP), NA, "NPP"),
TRI = ifelse(is.na(TRI), NA, "TRI")) |>
unite(col = "Model", EHM:TRI) |>
mutate(Model = paste0("S ~ ", gsub("_", " + ", Model))) |>
select(-"(Intercept)")