Full text
49,705 characters
· extracted from
preprint-html
· click to expand
Invisible people: Exploring how well remote-sensed datasets reveal the distribution of forest-proximate populations | bioRxiv /* */ /* */ <!-- <!-- /*! * yepnope1.5.4 * (c) WTFPL, GPLv2 */ (function(a,b,c){function d(a){return"[object Function]"==o.call(a)}function e(a){return"string"==typeof a}function f(){}function g(a){return!a||"loaded"==a||"complete"==a||"uninitialized"==a}function h(){var a=p.shift();q=1,a?a.t?m(function(){("c"==a.t?B.injectCss:B.injectJs)(a.s,0,a.a,a.x,a.e,1)},0):(a(),h()):q=0}function i(a,c,d,e,f,i,j){function k(b){if(!o&&g(l.readyState)&&(u.r=o=1,!q&&h(),l.onload=l.onreadystatechange=null,b)){"img"!=a&&m(function(){t.removeChild(l)},50);for(var d in y[c])y[c].hasOwnProperty(d)&&y[c][d].onload()}}var j=j||B.errorTimeout,l=b.createElement(a),o=0,r=0,u={t:d,s:c,e:f,a:i,x:j};1===y[c]&&(r=1,y[c]=[]),"object"==a?l.data=c:(l.src=c,l.type=a),l.width=l.height="0",l.onerror=l.onload=l.onreadystatechange=function(){k.call(this,r)},p.splice(e,0,u),"img"!=a&&(r||2===y[c]?(t.insertBefore(l,s?null:n),m(k,j)):y[c].push(l))}function j(a,b,c,d,f){return q=0,b=b||"j",e(a)?i("c"==b?v:u,a,b,this.i++,c,d,f):(p.splice(this.i++,0,a),1==p.length&&h()),this}function k(){var a=B;return a.loader={load:j,i:0},a}var l=b.documentElement,m=a.setTimeout,n=b.getElementsByTagName("script")[0],o={}.toString,p=[],q=0,r="MozAppearance"in l.style,s=r&&!!b.createRange().compareNode,t=s?l:n.parentNode,l=a.opera&&"[object Opera]"==o.call(a.opera),l=!!b.attachEvent&&!l,u=r?"object":l?"script":"img",v=l?"script":u,w=Array.isArray||function(a){return"[object Array]"==o.call(a)},x=[],y={},z={timeout:function(a,b){return b.length&&(a.timeout=b[0]),a}},A,B;B=function(a){function b(a){var a=a.split("!"),b=x.length,c=a.pop(),d=a.length,c={url:c,origUrl:c,prefixes:a},e,f,g;for(f=0;f<d;f++)g=a[f].split("="),(e=z[g.shift()])&&(c=e(c,g));for(f=0;f<b;f++)c=x[f](c);return c}function g(a,e,f,g,h){var i=b(a),j=i.autoCallback;i.url.split(".").pop().split("?").shift(),i.bypass||(e&&(e=d(e)?e:e[a]||e[g]||e[a.split("/").pop().split("?")[0]]),i.instead?i.instead(a,e,f,g,h):(y[i.url]?i.noexec=!0:y[i.url]=1,f.load(i.url,i.forceCSS||!i.forceJS&&"css"==i.url.split(".").pop().split("?").shift()?"c":c,i.noexec,i.attrs,i.timeout),(d(e)||d(j))&&f.load(function(){k(),e&&e(i.origUrl,h,g),j&&j(i.origUrl,h,g),y[i.url]=2})))}function h(a,b){function c(a,c){if(a){if(e(a))c||(j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}),g(a,j,b,0,h);else if(Object(a)===a)for(n in m=function(){var b=0,c;for(c in a)a.hasOwnProperty(c)&&b++;return b}(),a)a.hasOwnProperty(n)&&(!c&&!--m&&(d(j)?j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}:j[n]=function(a){return function(){var b=[].slice.call(arguments);a&&a.apply(this,b),l()}}(k[n])),g(a[n],j,b,n,h))}else!c&&l()}var h=!!a.test,i=a.load||a.both,j=a.callback||f,k=j,l=a.complete||f,m,n;c(h?a.yep:a.nope,!!i),i&&c(i)}var i,j,l=this.yepnope.loader;if(e(a))g(a,0,l,0);else if(w(a))for(i=0;i (function(w,d,s,l,i){w[l]=w[l]||[];w[l].push({'gtm.start':new Date().getTime(),event:'gtm.js'});var f=d.getElementsByTagName(s)[0];var j=d.createElement(s);var dl=l!='dataLayer'?'&l='+l:'';j.src='//www.googletagmanager.com/gtm.js?id='+i+dl;j.type='text/javascript';j.async=true;f.parentNode.insertBefore(j,f);})(window,document,'script','dataLayer','GTM-M677548'); Skip to main content Home About Submit ALERTS / RSS Search for this keyword Advanced Search New Results Invisible people: Exploring how well remote-sensed datasets reveal the distribution of forest-proximate populations Mirindra Rakotoarisoa , Julia P. G. Jones , View ORCID Profile O. Sarobidy Rakotonarivo , Manoa Rajaonarivelo , View ORCID Profile Dominik Schüßler doi: https://doi.org/10.1101/2024.09.23.614649 Mirindra Rakotoarisoa 1 École Supérieure des Sciences Agronomiques, Université d’Antananarivo , Madagascar Find this author on Google Scholar Find this author on PubMed Search for this author on this site Julia P. G. Jones 2 School of Natural Sciences, College of Environmental Sciences and Engineering, Bangor University , UK Find this author on Google Scholar Find this author on PubMed Search for this author on this site O. Sarobidy Rakotonarivo 1 École Supérieure des Sciences Agronomiques, Université d’Antananarivo , Madagascar Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for O. Sarobidy Rakotonarivo Manoa Rajaonarivelo 1 École Supérieure des Sciences Agronomiques, Université d’Antananarivo , Madagascar Find this author on Google Scholar Find this author on PubMed Search for this author on this site Dominik Schüßler 3 Institute of Biology and Chemistry, University of Hildesheim , Germany Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Dominik Schüßler For correspondence: dominik.schuessler{at}posteo.de Abstract Full Text Info/History Metrics Preview PDF Abstract Accurate information on the location and density of people living at the forest frontier is vital for effective and equitable forest conservation. We compare the location of settlements and estimated population density from three global-scale, remote-sensed datasets (World Settlement Footprint 2015, Open Buildings, WorldPop) with a fine-scale, manually-derived dataset of 3,136 human settlements, of which 95% had fewer than 150 households. The study region is located in north-eastern Madagascar, contains three protected areas and the largest unprotected block of humid forest of the island. The Open Buildings dataset detected a much higher proportion (94%) of settlements than did World Settlement Footprint (15%). Population density from WorldPop matches poorly with that estimated from our manually-derived dataset. The accuracy of all three datasets is worse in more remote, forested areas, further away from basic infrastructure. Open Buildings appears to best reveal the distribution of low density scattered populations in forested areas. However, further testing in other climatic regions is still needed. Making good use of appropriate remote-sensed data could revolutionize the inclusion of local communities in conservation policy and practice, improve the quality of inference in conservation research, particularly in times of a planned expansion of the global protected area network. Introduction Land use change is a major driver of biodiversity decline ( IPBES, 2019 ; Jaureguiberry et al., 2022 ). Subsistence farming, mostly carried out by poor people living in scattered settlements along the forest frontier, is an important driver of land use change ( Foley et al., 2005 ), especially in Africa ( Curtis et al., 2018 ). Ensuring that biodiversity conservation goals can be met without exacerbating poverty of these often already politically marginalized people ( Fisher & Christopher, 2007 ), therefore requires high-quality information on the distribution of populations in these frontier regions. Unfortunately, the location and population density of forest-proximate people is poorly known and often badly captured by existing datasets including national gazetteers ( Newton et al., 2020 ; Thomson et al., 2022 ) meaning many people are essentially invisible to conservation policy and practice ( Poudyal et al 2016 ). Understanding the distribution of human populations is needed to ensure conservation policy and practice is appropriately participatory and does not harm local people. A major expansion of area-based conservation measures is underway, following the agreement by nearly 200 countries to conserve 30% of the earth for nature by 2030 (CBD, 2022). Policymakers need to consider where people already live to reduce the opportunity costs, and potential conflict, associated with protected area establishment ( Adams et al., 2010 ). The importance of genuine consultation with local people during the process of establishing new protected areas is recognized (Pimbert & Petty, 1997; Dawson et al., 2017 ), and requires information on the distribution of settlements. Conservation researchers also need data on the density and distribution of human populations for a variety of purposes. This includes the selection of appropriate controls for exploring the impact of area-based conservation interventions on conservation outcomes (e.g. species populations; Wauchope et al., 2022 , or tree cover loss; Desbureaux, 2021 ), or extrapolation from small-scale studies about the opportunity costs of conservation to the landscape scale, whether these costs arise through restrictions on agricultural expansion ( Poudyal et al., 2018 ), or wildlife-human interactions ( Drake et al., 2020 ). A suite of open access global-scale datasets provide information on the distribution of human settlements. These are for example the World Settlement Footprint 2015 ( Marconcini et al., 2020 ), the Open Buildings dataset ( Sirko et al., 2021 ) or the WorldPop population density map ( Tatem, 2017 ). However, several factors can limit the detectability of people living in forest-frontier regions including the often small size of settlements and potentially the lack of contrast between building materials and the surrounding environment ( Ji et al., 2020 ; Van Den Hoek & Friedrich, 2021 ). There are few, if any, studies which explicitly test how well these datasets perform at detecting the distribution of forest-proximate people. Detailed manually-derived data on the distribution of hamlets, villages and towns in the north-east of Madagascar (see Schüßler et al., 2020 ) offer an opportunity to test the reliability of global-scale remote-sensed datasets at capturing the density and distribution of human populations in a frontier area of great importance for biodiversity conservation. Madagascar’s highly threatened biodiversity is mostly located in the rapidly shrinking forests across the island ( Ralimanana et al., 2022 ; Vieilledent et al., 2018 ), with shifting cultivation representing a major driver of ongoing forest loss ( Curtis et al., 2018 , though see McConnell and Kull, 2014 ). Sixty-five percent of the Malagasy population live in rural areas ( UNDP, 2016 ), where food insecurity is particularly rife ( Harvey et al., 2014 ; Thompson et al., 2023 ). Nationally-available datasets of the distribution of rural populations are largely absent ( Ihantamalala et al., 2020 ). The country has undergone a substantial expansion of its protected area network ( Gardner et al., 2018 ) which has sometimes negatively affected poor and already marginalized households living in forested areas ( Jones et al., 2021 ; Rakotonarivo et al., 2017 ). However, previous attempts to compensate the local costs of conservation have failed ( Brimont et al., 2015 ; Hockley et al., 2018 ; Poudyal et al., 2018 ), partly because of the limited available information on the location of forest-proximate people ( Poudyal et al., 2016 ). We evaluate the suitability of three global-scale remote-sensed datasets in detecting settlements and the density of forest-proximate people in north-eastern Madagascar. By comparing these datasets with a fine-scale manually-derived dataset ( Schüßler et al., 2020 ), we explore the performance of the World Settlement Footprint and the Open Buildings Dataset at capturing the location of settlements, and WorldPop at capturing the density of human populations across the landscape. We discuss the factors associated with the detectability of forest-proximate people and the implications of these results for conservation policy, practice and research. Methods Study region North-eastern Madagascar is characterized by the largest remaining rainforests of the island and a mosaic of regenerating fallows and farmland ( Zähringer et al., 2015 ). While there are larger towns and cities along the more accessible coastline, inland there are scattered villages and hamlets. The main agriculture is shifting cultivation of rice, maize and manioc, supplemented with agroforestry production of cash crops such as vanilla, cloves or coffee ( Llopis et al., 2019 ; Zähringer et al., 2015 ; Schüßler et al., 2020 ). We focus specifically on the Analanjirofo region which at 22,000 km² is of an equivalent size to El Salvador, Israel or Slovenia and which contains three major protected areas: Makira Natural Park, Mananara Nord National Park and Ambatovaky Special Reserve. Datasets The World Settlement Footprint 2015 (hereafter WSF2015; Marconcini et al., 2020 ), indicates the presence or absence of human settlements in each grid cell of a raster at 10 m resolution. The Open Buildings Data ( Sirko et al., 2021 ), provides the location of single buildings as shapefile data for the African continent. WorldPop ( Tatem, 2017 ), is widely used raster data representing estimated population density at a resolution of 1 km. Details of the datasets, including the timestamp for data acquisition, is given in Table S1 . The fine-scale, manually-derived dataset was produced by Schüßler et al. (2020) to investigate the drivers of forest change in the Analanjirofo region. Schüßler et al. (2020) digitized the location of all villages detected visually from high-resolution images in Google Earth. The area was subdivided into seven parts and carefully scanned along north-south running transects for indications of human housing. The best quality and most cloud-free images were selected ranging in time between 2012 and 2018 ( Table S1 ; Schüßler et al., 2020 ). Every settlement was marked as a point in its center and accompanied with its size (i.e., number of houses) in 8 size classes, ranging from 5-50 to 51-100 etc. to >350 houses per settlement. Many people in the study region have temporary houses in their agricultural fields but which are not permanent dwellings. Settlements with 1-4 houses were therefore not recorded. This resulted in a total number of 3,136 settlements of which 59% consist of less than 50 houses, and a further 38% between 50 and 150 houses. Larger villages and cities made up the remaining 3% of all settlements of the area. While of course errors can be made in any dataset, for this analysis we treat this data as a measure of truth against which to compare the global datasets. Treatment of data The three global-scale remote-sensed and the fine-scale manually-derived reference dataset are of different resolutions and of different data types (i.e., 10 m vs. 1 km, raster vs. shapefile). To explore the accuracy of the datasets at detecting settlements, we modified the data as follows. For comparability with WSF2015 (1x1 km raster data), we converted the fine-scale data to the same grid cell size, and recorded whether a grid cell size of 1km² contained a manually-derived settlement or not. The Open Buildings dataset was first converted from single buildings to settlements by creating 100 m buffers around all buildings and dissolving them to settlements (excluding groupings of fewer than 5 households as these had been excluded when preparing the manually-derived dataset). This buffer size was selected based on visual interpretation of satellite images overlaid with the Open Buildings dataset; increased buffer sizes of 200 or 300m did not change the results. Overlap of settlement locations between Open Buildings and our fine-scale manually derived dataset could then be measured and analyzed, as points of the latter dataset were located in village centers, warranting overlap with Open Buildings buffer polygons. For comparability with the WorldPop population density map, we calculated a kernel density map (Silverman, 2018) based on the number of houses per settlement in the fine-scale manually-derived dataset (and an estimate of 5.5 persons per household from Poudyal et al., 2018 ). These two population density datasets were then log-transformed and z-standardized to achieve a normal distribution and to increase comparability among datasets. Due to artefacts in the WorldPop data (indicated with strong outliers in the dataset and sharp edges in Figure 4 ), we removed outlier raster cells beforehand based on the 1.5*interquartile range rule ( Yang et al., 2019 ). For comparability and illustrative purposes, we also produced a population density map from the Open Buildings dataset (again using an average estimate of 5.5 persons per household from Poudyal et al., 2018 ). We do not test this dataset against the data from the manually-derived dataset as we do not necessarily believe that for population density, the manually-derived data (based on point locations for settlements of varied size) is inherently better. Analysis We used generalized linear models with a binary response variable (i.e., settlement detected or not) to compare both the WSF2015 and the Open Buildings datasets with the manually-derived fine-scale dataset. We used a linear model with the deviance between the population density estimates per grid cell as response variable for the comparison of WorldPop and the kernel density map from the manually-derived fine-scale data. To explain variation in detectability and density estimates of the three datasets we ran our models with six explanatory variables (described in Schüßler et al., 2020 ): (1) the density of forest per km² (in 2018) as a measure of proximity to the forest frontier (distance to the forest edge could not be used, as it does not distinguish between small forest fragments and the major forest blocks); (2) distance to major pathways of the study area (which represents accessibility); (3) distance to valley bottoms; (4) distance to major rivers (as preferred places for settlement formation); (5) the elevation and (6) the slope. Distance measures were calculated as Euclidean distances given in m. All explanatory variables were z-standardized to account for high variability in the scale of values. Correlations among explanatory variables were r < 0.65. Odds Ratios are presented for generalized linear models and standardized coefficients for the linear model. A further multi-model inference approach is detailed in the supplementary methods below. Results The accuracy of global-scale remote-sensed datasets at detecting settlements Visual comparison of the two global-scale remote-sensed datasets with our fine-scale, manually-derived data suggests that the Open Buildings dataset detects a higher proportion of the settlements in our study area than the World Settlement Footprint data (WSF2015; Figure 1 ). The Open Buildings dataset detected a much higher proportion of the settlements than did the WSF2015 (94% or 2,914 of the settlements, compared to 15% or 484, Figure 2 ). WSF2015, performed particularly badly at identifying settlements of between 5 and 100 houses: 79% (2,477) were not detected while the Open Buildings dataset missed only 10% (177) of these small settlements ( Figure 2 ). Download figure Open in new tab Figure 1: Distribution of settlements in the Analanjirofo region of north-eastern Madagascar as detected by I) World Settlement Footprint (WSF2015; raster data, 10 m resolution), II) Open Buildings (shape file of individual buildings) and III) our fine-scale manual-derived dataset (shape file with points of settlement locations). Download figure Open in new tab Figure 2: Number of settlements detected in different size categories by (I) World Settlement Footprint 2015 and (II) Open Buildings compared to the fine-scale manually derived dataset. While WSF2015 clearly missed a lot of settlements across the landscape, the dataset was particularly likely to miss settlements in areas with high forest density, which were far from paths, at high elevation and further from valley bottoms ( Figure 3I ). Distance to major rivers did not contribute to the detectability of settlements and this variable was not included in the best performing model ( Table S2 in SI). Given the higher agreement of the Open Buildings dataset with our manually-derived dataset in general ( Figure 2 ), it is unsurprising that fewer variables significantly predict the detection of settlements by this dataset. However lower detection was similarly associated with areas of higher forest and higher elevations ( Figure 3II ). All other variables contributed to a lesser extent and were insignificant ( Figure 3II ; Table S2 ). Download figure Open in new tab Figure 3: Effect sizes of the seven explanatory variables in explaining detection of settlements by the global-scale data (I, II) and the deviance in population density estimates (III). I: Odds Ratios of World Settlement Footprint 2015, II: Odds Ratios of Open Buildings dataset, II: Standardized coefficients of WorldPop. Calculation of Odds Ratios and standardized coefficients is based on global models containing all 7 explanatory variables (multi-model inference in Table S2 ). Note: Significant parameters are those not overlapping with the dashed line of no effect; values oriented in negative direction from the dashed line indicate lower detectability based on an increase in this parameter while values in positive direction from the dashed line show parameters that contributed to higher detectability of settlements based on the increase of this parameter. The accuracy of global-scale remote-sensed datasets at characterizing the variation in population density across the landscape We were able to produce density estimates across the landscape from the Open Buildings dataset ( Figure 4II ) and the fine-scale manually-derived dataset ( Figure 4III ) and compared the latter to the density raster provided by WorldPop ( Figure 4I ). WSF2015 could not be easily converted into a comparable population density as it is presence/absence of settlements in a raster so it is not included in Figure 4 . Apparent inaccuracies with sharp lines were found for many places in the WorldPop dataset ( Figure 4I , cells C3 and C5). The density map estimates from the Open Buildings dataset displayed a pattern comparable to our manually derived dataset ( Figure 4II, III ). We did not model this relationship, as we produced the population density map ourselves, which may not directly allow to judge about the original dataset and the comparison of the original data was already conducted above ( Figure 1 - 3 ). Download figure Open in new tab Figure 4: Population density in north-eastern Madagascar at 1 km resolution as derived from WorldPop (I), Open Buildings (II) and the fine-scale manually-derived dataset (III). WorldPop was particularly poor at characterizing the population density in areas of lower forest density, at higher elevations, on steeper slopes and further away from valley bottoms ( Figure 3III ). Correct detection was higher in areas closer to the main rivers of the region. The best model did not include distance to pathways, but all other explanatory variables ( Table S2 ) and explained only 3.4% of the variation. Although a high population density along the coast was found by WorldPop, it failed to estimate population density correctly further inland ( Figure 4I, III ). Discussion Which dataset performed best? In many less developed countries, maps of human settlements are unavailable or inaccurate ( Ihantamalala et al., 2020 ). Remote-sensed global datasets can help fill gaps, however, for such datasets to be used to inform conservation practice, policy or research, they need to accurately capture the location and density of human populations. Our results show that for detecting the distribution of human populations in a forest frontier region of Madagascar, the available remote-sensed datasets are of variable quality. The Open Buildings dataset was particular promising in detecting both the location, and potentially density, of forest-proximate people. The Open Buildings dataset detected a much higher proportion of settlements in our manually-derived dataset than the World Settlement Footprint. This was especially true for the smallest settlements where Open Buildings dataset detected 90% compared to just 21% for World Settlement Footprint. Both datasets were particularly likely to miss settlements in more remote, forested areas and it is important to note that even the Open Buildings dataset missed 7% (177) of them. While WorldPop is very widely used as an estimate of the distribution of human population density (at 1km resolution, Tatem, 2017 ), we found it performed rather poorly in our highly-forested study region. It further included sharp edges; an artefact from the processing of underlying datasets. Although the coastal regions were correctly shown to have high population densities, inland areas were inaccurate in both the visual interpretation ( Figure 4 ) and the linear model explaining the deviations ( Figure 3III ). We did not formally test the performance of the density layer derived from the Open Buildings dataset. However, as this is based on detection of single buildings (rather than a classification of the approximate size of settlement as in our manually-derived dataset; Schüßler et al., 2020 ), this, when combined with a regionally-appropriate estimate of household size, may capture human population density most accurately (see Figure 4II ). Limitations There are a few limitations to our study. While we treat the manually-derived dataset as representing the truth for the purpose of this analysis, there will inevitably be some inaccuracies in this dataset. Firstly there is some discrepancy in the timestamp associated with the various datasets. As settlements can appear (and less commonly disappear) relatively rapidly in frontier regions ( Foley et al., 2005 ), lack of accuracy detected in the remote-sense datasets may relate to inconsistencies in which settlements were present at a moment in time, rather than ability of certain approaches to detect settlements of a given size. However, all datasets used in this study (with the exception of the Open Buildings dataset for which not date is defined) come from a relatively short period (see Table S1 ), so that we do not consider this to be a major problem. Another limitation with the manually-derived dataset is that it does not include individual isolated homesteads. While many isolated buildings represent temporary shelters for use when tending crops at certain times of the year, others will represent permanent dwellings. By not recording settlements with fewer than 5 houses our dataset risks missing some of the most isolated people in the landscape. Our results may further only be applicable to settlement detectability in humid tropical regions. Similar analysis would be needed to explore the extent to which the findings are transferable to arid regions. This is because single houses (as in the Open Buildings dataset) and settlements (as in the WSF2015 dataset) likely contrast better with the surrounding evergreen vegetation than might be true in more arid environments. Implications for forest-proximate communities There are at least 1 billion forest-proximate people in tropical countries ( Newton et al., 2020 ). Such people are often marginalized politically and economically (e.g., Levers et al., 2021 ) and conservation has often proceeded without appropriate involvement of these key stakeholders ( Adams et al., 2010 ). The lack of high-quality information about the distribution of people at the forest frontier has effectively made such people invisible. The aim of the study was to highlight the potential for remote-sensed datasets to make them more visible: easier to consider in conservation policy, easier to reach for consultation or involvement in conservation practice, and easier to take into account in conservation research. Our findings confirm the value of such datasets, and suggest that the Open Buildings dataset has particular value (at least in a forest frontier region of north-eastern Madagascar). However even the best dataset struggles to capture settlements in the most forested areas. If this isn’t addressed, there is a risk of these people continuing to be overlooked. Author contribution statement JPGJ and DS conceived of the ideas for this manuscript. MR and DS collated and analyzed the data and lead the manuscript writing. All authors contributed to previous drafts of the manuscript, and approved the final version for publication. Data availability statement The global datasets (WorldPop, WSF2015, Open Buildings) used in this manuscript are freely available. The fine-scale manually-derived dataset can be shared upon request to the corresponding author. Funding statement This work was funded by the UK Government CLARE programme (Climate Resilience and Adaptation) and the International Development Research Centre, Ottawa, Canada through their support for the Forest4Climate&People project. Further statements The authors declare no conflict of interests. Supplementary information Supplementary methods The spatial data was freely available from Tatem (2017) , Sirko et al. (2021) and Marconcini et al. (2020) and provided by Schüßler et al. (2020) . Spatial data was prepared in ArcGIS 10.6 (ArcGIS Desktop 10.6.1, ESRI, Redlands, USA) and QGIS 3.10 (QGIS Development Team, 2020 ) and later analyses were conducted in R v4.4.2 and RStudio v2022.12.0.353 (R Core Team, 2022; Posit Team, 2022). We checked for collinearity of the seven explanatory variables beforehand using the “psych” package v2.2.9 in R ( Revelle, 2022 ) and all correlations were below r = 0.65. Supplementary Table S1 . provides details on the used datasets and their specifications. Using a multi-model inference approach ( Burnham & Anderson, 2002 ) for each comparison (i.e., WSF2015 and Open Buildings with the manually-derived dataset, WorldPop with the kernel density estimates from the manually-derived dataset), we fitted a global model first with all six explanatory variables (i.e., forest density, distance to major pathways, distance to main rivers, distance to valley bottoms, slope and elevation). Models containing all possible combinations of variables were then calculated using the “MuMIn” package v1.47.1 ( Barton, 2022 ). Candidate models based on the lowest AIC values and those deviating less than 2 units from the best model (ΔAIC<2) are reported in this study ( Burnham & Anderson, 2002 ). Akaike weights (i.e., conditional probability of a certain model) were calculated based on all possible models ( Wagenmakers & Farrell, 2004 ). Model results from the generalized linear models are presented as Odds Ratios calculated using the “effectsize” package v0.8.2 ( Ben-Shachar et al., 2020 ) and visualized using “ggplot2” v.3.4.0 ( Wickham, 2016 ) and “patchwork” v1.1.2 (Pedersen, 2020). For the linear model, standardized coefficients are presented. Supplementary results Forest density and elevation were the only variables present in all candidate models as a predictor of the detectability of settlements or correct estimation of population densities ( Table S2 ); the other variables were less often involved. The best model on the detectability of settlements of WSF2015 involved elevation, forest density, distance to valley bottoms, distance to pathways and slope as explanatory variables and yielded the highest Akaike weight with 0.682. The other candidate model was of subordinate quality ( Table S2 ). For Open Buildings, the best model involved forest density, elevation, distance to valley bottoms and slope as explanatory variables. However, multiple further candidate models with only slightly lower Akaike weights involved also all other variables at some point. The best model concerning correct estimation of population density by WorldPop included all explanatory variables, except distance to pathways and yielded an Akaike weight of 0.693, markedly higher compared to the second best and only other candidate model ( Table S2 ). View this table: View inline View popup Supplementary Table S1: Details on the remote-sensed datasets used in this study. View this table: View inline View popup Download powerpoint Supplementary Table S2: Multi-model comparison to explain differences in village detectability (WSF2015 and Open Buildings via GLMs) and deviance in population density estimates (WorldPop via LM). Candidate models with ΔAIC<2.0 are shown here with the best model given in bold. Akaike weights were calculated on all possible models and indicate how well this model performs in comparison to the other candidate models. Empty cells indicate that these parameters were not included in the respective model. Abbreviations: Int. = intercept, elev = elevation, for. dens. = forest density, AIC = Akaike Information Criterion. Acknowledgement This work was funded by the UK Government CLARE programme (Climate Resilience and Adaptation) and the International Development Research Centre, Ottawa, Canada through their support for the Forest4Climate&People project. We thank Neal Hockley and Bruno Ramamonjisoa for support during this project and Ute Radespiel for supervision during the generation of the manually-derived fine-scale dataset. We further thank Dr. Enrico Di Minin for valuable comments on an earlier version of the manuscript. The authors declare not conflict of interests. References ↵ Adams , V.M. , Pressey , R.L. & Naidoo , R . ( 2010 ). Opportunity costs: Who really pays for conservation? Biological Conservation , 143 ( 2 ), 439 – 448 . OpenUrl CrossRef Web of Science ↵ Brimont , L. , Ezzine-de Blas , D. , Karsenty , A. & Toulon , A. ( 2015 ). Achieving conservation and equity amidst extreme poverty and climate risk: the Makira REDD+ project in Madagascar . Forests , 6 ( 3 ), 748 – 768 . OpenUrl ↵ Curtis , P.G. , Slay , C.M. , Harris , N.L. , Tyukavina , A. & Hansen , M.C . ( 2018 ). Classifying drivers of global forest loss . Science , 361 ( 6407 ), 1108 – 1111 . OpenUrl Abstract / FREE Full Text ↵ Dawson , N. , Martin , A. & Danielsen , F . ( 2017 ). Assessing equity in protected area governance: Approaches to promote just and effective conservation . Conservation Letters , 11 ( 2 ), e12388 . OpenUrl ↵ Desbureaux , S . ( 2021 ). Subjective modeling choices and the robustness of impact evaluations in conservation science . Conservation Biology , 35 ( 5 ), 1615 – 1626 . OpenUrl CrossRef ↵ Drake , M.D. , Salerno , J. , Langendorf , R.E. , Cassidy , L. , Gaughan , A.E. , Stevens , F.R. , Pricope , N.G. & Hartter , J . ( 2020 ). Costs of elephant crop depredation exceed the benefits of trophy hunting in a community-based conservation area of Namibia . Conservation Science and Practice , 3 ( 1 ). OpenUrl ↵ Fisher , B. & Christopher , T . ( 2007 ). Poverty and biodiversity: Measuring the overlap of human poverty and the biodiversity hotspots . Ecological Economics , 62 ( 1 ), 93 – 101 . OpenUrl CrossRef Web of Science ↵ Foley , J.A. , DeFries , R. , Asner , G.P. , Barford , C. , Bonan , G. , Carpenter , S.R. , Chapin , F.S. , Coe , M.T. , Daily , G.C. , Gibbs , H.K. , Helkowski , J.H. , Holloway , T. , Howard , E.A. , Kucharik , C.J. , Monfreda , C. , Patz , J.A. , Prentice , I.C. , Ramankutty , N. & Snyder , P.K . ( 2005 ). Global consequences of land use . Science , 309 ( 5734 ), 570 – 574 . OpenUrl Abstract / FREE Full Text ↵ Gardner , C.J. , Nicoll , M.E. , Birkinshaw , C. , Harris , A. , Lewis , R.E. , Rakotomalala , D. & Ratsifandrihamanana , A.N . ( 2018 ). The rapid expansion of Madagascar’s protected area system . Biological Conservation , 220 , 29 – 36 . OpenUrl ↵ Harvey , C.A. , Rakotobe , Z.L. , Rao , N.S. , Dave , R. , Razafimahatratra , H. , Rabarijohn , R.H. , Rajaofara , H. & MacKinnon , J.L. ( 2014 ). Extreme vulnerability of smallholder farmers to agricultural risks and climate change in Madagascar . Phil. Trans. R. Soc. B , 369 ( 1639 ), 20130089 . OpenUrl CrossRef PubMed ↵ Hockley , N. , Mandimbiniaina , R. & Rakotonarivo , O.S . ( 2018 ). Fair and equitable conservation: do we really want it, and if so, do we know how to achieve it? Madagascar Conservation Development , 13 ( 1 ), 3 . OpenUrl ↵ Hoek , J.V.D. & Friedrich , H.K . ( 2021 ). Satellite-based human settlement datasets inadequately detect refugee settlements: A critical assessment at thirty refugee settlements in Uganda . Remote Sensing , 13 ( 18 ), 3574 . OpenUrl ↵ Ihantamalala , F.A. , Herbreteau , V. , Révillion , C. , Randriamihaja , M. , Commins , J. , Andréambeloson , T. , Rafenoarimalala , F.H. , Randrianambinina , A. , Cordier , L.F. , Bonds , M.H. & Garchitorena , A . ( 2020 ). Improving geographical accessibility modeling for operational use by local health actors . International Journal of Health Geographics , 19 , 27 . OpenUrl ↵ IPBES ( 2019 ). Global assessment report on biodiversity and ecosystem services of the intergovernmental science-policy platform on biodiversity and ecosystem services . IPBES secretariat, Bonn, Germany . ↵ Jaureguiberry , P. , Titeux , N. , Wiemers , M. , Bowler , D.E. , Coscieme , L. , Golden , A.S. , Guerra , C.A. , Jacob , U. , Takahashi , Y. , Settele , J. , Díaz , S. , Molnár , Z. & Purvis , A . ( 2022 ). The direct drivers of recent global anthropogenic biodiversity loss . Science Advances , 8 ( 49 ) , DOI: 10.1126/sciadv.adf9317 . OpenUrl CrossRef ↵ Ji , H. , Li , X. , Wei , X. , Liu , W. , Zhang , L. & Wang , L . ( 2020 ). Mapping 10-m resolution rural settlements using multi-source remote sensing datasets with the google earth engine platform . Remote Sensing , 12 ( 17 ), 2832 . OpenUrl ↵ Jones , J.P. , Rakotonarivo , S. & Razafimanahaka , J . ( 2021 ). The New Natural History of Madagascar, Kapitel: Forest Conservation in Madagascar: Past, Present, Future . Princeton University Press . ↵ Levers , C. , Romero-Muñoz , A. , Baumann , M. , Marzo , T.D. , Fernández , P.D. , Gasparri , N.I. , Gavier-Pizarro , G.I. , le Polain de Waroux , Y. , Piquer-Rodríguez , M. , Semper-Pascual , A. & Kuemmerle , T. ( 2021 ). Agricultural expansion and the ecological marginalization of forest-dependent people . Proceedings of the National Academy of Sciences , 118 ( 44 ). OpenUrl ↵ Llopis , J.C. , Harimalala , P.C. , Bär , R. , Heinimann , A. , Rabemananjara , Z.H. & Zähringer , J.G . ( 2019 ). Effects of protected area establishment and cash crop price dynamics on land use transitions 1990-2017 in northeastern Madagascar . Journal of Land Use Science , 14 ( 1 ), 52 – 80 . OpenUrl Marconcini , M. , Metz-Marconcini , A. , Ãreyen , S. , Palacios-Lopez , D. , Hanke , W. , Bachofer , F. , Zeidler , J. , Esch , T. , Gorelick , N. , Kakarla , A. , Paganini , M. & Strano , E . ( 2020 ). Outlining where humans live, the world settlement footprint 2015 . Scientific Data , 7 ( 1 ), 242 . OpenUrl ↵ McConnell , W.J. & Kull , C.A . ( 2014 ). Deforestation in Madagascar: Debates over the island’s forest cover and challenges of measuring forest change . In Conservation and Environmental Management in Madagascar. Routledge , ( 91 – 128 ) ↵ Newton , P. , Kinzer , A.T. , Miller , D.C. , Oldekop , J.A. & Agrawal , A. ( 2020 ). The number and spatial distribution of forest-proximate people globally . One Earth , 3 ( 3 ), 363 – 370 . OpenUrl Convention on Biological Diversity (CBD). ( 2022 ). Conference of the parties draft decision cbd/cop/15/l.25 issued 18 December 2022. Pimbert , M.P. & Pretty , J.N . ( 1997 ). Parks, people and professionals: putting "participation" into protected area management . Social Change and Conservation , 16 , 297 – 330 . OpenUrl ↵ Poudyal , M. , Jones , J.P. , Rakotonarivo , O.S. , Hockley , N. , Gibbons , J.M. , Mandimbiniaina , R. , Rasoamanana , A. , Andrianantenaina , N.S. & Ramamonjisoa , B.S . ( 2018 ). Who bears the cost of forest conservation? PeerJ 6 , e5106 . OpenUrl ↵ Poudyal , M. , Ramamonjisoa , B.S. , Hockley , N. , Rakotonarivo , O.S. , Gibbons , J.M. , Mandimbiniaina , R. , Rasoamanana , A. & Jones , J.P . ( 2016 ). Can REDD+ social safeguards reach the ‘right’ people? Lessons from Madagascar . Global Environmental Change , 37 , 31 – 42 . OpenUrl ↵ Rakotonarivo , O.S. , Jacobsen , J.B. , Larsen , H.O. , Jones , J.P. , Nielsen , M.R. , Ramamonjisoa , B.S. , Mandimbiniaina , R.H. & Hockley , N . ( 2017 ). Qualitative and quantitative evidence on the true local welfare costs of forest conservation in Madagascar: Are discrete choice experiments a valid ex ante tool? World Development , 94 , 478 – 491 . OpenUrl ↵ Ralimanana , H. , Perrigo , A.L. , Smith , R.J. , Borrell , J.S. , Faurby , S. , Rajaonah , M.T. , Randriamboavonjy , T. , Vorontsova , M.S. , Cooke , R.S.C. , Phelps , L.N. , Sayol , F. , Andela , N. , Andermann , T. , Andriamanohera , A.M. , Andriambololonera , S. , Bachman , S.P. , Bacon , C.D. , Baker , W.J. , Belluardo , F. , Birkinshaw , C. , Cable , S. , Canales , N.A. , Carrillo , J.D. , Clegg , R. , Clubbe , C. , Crottini , A. , Damasco , G. , Dhanda , S. , Edler , D. , Farooq , H. , de Lima Ferreira , P. , Fisher , B.L. , Forest , F. , Gardiner , L.M. , Goodman , S.M. , Grace , O.M. , Guedes , T.B. , Hackel , J. , Henniges , M.C. , Hill , R. , Lehmann , C.E.R. , Lowry , P.P. , Marline , L. , Matos-Maraví , P. , Moat , J. , Neves , B. , Nogueira , M.G.C. , Onstein , R.E. , Papadopulos , A.S.T. , Perez-Escobar , O.A. , Phillipson , P.B. , Pironon , S. , Przelomska , N.A.S. , Rabarimanarivo , M. , Rabehevitra , D. , Raharimampionona , J. , Rajaonary , F. , Rajaovelona , L.R. , Rakotoarinivo , M. , Rakotoarisoa , A.A. , Rakotoarisoa , S.E. , Rakotomalala , H.N. , Rakotonasolo , F. , Ralaiveloarisoa , B.A. , Ramirez-Herranz , M. , Randriamamonjy , J.E.N. , Randrianasolo , V. , Rasolohery , A. , Ratsifandrihamanana , A.N. , Ravololomanana , N. , Razafiniary , V. , Razanajatovo , H. , Razanatsoa , E. , Rivers , M. , Silvestro , D. , Testo , W. , Jiménez , M.F.T. , Walker , K. , Walker , B.E. , Wilkin , P. , Williams , J. , Ziegler , T. , Zizka , A. & Antonelli , A . ( 2022 ). Madagascar’s extraordinary biodiversity: Threats and opportunities . Science , 378 ( 6623 ) , DOI: 10.1126/science.adf1466 . OpenUrl CrossRef Schüßler , D. , Mantilla-Contreras , J. , Stadtmann , R. , Ratsimbazafy , J.H. & Radespiel , U . ( 2020 ). Identification of crucial stepping stone habitats for biodiversity conservation in northeastern Madagascar using remote sensing and comparative predictive modeling . Biodiversity and Conservation , 29 ( 7 ), 2161 – 2184 . OpenUrl Sirko , W. , Kashubin , S. , Ritter , M. , Annkah , A. , Bouchareb , Y. , Dauphin , Y. , Keysers , D. , Neumann , M. , Cisse , M. & Quinn , J. ( 2021 ). Continental-scale building detection from high resolution satellite imagery . Tech. Rep., Google Research . URL https://arxiv.org/abs/2107.12283 Tatem , A.J . ( 2017 ). WorldPop, open data for spatial demography . Scientific Data , 4 ( 1 ), 170004 . OpenUrl ↵ Thompson , K.E.T. , Borgerson , C. , Wright , P.C. , Randriamanetsy , J.M. , Andrianantenaina , M.Y. , Andriamavosoloarisoa , N.N.M. , Razafindrahasy , T.A. , Rothman , R.S. , Surkis , C. , Bankoff R.J. , Daniels , C. & Twiss , K.C . ( 2023 ). A coupled humanitarian and biodiversity crisis in western Madagascar . International Journal of Primatology . DOI: 10.1007/s10764-022-00338-3 OpenUrl CrossRef ↵ Thomson , D.R. , Leasure , D.R. , Bird , T. , Tzavidis , N. & Tatem , A.J . ( 2022 ). How accurate are WorldPop-global-unconstrained gridded population data at the cell-level? A simulation analysis in urban Namibia . PLOS ONE , 17 ( 7 ), e0271504 . OpenUrl ↵ UNDP ( 2016 ). Human development report 2016. URL http://hdr.undp.org/sites/default/files/2016humandevelopmentreport.pdf ↵ Vieilledent , G. , Grinand , C. , Rakotomalala , F.A. , Ranaivosoa , R. , Rakotoarijaona , J.R. , Allnutt , T.F. & Achard , F . ( 2018 ). Combining global tree cover loss data with historical national forest-cover maps to look at six decades of deforestation and forest fragmentation in Madagascar . Biological Conservation , 222 , 189 – 197 . OpenUrl CrossRef ↵ Wauchope , H.S. , Jones , J.P.G. , Geldmann , J. , Simmons , B.I. , Amano , T. , Blanco , D.E. , Fuller , R.A. , Johnston , A. , Langendoen , T. , Mundkur , T. , Nagy , S. & Sutherland , W.J . ( 2022 ). Protected areas have a mixed impact on waterbirds, but management helps . Nature , 605 ( 7908 ), 103 – 107 . OpenUrl CrossRef ↵ Yang , J. , Rahardja , S. & Fränti , P. ( 2019 ). Outlier detection. In Proceedings of the International Conference on Artificial Intelligence, Information Processing and Cloud Computing - AIIPCC ’19 . ACM Press . ↵ Zähringer , J.G. , Eckert , S. & Messerli , P . ( 2015 ). Revealing regional deforestation dynamics in north-eastern Madagascar: Insights from multi-temporal land cover change analysis . Land , 4 ( 2 ), 454 – 474 . OpenUrl Supplementary references ↵ Barton , K . ( 2022 ). MuMIn: Multi-Model Inference . R package version 1 . 47 . 1 OpenUrl ↵ Ben-Shachar , M. , Lüdecke , D. & Makowski , D . ( 2020 ). effectsize: Estimation of effect size indices and standardized parameters . Journal of Open Source Software , 5 ( 56 ), 2815 . doi: 10.21105/joss.02815 OpenUrl CrossRef ↵ Burnham , K.P. & Anderson , D.R. ( 2002 ). Model selection and multimodel inference: a practical information-theoretic approach . Springer Science & Business Media , 2 Edition ↵ Marconcini , M. , Metz-Marconcini , A. , Ãreyen , S. , Palacios-Lopez , D. , Hanke , W. , Bachofer , F. , Zeidler , J. , Esch , T. , Gorelick , N. , Kakarla , A. , Paganini , M. & Strano , E . ( 2020 ). Outlining where humans live, the world settlement footprint 2015 . Scientific Data , 7 ( 1 ). doi: 10.1038/s41597-020-00580-5 OpenUrl CrossRef Pedersen , T.L. ( 2022 ). patchwork: The Composer of Plots . URL https://CRAN.R-project.org/package=patchwork , r package version 1.1.2 Posit team (2022). RStudio: Integrated Development Environment for R. Posit Software, PBC , Boston, MA . URL http://www.posit.co/ ↵ QGIS Development Team ( 2020 ). QGIS Geographic Information System . QGIS Association . URL https://www.qgis.org R Core Development Team ( 2020 ). R: A Language and Environment for Statistical Computing. R Foundation for Statistical Computing , Vienna, Austria . URL: http://www.R-project.org/ ↵ Revelle , W. ( 2022 ). psych: Procedures for Psychological, Psychometric, and Personality Research . Northwestern University, Evanston, Illinois . URL https://CRAN.R-project.org/package=psych , r package version 2.2.9 ↵ Schüßler , D. , Mantilla-Contreras , J. , Stadtmann , R. , Ratsimbazafy , J.H. & Radespiel , U . ( 2020 ). Identification of crucial stepping stone habitats for biodiversity conservation in northeastern Madagascar using remote sensing and comparative predictive modeling . Biodiversity and Conservation , 29 ( 7 ), 2161 – 2184 . doi: 10.1007/s10531-020-01965-z OpenUrl CrossRef ↵ Sirko , W. , Kashubin , S. , Ritter , M. , Annkah , A. , Bouchareb , Y. , Dauphin , Y. , Keysers , D. , Neumann , M. , Cisse , M. & Quinn , J. ( 2021 ). Continental-scale building detection from high resolution satellite imagery. Tech. Rep ., Google Research . URL https://arxiv.org/abs/2107.12283 ↵ Tatem , A.J . ( 2017 ). WorldPop, open data for spatial demography . Scientific Data , 4 ( 1 ). doi: 10.1038/sdata.2017.4 OpenUrl CrossRef ↵ Wagenmakers , E.J. & Farrell , S . ( 2004 ). AIC model selection using Akaike weights . Psychonomic Bulletin & Review , 11 ( 1 ), 192 – 196 . doi: 10.3758/bf03206482 OpenUrl CrossRef PubMed Web of Science ↵ Wickham , H. ( 2016 ). ggplot2: Elegant Graphics for Data Analysis . Springer-Verlag New York . URL https://ggplot2.tidyverse.org View the discussion thread. Back to top Previous Next Posted September 25, 2024. Download PDF Email Thank you for your interest in spreading the word about bioRxiv. NOTE: Your email address is requested solely to identify you as the sender of this article. Your Email * Your Name * Send To * Enter multiple addresses on separate lines or separate them with commas. You are going to email the following Invisible people: Exploring how well remote-sensed datasets reveal the distribution of forest-proximate populations Message Subject (Your Name) has forwarded a page to you from bioRxiv Message Body (Your Name) thought you would like to see this page from the bioRxiv website. Your Personal Message CAPTCHA This question is for testing whether or not you are a human visitor and to prevent automated spam submissions. Share Invisible people: Exploring how well remote-sensed datasets reveal the distribution of forest-proximate populations Mirindra Rakotoarisoa , Julia P. G. Jones , O. Sarobidy Rakotonarivo , Manoa Rajaonarivelo , Dominik Schüßler bioRxiv 2024.09.23.614649; doi: https://doi.org/10.1101/2024.09.23.614649 Share This Article: Copy Citation Tools Invisible people: Exploring how well remote-sensed datasets reveal the distribution of forest-proximate populations Mirindra Rakotoarisoa , Julia P. G. Jones , O. Sarobidy Rakotonarivo , Manoa Rajaonarivelo , Dominik Schüßler bioRxiv 2024.09.23.614649; doi: https://doi.org/10.1101/2024.09.23.614649 Citation Manager Formats BibTeX Bookends EasyBib EndNote (tagged) EndNote 8 (xml) Medlars Mendeley Papers RefWorks Tagged Ref Manager RIS Zotero Tweet Widget Facebook Like Google Plus One Subject Area Ecology Subject Areas All Articles Animal Behavior and Cognition (7653) Biochemistry (17763) Bioengineering (13944) Bioinformatics (42101) Biophysics (21509) Cancer Biology (18667) Cell Biology (25592) Clinical Trials (138) Developmental Biology (13413) Ecology (19969) Epidemiology (2067) Evolutionary Biology (24393) Genetics (15647) Genomics (22582) Immunology (17791) Microbiology (40524) Molecular Biology (17222) Neuroscience (88860) Paleontology (667) Pathology (2848) Pharmacology and Toxicology (4841) Physiology (7670) Plant Biology (15182) Scientific Communication and Education (2048) Synthetic Biology (4312) Systems Biology (9843) Zoology (2274)
Text is read by the "Ask this paper" AI Q&A widget below.
Extraction quality varies by source — PMC NXML preserves structure
cleanly, OA-HTML may include some navigation residue, and OA-PDF can
have broken hyphenation. The publisher copy
(via DOI)
is the canonical version.