<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.3 20210610//EN" "https://jats.nlm.nih.gov/publishing/1.3/JATS-journalpublishing1-3.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" dtd-version="1.3" article-type="research-article" xml:lang="en"><front><journal-meta><journal-id journal-id-type="issn">2460-3945</journal-id><journal-title-group><journal-title>Forum Geografi</journal-title><abbrev-journal-title>For. Geo.</abbrev-journal-title></journal-title-group><issn pub-type="epub">2460-3945</issn><issn pub-type="ppub">0852-0682</issn><publisher><publisher-name>Universitas Muhammadiyah Surakarta</publisher-name></publisher></journal-meta><article-meta><article-id pub-id-type="doi">10.23917/forgeo.v39i3.13611</article-id><article-categories/><title-group><article-title>Flood Risk Analysis Using Spatial Synthetic Population in the Upper Bengawan Solo Watershed, Indonesia</article-title></title-group><contrib-group><contrib contrib-type="author"><contrib-id contrib-id-type="orcid">https://orcid.org/0009-0005-5133-5884</contrib-id><name><surname>Musiyam</surname><given-names>Muhammad</given-names></name><address><country>Indonesia</country><email>mm102@ums.ac.id</email></address><xref ref-type="aff" rid="AFF-1"/><xref ref-type="corresp" rid="cor-0"/></contrib><contrib contrib-type="author"><contrib-id contrib-id-type="orcid">https://orcid.org/0000-0002-1002-3084</contrib-id><name><surname>Jumadi</surname><given-names>Jumadi</given-names></name><address><country>Malaysia</country></address><xref ref-type="aff" rid="AFF-2"/></contrib><contrib contrib-type="author"><contrib-id contrib-id-type="orcid">https://orcid.org/0000-0003-2869-3657</contrib-id><name><surname>Fikriyah</surname><given-names>Vidya Nahdhiyatul</given-names></name><address><country>Netherlands</country></address><xref ref-type="aff" rid="AFF-3"/></contrib><contrib contrib-type="author"><contrib-id contrib-id-type="orcid">https://orcid.org/0000-0001-6752-4536</contrib-id><name><surname>Masruroh</surname><given-names>Heni</given-names></name><address><country>Indonesia</country></address><xref ref-type="aff" rid="AFF-4"/></contrib><contrib contrib-type="author"><contrib-id contrib-id-type="orcid">https://orcid.org/0009-0009-5813-8022</contrib-id><name><surname>Septiyani</surname><given-names>Ema Dwi</given-names></name><address><country>Indonesia</country></address><xref ref-type="aff" rid="AFF-5"/></contrib><contrib contrib-type="author"><contrib-id contrib-id-type="orcid">https://orcid.org/0000-0002-4174-1740</contrib-id><name><surname>Amin</surname><given-names>Choirul</given-names></name><address><country>Indonesia</country></address><xref ref-type="aff" rid="AFF-6"/></contrib><contrib contrib-type="author"><contrib-id contrib-id-type="orcid">https://orcid.org/0000-0003-4143-2523</contrib-id><name><surname>Hadibasyir</surname><given-names>Hamim Zaky</given-names></name><address><country>Australia</country></address><xref ref-type="aff" rid="AFF-7"/></contrib><contrib contrib-type="author"><contrib-id contrib-id-type="orcid">https://orcid.org/0000-0001-7070-8715</contrib-id><name><surname>Sattar</surname><given-names>Farha</given-names></name><address><country>Australia</country></address><xref ref-type="aff" rid="AFF-8"/></contrib><contrib contrib-type="author"><contrib-id contrib-id-type="orcid">https://orcid.org/0000-0002-1504-4706</contrib-id><name><surname>Nawaz</surname><given-names>Muhammad</given-names></name><address><country>Singapore</country></address><xref ref-type="aff" rid="AFF-9"/></contrib></contrib-group><aff id="AFF-1">Department of Geography Education, Faculty of Education, Universitas Muhammadiyah Surakarta</aff><aff id="AFF-2"><institution-wrap><institution>INTI International University</institution><institution-id institution-id-type="ror">https://ror.org/03fj82m46</institution-id></institution-wrap><addr-line>71800 Nilai</addr-line><country>Negeri Sembilan</country></aff><aff id="AFF-3"><institution content-type="dept">Department of Geography, Faculty of Geography, Universitas Muhammadiyah Surakarta, Indonesia, Faculty of Geo information Science and Earth Observation</institution><institution-wrap><institution>University of Twente</institution><institution-id institution-id-type="ror">https://ror.org/006hf6230</institution-id></institution-wrap><country country="NL">The Netherlands</country></aff><aff id="AFF-4"><institution content-type="dept">Department of Geography</institution><institution-wrap><institution>Universitas Negeri Malang</institution><institution-id institution-id-type="ror">https://ror.org/00ypgyy34</institution-id></institution-wrap><country country="ID">Indonesia</country></aff><aff id="AFF-5">Department of Geographic Information Science, Faculty of Geography, Universitas Muhammadiyah Surakarta</aff><aff id="AFF-6">Department of Geography, Faculty of Geography, Universitas Muhammadiyah Surakarta, Indonesia</aff><aff id="AFF-7"><institution content-type="dept">Department of Geography, Faculty of Geography, Universitas Muhammadiyah Surakarta, Indonesia, School of Built Environment</institution><institution-wrap><institution>University of New South Wales</institution><institution-id institution-id-type="ror">https://ror.org/03r8z3t63</institution-id></institution-wrap><addr-line>Sydney</addr-line><country>New South Wales 2052</country></aff><aff id="AFF-8"><institution content-type="dept">Faculty of Arts and Society</institution><institution-wrap><institution>Charles Darwin University</institution><institution-id institution-id-type="ror">https://ror.org/048zcaj52</institution-id></institution-wrap><country country="AU">Australia</country></aff><aff id="AFF-9"><institution content-type="dept">Department of Geography</institution><institution-wrap><institution>National University of Singapore</institution><institution-id institution-id-type="ror">https://ror.org/01tgyzw49</institution-id></institution-wrap><addr-line>AS#3-03-11, 1 Arts Link</addr-line><country>Kent Ridge</country></aff><author-notes><corresp id="cor-0"><bold>Corresponding author: Muhammad Musiyam</bold>, Department of Geography Education, Faculty of Education, Universitas Muhammadiyah Surakarta .Email:<email>mm102@ums.ac.id</email></corresp></author-notes><pub-date date-type="pub" iso-8601-date="2025-12-30" publication-format="electronic"><day>30</day><month>12</month><year>2025</year></pub-date><pub-date date-type="collection" iso-8601-date="2025-9-18" publication-format="electronic"><day>18</day><month>9</month><year>2025</year></pub-date><volume>39</volume><issue>3</issue><fpage>383</fpage><lpage>397</lpage><history><date date-type="received" iso-8601-date="2025-11-22"><day>22</day><month>11</month><year>2025</year></date><date date-type="rev-recd" iso-8601-date="2025-12-4"><day>14</day><month>12</month><year>2025</year></date><date date-type="accepted" iso-8601-date="2025-12-14"><day>14</day><month>12</month><year>2025</year></date></history><permissions><copyright-statement>Copyright (c) 2025 Muhammad Musiyam, Jumadi Jumadi, Vidya Nahdhiyatul Fikriyah, Heni Masruroh, Ema Dwi Septiyani, Choirul Amin, Hamim Zaky Hadibasyir, Farha Sattar, Muhammad Nawaz</copyright-statement><copyright-year>2025</copyright-year><copyright-holder>Muhammad Musiyam, Jumadi Jumadi, Vidya Nahdhiyatul Fikriyah, Heni Masruroh, Ema Dwi Septiyani, Choirul Amin, Hamim Zaky Hadibasyir, Farha Sattar, Muhammad Nawaz</copyright-holder><license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/"><ali:license_ref xmlns:ali="http://www.niso.org/schemas/ali/1.0/">https://creativecommons.org/licenses/by/4.0/</ali:license_ref><license-p>This work is licensed under a Creative Commons Attribution 4.0 International License.</license-p></license></permissions><self-uri xlink:href="https://journals2.ums.ac.id/fg/article/view/13611" xlink:title="Flood Risk Analysis Using Spatial Synthetic Population in the Upper Bengawan Solo Watershed, Indonesia">Flood Risk Analysis Using Spatial Synthetic Population in the Upper Bengawan Solo Watershed, Indonesia</self-uri><abstract><p>This study develops a spatial synthetic population (SSP)-based computational model to produce realis-tic, high-resolution flood-risk maps for the Upper Bengawan Solo Watershed. It combines Global Hu-man Settlement (spatial distribution) with local population statistics (attributes). The SSP is created for flood risk mapping in the Upper Bengawan Solo Watershed (BSH) using a 100 m grid from the Global Human Settlement Layer (GHSL) GHS-POP R2023A. Synthetic individuals are strategically placed around the pixel centre (radius ≤ 100 m), and each is assigned demographic attributes (age, gender, ed-ucation, occupation) validated against official county-level data. Social vulnerability is calculated through weighted aggregation (AHP) across four attributes; individual scores are combined with flood hazard intensity at each location to produce a risk index for each person. Validation shows that (i) the SSP aligns closely with reference statistics: gender and age are nearly identical (MAE ≈ 0.01–0.02%), with slight deviations in occupation (MAE 6.52%) and education (MAE 4.89%), (ii) the overall suita-bility of the SSP compared to GHS counts at pixel samples, and (iii) location plausibility testing using ESRI Sentinel‑2 Land Cover (10 m). Results indicate that (i) the SSP aligns well for gender, moderately for education and occupation, but shows significant misalignment in age, (ii) 91.96% of SSP points are in built-up land, suggesting high spatial accuracy. Medium- to high-risk patterns are mainly along the main river corridors and peri-urban areas, while rural non-built zones are mostly low- to medium-risk. These findings suggest that this methodology is scalable, reproducible, and suitable for data limited regions, enabling the production of detail risk maps that can guide mitigation and preparedness efforts.</p></abstract><kwd-group><kwd>Spatial synthetic population</kwd><kwd>Global Human Settlement Layer</kwd><kwd>Flood risk</kwd><kwd>Upper Bengawan Solo</kwd><kwd>AHP</kwd><kwd>Social vulnerability</kwd><kwd>flood mitigation</kwd></kwd-group><custom-meta-group><custom-meta><meta-name>File created by JATS Editor</meta-name><meta-value><ext-link ext-link-type="uri" xlink:href="https://jatseditor.com" xlink:title="JATS Editor">JATS Editor</ext-link></meta-value></custom-meta><custom-meta><meta-name>issue-created-year</meta-name><meta-value>2025</meta-value></custom-meta></custom-meta-group></article-meta></front><body><sec><title>1. Introduction</title><p>Floods are the most common hydrometeorological disasters in Indonesia and have significant socio-economic impacts, especially in fast-growing urban and rural areas such as the Upper Bengawan Solo River Basin (Jumadi et al., 2024a;Jumadi et al., 2024b;<xref ref-type="bibr" rid="BIBR-30">(Purwanto et al., 2023)</xref><xref ref-type="bibr" rid="BIBR-32">(Sahid, 2024)</xref><xref ref-type="bibr" rid="BIBR-37">(Tellman et al., 2021)</xref>. Accurate flood risk mapping requires integrating hazards and vulnerabilities; however, the quality of mapping is often limited by the lack of detailed. Population-based raster methods-such as medium-resolution global datasets-help estimate exposure but usually overlook demographic structures and household traits that influence resilience and recovery after disasters. This is where spatial synthetic population (SSP) becomes a breakthrough: it assigns realistic attributes and locations to individual and household units without jeopardizing privacy, thus connecting aggregate data with detailed demographic information for better risk assessment <xref ref-type="bibr" rid="BIBR-3">(Agriesti et al., 2022)</xref><xref ref-type="bibr" rid="BIBR-11">(Chapuis &amp; Taillandier, 2019)</xref><xref ref-type="bibr" rid="BIBR-17">(Jiang et al., 2024)</xref><xref ref-type="bibr" rid="BIBR-18">(Jumadi et al., 2019)</xref><xref ref-type="bibr" rid="BIBR-29">(Prédhumeau &amp; Manley, 2023)</xref>.</p><p>Recent research shows rapid progress in creating SSPs at scales from urban to national, emphasizing reproducibility, data openness, and computational efficiency. Earlier studies have focused on building national synthetic populations, highlighting transparent pipelines and statistical alignment between synthetic data and census figures <xref ref-type="bibr" rid="BIBR-29">(Prédhumeau &amp; Manley, 2023)</xref>. Similar endeavours at a larger scale demonstrate that assembling a geographically explicit synthetic population (SSP) is achievable by combining microdata, spatial constraints, and realistic housing placement strategies <xref ref-type="bibr" rid="BIBR-17">(Jiang et al., 2024)</xref>. In mobility planning and public services, assignment and placement techniques for SSPs underscore the importance of matching individual attributes, household structures, and spatial activity patterns to ensure population representations remain accurate and practical <xref ref-type="bibr" rid="BIBR-3">(Agriesti et al., 2022)</xref>. Methodologically, a brief review of synthetic population creation methods identifies Iterative Proportional Fitting/Updating (IPF/IPU), microsimulation, and machine learning as the primary approaches, each suited to varying data availability and research goals (<xref ref-type="bibr" rid="BIBR-7">(Balac &amp; Hörl, 2021)</xref>; <xref ref-type="bibr" rid="BIBR-8">(Bigi et al., 2024)</xref>; <xref ref-type="bibr" rid="BIBR-9">(Burger et al., 2017)</xref>; <xref ref-type="bibr" rid="BIBR-14">(Mooij et al., 2024)</xref>; <xref ref-type="bibr" rid="BIBR-16">(Jiang et al., 2022)</xref>; <xref ref-type="bibr" rid="BIBR-20">(Jumadi et al., 2018)</xref>, <xref ref-type="bibr" rid="BIBR-18">(Jumadi et al., 2019)</xref>)</p><p>In the context of hydrometeorological disasters, the main challenge is not only in representing the number of exposed individuals but also in accounting for their demographic structure, employment, and socio-economic conditions, which influence vulnerability. Many studies use social vulnerability indices (e.g., derivatives of SoVI) to summarize sensitivity and adaptive capacity at the community level; however, at the village level in developing countries, data gaps are common, requiring the synthesis of indicators from incomplete distributions <xref ref-type="bibr" rid="BIBR-10">(Chakraborty et al., 2023)</xref><xref ref-type="bibr" rid="BIBR-12">(Cutter et al., 2003)</xref><xref ref-type="bibr" rid="BIBR-13">(Cutter &amp; Finch, 2008)</xref><xref ref-type="bibr" rid="BIBR-21">(Jumadi et al., 2020)</xref>. At the same time, flood hazard information can be analyzed based on several parameters by combining indicators such as slope gradient, rainfall, drainage density, soil moisture, land use/land cover (LULC), elevation, distance to rivers, normalized difference vegetation index (NDVI), curvature, flow accumulation, and topographic wetness index (TWI); these indicators can be calibrated with historical event records and/or remotely sensed rainfall if available (<xref ref-type="bibr" rid="BIBR-22">(Jumadi et al., 2024)</xref>;<xref ref-type="bibr" rid="BIBR-22">(Jumadi et al., 2024)</xref>;<xref ref-type="bibr" rid="BIBR-26">(Musiyam et al., 2020)</xref>).</p><p>Although global population grid maps support macro-level analysis, several studies show that flood exposure results are sensitive to the choice of population datasets and their distribution schemes. These findings highlight the importance of methodological transparency in selecting and creating population representations, as minor differences in inputs can significantly affect risk estimates <xref ref-type="bibr" rid="BIBR-1">(Abdelkareem &amp; Mansour, 2023)</xref><xref ref-type="bibr" rid="BIBR-6">(Arnell &amp; Gosling, 2016)</xref><xref ref-type="bibr" rid="BIBR-10">(Chakraborty et al., 2023)</xref><xref ref-type="bibr" rid="BIBR-15">(Diriba et al., 2024)</xref><xref ref-type="bibr" rid="BIBR-22">(Jumadi et al., 2024)</xref>. This methodological awareness is especially relevant for floods, as demographic structures and settlement patterns can determine who is exposed to flooding, where flooding occurs, and its severity.</p><p>In Thailand, for instance, flood risk assessments have become increasingly important as the population ages rapidly <xref ref-type="bibr" rid="BIBR-40">(Waiyasusri et al., 2021)</xref><xref ref-type="bibr" rid="BIBR-34">(Sawangnate et al., 2022)</xref><xref ref-type="bibr" rid="BIBR-39">(Waiyasusri et al., 2023)</xref>. On the other hand, informal settlements and regional terrain variations pose a high risk of flooding in the Philippines <xref ref-type="bibr" rid="BIBR-38">(Usamah et al., 2014)</xref>. Similar challenges are also evident in other coastal regions, such as peninsular Malaysia <xref ref-type="bibr" rid="BIBR-25">(Maqtan et al., 2025)</xref>, highlighting the need to consider population context in flood risk mapping.</p><p>In Indonesia, including the Upper Bengawan Solo River Basin, there are practical gaps in three areas. First, the lack of microdata at the village level limits the use of IPF/IPU; as a result, many studies depend on an aggregate population raster that may be biased in areas with mixed settlements and open land. Second, the spatial distribution of populations often ignores the actual settlement structure (building footprints and road networks), so exposure at the unit level (buildings and households) is not accurately reflected. Third, combining SSP with composite multi indicator hazard and social vulnerability indices in a reproducible format is not yet a common practice at the village level, making cross regional and temporal comparison difficult (<xref ref-type="bibr" rid="BIBR-3">(Agriesti et al., 2022)</xref>; <xref ref-type="bibr" rid="BIBR-11">(Chapuis &amp; Taillandier, 2019)</xref>; <xref ref-type="bibr" rid="BIBR-17">(Jiang et al., 2024)</xref>; <xref ref-type="bibr" rid="BIBR-29">(Prédhumeau &amp; Manley, 2023)</xref>).</p><p>This research addresses the gap identified above by developing an SSP model that utilizes the GHS-POP R2023A (<xref ref-type="bibr" rid="BIBR-28">(Pesaresi et al., 2024)</xref>; <xref ref-type="bibr" rid="BIBR-35">(Schiavina et al., 2023)</xref>) using lightweight computing. It incorporates directed stochastic allocation around settlement centers (based on GHS-POP pixels) to match local spatial patterns. Population attributes such as age, gender, education, occupation, and income are synthesized from official frequency distributions, with their margins enforced for consistency across districts. Flood hazard is modelled using eleven measurable risk factors (slope, rainfall, drainage density, soil moisture, land use/land cover, elevation, distance to river, NDVI, curvature, flow accumulation, TWI) through ordinal reclassification and normalized weighted overlay.</p><p>Meanwhile, social vulnerability is summarized into a composite index based on tested demographic, social, and economic indicators. Risk is then calculated as a composite or multiplicative function of hazard and vulnerability at an operational resolution. This framework is built on best practices for SSP generation—ensuring transparency and evaluating statistical congruence—while remaining adaptable to regions with data limitations. This design produces an individual-based flood risk map that more accurately reflects local demographic and socio-economic conditions, making it ready for stakeholders in the Upper Bengawan Solo region to prioritize mitigation and risk communication. Finally, the rest of the paper is organized as follows: the Research Methods section explains the construction of the SSP, the composite hazard and vulnerability, and the validation processes. The Results and Discussion section displays the risk maps and validation outcomes. The Conclusion section discusses contributions, limitations, and future research directions.</p></sec><sec><title>2. Research Methods</title><p>The study develops SSP modelling, which uses demographic data, gender, education, and occupation, with randomized spatial allocation centered on GHS-POP pixels to determine individual distributions. The accuracy of the SSP is validated against official statistics (using MAE and RMSE metrics), spatial fit with population grids, and placement tests on built-up land based on ESRI Sentinel 2 Land Cover. The social vulnerability index (V) is calculated as a linear weighted sum using AHP. Flood risk (R) is derived by multiplying the standardized hazard (H) by V, then classified into five categories using natural breaks (Jenks). The Getis-Ord Gi hotspot analysis identifies significant risk clusters, which are then interpreted in relation to river corridors and urban areas. All steps are performed in a geographic information system (GIS) environment with a reproducible workflow <xref ref-type="fig" rid="figure-1">Figure 1</xref>.</p><fig id="figure-1" ignoredToc=""><label>Figure 1</label><caption><p>Research Framework.</p></caption><graphic xlink:href="For_Geo-39-3-383-g1.png" mimetype="image" mime-subtype="png"><alt-text>Image</alt-text></graphic></fig><sec><title>2.1. Study Area</title><p>The study area is the Upper Bengawan Solo Watershed (BSH), the upstream part of the Bengawan Solo system, the largest river basin on Java Island <xref ref-type="fig" rid="figure-2">Figure 2</xref>. Geographically, this area is located in Central Java and covers the upstream region, supplied by the Merapi–Merbabu volcanic complex to the west and the Lawu to the east. Generally, the area's terrain is dominated by relatively flat plains; however, the northeastern and northwestern sections feature undulating to rolling terrain near the mountain foothills. The hydrological segmentation classifies BSH as one of the three main sub-watersheds within the Bengawan Solo system. The study boundaries are defined by hydrological (watershed) boundaries based on the digital elevation model (DEM) and align with administrative borders (<xref ref-type="bibr" rid="BIBR-2">(Absori et al., 2023)</xref>; <xref ref-type="bibr" rid="BIBR-5">(Anna et al., 2023)</xref>; <xref ref-type="bibr" rid="BIBR-4">(Anna &amp; Priyana, 2015)</xref>; <xref ref-type="bibr" rid="BIBR-33">(Santhyami et al., 2025)</xref>).</p><p>The topographic conditions and river networks primarily influence flood dynamics in BSH. Past studies have shown varying vulnerability to flooding: areas around Surakarta (the urban core) tend to be more susceptible, while certain regions in Wonogiri, Karanganyar, and Boyolali are comparatively less at risk. This pattern aligns with the morphological gradient (flat versus undulating or steep terrain), drainage density, and land use/cover structure along the main river corridor. Variations in vulnerability among districts highlight the need for locally tailored management, especially during the rainy season when increased rainfall strains urban drainage systems <xref ref-type="bibr" rid="BIBR-23">(Jumadi et al., 2025)</xref>. Administratively, BSH includes at least six districts/cities: Boyolali, Surakarta, Karanganyar, Sukoharjo, Klaten, and Wonogiri. The Surakarta urban area acts as a hub for population and economic activity, leading to higher exposure of residents and property in this region <xref ref-type="bibr" rid="BIBR-33">(Santhyami et al., 2025)</xref>.</p><fig id="figure-2" ignoredToc=""><label>Figure 2</label><caption><p>Study Area.</p></caption><graphic xlink:href="For_Geo-39-3-383-g2.png" mimetype="image" mime-subtype="png"><alt-text>Image</alt-text></graphic></fig></sec><sec><title>2.2. Data and Sources</title><p>1. Population Centers (GHS-POP R2023A)</p><p>The population center dataset is derived from the latest Global Human Settlement Layer (GHSL) release (GHS global population grid multitemporal, GHS-POP R2023A) <xref ref-type="bibr" rid="BIBR-28">(Pesaresi et al., 2024)</xref><xref ref-type="bibr" rid="BIBR-35">(Schiavina et al., 2023)</xref>. The population pixel values from GHSL, typically at 100 m resolution, were converted into point centers using Raster to Point in ArcGIS Pro. Each point retains a center_id, pixel center coordinates, and population count (the number of residents in that pixel). These points are used as references to generate synthetic individuals within a 100 m radius.</p><p>2. Attribute Frequency Tables (Age, Gender, Education, Occupation)</p><p>Four tables display the proportions of demographic and social categories at the watershed level, which combines four districts or cities, for age, gender, education, and occupation. For age, the labels are given as age ranges; during synthesis, these are converted to specific ages by sampling integers within each range. For gender, education, and occupation, category selection is weighted by frequency. Substantive rules are applied to maintain social realism, such as automatically assigning individuals under 15 years old to the occupation 0 (no occupation).</p><p>3. Flood Hazard Data Based on RS–GIS</p><p>The hazard index <xref ref-type="fig" rid="figure-3">Figure 3</xref> is compiled from physical-environmental parameters derived from open-access spatial data (<xref ref-type="bibr" rid="BIBR-22">(Jumadi et al., 2024)</xref>; <xref ref-type="bibr" rid="BIBR-22">(Jumadi et al., 2024)</xref>). The core framework uses eleven parameters: elevation (El), slope (Sl), flow accumulation (FA), distance to river (DR), drainage density (DD), topographic wetness index (TWI), curvature (Cu), land cover/use (LULC), NDVI, rainfall (Rf), and soil moisture (SM). The primary data sources include SRTM 30 m (El, Sl, FA, DR, DD, TWI, Cu), Sentinel-2 10 m (LULC, NDVI), GPM v6 (Rf), and SMAP (SM). All parameters are projected to the working CRS, standardized in spatial resolution, and then reclassified to an ordinal scale of 1–5 (very low – very high) with local thematic thresholds. Weights among parameters are explicitly assigned (e.g., El/Sl/FA/DR as major controlling factors), and the weighted overlay results in a hazard surface H. Physically, low or flat locations and those near rivers tend to experience flow accumulation and low flow velocity; high NDVI values indicate vegetative cover that may delay runoff; TWI and SM capture soil saturation; flat or concave curvature leads to pooling (see further explanations in <xref ref-type="bibr" rid="BIBR-22">(Jumadi et al., 2024)</xref>; <xref ref-type="bibr" rid="BIBR-22">(Jumadi et al., 2024)</xref>).</p><fig id="figure-3" ignoredToc=""><label>Figure 3</label><caption><p>Flood hazard map (source: <xref ref-type="bibr" rid="BIBR-22">(Jumadi et al., 2024)</xref>; <xref ref-type="bibr" rid="BIBR-22">(Jumadi et al., 2024)</xref>).</p></caption><graphic xlink:href="For_Geo-39-3-383-g3.png" mimetype="image" mime-subtype="png"><alt-text>Image</alt-text></graphic></fig><p>3. Supporting Data</p><p>The research uses administrative boundaries (districts), river networks, watershed boundaries, and ESRI Sentinel 2 Land Cover. Administrative boundaries are essential for reporting, especially when comparing results with different regions. The river network helps interpret the results. ESRI Sentinel-2 land cover is needed to validate the distribution of SSP.</p><p>The characteristics and sources of all datasets are summarised in <xref ref-type="table" rid="table-1">Table 1</xref>.</p><table-wrap id="table-1" ignoredToc=""><label>Table 1</label><caption><p>Data Description and Sources.</p></caption><table frame="box" rules="all"><thead><tr><th colspan="1" rowspan="1" style="" align="left" valign="top">No</th><th colspan="1" rowspan="1" style="" align="left" valign="top">Data</th><th colspan="1" rowspan="1" style="" align="left" valign="top">Description</th><th colspan="1" rowspan="1" style="" align="left" valign="top">Source</th><th colspan="1" rowspan="1" style="" align="left" valign="top">Derived data</th></tr></thead><tbody><tr><td colspan="1" rowspan="1" style="" align="left" valign="top">1</td><td colspan="1" rowspan="1" style="" align="left" valign="top">Population</td><td colspan="1" rowspan="1" style="" align="left" valign="top">Global Human Settlement Layer (GHS-POP R2023A). Pixel at 100 m resolution</td><td colspan="1" rowspan="1" style="" align="left" valign="top">Earth Engine Data Catalogue</td><td colspan="1" rowspan="1" style="" align="left" valign="top">Population center_id, coordinates, and count (number of residents)</td></tr><tr><td colspan="1" rowspan="1" style="" align="left" valign="top">2</td><td colspan="1" rowspan="1" style="" align="left" valign="top">Demographic and social categories</td><td colspan="1" rowspan="1" style="" align="left" valign="top">Regency /city statistics data</td><td colspan="1" rowspan="1" style="" align="left" valign="top">Central Bureau of Statistics</td><td colspan="1" rowspan="1" style="" align="left" valign="top">Age, gender, education, occupation</td></tr><tr><td colspan="1" rowspan="1" style="" align="left" valign="top">3</td><td colspan="1" rowspan="1" style="" align="left" valign="top">Images</td><td colspan="1" rowspan="1" style="" align="left" valign="top">Sentinel-2 at 10 m resolution</td><td colspan="1" rowspan="1" style="" align="left" valign="top">ESA</td><td colspan="1" rowspan="1" style="" align="left" valign="top">LULC, NDVI</td></tr><tr><td colspan="1" rowspan="1" style="" align="left" valign="top">4</td><td colspan="1" rowspan="1" style="" align="left" valign="top">DEM</td><td colspan="1" rowspan="1" style="" align="left" valign="top">Shuttle Radar Topography Mission (SRTM) at 30 m resolution</td><td colspan="1" rowspan="1" style="" align="left" valign="top">USGS</td><td colspan="1" rowspan="1" style="" align="left" valign="top">Elevation, slope, flow accumulation, distance to river, drainage density, TWI, and curvature</td></tr><tr><td colspan="1" rowspan="1" style="" align="left" valign="top">5</td><td colspan="1" rowspan="1" style="" align="left" valign="top">Rainfall</td><td colspan="1" rowspan="1" style="" align="left" valign="top">Global Precipitation Measurement (GPM) v6 at 10 km resolution</td><td colspan="1" rowspan="1" style="" align="left" valign="top">NASA</td><td colspan="1" rowspan="1" style="" align="left" valign="top">Rainfall</td></tr><tr><td colspan="1" rowspan="1" style="" align="left" valign="top">6</td><td colspan="1" rowspan="1" style="" align="left" valign="top">Soil moisture</td><td colspan="1" rowspan="1" style="" align="left" valign="top">NASA-USDA Enhanced Soil Moisture Active Passive (SMAP) at 10 km resolution</td><td colspan="1" rowspan="1" style="" align="left" valign="top">NASA</td><td colspan="1" rowspan="1" style="" align="left" valign="top">Soil moisture</td></tr><tr><td colspan="1" rowspan="1" style="" align="left" valign="top">7</td><td colspan="1" rowspan="1" style="" align="left" valign="top">Land cover</td><td colspan="1" rowspan="1" style="" align="left" valign="top">Based on the ESA Sentinel-2 image at 10 m resolution</td><td colspan="1" rowspan="1" style="" align="left" valign="top">ESRI</td><td colspan="1" rowspan="1" style="" align="left" valign="top">Land cover</td></tr></tbody></table></table-wrap></sec><sec><title>2.3. Data Pre-processing</title><p>1. Spatial Harmonization</p><p>Preprocessing starts with aligning the coordinate system and analysis grid so that all layers function properly without distortion. All data is projected to UTM 49S (EPSG:32749) as a standard CRS to ensure consistency in distance and area measurements. The extent is defined by the mask of the Upper Solo River Basin (BSH), which is then used as a clipping boundary for all raster and vector data.</p><p>2. Extraction of GHSL Population Data</p><p>The GHSL population raster is converted into points using ArcGIS Pro (Raster to Point). These points are clipped by the watershed mask and assigned a unique ID (center_id). The population attribute (number of people per pixel) is cleaned by removing negative or empty values. Points with a population of zero are discarded to improve computational efficiency. If there is an off by one issue at the watershed boundary where GHSL cells cross it, a small adjustment is applied to the analysis grid. All points are stored in the working CRS and exported to CSV for use in the Python pipeline (SSP Algorithm).</p></sec><sec><title>2.4. Spatial Synthetic Population (SSP) Development</title><p>1. Principles and Assumptions</p><p>The development of SSP aims to represent the population at the individual level in a synthetic way while maintaining overall consistency with official statistics and spatial accuracy regarding settlement areas. The main principles are: (i) aggregate consistency—matching the number of individuals generated at each center point to the population count from GHS-POP; (ii) micro-spatial realism—dispersing individuals around the pixel center within a fixed radius (100 m) with a denser radial distribution at the center; (iii) attribute consistency—sampling age, gender, education, and occupation based on weighted standardized frequency tables; and (iv) substantive rules—to avoid unrealistic attribute combinations (e.g., children working), such as age &lt; 15 → education = 0, occupation = 0. Other key assumptions include: (a) category frequencies reflect the population makeup at the watershed level; (b) micro-spatial dispersion within a 100 m radius sufficiently represents the intrapixel variability observed in GHS-POP; (c) ages within intervals are assumed uniform unless additional information is available.</p><p>2. Spatial Algorithm (Individual Placement)</p><p>For each center point (cx, cy) with a population n, generate n individual positions using radial jitter, where the angle theta is uniformly distributed between 0 and 2π, and the radius r is drawn from a Beta(2, 2,5) distribution scaled by RADIUS_M. This creates a denser clustering around the center. Offsets are calculated as dx = r* cos (theta) and dy = r* sin (theta).</p><p>3. Demographic-Social Attribute Sampling</p><p>Individual attributes are assigned through weighted random sampling based on frequency tables. For age, the ID label can indicate a range (e.g., “a–b”), a single value, or “a+.” The range “a–b” is converted into specific ages by selecting a random integer within [a, b]; labels “a+” are limited to [a, a+4] to avoid an infinite tail; single values are used directly. For gender, education, and occupation, categories are selected based on their relative probability (frequency divided by total). After age is assigned, the rule age &lt; 15 is applied to disable education and occupation (set to “0”).</p><p>4. Computational Implementation</p><p>The implementation uses Python on Google Colab Pro (High-RAM). It reads population centers from DBF files with dbfread and converts data types to numeric. The source code for SSP generation is available at https://doi.org/10.17605/OSF.IO/2KEJQ.</p><p>5. Validation of Aggregate Consistency and Spatial Distribution</p><p>Validation involves three layers. (i) Aggregate count: the number of SSP per point must match the GHSL count; a difference greater than 0 indicates anomalies (e.g., non integer population values or casting issues). (ii) Attribute distribution: calculate the proportion of results for age, gender, education, and occupation, then compare these with frequency tables using MAE and RMSE (Equations 1 and 2), where y is the observed proportion and ŷ is SSP proportion in category i, and n is the number of categories. (iii) Compatibility of the spatial distribution of SSP with the built-up land positions according to ESRI Sentinel-2 Land Cover.</p><p><inline-formula><tex-math id="math-1"><![CDATA[ \documentclass{article} \usepackage{amsmath} \begin{document} \displaystyle MAE = \frac{1}{n} \sum_{i=1}^{n} |y_i - \hat{y}_i| \end{document} ]]></tex-math></inline-formula>       (1)</p><p><inline-formula><tex-math id="math-2"><![CDATA[ \documentclass{article} \usepackage{amsmath} \begin{document} \displaystyle RMSE = \sqrt{\frac{1}{n} \sum_{i=1}^{n} (y_i - \hat{y}_i)^2} \end{document} ]]></tex-math></inline-formula>       (2)</p></sec><sec><title>2.5. Vulnerability Analysis</title><p>1. Determination of Scores per Attribute Class</p><p>The method for calculating scores per class follows the schema you established in the table. To ensure consistency and facilitate multicriteria aggregation, all scores are expressed within the range [0, 1]. If an initial score column falls outside [0, 1], linear normalization can be applied without altering the actual ordering: sᵢ(norm) = (sᵢ − min sᵢ) / (max sᵢ − min sᵢ). <xref ref-type="table" rid="table-2">Table 2</xref> illustrates this basic schema.</p><table-wrap id="table-2" ignoredToc=""><label>Table 2</label><caption><p>Criteria and Scoring of Vulnerability.</p></caption><table frame="box" rules="all"><thead><tr><th colspan="1" rowspan="1" style="" align="left" valign="top">No</th><th colspan="1" rowspan="1" style="" align="left" valign="top">Criteria</th><th colspan="1" rowspan="1" style="" align="left" valign="top">Category</th><th colspan="1" rowspan="1" style="" align="left" valign="top">Description</th><th colspan="1" rowspan="1" style="" align="left" valign="top">Vulnerability Score</th></tr></thead><tbody><tr><td colspan="1" rowspan="7" style="" align="left" valign="top">1</td><td colspan="1" rowspan="7" style="" align="left" valign="top">Age</td><td colspan="1" rowspan="1" style="" align="left" valign="top">0-10</td><td colspan="1" rowspan="1" style="" align="left" valign="top">extremely vulnerable</td><td colspan="1" rowspan="1" style="" align="left" valign="top">1</td></tr><tr><td colspan="1" rowspan="1" style="" align="left" valign="top">11-20</td><td colspan="1" rowspan="1" style="" align="left" valign="top">strongly vulnerable</td><td colspan="1" rowspan="1" style="" align="left" valign="top">0.85</td></tr><tr><td colspan="1" rowspan="1" style="" align="left" valign="top">21-30</td><td colspan="1" rowspan="1" style="" align="left" valign="top">vulnerable</td><td colspan="1" rowspan="1" style="" align="left" valign="top">0.7</td></tr><tr><td colspan="1" rowspan="1" style="" align="left" valign="top">31-40</td><td colspan="1" rowspan="1" style="" align="left" valign="top">less vulnerable</td><td colspan="1" rowspan="1" style="" align="left" valign="top">0.4</td></tr><tr><td colspan="1" rowspan="1" style="" align="left" valign="top">41-50</td><td colspan="1" rowspan="1" style="" align="left" valign="top">vulnerable</td><td colspan="1" rowspan="1" style="" align="left" valign="top">0.7</td></tr><tr><td colspan="1" rowspan="1" style="" align="left" valign="top">51-60</td><td colspan="1" rowspan="1" style="" align="left" valign="top">strongly vulnerable</td><td colspan="1" rowspan="1" style="" align="left" valign="top">0.85</td></tr><tr><td colspan="1" rowspan="1" style="" align="left" valign="top">&gt;60</td><td colspan="1" rowspan="1" style="" align="left" valign="top">extremely vulnerable</td><td colspan="1" rowspan="1" style="" align="left" valign="top">1</td></tr><tr><td colspan="1" rowspan="4" style="" align="left" valign="top">2</td><td colspan="1" rowspan="4" style="" align="left" valign="top">Education</td><td colspan="1" rowspan="1" style="" align="left" valign="top">Elementary School</td><td colspan="1" rowspan="1" style="" align="left" valign="top">extremely vulnerable</td><td colspan="1" rowspan="1" style="" align="left" valign="top">1</td></tr><tr><td colspan="1" rowspan="1" style="" align="left" valign="top">Yunior High School</td><td colspan="1" rowspan="1" style="" align="left" valign="top">strongly vulnerable</td><td colspan="1" rowspan="1" style="" align="left" valign="top">0.85</td></tr><tr><td colspan="1" rowspan="1" style="" align="left" valign="top">Senior High School</td><td colspan="1" rowspan="1" style="" align="left" valign="top">vulnerable</td><td colspan="1" rowspan="1" style="" align="left" valign="top">0.7</td></tr><tr><td colspan="1" rowspan="1" style="" align="left" valign="top">University Graduate</td><td colspan="1" rowspan="1" style="" align="left" valign="top">less vulnerable</td><td colspan="1" rowspan="1" style="" align="left" valign="top">0.4</td></tr><tr><td colspan="1" rowspan="3" style="" align="left" valign="top">3</td><td colspan="1" rowspan="3" style="" align="left" valign="top">Occupation</td><td colspan="1" rowspan="1" style="" align="left" valign="top">Informal Worker</td><td colspan="1" rowspan="1" style="" align="left" valign="top">extremely vulnerable</td><td colspan="1" rowspan="1" style="" align="left" valign="top">1</td></tr><tr><td colspan="1" rowspan="1" style="" align="left" valign="top">Self-employed/entrepreneur</td><td colspan="1" rowspan="1" style="" align="left" valign="top">strongly vulnerable</td><td colspan="1" rowspan="1" style="" align="left" valign="top">0.85</td></tr><tr><td colspan="1" rowspan="1" style="" align="left" valign="top">Employee</td><td colspan="1" rowspan="1" style="" align="left" valign="top">vulnerable</td><td colspan="1" rowspan="1" style="" align="left" valign="top">0.7</td></tr><tr><td colspan="1" rowspan="2" style="" align="left" valign="top">4</td><td colspan="1" rowspan="2" style="" align="left" valign="top">Gender</td><td colspan="1" rowspan="1" style="" align="left" valign="top">Man</td><td colspan="1" rowspan="1" style="" align="left" valign="top">less vulnerable</td><td colspan="1" rowspan="1" style="" align="left" valign="top">0.4</td></tr><tr><td colspan="1" rowspan="1" style="" align="left" valign="top">Woman</td><td colspan="1" rowspan="1" style="" align="left" valign="top">vulnerable</td><td colspan="1" rowspan="1" style="" align="left" valign="top">0.7</td></tr></tbody></table></table-wrap><p>Regarding age groups, the young (0–10 years) and elderly (&gt;60 years) are assigned the highest scores due to mobility limitations, dependency, and increased support needs during emergency responses. The middle working age group (31–40 years) receives a lower score because of its relatively high responsiveness. This mapping also assumes that higher levels of education are linked to greater risk literacy, better access to information, and improved ability to use services—thereby reducing vulnerability scores. Jobs with low income stability or high physical exposure are assigned higher scores (e.g., category 3) because of increased economic and operational risks during flood disruptions. From a gender perspective, women are considered more vulnerable than men.</p><p>2. Determination of Vulnerability Parameter Weights</p><p>The established core preferences are: Age (very important), Occupation (important), Education (somewhat important), Gender (less important) <xref ref-type="table" rid="table-3">Table 3</xref>. These preferences are linked to the Saaty scale as anchor vectors s = [7, 5, 3, 1]. The paired comparison matrix A = [aᵢⱼ] is created as anchor ratios, where aᵢⱼ = sᵢ/sⱼ, ensuring the matrix's transitivity and mathematical consistency <xref ref-type="table" rid="table-4">Table 4</xref>.</p><table-wrap id="table-3" ignoredToc=""><label>Table 3</label><caption><p>Summary of Saaty Scale.</p></caption><table frame="box" rules="all"><thead><tr><th colspan="1" rowspan="1" style="" align="left" valign="top">Value</th><th colspan="1" rowspan="1" style="" align="left" valign="top">Meaning</th></tr></thead><tbody><tr><td colspan="1" rowspan="1" style="" align="left" valign="top">1</td><td colspan="1" rowspan="1" style="" align="left" valign="top">Equally important</td></tr><tr><td colspan="1" rowspan="1" style="" align="left" valign="top">3</td><td colspan="1" rowspan="1" style="" align="left" valign="top">A little more important</td></tr><tr><td colspan="1" rowspan="1" style="" align="left" valign="top">5</td><td colspan="1" rowspan="1" style="" align="left" valign="top">More/stronger important</td></tr><tr><td colspan="1" rowspan="1" style="" align="left" valign="top">7</td><td colspan="1" rowspan="1" style="" align="left" valign="top">Very strong important</td></tr><tr><td colspan="1" rowspan="1" style="" align="left" valign="top">9</td><td colspan="1" rowspan="1" style="" align="left" valign="top">Extreme importance</td></tr><tr><td colspan="1" rowspan="1" style="" align="left" valign="top">2,4,6,8</td><td colspan="1" rowspan="1" style="" align="left" valign="top">Intermediate value</td></tr><tr><td colspan="1" rowspan="1" style="" align="left" valign="top">1/x</td><td colspan="1" rowspan="1" style="" align="left" valign="top">Opposite preference</td></tr></tbody></table></table-wrap><table-wrap id="table-4" ignoredToc=""><label>Table 4</label><caption><p>Pairwise comparison matrix A.</p></caption><table frame="box" rules="all"><thead><tr><th colspan="1" rowspan="1" style="" align="left" valign="top"/><th colspan="1" rowspan="1" style="" align="left" valign="top">Age</th><th colspan="1" rowspan="1" style="" align="left" valign="top">Work</th><th colspan="1" rowspan="1" style="" align="left" valign="top">Education</th><th colspan="1" rowspan="1" style="" align="left" valign="top">Gender</th></tr></thead><tbody><tr><td colspan="1" rowspan="1" style="" align="left" valign="top">Age</td><td colspan="1" rowspan="1" style="" align="left" valign="top">1.0</td><td colspan="1" rowspan="1" style="" align="left" valign="top">1.4</td><td colspan="1" rowspan="1" style="" align="left" valign="top">2.333</td><td colspan="1" rowspan="1" style="" align="left" valign="top">7.0</td></tr><tr><td colspan="1" rowspan="1" style="" align="left" valign="top">Occupation</td><td colspan="1" rowspan="1" style="" align="left" valign="top">0.714</td><td colspan="1" rowspan="1" style="" align="left" valign="top">1.0</td><td colspan="1" rowspan="1" style="" align="left" valign="top">1.667</td><td colspan="1" rowspan="1" style="" align="left" valign="top">5.0</td></tr><tr><td colspan="1" rowspan="1" style="" align="left" valign="top">Education</td><td colspan="1" rowspan="1" style="" align="left" valign="top">0.429</td><td colspan="1" rowspan="1" style="" align="left" valign="top">0.6</td><td colspan="1" rowspan="1" style="" align="left" valign="top">1.000</td><td colspan="1" rowspan="1" style="" align="left" valign="top">3.0</td></tr><tr><td colspan="1" rowspan="1" style="" align="left" valign="top">Gender</td><td colspan="1" rowspan="1" style="" align="left" valign="top">0.143</td><td colspan="1" rowspan="1" style="" align="left" valign="top">0.2</td><td colspan="1" rowspan="1" style="" align="left" valign="top">0.333</td><td colspan="1" rowspan="1" style="" align="left" valign="top">1.0</td></tr></tbody></table></table-wrap><p>The AHP weights w are derived from the normalized principal eigenvector of matrix A <xref ref-type="table" rid="table-5">Table 5</xref>. When constructing anchor ratios, the maximum eigenvalue becomes λmax = n; as a result, the consistency index and ratio are: CI = (λmax − n)/(n − 1) = 0 and CR = CI/RI = 0 (with RI for n = 4 being 0.90).</p><table-wrap id="table-5" ignoredToc=""><label>Table 5</label><caption><p>AHP Weights Between Attributes.</p></caption><table frame="box" rules="all"><thead><tr><th colspan="1" rowspan="1" style="" align="left" valign="top">Attribute</th><th colspan="1" rowspan="1" style="" align="left" valign="top">Weight (wᵢ)</th></tr></thead><tbody><tr><td colspan="1" rowspan="1" style="" align="left" valign="top">Age</td><td colspan="1" rowspan="1" style="" align="left" valign="top">0.4375</td></tr><tr><td colspan="1" rowspan="1" style="" align="left" valign="top">Occupation</td><td colspan="1" rowspan="1" style="" align="left" valign="top">0.3125</td></tr><tr><td colspan="1" rowspan="1" style="" align="left" valign="top">Education</td><td colspan="1" rowspan="1" style="" align="left" valign="top">0.1875</td></tr><tr><td colspan="1" rowspan="1" style="" align="left" valign="top">Gender</td><td colspan="1" rowspan="1" style="" align="left" valign="top">0.0625</td></tr><tr><td colspan="1" rowspan="1" style="" align="left" valign="top">Total</td><td colspan="1" rowspan="1" style="" align="left" valign="top">1.0</td></tr></tbody></table></table-wrap><p>3. Determination of Vulnerability Index</p><p>Vulnerability (V) is the tendency of a population to experience adverse impacts when exposed to hazards, influenced by demographic characteristics and socio-economic conditions. In this context, V does not measure the likelihood of floods (hazard domain), but rather the internal capacity of individuals to anticipate, absorb, and recover. The scope of indicators is limited to attributes directly available from the SSP-namely, age, gender, education level, and employment status -where Si is the score for the i-th attribute category and Wi is the weight for the i-th attribute (Equation 3).</p><p><inline-formula><tex-math id="math-3"><![CDATA[ \documentclass{article} \usepackage{amsmath} \begin{document} \displaystyle V = \sum_{i=1}^{m} S_i W_i \end{document} ]]></tex-math></inline-formula>       (3)</p></sec><sec><title>2.6. Risk Analysis (R)</title><p>Risk analysis combines hazards (H) and vulnerabilities (V) to evaluate the potential impact of flooding on populations. We use a complementary approach: (1) Relative Risk Index: R = H × V, with H and V scaled from 0 to 1.</p></sec></sec><sec><title>3. Results and Discussion</title><sec><title>3.1. Spatial Synthetic Population (SSP)</title><p>The SSP modeling result is shown in <xref ref-type="fig" rid="figure-4">Figure 4</xref>. The resulting SSP includes 4,459,936 individual entities geolocated on a 100 m grid in the Upper Bengawan Solo watershed, derived from GHS-POP R2023. Each individual is assigned directional jitter within a radius of ≤100 m of the pixel center and is assigned attributes such as age, sex, education, and occupation, which are calibrated against official district or city level statistics via marginal alignment (IPF) until they are consistent.</p><fig id="figure-4" ignoredToc=""><label>Figure 4</label><caption><p>Spatial Synthetic Population Map.</p></caption><graphic xlink:href="For_Geo-39-3-383-g4.png" mimetype="image" mime-subtype="png"><alt-text>Image</alt-text></graphic></fig></sec><sec><title>3.2. Attributes Validation</title><p>The results of attribute validation are shown in <xref ref-type="table" rid="table-5">Table 5</xref> and <xref ref-type="fig" rid="figure-5">Figure 5</xref>. Based on these results, the errors for each attribute are as follows: education (MAE 4.89%; RMSE 5.19%), occupation (MAE 6.52%; RMSE 6.93%), gender (MAE 0.0103%; RMSE 0.0103%), and age (MAE 0.0137%; RMSE 0.0163%). Notably, gender and age are nearly identical to the observed values (a difference of about 0.01), highlighting the success of mapping age bins and maintaining consistent category labels. This alignment is important because these attributes are often key factors in flood vulnerability indices (such as the proportion of children and the elderly as vulnerable groups); therefore, the stability of their values helps prevent errors from affecting the overall risk results.</p><table-wrap id="table-6" ignoredToc=""><label>Table 6</label><caption><p>Error Metrics.</p></caption><table frame="box" rules="all"><thead><tr><th colspan="1" rowspan="1" style="" align="left" valign="top">Attribute</th><th colspan="1" rowspan="1" style="" align="left" valign="top">MAE (%)</th><th colspan="1" rowspan="1" style="" align="left" valign="top">RMSE (%)</th></tr></thead><tbody><tr><td colspan="1" rowspan="1" style="" align="left" valign="top">Education</td><td colspan="1" rowspan="1" style="" align="left" valign="top">4.892</td><td colspan="1" rowspan="1" style="" align="left" valign="top">5.186</td></tr><tr><td colspan="1" rowspan="1" style="" align="left" valign="top">Occupation</td><td colspan="1" rowspan="1" style="" align="left" valign="top">6.522</td><td colspan="1" rowspan="1" style="" align="left" valign="top">6.926</td></tr><tr><td colspan="1" rowspan="1" style="" align="left" valign="top">Gender</td><td colspan="1" rowspan="1" style="" align="left" valign="top">0.010</td><td colspan="1" rowspan="1" style="" align="left" valign="top">0.010</td></tr><tr><td colspan="1" rowspan="1" style="" align="left" valign="top">Age</td><td colspan="1" rowspan="1" style="" align="left" valign="top">0.014</td><td colspan="1" rowspan="1" style="" align="left" valign="top">0.016</td></tr></tbody></table></table-wrap><fig id="figure-5" ignoredToc=""><label>Figure 5</label><caption><p>Comparison of Population Distribution by: (a) Gender, (b) Occupation, (c) Education, (d) Age.</p></caption><graphic xlink:href="For_Geo-39-3-383-g5.png" mimetype="image" mime-subtype="png"><alt-text>Image</alt-text></graphic></fig><p>Regarding education and occupation, the MAE of 4.9–6.5 reflects different dynamics: the SSP distribution closely matches the observed distribution (the pattern of comparisons between categories is preserved), but there is an offset in some high frequency categories. In practice, this often happens when category ontologies are not perfectly aligned, such as combining High School/Vocational School into a single source and distinguishing High School from Vocational School in another. In these cases, a few percentage points difference in one category is usually offset by a comparable difference in a nearby category.</p></sec><sec><title>3.3. Spatial Error Analysis</title><p>The SSP validation results against GHS-POP for 30 sample pixels show a plausible pattern <xref ref-type="fig" rid="figure-6">Figure 6</xref>. The relationship between the two is strong (r = 0.935), yet there is a systematic overcount with a bias of +10.4 people per pixel (MAE 12.93; RMSE 22.22), and a 95% agreement limit that remains wide (−28.74 to 49.54), indicating significant residual uncertainty in some pixels. Structurally, the regression slope is less than 1, and increasing error at higher density bin points to heteroskedasticity and the potential for spatial “bleeding” caused by jitter points extending beyond pixel limits and non mass preserving allocations per pixel. The SSP has successfully captured the density gradient but needs scale calibration, and jitter restrictions within pixel polygons and allocations hinder consistency at 100 m. With these adjustments, especially for aggregations ≥300 m, the accuracy is expected to improve, but expanding the sample will be necessary to stabilize the metrics and reduce the Level of Acceptance range.</p><fig id="figure-6" ignoredToc=""><label>Figure 6</label><caption><p>Comparison between GHS and SSP Pixel Values (n = 30).</p></caption><graphic xlink:href="For_Geo-39-3-383-g6.png" mimetype="image" mime-subtype="png"><alt-text>Image</alt-text></graphic></fig><p>Additionally, the distribution of SSP locations compared to ESRI Sentinel-2 Land Cover (10 m) shows high consistency: out of a total of 4,235,296 points, 91.95% (3,894,372) are on built-up land and 8.05% (340,924) on non-built-up areas. Treating this as an estimate of binomial proportions, its statistical uncertainty is minimal (95% confidence interval approximately 91.92–91.98%), indicating a strong “location accuracy” signal for the SSP. Substantively, the roughly 8% off-built-up figure remains reasonable given (i) thematic errors in land cover maps (such as commission/omission of built classes, especially in rural residential areas mixed with vegetation), (ii) the impact of the 10 m boundary—misregistration and mixed pixels at settlement edges, and (iii) jitter or bleeding of SSP points near class boundaries. These results strongly support the conclusion that the placement of SSP aligns with built-up spaces; the remaining 8% likely results from class boundary issues and thematic uncertainties, which could be minimized through small buffering, datum/registration alignment, or the use of building footprints in the test zone.</p></sec><sec><title>3.4. Population Vulnerability Analysis based on SSP</title><p>The demographic vulnerability analysis indicates a very “low” profile (<xref ref-type="fig" rid="figure-7">Figure 7</xref> and <xref ref-type="fig" rid="figure-8">Figure 8</xref>). The average weighted population is 0.2160 (scale 0–1), with 99.63% of the population categorized as Very Low (44.43%) and Low (55.20%), while only 0.37% falls into the Moderate category. The AHP weights are consistent (CR=0), confirming that age is the primary factor (w=0.5333), followed by occupation (0.2667), education (0.1333), and gender (0.0667).</p><p>Consequently, pockets of vulnerability mainly develop in areas with higher proportions of children and the elderly, or in areas dominated by low adaptive capacity jobs (informal/daily workers) and low education levels, even though their overall contribution is smaller than their share of the population. Spatially, the impact is that vulnerability hotspots are limited but operationally significant: although they account for only 0.37% of the population, the intersection of moderate pockets with high hazard zones (H) could prioritize interventions such as increasing household preparedness, improving access to emergency services, and strengthening social networks. These results highlight that most regions possess reasonable demographic resilience reserves; however, risk management must continue to focus on micro locations with vulnerable age groups and job/education vulnerabilities to deploy mitigation resources effectively.</p><fig id="figure-7" ignoredToc=""><label>Figure 7</label><caption><p>Distribution of Population by Vulnerability Class.</p></caption><graphic xlink:href="For_Geo-39-3-383-g7.png" mimetype="image" mime-subtype="png"><alt-text>Image</alt-text></graphic></fig><fig id="figure-8" ignoredToc=""><label>Figure 8</label><caption><p>Spatial Distribution of Population by Vulnerability Class.</p></caption><graphic xlink:href="For_Geo-39-3-383-g8.png" mimetype="image" mime-subtype="png"><alt-text>Image</alt-text></graphic></fig></sec><sec><title>3.4. Risk</title><p>The distribution of the population's flood risk based on SSP (approximately 4.23 million entities) is heavily concentrated in the Low Risk category (3,391,760; 80.21%), with a substantial portion in the Moderate Risk category (830,469; 19.64%). Meanwhile, the tail distribution is nearly zero for the Very Low (5,026; 0.12%) and High (1,602; 0.04%) categories, indicating that overall exposure is primarily in the low risk class. However, about 832,071 (±19.68%) of the population falls into the moderate high risk category, which should be the focus of priority interventions, such as improvements to early warning systems, micro infrastructure protection, and spatial planning in hotspots (see <xref ref-type="fig" rid="figure-9">Figure 9</xref>).</p><fig id="figure-9" ignoredToc=""><label>Figure 9</label><caption><p>Spatial Distribution of Population by Risk Index.</p></caption><graphic xlink:href="For_Geo-39-3-383-g9.png" mimetype="image" mime-subtype="png"><alt-text>Image</alt-text></graphic></fig><p>The Getis–Ord Gi analysis reveals that risk hotspots form significant clusters along river network corridors and in urban core areas <xref ref-type="fig" rid="figure-10">Figure 10</xref>. The directional pattern along water pathways indicates the dominance of river flooding in floodplains, while the clustering in urban zones reflects pluvial flooding caused by high impervious surfaces and limited drainage capacity; both are worsened by high exposure (population/asset density) and local vulnerabilities (informal settlements, fragile buildings, service inequality). Therefore, the interaction of H×V explains the consistently positive z-score of Gi observed in riverbanks and urban pockets. Operationally, this involves addressing setbacks and restoring floodplain connectivity, improving drainage systems and green-blue infrastructure in cities, and prioritizing early warning systems and protecting critical facilities in hotspots. To ensure the accuracy of these conclusions, sensitivity testing should be performed on spatial neighbor weighting schemes (including river network based methods), along with corrections for multiple testing and cross validation using historical flood records.</p><fig id="figure-10" ignoredToc=""><label>Figure 10</label><caption><p>Risk Hotspots.</p></caption><graphic xlink:href="For_Geo-39-3-383-g10.png" mimetype="image" mime-subtype="png"><alt-text>Image</alt-text></graphic></fig></sec><sec><title>3.4. Discussion</title><p>The metrics findings show that the synthetic population distribution (SSP) has been accurately reconstructed regarding attribute spread and spatial distribution, although some residual errors remain in several categories. In high resolution population mapping, harmonizing category definitions and maintaining consistent classification schemes are essential steps to reduce artifact related residual bias <xref ref-type="bibr" rid="BIBR-31">(Rubinyi et al., 2022)</xref>.</p><p>Substantively, age and gender attributes exhibit practical errors of approximately 0.01% (≈0.01%). This confirms the success of age bin mapping, the consistency of category labels, and the normalization of proportions. High accuracy in these two attributes is essential because the proportions of children and the elderly often influence response capacity and evacuation needs, while demographic structure also impacts risk projection by incorporating population dynamics and climate change <xref ref-type="bibr" rid="BIBR-36">(Shu et al., 2023)</xref>. Therefore, the propagation of errors to the overall vulnerability index should be minimal. Conversely, in education and employment, a mean absolute error (MAE) of around 5-7 percentage points was observed. While this is generally considered a good fit for categorical shape, some dominant classes still show offset levels. From a policy standpoint, such deviations tend to affect thematic evaluations-such as post flood job training programs or school level disaster literacy initiatives-more than they impact spatial risk rankings between zones, provided these two attribute weights do not dominate the composite index.</p><p>From a utilization standpoint, current performance is sufficient for operational risk mapping at a resolution of ≥100 m (or village level). The research on composite based flood risk assessment models indicates that aggregate outcomes are fairly resilient to minor variations in less sensitive components, as long as the most sensitive factors-in this case, age and gender-are accurately measured. However, it is also important to note that fluctuations in population datasets alone have been shown to alter flood exposure estimates across different regions <xref ref-type="bibr" rid="BIBR-24">(Li et al., 2024)</xref><xref ref-type="bibr" rid="BIBR-42">(Zhang et al., 2025)</xref><xref ref-type="bibr" rid="BIBR-42">(Zhang et al., 2025)</xref>. Consequently, documenting and monitoring residual patterns remain essential for quality control, especially in urban and peri urban areas, which often display greater social and economic diversity.</p><p>Regarding sources of bias, three main factors should be noted. First, misalignment between category lexicons (observed vs. SSP) could cause discrepancies of several percentage points in large categories. Second, imperfections in conditioning employment attributes on demographic predictors and regional contexts (e.g., age, education, and urban rural typologies) may lead to small but systematic distortions. Third, rounding in reference data can mathematically amplify differences in high frequency classes without changing the overall shape of the distribution. Two low cost steps are recommended that do not alter the SSP architecture: (i) post synthesis ranking or Iterative Proportional Fitting (IPF) in each territorial unit to "attach" margins to the targets; this method is common and effectively reduces the mean absolute error (MAE) of categories to &lt;3 percentage points <xref ref-type="bibr" rid="BIBR-27">(Nejad et al., 2021)</xref>, and (ii) one to one category ontology harmonization (consistently merging or crossing "similar" classes), as recommended in high resolution synthetic population mapping <xref ref-type="bibr" rid="BIBR-31">(Rubinyi et al., 2022)</xref>. Both steps improve accuracy without sacrificing spatial consistency or computational efficiency.</p><p>As an additional measure, two more tests are recommended. First, a sensitivity analysis of the weight assigned to the vulnerability index: assessing the stability of spatial rankings across reasonable variations in educational and employment weights will confirm the robustness of the results. Second, constructing a residual map (observed – SSP, in %) for each main category can help identify spatial bias patterns—such as residual concentration in urban cores versus peri urban areas—that may influence the next ranking stage. This can also help distinguish between methodological bias and actual demographic heterogeneity <xref ref-type="bibr" rid="BIBR-42">(Zhang et al., 2025)</xref>. In relation to medium to long term planning, combining demographic structure accuracy with these light balancing mechanisms is also important for a risk projection framework that considers future population dynamics and climate related hazard scenarios <xref ref-type="bibr" rid="BIBR-36">(Shu et al., 2023)</xref>. Overall, these results support the conclusion that the SSP has adequately captured key demographic structures for area prioritization and operational level mitigation planning, with room for improvement through IPF/ranking and category harmonization. This approach aligns with industry best practices and offers a way to increase precision without adding computational complexity or model architecture overhead (<xref ref-type="bibr" rid="BIBR-27">(Nejad et al., 2021)</xref>; <xref ref-type="bibr" rid="BIBR-31">(Rubinyi et al., 2022)</xref>; <xref ref-type="bibr" rid="BIBR-36">(Shu et al., 2023)</xref>; <xref ref-type="bibr" rid="BIBR-42">(Zhang et al., 2025)</xref>; <xref ref-type="bibr" rid="BIBR-41">(Zhang et al., 2025)</xref>).</p></sec></sec><sec><title>4. Conclusion</title><p>This study presents the development of SSP for flood risk analysis in the Upper Bengawan Solo Watershed. The developed SSP is valid in both a distributional and a spatial sense, with some suggestions for improvement. For attributes, the fit to reference data is very high for sex and age (MAE=0.0103; RMSE=0.0103 and MAE=0.0137; RMSE=0.0163). Education (MAE 4.89; RMSE 5.19) and employment (MAE 6.52; RMSE 6.93) preserve a similar distribution shape to the observed but show an offset in some high frequency categories. In spatial validation results, the SSP-GHS relationship is strong (r=0.935), but there is an overcount of +10.4 people per pixel (MAE 12.93; RMSE 22.22) and wide 95% Limits of Agreement (−28.74 to 49.54), indicating heteroskedasticity and possible issues from jitter and allocations not being mass preserving per 100 m. Limiting jitter within pixels, using conservative allocations, and aggregating at ≥300 m are expected to improve accuracy. Positional validation against ESRI Sentinel-2 shows that 91.95% of points are within built-up areas (CI95%≈91.92–91.98%). In comparison, about 8% outside built-up areas is likely due to thematic or edge uncertainty, which can be reduced through buffering, improved registration, or more precise building footprint definitions. The risk of residents is mainly in Low (80.21%) and Moderate (19.64%) categories. Getis-Ord Gi analysis confirms risk hotspots tend to run along river corridors and cluster in urban centers—reflecting the combined effects of river flood and pluvial processes—with operational implications: setback planning, floodplain restoration, improving drainage and green blue infrastructure, strengthening early warning systems, and protecting critical facilities, alongside spatial weight sensitivity tests, corrections for multiple testing, and cross validation against historical floods. In short, the research enables fine scale flood risk assessment, identifying hotspots for targeted interventions such as urban planning, drainage improvements, and early warning systems. Validated and robust, the SSP framework offers policymakers a practical tool to enhance resilience, optimize resources, and mitigate the societal impacts of rising flood hazards.</p></sec><sec><title>Acknowledgements</title><p>The author would like to express sincere gratitude to all parties who contributed to the research and completion of this manuscript, including mentors, funding supporters, and those who provided essential data and information. Their assistance has been invaluable to this work.</p></sec><sec><title>Author Contributions</title><p><bold>Conceptualization</bold>: Musiyam, M., Jumadi, J., Fikriyah, V. N., Masruroh, H., Septiyani, E. D., Amin, H., Hadibasyir, H. Z., Sattar, F., &amp; Nawaz, M.; <bold>methodology</bold>: Musiyam, M., &amp; Jumadi, J.; <bold>investigation</bold>: Musiyam, M., Fikriyah, V. N., &amp; Nawaz, M.; <bold>writing—original draft preparation</bold>: Musiyam, M., Jumadi, J., Septiyani, E. D., Amin, H., Hadibasyir, H. Z., Sattar, F., &amp; Nawaz, M.; <bold>writing—review and editing</bold>: Musiyam, M., &amp; Nawaz, M.; <bold>visualization</bold>: Musiyam, M. All authors have read and agreed to the published version of the manuscript.</p></sec><sec><title>Conflict of interest</title><p>All authors declare that they have no conflicts of interest.</p></sec><sec><title>Data availability</title><p>Data is available upon Request.</p></sec><sec><title>Funding</title><p>This research was funded by the Matching Fund Program of Universitas Muhammadiyah Surakarta (DRPPS) and Universitas Negeri Malang MoA Number 5.2.7/UN32.14/KS/2024 and 48/C.3-III/LRI/II/2024 through RKN Scheme.</p></sec></body><back><ref-list><title>References</title><ref id="BIBR-1"><element-citation publication-type="article-journal"><article-title>Risk assessment and management of vulnerable areas to flash flood ha-zards in arid regions using remote sensing and GIS-based knowledge-driven techniques</article-title><source>Natural Hazards</source><volume>117</volume><issue>3</issue><person-group person-group-type="author"><name><surname>Abdelkareem</surname><given-names>M.</given-names></name><name><surname>Mansour</surname><given-names>A.M.</given-names></name></person-group><year>2023</year><fpage>2269</fpage><lpage>2295</lpage><page-range>2269-2295</page-range><pub-id pub-id-type="doi">10.1007/s11069-023-05942-x</pub-id></element-citation></ref><ref id="BIBR-2"><element-citation publication-type="article-journal"><article-title>Analysis of the Issues on Bengawan Solo River Basin Management Policies</article-title><source>WSEAS Transactions on Environment and Development</source><volume>19</volume><person-group person-group-type="author"><name><surname>Absori</surname><given-names>A.</given-names></name><name><surname>Hernanda</surname><given-names>T.</given-names></name><name><surname>Fitriciada</surname><given-names>A.</given-names></name><name><surname>Wardiono</surname><given-names>K.</given-names></name><name><surname>Budiono</surname><given-names>A.</given-names></name></person-group><year>2023</year><fpage>25</fpage><lpage>32</lpage><page-range>25-32</page-range></element-citation></ref><ref id="BIBR-3"><element-citation publication-type="article-journal"><article-title>Assignment of a synthetic population for activity-based modeling employing publicly available data</article-title><source>ISPRS International Journal of Geo-Information</source><volume>11</volume><issue>2</issue><person-group person-group-type="author"><name><surname>Agriesti</surname><given-names>S.</given-names></name><name><surname>Roncoli</surname><given-names>C.</given-names></name><name><surname>Nahmias-Biran</surname><given-names>B.</given-names></name></person-group><year>2022</year><page-range>148</page-range></element-citation></ref><ref id="BIBR-4"><element-citation publication-type="article-journal"><article-title>Kajian biofisik lahan untuk penilaian kerentanan banjir di DAS Bengawan Solo Hu-lu</article-title><source>Jurnal Pengelolaan Sumberdaya Alam dan Lingkungan</source><volume>8</volume><issue>1</issue><person-group person-group-type="author"><name><surname>Anna</surname><given-names>A.N.</given-names></name><name><surname>Priyana</surname><given-names>Y.</given-names></name></person-group><year>2015</year><fpage>96</fpage><lpage>108</lpage><page-range>96-108</page-range><pub-id pub-id-type="doi">10.29244/jpsl.8.1.96-108</pub-id></element-citation></ref><ref id="BIBR-5"><element-citation publication-type="book"><article-title>Water resources management model based area (A case study in some areas of Bengawan Solo watershed</article-title><volume>2727</volume><issue>1</issue><person-group person-group-type="author"><name><surname>Anna</surname><given-names>A.N.</given-names></name><name><surname>Priyana</surname><given-names>Y.</given-names></name><name><surname>Rudiyanto</surname></name><name><surname>Fikriyah</surname><given-names>V.N.</given-names></name></person-group><year>2023</year><page-range>050027</page-range><publisher-name>Proceeding Of International Summit On Education, Tech-nology, And Humanity</publisher-name></element-citation></ref><ref id="BIBR-6"><element-citation publication-type="article-journal"><article-title>The impacts of climate change on river flood risk at the global scale</article-title><source>Climatic Change</source><volume>134</volume><issue>3</issue><person-group person-group-type="author"><name><surname>Arnell</surname><given-names>N.W.</given-names></name><name><surname>Gosling</surname><given-names>S.N.</given-names></name></person-group><year>2016</year><fpage>387</fpage><lpage>401</lpage><page-range>387-401</page-range><pub-id pub-id-type="doi">10.1007/s10584-014-1084-5</pub-id></element-citation></ref><ref id="BIBR-7"><element-citation publication-type="paper-conference"><article-title>Synthetic population for the state of California based on open-data: Examples of San Francisco Bay area and San Diego County</article-title><source>100th Annual Meeting of the Transportation Research Board (TRB</source><person-group person-group-type="author"><name><surname>Balac</surname><given-names>M.</given-names></name><name><surname>Hörl</surname><given-names>S.</given-names></name></person-group><year>2021</year><ext-link xlink:href="https://hal.science/hal-03208848/" ext-link-type="uri" xlink:title="Synthetic population for the state of California based on open-data: Examples of San Francisco Bay area and San Diego County">Available from: https://hal.science/hal-03208848/</ext-link></element-citation></ref><ref id="BIBR-8"><element-citation publication-type="article-journal"><article-title>Synthetic Population: A Reliable Framework for Analysis for Agent-Based Modeling in Mobility</article-title><source>Transportation Research Record: Journal of the Transportation Research Board</source><volume>2678</volume><issue>11</issue><person-group person-group-type="author"><name><surname>Bigi</surname><given-names>F.</given-names></name><name><surname>Rashidi</surname><given-names>T.H.</given-names></name><name><surname>Viti</surname><given-names>F.</given-names></name></person-group><year>2024</year><fpage>1</fpage><lpage>15</lpage><page-range>1-15</page-range><pub-id pub-id-type="doi">10.1177/03611981241239656</pub-id></element-citation></ref><ref id="BIBR-9"><element-citation publication-type="paper-conference"><article-title>Generation of Realistic Mega-City Populations and Social Networks for Agent-Based Modeling</article-title><source>Proceedings of the 2017 International Conference of The Computatio-nal Social Science Society of the Americas</source><person-group person-group-type="author"><name><surname>Burger</surname><given-names>A.</given-names></name><name><surname>Oz</surname><given-names>T.</given-names></name><name><surname>Crooks</surname><given-names>A.</given-names></name><name><surname>Kennedy</surname><given-names>W.G.</given-names></name></person-group><year>2017</year><fpage>1</fpage><lpage>7</lpage><page-range>1-7</page-range><pub-id pub-id-type="doi">10.1145/3145574.3145593</pub-id></element-citation></ref><ref id="BIBR-10"><element-citation publication-type="article-journal"><article-title>Assessing social vulnerability and identifying spatial hotspots of flood risk to inform socially just flood management policy</article-title><source>Risk Analysis</source><volume>43</volume><issue>5</issue><person-group person-group-type="author"><name><surname>Chakraborty</surname><given-names>L.</given-names></name><name><surname>Thistlethwaite</surname><given-names>J.</given-names></name><name><surname>Scott</surname><given-names>D.</given-names></name><name><surname>Henstra</surname><given-names>D.</given-names></name><name><surname>Minano</surname><given-names>A.</given-names></name><name><surname>Rus</surname><given-names>H.</given-names></name></person-group><year>2023</year><fpage>1058</fpage><lpage>1078</lpage><page-range>1058-1078</page-range><pub-id pub-id-type="doi">10.1111/risa.13978</pub-id></element-citation></ref><ref id="BIBR-11"><element-citation publication-type="paper-conference"><article-title>A brief review of synthetic population generation practices in agent-based social simulation</article-title><source>Submitted to SSC2019, Social Simulation Conference</source><person-group person-group-type="author"><name><surname>Chapuis</surname><given-names>K.</given-names></name><name><surname>Taillandier</surname><given-names>P.</given-names></name></person-group><year>2019</year><ext-link xlink:href="https://www.researchgate.net/profile/Kevin-Chapuis/publication/335601121_A_brief_review_of_synthetic_population_generation_practices_in_agent-based_social_simulation/links/5d6f58e592851c1b3b279b9a/A-brief-review-of-synthetic-population-generation-practices-in-agent-based-social-simulation.pdf" ext-link-type="uri" xlink:title="A brief review of synthetic population generation practices in agent-based social simulation">Available from: https://www.researchgate.net/profile/Kevin-Chapuis/publication/335601121_A_brief_review_of_synthetic_population_generation_practices_in_agent-based_social_simulation/links/5d6f58e592851c1b3b279b9a/A-brief-review-of-synthetic-population-generation-practices-in-agent-based-social-simulation.pdf</ext-link></element-citation></ref><ref id="BIBR-12"><element-citation publication-type="article-journal"><article-title>Social Vulnerability to Environmental Hazards*</article-title><source>Social Science Quarterly</source><volume>84</volume><issue>2</issue><person-group person-group-type="author"><name><surname>Cutter</surname><given-names>S.L.</given-names></name><name><surname>Boruff</surname><given-names>B.J.</given-names></name><name><surname>Shirley</surname><given-names>W.L.</given-names></name></person-group><year>2003</year><pub-id pub-id-type="doi">10.1111/1540-6237.8402002</pub-id></element-citation></ref><ref id="BIBR-13"><element-citation publication-type="article-journal"><article-title>Temporal and spatial changes in social vulnerability to natural hazards</article-title><source>Proceedings of the National Academy of Sciences</source><volume>105</volume><issue>7</issue><person-group person-group-type="author"><name><surname>Cutter</surname><given-names>S.L.</given-names></name><name><surname>Finch</surname><given-names>C.</given-names></name></person-group><year>2008</year><fpage>2301</fpage><lpage>2306</lpage><page-range>2301-2306</page-range><pub-id pub-id-type="doi">10.1073/pnas.0710375105</pub-id></element-citation></ref><ref id="BIBR-14"><element-citation publication-type="article-journal"><article-title>Gen-SynthPop: Generating a spatially explicit synthetic population of individuals and households from aggregated data</article-title><source>Autonomous Agents and Multi-Agent Systems</source><volume>38</volume><issue>2</issue><person-group person-group-type="author"><name><surname>Mooij</surname><given-names>J.</given-names></name><name><surname>Sonnenschein</surname><given-names>T.</given-names></name><name><surname>Pellegrino</surname><given-names>M.</given-names></name><name><surname>Dastani</surname><given-names>M.</given-names></name><name><surname>Ettema</surname><given-names>D.</given-names></name><name><surname>Logan</surname><given-names>B.</given-names></name><name><surname>Verstegen</surname><given-names>J.A.</given-names></name></person-group><year>2024</year><page-range>48</page-range><pub-id pub-id-type="doi">10.1007/s10458-024-09680-7</pub-id></element-citation></ref><ref id="BIBR-15"><element-citation publication-type="article-journal"><article-title>Flood hazard analysis and risk assessment using remote sensing, GIS, and AHP techniques: A case study of the Gidabo Watershed, main Ethiopian Rift, Ethiopia</article-title><source>Geomatics, Natural Hazards and Risk</source><volume>15</volume><issue>1</issue><person-group person-group-type="author"><name><surname>Diriba</surname><given-names>D.</given-names></name><name><surname>Takele</surname><given-names>T.</given-names></name><name><surname>Karuppannan</surname><given-names>S.</given-names></name><name><surname>Husein</surname><given-names>M.</given-names></name></person-group><year>2024</year><page-range>2361813</page-range><pub-id pub-id-type="doi">10.1080/19475705.2024.2361813</pub-id></element-citation></ref><ref id="BIBR-16"><element-citation publication-type="article-journal"><article-title>A method to create a synthetic population with social networks for geographically-explicit agent-based models</article-title><source>Computational Urban Science</source><volume>2</volume><issue>1</issue><person-group person-group-type="author"><name><surname>Jiang</surname><given-names>N.</given-names></name><name><surname>Crooks</surname><given-names>A.T.</given-names></name><name><surname>Kavak</surname><given-names>H.</given-names></name><name><surname>Burger</surname><given-names>A.</given-names></name><name><surname>Kennedy</surname><given-names>W.G.</given-names></name></person-group><year>2022</year><page-range>7</page-range><pub-id pub-id-type="doi">10.1007/s43762-022-00034-1</pub-id></element-citation></ref><ref id="BIBR-17"><element-citation publication-type="article-journal"><article-title>A Large-Scale Geographically Explicit Synthetic Population with Social Networks for the United States</article-title><source>Scientific Data</source><volume>11</volume><issue>1</issue><person-group person-group-type="author"><name><surname>Jiang</surname><given-names>N.</given-names></name><name><surname>Yin</surname><given-names>F.</given-names></name><name><surname>Wang</surname><given-names>B.</given-names></name><name><surname>Crooks</surname><given-names>A.T.</given-names></name></person-group><year>2024</year><page-range>1204</page-range></element-citation></ref><ref id="BIBR-18"><element-citation publication-type="article-journal"><article-title>An agent-based evaluation of varying evacuation scenarios in Merapi: Simultaneous and staged</article-title><source>Geosciences</source><volume>9</volume><issue>7</issue><person-group person-group-type="author"><name><surname>Jumadi</surname><given-names>J.</given-names></name><name><surname>Carver</surname><given-names>S.J.</given-names></name><name><surname>Quincey</surname><given-names>D.J.</given-names></name></person-group><year>2019</year><page-range>317</page-range></element-citation></ref><ref id="BIBR-19"><element-citation publication-type="article-journal"><article-title>Utilizing Open Access Spatial Data for Flood Risk Mapping: A Case Study in the Upper Solo Watershed</article-title><source>Geoplanning: Journal of Geomatics and Planning</source><volume>11</volume><issue>2</issue><person-group person-group-type="author"><name><surname>Jumadi</surname><given-names>J.</given-names></name><name><surname>Danardono</surname><given-names>D.</given-names></name><name><surname>Priyono</surname><given-names>K.D.</given-names></name><name><surname>Roziaty</surname><given-names>E.</given-names></name><name><surname>Masruroh</surname><given-names>H.</given-names></name><name><surname>Rohman</surname><given-names>A.</given-names></name><name><surname>Amin</surname><given-names>C.</given-names></name><name><surname>Hadibasyir</surname><given-names>H.Z.</given-names></name><name><surname>Fikriyah</surname><given-names>V.N.</given-names></name><name><surname>Nawaz</surname><given-names>M.</given-names></name><name><surname>Sattar</surname><given-names>F.</given-names></name><name><surname>Lotfata</surname><given-names>A.</given-names></name></person-group><year>2024</year><fpage>189</fpage><lpage>204</lpage><page-range>189-204</page-range><pub-id pub-id-type="doi">10.14710/geoplanning.11.2.189-204</pub-id></element-citation></ref><ref id="BIBR-20"><element-citation publication-type="article-journal"><article-title>Modelling individual evacua-tion decisions during natural disasters: A case study of volcanic crisis in Merapi, Indonesia</article-title><source>Geosciences</source><volume>8</volume><issue>6</issue><person-group person-group-type="author"><name><surname>Jumadi</surname><given-names>J.</given-names></name><name><surname>Heppenstall</surname><given-names>A.</given-names></name><name><surname>Malleson</surname><given-names>N.</given-names></name><name><surname>Carver</surname><given-names>S.</given-names></name><name><surname>Quincey</surname><given-names>D.</given-names></name><name><surname>Manville</surname><given-names>V.</given-names></name></person-group><year>2018</year></element-citation></ref><ref id="BIBR-21"><element-citation publication-type="article-journal"><article-title>Estimating spatio-temporal risks from volcanic eruptions using an agent-based model</article-title><source>Journal of Artificial Societies and Social Simulation</source><volume>23</volume><issue>2</issue><person-group person-group-type="author"><name><surname>Jumadi</surname><given-names>J.</given-names></name><name><surname>Malleson</surname><given-names>N.</given-names></name><name><surname>Carver</surname><given-names>S.</given-names></name><name><surname>Quincey</surname><given-names>D.</given-names></name></person-group><year>2020</year><page-range>2</page-range></element-citation></ref><ref id="BIBR-22"><element-citation publication-type="article-journal"><article-title>Remote Sensing and GIS-Driven Model for Flood Susceptibility Assessment in the Upper Solo River Watershed</article-title><source>Geo-graphia Technica</source><volume>19</volume><issue>2</issue><person-group person-group-type="author"><name><surname>Jumadi</surname><given-names>J.</given-names></name><name><surname>Sari</surname><given-names>D.N.</given-names></name><name><surname>Umrotun</surname><given-names>U.</given-names></name><name><surname>Musiyam</surname><given-names>M.</given-names></name><name><surname>Nurmantyo</surname><given-names>C.</given-names></name><name><surname>Muhammad</surname><given-names>S.F.</given-names></name><name><surname>Ibrahim</surname><given-names>M.H.</given-names></name></person-group><year>2024</year></element-citation></ref><ref id="BIBR-23"><element-citation publication-type="article-journal"><article-title>AI-Driven Ensemble Learning for Spatio-Temporal Rainfall Prediction in the Bengawan Solo River Watershed, Indonesia</article-title><source>Sustainability</source><volume>17</volume><issue>20</issue><person-group person-group-type="author"><name><surname>Jumadi</surname><given-names>J.</given-names></name><name><surname>Danardono</surname><given-names>D.</given-names></name><name><surname>Roziaty</surname><given-names>E.</given-names></name><name><surname>Ulinuha</surname><given-names>A.</given-names></name><name><surname>Supari</surname><given-names>S.</given-names></name><name><surname>Choy</surname><given-names>L.K.</given-names></name><name><surname>Sattar</surname><given-names>F.</given-names></name><name><surname>Nawaz</surname><given-names>M.</given-names></name></person-group><year>2025</year><page-range>9281</page-range><pub-id pub-id-type="doi">10.3390/su17209281</pub-id></element-citation></ref><ref id="BIBR-24"><element-citation publication-type="article-journal"><article-title>Flood Risk Assessment of Areas under Urbanization in Chongqing, China, by Integrating Multi-Models</article-title><source>Remote Sensing</source><volume>16</volume><issue>2</issue><person-group person-group-type="author"><name><surname>Li</surname><given-names>Y.</given-names></name><name><surname>Gao</surname><given-names>J.</given-names></name><name><surname>Yin</surname><given-names>J.</given-names></name><name><surname>Liu</surname><given-names>L.</given-names></name><name><surname>Zhang</surname><given-names>C.</given-names></name><name><surname>Wu</surname><given-names>S.</given-names></name></person-group><year>2024</year><page-range>2</page-range><pub-id pub-id-type="doi">10.3390/rs16020219</pub-id></element-citation></ref><ref id="BIBR-25"><element-citation publication-type=""><article-title>Flash flood data compilation and risk insights in Pe-ninsular Malaysia: a data-driven analysis</article-title><person-group person-group-type="author"><name><surname>Maqtan</surname><given-names>R.</given-names></name><name><surname>Othman</surname><given-names>F.</given-names></name><name><surname>Jaafar</surname><given-names>W.Z.W.</given-names></name><name><surname>Elshafie</surname><given-names>A.</given-names></name></person-group><year>2025</year><fpage>1</fpage><lpage>27</lpage><page-range>1-27</page-range></element-citation></ref><ref id="BIBR-26"><element-citation publication-type="article-journal"><article-title>Analysis of Flood-Affected Areas Due to Extreme Weather In Pacitan, Indonesia</article-title><source>Geomate Journal</source><volume>19</volume><issue>75</issue><person-group person-group-type="author"><name><surname>Musiyam</surname><given-names>M.</given-names></name><name><surname>Jumadi</surname><given-names>J.</given-names></name><name><surname>Wibowo</surname><given-names>Y.A.</given-names></name><name><surname>Widiyatmoko</surname><given-names>W.</given-names></name><name><surname>Hafida</surname><given-names>S.H.N.</given-names></name></person-group><year>2020</year><fpage>27</fpage><lpage>34</lpage><page-range>27-34</page-range></element-citation></ref><ref id="BIBR-27"><element-citation publication-type="article-journal"><article-title>A statistical approach to small area synthetic population generation as a basis for carless evacuation planning</article-title><source>Journal of Transport Geography</source><volume>90</volume><person-group person-group-type="author"><name><surname>Nejad</surname><given-names>M.M.</given-names></name><name><surname>Erdogan</surname><given-names>S.</given-names></name><name><surname>Cirillo</surname><given-names>C.</given-names></name></person-group><year>2021</year><page-range>102902</page-range></element-citation></ref><ref id="BIBR-28"><element-citation publication-type="article-journal"><article-title>Advances on the Global Human Settlement Layer by joint assessment of Earth Observation and population survey data</article-title><source>International Journal of Digital Earth</source><volume>17</volume><issue>1</issue><person-group person-group-type="author"><name><surname>Pesaresi</surname><given-names>M.</given-names></name><name><surname>Schiavina</surname><given-names>M.</given-names></name><name><surname>Politis</surname><given-names>P.</given-names></name><name><surname>Freire</surname><given-names>S.</given-names></name><name><surname>Krasnodębska</surname><given-names>K.</given-names></name><name><surname>Uhl</surname><given-names>J.H.</given-names></name><name><surname>Carioli</surname><given-names>A.</given-names></name><name><surname>Corbane</surname><given-names>C.</given-names></name><name><surname>Dijkstra</surname><given-names>L.</given-names></name><name><surname>Florio</surname><given-names>P.</given-names></name><name><surname>Friedrich</surname><given-names>H.K.</given-names></name><name><surname>Gao</surname><given-names>J.</given-names></name><name><surname>Leyk</surname><given-names>S.</given-names></name><name><surname>Lu</surname><given-names>L.</given-names></name><name><surname>Maffenini</surname><given-names>L.</given-names></name><name><surname>Mari-Rivero</surname><given-names>I.</given-names></name><name><surname>Melchiorri</surname><given-names>M.</given-names></name><name><surname>Syrris</surname><given-names>V.</given-names></name><name><surname>Den Hoek</surname><given-names>J.</given-names></name><name><surname>Kemper</surname><given-names>T.</given-names></name></person-group><year>2024</year><page-range>2390454</page-range><pub-id pub-id-type="doi">10.1080/17538947.2024.2390454</pub-id></element-citation></ref><ref id="BIBR-29"><element-citation publication-type="article-journal"><article-title>A synthetic population for agent-based modelling in Canada</article-title><source>Scientific Data</source><volume>10</volume><issue>1</issue><person-group person-group-type="author"><name><surname>Prédhumeau</surname><given-names>M.</given-names></name><name><surname>Manley</surname><given-names>E.</given-names></name></person-group><year>2023</year><page-range>148</page-range></element-citation></ref><ref id="BIBR-30"><element-citation publication-type="article-journal"><article-title>Validating the GIS-based flood susceptibility model using Synthetic Aperture Radar (SAR) data in sengah Temila watershed, Lan-dak Regency, Indonesia</article-title><source>Forum Geografi</source><volume>36</volume><issue>2</issue><person-group person-group-type="author"><name><surname>Purwanto</surname><given-names>A.</given-names></name><name><surname>Andrasmoro</surname><given-names>D.</given-names></name><name><surname>Eviliyanto</surname><given-names>E.</given-names></name><name><surname>Rustam</surname><given-names>R.</given-names></name><name><surname>Ibrahim</surname><given-names>M.H.</given-names></name><name><surname>Rohman</surname><given-names>A.</given-names></name></person-group><year>2023</year><fpage>185</fpage><lpage>201</lpage><page-range>185-201</page-range><pub-id pub-id-type="doi">10.23917/forgeo.v36i2.16368</pub-id></element-citation></ref><ref id="BIBR-31"><element-citation publication-type="article-journal"><article-title>High-resolution synthetic population mapping for quantifying disparities in disaster impacts: An application in the Bangladesh Coastal Zone</article-title><source>Frontiers in Environmental Science</source><volume>10</volume><person-group person-group-type="author"><name><surname>Rubinyi</surname><given-names>S.</given-names></name><name><surname>Verschuur</surname><given-names>J.</given-names></name><name><surname>Goldblatt</surname><given-names>R.</given-names></name><name><surname>Gussenbauer</surname><given-names>J.</given-names></name><name><surname>Kowarik</surname><given-names>A.</given-names></name><name><surname>Mannix</surname><given-names>J.</given-names></name><name><surname>Bottoms</surname><given-names>B.</given-names></name><name><surname>Hall</surname><given-names>J.</given-names></name></person-group><year>2022</year><page-range>1033579</page-range></element-citation></ref><ref id="BIBR-32"><element-citation publication-type="article-journal"><article-title>Enhancing Digital Elevation Model Accuracy for Flood Modelling–A Case Study of the Ciberes River in Cirebon, Indonesia</article-title><source>Forum Geografi</source><volume>38</volume><issue>1</issue><person-group person-group-type="author"><name><surname>Sahid</surname><given-names>S.</given-names></name></person-group><year>2024</year><fpage>40</fpage><lpage>56</lpage><page-range>40-56</page-range><pub-id pub-id-type="doi">10.23917/forgeo.v38i1.1839</pub-id></element-citation></ref><ref id="BIBR-33"><element-citation publication-type="article-journal"><article-title>Spatio-Temporal Mo-deling for the Analysis of Hydrological Drought and its Impact on Rice Production in the Upper Bengawan Solo Basin, Central Java, Indonesia</article-title><source>Geographia Technica</source><volume>20</volume><issue>2</issue><person-group person-group-type="author"><name><surname>Santhyami</surname><given-names>S.</given-names></name><name><surname>Jumadi</surname><given-names>J.</given-names></name><name><surname>Priyono</surname><given-names>K.D.</given-names></name><name><surname>Rahayu</surname><given-names>T.</given-names></name><name><surname>Sari</surname><given-names>D.N.</given-names></name><name><surname>Othman</surname><given-names>M.</given-names></name><name><surname>Rudi</surname><given-names>R.</given-names></name></person-group><year>2025</year></element-citation></ref><ref id="BIBR-34"><element-citation publication-type="article-journal"><article-title>Flood hazard mapping and flood preparedness literacy of the elderly population residing in Bangkok, Thailand</article-title><source>Water</source><volume>14</volume><issue>8</issue><person-group person-group-type="author"><name><surname>Sawangnate</surname><given-names>C.</given-names></name><name><surname>Chaisri</surname><given-names>B.</given-names></name><name><surname>Kittipongvises</surname><given-names>S.</given-names></name></person-group><year>2022</year><page-range>1268</page-range></element-citation></ref><ref id="BIBR-35"><element-citation publication-type="article-journal"><article-title>GHS-POP R2023A-GHS population grid multitemporal (1975–2030</article-title><source>Joint Research Centre Data Catalogue</source><person-group person-group-type="author"><name><surname>Schiavina</surname><given-names>M.</given-names></name><name><surname>Freire</surname><given-names>S.</given-names></name><name><surname>MacManus</surname><given-names>K.</given-names></name></person-group><year>2023</year></element-citation></ref><ref id="BIBR-36"><element-citation publication-type="article-journal"><article-title>Integrating climate change induced flood risk into future population projections</article-title><source>Na-ture Communications</source><volume>14</volume><issue>1</issue><person-group person-group-type="author"><name><surname>Shu</surname><given-names>E.G.</given-names></name><name><surname>Porter</surname><given-names>J.R.</given-names></name><name><surname>Hauer</surname><given-names>M.E.</given-names></name><name><surname>Sandoval Olascoaga</surname><given-names>S.</given-names></name><name><surname>Gourevitch</surname><given-names>J.</given-names></name><name><surname>Wilson</surname><given-names>B.</given-names></name><name><surname>Pope</surname><given-names>M.</given-names></name><name><surname>Melecio-Vazquez</surname><given-names>D.</given-names></name><name><surname>Kearns</surname><given-names>E.</given-names></name></person-group><year>2023</year><page-range>7870</page-range></element-citation></ref><ref id="BIBR-37"><element-citation publication-type="article-journal"><article-title>Satellite imaging reveals increased proportion of population exposed to floods</article-title><source>Nature</source><volume>596</volume><issue>7870</issue><person-group person-group-type="author"><name><surname>Tellman</surname><given-names>B.</given-names></name><name><surname>Sullivan</surname><given-names>J.A.</given-names></name><name><surname>Kuhn</surname><given-names>C.</given-names></name><name><surname>Kettner</surname><given-names>A.J.</given-names></name><name><surname>Doyle</surname><given-names>C.S.</given-names></name><name><surname>Brakenridge</surname><given-names>G.R.</given-names></name><name><surname>Erickson</surname><given-names>T.A.</given-names></name><name><surname>layback</surname><given-names>D.A.</given-names></name></person-group><year>2021</year><fpage>80</fpage><lpage>86</lpage><page-range>80-86</page-range><pub-id pub-id-type="doi">10.1038/s41586-021-03695-w</pub-id></element-citation></ref><ref id="BIBR-38"><element-citation publication-type="article-journal"><article-title>Can the vulnerable be resilient? Co-existence of vulnerabi-lity and disaster resilience: Informal settlements in the Philippines</article-title><source>International journal of disaster risk re-duction</source><volume>10</volume><person-group person-group-type="author"><name><surname>Usamah</surname><given-names>M.</given-names></name><name><surname>Handmer</surname><given-names>J.</given-names></name><name><surname>Mitchell</surname><given-names>D.</given-names></name><name><surname>Ahmed</surname><given-names>I.</given-names></name></person-group><year>2014</year><fpage>178</fpage><lpage>189</lpage><page-range>178-189</page-range></element-citation></ref><ref id="BIBR-39"><element-citation publication-type="article-journal"><article-title>Flood susceptibility mapping using logistic regression analysis in Lam Khan Chu watershed, Chaiyaphum Province, Thailand</article-title><source>Geography, Environment, Sustainability</source><volume>16</volume><issue>2</issue><person-group person-group-type="author"><name><surname>Waiyasusri</surname><given-names>K.</given-names></name><name><surname>Wetchayont</surname><given-names>P.</given-names></name><name><surname>Tananonchai</surname><given-names>A.</given-names></name><name><surname>Suwanmajo</surname><given-names>D.</given-names></name></person-group><year>2023</year><fpage>41</fpage><lpage>56</lpage><page-range>41-56</page-range></element-citation></ref><ref id="BIBR-40"><element-citation publication-type="article-journal"><article-title>Flood Prone Risk Area Analysis During 2005-2019 In Lam Se Bok Watershed, Ubon Ratchathani Province, Thailand</article-title><source>Geogra-phia Technica</source><volume>16</volume><issue>1</issue><person-group person-group-type="author"><name><surname>Waiyasusri</surname><given-names>K.</given-names></name><name><surname>Kulpanich</surname><given-names>N.</given-names></name><name><surname>Worachairungreung</surname><given-names>M.</given-names></name><name><surname>Sae-Ngow</surname><given-names>P.</given-names></name><name><surname>Chaysmithikul</surname><given-names>P.</given-names></name></person-group><year>2021</year></element-citation></ref><ref id="BIBR-41"><element-citation publication-type="article-journal"><article-title>Integrating Remote Sensing and Machine Learning for Actionable Flood Risk Assessment: Multi-Scenario Projection in the Ili River Basin in China Under Climate Change</article-title><source>Remote Sen-sing</source><volume>17</volume><issue>7</issue><person-group person-group-type="author"><name><surname>Zhang</surname><given-names>M.</given-names></name><name><surname>Fu</surname><given-names>X.</given-names></name><name><surname>Liu</surname><given-names>S.</given-names></name><name><surname>Zhang</surname><given-names>C.</given-names></name></person-group><year>2025</year><page-range>1189</page-range></element-citation></ref><ref id="BIBR-42"><element-citation publication-type="article-journal"><article-title>Global South shows higher urban flood exposures than the Global North under current and future scenarios</article-title><source>Communications Earth &amp; En-vironment</source><volume>6</volume><issue>1</issue><person-group person-group-type="author"><name><surname>Zhang</surname><given-names>Q.</given-names></name><name><surname>Li</surname><given-names>C.</given-names></name><name><surname>Wen</surname><given-names>D.</given-names></name><name><surname>Kang</surname><given-names>J.</given-names></name><name><surname>Chen</surname><given-names>T.</given-names></name><name><surname>Zhang</surname><given-names>B.</given-names></name><name><surname>Hu</surname><given-names>Y.</given-names></name><name><surname>Yin</surname><given-names>J.</given-names></name><name><surname>Slater</surname><given-names>L.</given-names></name></person-group><year>2025</year><page-range>594</page-range></element-citation></ref></ref-list></back></article>
