Rainfall, Mosquito Indices, and Dengue Outbreaks in Southern Taiwan: Reassessing Predictive Modeling with Machine Learning Approaches

preprint OA: closed
📄 Open PDF Full text JSON View at publisher
Full text 33,106 characters · extracted from preprint-html · click to expand
Rainfall, Mosquito Indices, and Dengue Outbreaks in Southern Taiwan: Reassessing Predictive Modeling with Machine Learning Approaches | medRxiv /* */ /* */ <!-- <!-- /*! * yepnope1.5.4 * (c) WTFPL, GPLv2 */ (function(a,b,c){function d(a){return"[object Function]"==o.call(a)}function e(a){return"string"==typeof a}function f(){}function g(a){return!a||"loaded"==a||"complete"==a||"uninitialized"==a}function h(){var a=p.shift();q=1,a?a.t?m(function(){("c"==a.t?B.injectCss:B.injectJs)(a.s,0,a.a,a.x,a.e,1)},0):(a(),h()):q=0}function i(a,c,d,e,f,i,j){function k(b){if(!o&&g(l.readyState)&&(u.r=o=1,!q&&h(),l.onload=l.onreadystatechange=null,b)){"img"!=a&&m(function(){t.removeChild(l)},50);for(var d in y[c])y[c].hasOwnProperty(d)&&y[c][d].onload()}}var j=j||B.errorTimeout,l=b.createElement(a),o=0,r=0,u={t:d,s:c,e:f,a:i,x:j};1===y[c]&&(r=1,y[c]=[]),"object"==a?l.data=c:(l.src=c,l.type=a),l.width=l.height="0",l.onerror=l.onload=l.onreadystatechange=function(){k.call(this,r)},p.splice(e,0,u),"img"!=a&&(r||2===y[c]?(t.insertBefore(l,s?null:n),m(k,j)):y[c].push(l))}function j(a,b,c,d,f){return q=0,b=b||"j",e(a)?i("c"==b?v:u,a,b,this.i++,c,d,f):(p.splice(this.i++,0,a),1==p.length&&h()),this}function k(){var a=B;return a.loader={load:j,i:0},a}var l=b.documentElement,m=a.setTimeout,n=b.getElementsByTagName("script")[0],o={}.toString,p=[],q=0,r="MozAppearance"in l.style,s=r&&!!b.createRange().compareNode,t=s?l:n.parentNode,l=a.opera&&"[object Opera]"==o.call(a.opera),l=!!b.attachEvent&&!l,u=r?"object":l?"script":"img",v=l?"script":u,w=Array.isArray||function(a){return"[object Array]"==o.call(a)},x=[],y={},z={timeout:function(a,b){return b.length&&(a.timeout=b[0]),a}},A,B;B=function(a){function b(a){var a=a.split("!"),b=x.length,c=a.pop(),d=a.length,c={url:c,origUrl:c,prefixes:a},e,f,g;for(f=0;f<d;f++)g=a[f].split("="),(e=z[g.shift()])&&(c=e(c,g));for(f=0;f<b;f++)c=x[f](c);return c}function g(a,e,f,g,h){var i=b(a),j=i.autoCallback;i.url.split(".").pop().split("?").shift(),i.bypass||(e&&(e=d(e)?e:e[a]||e[g]||e[a.split("/").pop().split("?")[0]]),i.instead?i.instead(a,e,f,g,h):(y[i.url]?i.noexec=!0:y[i.url]=1,f.load(i.url,i.forceCSS||!i.forceJS&&"css"==i.url.split(".").pop().split("?").shift()?"c":c,i.noexec,i.attrs,i.timeout),(d(e)||d(j))&&f.load(function(){k(),e&&e(i.origUrl,h,g),j&&j(i.origUrl,h,g),y[i.url]=2})))}function h(a,b){function c(a,c){if(a){if(e(a))c||(j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}),g(a,j,b,0,h);else if(Object(a)===a)for(n in m=function(){var b=0,c;for(c in a)a.hasOwnProperty(c)&&b++;return b}(),a)a.hasOwnProperty(n)&&(!c&&!--m&&(d(j)?j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}:j[n]=function(a){return function(){var b=[].slice.call(arguments);a&&a.apply(this,b),l()}}(k[n])),g(a[n],j,b,n,h))}else!c&&l()}var h=!!a.test,i=a.load||a.both,j=a.callback||f,k=j,l=a.complete||f,m,n;c(h?a.yep:a.nope,!!i),i&&c(i)}var i,j,l=this.yepnope.loader;if(e(a))g(a,0,l,0);else if(w(a))for(i=0;i (function(w,d,s,l,i){w[l]=w[l]||[];w[l].push({'gtm.start':new Date().getTime(),event:'gtm.js'});var f=d.getElementsByTagName(s)[0];var j=d.createElement(s);var dl=l!='dataLayer'?'&l='+l:'';j.src='//www.googletagmanager.com/gtm.js?id='+i+dl;j.type='text/javascript';j.async=true;f.parentNode.insertBefore(j,f);})(window,document,'script','dataLayer','GTM-P4HH5NV'); Skip to main content Home About Submit ALERTS / RSS Search for this keyword Advanced Search Rainfall, Mosquito Indices, and Dengue Outbreaks in Southern Taiwan: Reassessing Predictive Modeling with Machine Learning Approaches Hsiang Hong doi: https://doi.org/10.1101/2025.09.10.25335502 Hsiang Hong 1 Department of Medicine, College of Medicine, National Taiwan University Find this author on Google Scholar Find this author on PubMed Search for this author on this site For correspondence: 168hsiang{at}gmail.com Abstract Full Text Info/History Metrics Data/Code Preview PDF Abstract Dengue remains a major public health challenge in southern Taiwan, where recurrent outbreaks are shaped by complex environmental and entomological drivers. Using nine years of surveillance data (2015–2024) comprising more than 70,000 dengue cases, daily rainfall, and six mosquito indices from Tainan, Kaohsiung, and Pingtung, we evaluated the predictive value of these indicators through lagged correlation and machine learning models. Rainfall showed little explanatory power, while entomological indices demonstrated only moderate, location-specific associations, with the Container Index in Kaohsiung peaking at r ≈ 0.38 at 4–6 week lags. Regression models failed to predict outbreak magnitude, with R 2 near zero on test data, but classification frameworks distinguishing outbreak from non-outbreak weeks achieved high accuracy (AUC up to 0.98), driven primarily by mosquito indices. These findings highlight the limited utility of regression forecasts for dengue, while supporting classification-based approaches as more practical tools for early outbreak detection and vector control planning. Introduction Dengue fever is a rapidly expanding vector-borne disease in tropical and subtropical regions, posing significant public health challenges worldwide 1 – 3 . In Taiwan, the southern counties of Tainan, Kaohsiung, and Pingtung consistently report the highest dengue burden, with recurring outbreaks exacerbated by complex environmental and entomological drivers 4 , 5 . Climatic factors, especially precipitation and temperature, are known to influence Aedes mosquito breeding and survival, creating a temporal window for increased transmission risk 6 – 8 . Entomological surveillance indices such as Container Index (CI), Breteau Index (BI), and Pupal Index are widely used for early detection of vector proliferation, yet their effectiveness in predicting human cases remains debated 9 – 11 . Several studies have employed machine learning (ML) techniques to forecast dengue incidence, often achieving high accuracy using meteorological and entomological predictors in retrospective analyses 12 – 14 . Notably, Kuo et al. (2024) obtained robust predictive performance (AUC ≈ 0.95) by training models on short-term (2013–2015) data splits, relying on rainfall, air quality, and UV indices 15 . However, model performance in such in-sample validations may overestimate generality, especially when future outbreaks are unprecedented in magnitude 16 . In this study, we address two critical gaps. First, we systematically evaluate the temporal relationships between rainfall, six entomological indices (CI, AI, BI, Containers per 100 households, House Index for Aedes aegypti , and Pupal Index), and dengue incidence across three southern Taiwanese counties from 2015 to early 2024. Second, we assess predictive modeling under two frameworks: regression to estimate case counts, and classification to distinguish outbreak versus non-outbreak weeks. By explicitly demonstrating the limitations of regression for forecasting rare outbreak magnitudes and highlighting the utility of ML classification for outbreak detection, we provide a more nuanced and realistic appraisal of prediction tools for dengue surveillance. Results Data Collection To investigate meteorological and entomological influences on dengue incidence in Taiwan, we compiled surveillance and environmental data from December 28, 2015 to December 30, 2024, covering a total of 9,863 daily observations. During this period, more than 70,000 laboratory-confirmed dengue cases were reported nationwide, of which we focused on the southern counties of Tainan, Kaohsiung, and Pingtung, the regions with the highest disease burden. Daily dengue case records, mosquito surveillance indices, and precipitation measurements were aggregated to the weekly level to align temporal resolution across datasets and to account for the time-lagged effects of climate and entomological drivers. This resulted in a dataset comprising 1,409 county-weeks of aligned observations, with variables including weekly case counts, cumulative precipitation (mm), and six entomological indices (Container Index [CI], Adult Index [AI], Breteau Index [BI], Containers per 100 households, House Index for Aedes aegypti , and Pupal Index). Temporal Dynamics of Dengue, Rainfall, and Mosquito Indices Having assembled and harmonized dengue case counts, rainfall, and mosquito surveillance indices into a common weekly framework, we next examined the temporal dynamics of these variables across the three high-burden counties of Tainan, Kaohsiung, and Pingtung ( Fig. 1a-c ). Download figure Open in new tab Figure 1. Temporal dynamics of dengue incidence, rainfall, and mosquito indices in southern Taiwan (2016–2024). (a) Tainan, (b) Kaohsiung, and (c) Pingtung. Weekly dengue cases (red, left y-axis), accumulated weekly rainfall (blue, right y-axis), and mosquito Container Index (CI; green, secondary right y-axis) are shown. Peaks in rainfall consistently occur during the summer monsoon, while CI fluctuates seasonally, reflecting Aedes aegypti breeding conditions. Large dengue outbreaks were observed in Tainan (2015–2016 and 2023–2024) and in Kaohsiung (2023–2024), whereas Pingtung reported relatively fewer cases. While increases in CI often followed rainfall peaks, their correspondence with dengue incidence was inconsistent, underscoring the multifactorial drivers of epidemic onset. From 2015 through 2023, dengue incidence in southern Taiwan displayed marked temporal and geographic heterogeneity. Tainan experienced the most severe outbreaks, including the nationwide epidemic of 2015 and another large resurgence in 2023, with weekly peaks exceeding 2,000 reported cases. Kaohsiung exhibited intermediate activity, with outbreaks reaching several hundred weekly cases, whereas Pingtung reported relatively lower case counts throughout the study period. These patterns reaffirm the disproportionate burden borne by the southernmost counties of Taiwan 5 . Rainfall followed a regular seasonal cycle, peaking during the summer monsoon months, while mosquito surveillance indices fluctuated within and across years. Although periods of elevated precipitation often coincided with increased values of indices such as the Container Index (CI), these trends did not consistently align with epidemic onset. Notably, elevated CI values in Kaohsiung were observed to precede local outbreaks, whereas similar increases in Tainan and Pingtung were not always accompanied by a rise in dengue incidence. This suggests that meteorological and entomological drivers provide only partial signals for outbreak potential, with other factors such as viral introduction, human mobility, and population immunity likely contributing to the timing and magnitude of epidemics 10 , 11 , 17 . Lagged Correlations: Rainfall and Mosquito Indices To assess whether environmental or entomological indicators precede dengue activity, we next examined lagged correlations between weekly dengue cases and rainfall or mosquito indices across the three southern counties. Across all three counties, rainfall demonstrated weak correlations with dengue incidence (r ≤ 0.1 in most cases). In Tainan and Pingtung, rainfall showed small positive associations at lags of 3–8 weeks, consistent with the expected delay between precipitation, mosquito breeding, and subsequent virus transmission, though the signal remained marginal. In Kaohsiung, rainfall correlations were negligible across all lags. Mosquito indices demonstrated similarly mixed results. Among the six entomological indices evaluated (Container Index [CI], House Index [HI], Breteau Index [BI], Con100HH, HI*Aeg, and pupal counts), the CI in Kaohsiung achieved the strongest association, peaking at r ≈ 0.38 with dengue cases at a lag of 4–6 weeks ( Fig. 2a–c ). However, in Tainan and Pingtung, none of the indices showed consistent or meaningful correlations, with most values fluctuating near zero or negative. Download figure Open in new tab Figure 2. Lagged correlations between dengue incidence and environmental predictors in southern Taiwan. (a) Line plots of Pearson correlations (r) between weekly dengue cases and precipitation (blue) or Container Index (CI; orange) at 0–8 week lags, shown separately for Tainan, Kaohsiung, and Pingtung. Kaohsiung demonstrated the strongest associations, with CI rising to r ≈ 0.38 at 5–6 week lags, while correlations in Tainan and Pingtung remained weak. (b) Heatmaps of lagged correlations for precipitation and CI across 0–8 week lags in each county. (c) Heatmap of the best correlation (maximum across 0–8 week lags) for all six mosquito indices (AI, BI, CI, Con100HH, HIAeg, Pupa). Moderate correlations (r ≈ 0.3– 0.4) were observed only for Kaohsiung (CI, HIAeg, Con100HH), while other indices and regions yielded negligible associations. These results highlight two key points: (i) traditional entomological indices do not reliably predict dengue activity in all settings, and (ii) correlations are highly location-dependent, with Kaohsiung showing moderate association but Tainan and Pingtung exhibiting weak or absent relationships. This underscores the challenge of using single predictors in isolation to anticipate outbreaks and suggests that integrative, multi-factorial models may be necessary. Regression Models Fail to Predict Outbreak Magnitude Given the weak and inconsistent associations observed when rainfall and mosquito indices were evaluated individually, we next asked whether combining multiple predictors within a machine learning framework could enhance forecasting performance. Specifically, we tested both regression approaches (predicting weekly dengue case counts directly) and classification approaches (predicting whether a given week would be an outbreak or non-outbreak week). For regression, we implemented three widely used ensemble methods, Random Forest, Gradient Boosting, and XGBoost, using rainfall and mosquito indices as lagged predictors ( Fig. 3 ). However, all three regressors failed to meaningfully capture outbreak magnitude, producing near-zero or negative explanatory power (R 2 ≈ –0.05 across models; RMSE ≈ 336). Instead of tracking the epidemic peaks, predictions collapsed toward the baseline, underestimating case counts during outbreak weeks and over-smoothing during inter-epidemic periods. Download figure Open in new tab Figure 3. Regression models fail to predict outbreak magnitude. Scatterplots comparing observed versus predicted weekly dengue cases in southern Taiwan using Random Forest, Gradient Boosting, and XGBoost regressors. Despite incorporating rainfall and mosquito indices as predictors, all models performed poorly (R 2 < 0, RMSE ≈ 336), with predictions clustered near zero and failing to capture epidemic peaks. The dashed red line indicates the 1:1 line of perfect prediction. This consistent failure underscores a key limitation of regression-based dengue forecasting: the statistical distribution of dengue incidence is highly imbalanced, with long stretches of zero or near-zero cases punctuated by sudden epidemic surges. Standard regression frameworks, which assume relatively stable variance, tend to regress toward the mean, rendering them poorly suited to predicting outbreak magnitudes. Importantly, this limitation was not alleviated by the choice of algorithm — tree-based methods that often excel in nonlinear relationships performed no better than gradient boosting approaches optimized for predictive accuracy. Taken together, these results demonstrate that simply adding multiple meteorological and entomological predictors into a regression model is insufficient for outbreak forecasting. Rather than capturing outbreak severity, the models defaulted to minimizing error during the much more frequent non-outbreak periods. Instead, it may be more effective to reframe the problem as a classification task (outbreak vs. non-outbreak weeks), where the skewed distribution of dengue incidence can be handled more appropriately and where categorical early-warning signals are more actionable for public health planning. Classification Models Distinguish Outbreak from Non-outbreak Weeks While regression approaches were unable to capture outbreak magnitudes, re-framing the problem as a binary classification task (outbreak vs. non-outbreak weeks) yielded substantially better performance. We trained logistic regression, Random Forest, Gradient Boosting, and XGBoost classifiers on lagged rainfall and mosquito indices, defining outbreak weeks as those exceeding the 90th percentile of weekly dengue cases. Receiver operating characteristic (ROC) curves demonstrated that tree-based ensemble methods strongly outperformed logistic regression ( Fig. 4a ). Random Forest achieved the highest discriminatory power (AUC = 0.98), followed by XGBoost (AUC = 0.93) and Gradient Boosting (AUC = 0.92), while logistic regression showed only moderate performance (AUC = 0.77). Download figure Open in new tab Figure 4. Classification performance for outbreak detection in southern Taiwan. (a) Receiver operating characteristic (ROC) curves for logistic regression, Random Forest, Gradient Boosting, and XGBoost classifiers distinguishing outbreak vs. non-outbreak weeks. Ensemble methods substantially outperformed logistic regression, with Random Forest achieving the highest AUC (0.98). (b) Confusion matrices of observed vs. predicted outbreak status on the held-out test set. Logistic regression misclassified nearly half of outbreak weeks, while tree-based models correctly identified most outbreak periods. (c) Feature importance rankings (averaged across ensemble models), highlighting lagged ento mological indices (CI, HIAeg, Con100HH, pupal counts) as the strongest predictors, while rainfall variables contributed little. Confusion matrices further underscored these differences ( Fig. 4b ). Logistic regression misclassified nearly half of outbreak weeks, whereas ensemble classifiers correctly identified the majority, albeit at the expense of some false positives. Random Forest, in particular, achieved nearly perfect separation of outbreak and non-outbreak weeks in the test set. Feature importance analysis indicated that lagged mosquito indices, especially container index (CI), HI*Aeg, and Con100HH, were the strongest drivers of classification ( Fig. 4c ). Pupal counts also contributed meaningfully, while rainfall lagged by up to 8 weeks showed lower and less consistent influence. This pattern suggests that entomological surveillance indicators may provide more immediate predictive value for outbreak detection than meteorological inputs alone. Discussion This study evaluated the predictive value of rainfall and entomological indices for dengue outbreaks in southern Taiwan across a nine-year period. While exploratory correlation analyses revealed weak and inconsistent associations between individual predictors and dengue incidence, our machine learning framework demonstrated two critical insights: (i) regression models cannot reliably forecast outbreak magnitude, and (ii) classification approaches offer greater promise for distinguishing outbreak versus non-outbreak periods. Our findings contrast with previous reports that achieved high predictive accuracy using regression-based approaches in Taiwan and other dengue-endemic setting 15 , 18 , 19 . We show that such results may reflect model overfitting within outbreak periods rather than generalizable predictive power across unseen data. By explicitly framing outbreak prediction as a classification task, we emphasize the non-linear and threshold-like nature of dengue transmission dynamics, where environmental and entomological conditions may be sufficient to tip systems into epidemic states but do not scale proportionally with case counts 20 . Importantly, the most informative predictors identified by our models were lagged entomological indices — particularly CI, HIAeg, Con100HH, and pupal counts — while rainfall contributed little explanatory value. This finding highlights the primacy of vector surveillance for early outbreak detection and aligns with broader entomological research suggesting that vector abundance is a more direct driver of transmission than meteorological conditions alone 10 , 11 , 21 . Nonetheless, correlations varied substantially by location, with moderate associations observed in Kaohsiung but negligible signals in Tainan and Pingtung. This heterogeneity underscores the challenge of extrapolating predictive models across regions and supports the need for localized calibration of early warning systems 6 , 7 . Several limitations should be noted. Our models relied only on rainfall and six standard mosquito indices, without incorporating other potentially important predictors such as temperature, humidity, human mobility, or land-use factors 22 – 25 . Moreover, all analyses were restricted to data from Tainan, Kaohsiung, and Pingtung between 2015 and 2024, and we did not validate the models on external datasets, limiting the generalizability of our findings to other regions or time periods 6 . Despite these limitations, our results provide an important corrective to overly optimistic regression-based forecasts 26 and demonstrate the value of classification-oriented approaches. Outbreak detection models may serve as practical tools for public health decision-making, helping to prioritize intensified surveillance or vector control during high-risk periods 27 , even if precise case numbers cannot be forecasted. Future studies should extend this work by integrating additional data sources, testing hybrid mechanistic–statistical frameworks, and evaluating performance prospectively in real-world public health systems. Methods Data Collection We compiled three datasets covering the period from December 28, 2015 to December 30, 2024: (i) daily dengue case counts from the Taiwan CDC’s National Notifiable Disease Surveillance System, (ii) daily rainfall records from the Central Weather Administration (CWA), and (iii) mosquito surveillance data from the Taiwan CDC entomological monitoring program. The latter included six indices: Container Index (CI), House Index (HI), Breteau Index (BI), Con100HH, HIAeg, and pupal counts. Data were restricted to the three southern counties of Tainan, Kaohsiung, and Pingtung, which consistently report the highest dengue burden in Taiwan. Preprocessing and aggregation Daily records were harmonized by county through standardized mapping of administrative divisions. For precipitation, station metadata were used to infer county-level assignments. All data were aggregated to epidemiological weeks beginning on Monday. Weekly dengue case counts were summed, precipitation was aggregated as the total weekly rainfall (mm), and mosquito indices were averaged across stations within each county. The final dataset comprised 1,409 county-week observations with non-missing data across all three sources. Machine learning models We evaluated both regression and classification frameworks. For regression, Random Forest, Gradient Boosting, and XGBoost were trained to predict weekly case counts from lagged rainfall and mosquito indices. Models were trained on the first 80% of weeks and tested on the final 20%. For classification, outbreak weeks were defined as those exceeding the 75th percentile of weekly case counts, and logistic regression, Random Forest, Gradient Boosting, and XGBoost classifiers were trained to distinguish outbreak versus non-outbreak weeks. Performance was assessed using R 2 for regression, and area under the receiver operating characteristic curve (AUC), confusion matrices, and feature importance rankings for classification. Statistical analysis All analyses were performed in Python (v3.11) on Google Colab using pandas, scikit-learn, xgboost, and matplotlib. Code for preprocessing, correlation analysis, and model training is available upon request. Data Availability All data produced in the present study are available upon reasonable request to the authors References 1. ↵ Paz-Bailey , G. , Adams , L. E. , Deen , J. , Anderson , K. B. & Katzelnick , L. C. Dengue . The Lancet 403 , 667 – 682 ( 2024 ). OpenUrl CrossRef PubMed 2. ↵ Bhatt , S. et al. The global distribution and burden of dengue . Nature 496 , 504 – 507 ( 2013 ). OpenUrl CrossRef PubMed Web of Science 3. ↵ WHO. Dengue and severe dengue . 4. ↵ Chuang , T.-W. , Ng , K.-C. , Nguyen , T. L. & Chaves , L. F. Epidemiological Characteristics and Space-Time Analysis of the 2015 Dengue Outbreak in the Metropolitan Region of Tainan City, Taiwan . Int. J. Environ. Res. Public. Health 15 , 396 ( 2018 ). OpenUrl PubMed 5. ↵ You , S.-H. , Chen , S.-C. Huang , Y.-H. & Tsai , H.-C. Dengue Meteorological Determinants during Epidemic and Non-Epidemic Periods in Taiwan . Trop. Med. Infect. Dis . 7 , 408 ( 2022 ). OpenUrl PubMed 6. ↵ Morin , C. W. , Comrie , A. C. & Ernst , K. Climate and dengue transmission: evidence and implications . Environ. Health Perspect . 121 , 1264 – 1272 ( 2013 ). OpenUrl CrossRef PubMed Web of Science 7. ↵ Hii , Y. L. et al. Climate variability and increase in intensity and magnitude of dengue incidence in Singapore . Glob. Health Action 2 , 10 .3402/gha.v2i0.2036 ( 2009 ). OpenUrl 8. ↵ Naish , S. et al. Climate change and dengue: a critical and systematic review of quantitative modelling approaches . BMC Infect. Dis . 14 , 167 ( 2014 ). OpenUrl CrossRef PubMed 9. ↵ Focks , D. A. & Alexander , N. Multicountry study of Aedes aegypti pupal productivity survey methodology: Findings and recommendations# . 10. ↵ Bowman , L. R. , Runge-Ranzinger , S. & McCall , P. J. Assessing the relationship between vector indices and dengue transmission: a systematic review of the evidence . PLoS Negl. Trop. Dis . 8 , e2848 ( 2014 ). OpenUrl CrossRef PubMed 11. ↵ Cromwell , E. A. et al. The relationship between entomological indicators of Aedes aegypti abundance and dengue virus infection . PLoS Negl. Trop. Dis . 11 , e0005429 ( 2017 ). OpenUrl CrossRef PubMed 12. ↵ Guo , P. et al. Developing a dengue forecast model using machine learning: A case study in China . PLoS Negl. Trop. Dis . 11 , e0005973 ( 2017 ). OpenUrl PubMed 13. Carvajal , T. M. et al. Machine learning methods reveal the temporal pattern of dengue incidence using meteorological factors in metropolitan Manila, Philippines . BMC Infect. Dis . 18 , 183 ( 2018 ). OpenUrl PubMed 14. ↵ Al Mobin , M. Forecasting dengue in Bangladesh using meteorological variables with a novel feature selection approach . Sci. Rep . 14 , 32073 ( 2024 ). OpenUrl PubMed 15. ↵ Kuo , C.-Y. Yang , W.-W. & Su , E.C.-Y. Improving dengue fever predictions in Taiwan based on feature selection and random forests . BMC Infect. Dis . 24 , 334 ( 2024 ). OpenUrl PubMed 16. ↵ Johansson , M. A. , Reich , N. G. , Hota , A. , Brownstein , J. S. & Santillana , M. Evaluating the performance of infectious disease forecasts: A comparison of climate-driven and seasonal dengue forecasts for Mexico . Sci. Rep . 6 , 33707 ( 2016 ). OpenUrl CrossRef PubMed 17. ↵ Naish , S. et al. Climate change and dengue: a critical and systematic review of quantitative modelling approaches . BMC Infect. Dis . 14 , 167 ( 2014 ). OpenUrl CrossRef PubMed 18. ↵ Racloz , V. , Ramsey , R. , Tong , S. & Hu , W. Surveillance of dengue fever virus: a review of epidemiological models and early warning systems . PLoS Negl. Trop. Dis . 6 , e1648 ( 2012 ). OpenUrl CrossRef PubMed 19. ↵ Lowe , R. et al. Nonlinear and delayed impacts of climate on dengue risk in Barbados: A modelling study . PLoS Med . 15 , e1002613 ( 2018 ). OpenUrl CrossRef PubMed 20. ↵ Johansson , M. A. , Cummings , D. A. T. & Glass , G. E. Multiyear climate variability and dengue--El Niño southern oscillation, weather, and dengue incidence in Puerto Rico, Mexico, and Thailand: a longitudinal data analysis . PLoS Med . 6 , e1000168 ( 2009 ). OpenUrl CrossRef PubMed 21. ↵ Brady , O. J. et al. Modelling adult Aedes aegypti and Aedes albopictus survival at different temperatures in laboratory and field settings . Parasit. Vectors 6 , 351 ( 2013 ). OpenUrl CrossRef PubMed 22. ↵ Wesolowski , A. et al. Impact of human mobility on the emergence of dengue epidemics in Pakistan . Proc. Natl. Acad. Sci. U. S. A . 112 , 11887 – 11892 ( 2015 ). OpenUrl Abstract / FREE Full Text 23. Reiner , R. C. et al. Time-varying, serotype-specific force of infection of dengue virus . Proc. Natl. Acad. Sci. U. S. A . 111 , E2694 – 2702 ( 2014 ). OpenUrl Abstract / FREE Full Text 24. Kraemer , M. U. G. et al. Past and future spread of the arbovirus vectors Aedes aegypti and Aedes albopictus . Nat. Microbiol . 4 , 854 – 863 ( 2019 ). OpenUrl PubMed 25. ↵ Kraemer , M. U. G. et al. The global distribution of the arbovirus vectors Aedes aegypti and Ae. albopictus . eLife 4 , e08347 ( 2015 ). OpenUrl CrossRef PubMed 26. ↵ Brady , O. J. et al. Vectorial capacity and vector control: reconsidering sensitivity to parameters for malaria elimination . Trans. R. Soc. Trop. Med. Hyg . 110 , 107 – 117 ( 2016 ). OpenUrl CrossRef PubMed 27. ↵ Lourenço , J. & Recker , M. Natural, Persistent Oscillations in a Spatial Multi-Strain Disease System with Application to Dengue . PLOS Comput. Biol . 9 , e1003308 ( 2013 ). OpenUrl CrossRef PubMed View the discussion thread. Back to top Previous Next Posted September 12, 2025. Download PDF Data/Code Email Thank you for your interest in spreading the word about medRxiv. NOTE: Your email address is requested solely to identify you as the sender of this article. Your Email * Your Name * Send To * Enter multiple addresses on separate lines or separate them with commas. You are going to email the following Rainfall, Mosquito Indices, and Dengue Outbreaks in Southern Taiwan: Reassessing Predictive Modeling with Machine Learning Approaches Message Subject (Your Name) has forwarded a page to you from medRxiv Message Body (Your Name) thought you would like to see this page from the medRxiv website. Your Personal Message CAPTCHA This question is for testing whether or not you are a human visitor and to prevent automated spam submissions. Share Rainfall, Mosquito Indices, and Dengue Outbreaks in Southern Taiwan: Reassessing Predictive Modeling with Machine Learning Approaches Hsiang Hong medRxiv 2025.09.10.25335502; doi: https://doi.org/10.1101/2025.09.10.25335502 Share This Article: Copy Citation Tools Rainfall, Mosquito Indices, and Dengue Outbreaks in Southern Taiwan: Reassessing Predictive Modeling with Machine Learning Approaches Hsiang Hong medRxiv 2025.09.10.25335502; doi: https://doi.org/10.1101/2025.09.10.25335502 Citation Manager Formats BibTeX Bookends EasyBib EndNote (tagged) EndNote 8 (xml) Medlars Mendeley Papers RefWorks Tagged Ref Manager RIS Zotero Tweet Widget Facebook Like Google Plus One Subject Area Epidemiology Subject Areas All Articles Addiction Medicine (567) Allergy and Immunology (863) Anesthesia (297) Cardiovascular Medicine (4411) Dentistry and Oral Medicine (443) Dermatology (380) Emergency Medicine (606) Endocrinology (including Diabetes Mellitus and Metabolic Disease) (1505) Epidemiology (15205) Forensic Medicine (30) Gastroenterology (1119) Genetic and Genomic Medicine (6574) Geriatric Medicine (666) Health Economics (994) Health Informatics (4511) Health Policy (1365) Health Systems and Quality Improvement (1608) Hematology (537) HIV/AIDS (1263) Infectious Diseases (except HIV/AIDS) (15903) Intensive Care and Critical Care Medicine (1103) Medical Education (620) Medical Ethics (144) Nephrology (666) Neurology (6573) Nursing (345) Nutrition (998) Obstetrics and Gynecology (1139) Occupational and Environmental Health (954) Oncology (3319) Ophthalmology (968) Orthopedics (369) Otolaryngology (420) Pain Medicine (435) Palliative Medicine (129) Pathology (662) Pediatrics (1689) Pharmacology and Therapeutics (691) Primary Care Research (710) Psychiatry and Clinical Psychology (5422) Public and Global Health (9205) Radiology and Imaging (2191) Rehabilitation Medicine and Physical Therapy (1367) Respiratory Medicine (1191) Rheumatology (593) Sexual and Reproductive Health (709) Sports Medicine (529) Surgery (709) Toxicology (99) Transplantation (288) Urology (265) (function(){function c(){var b=a.contentDocument||a.contentWindow.document;if(b){var d=b.createElement('script');d.innerHTML="window.__CF$cv$params={r:'9febabf9bff44193',t:'MTc3OTI4MzU3Mg=='};var a=document.createElement('script');a.src='/cdn-cgi/challenge-platform/scripts/jsd/main.js';document.getElementsByTagName('head')[0].appendChild(a);";b.getElementsByTagName('head')[0].appendChild(d)}}if(document.body){var a=document.createElement('iframe');a.height=1;a.width=1;a.style.position='absolute';a.style.top=0;a.style.left=0;a.style.border='none';a.style.visibility='hidden';document.body.appendChild(a);if('loading'!==document.readyState)c();else if(window.addEventListener)document.addEventListener('DOMContentLoaded',c);else{var e=document.onreadystatechange||function(){};document.onreadystatechange=function(b){e(b);'loading'!==document.readyState&&(document.onreadystatechange=e,c())}}}})();

Text is read by the "Ask this paper" AI Q&A widget below. Extraction quality varies by source — PMC NXML preserves structure cleanly, OA-HTML may include some navigation residue, and OA-PDF can have broken hyphenation. The publisher copy (via DOI) is the canonical version.

My notes (saved in your browser only)

Ask this paper AI returns verbatim quotes from the full text · source: preprint-html

Answers must be backed by verbatim quotes from this paper's full text. Hallucinated quotes are dropped automatically; if no verbatim passage answers the question, we say so. How this works

Citation neighborhood (no data yet)

We don't have any in-corpus citations linked to this paper yet. This is a recent paper (2025) — citers typically take a year or two to land, and the OpenAlex reference graph may still be filling in.

Source provenance

europepmc
last seen: 2026-05-20T01:45:00.602351+00:00