diff --git a/CONTRIBUTING.md b/CONTRIBUTING.md index b0ea3ba7..2e12839f 100644 --- a/CONTRIBUTING.md +++ b/CONTRIBUTING.md @@ -63,7 +63,7 @@ to allow running of tests within the IDE. ## Releasing Actions are configured to release to PyPI on pushing a tag. In order to do this: - Update VERSION -- Create new annotated tag and push +- Create new annotated tag and push ``` git tag -a v1.0.0 -m "v1.0.0" git push --follow-tags diff --git a/docs/handbook/onboarding.rst b/docs/handbook/onboarding.rst index 04437838..23266b17 100644 --- a/docs/handbook/onboarding.rst +++ b/docs/handbook/onboarding.rst @@ -1,14 +1,14 @@ Onboarding a new model/data =========================== -Exceedance curves +Exceedance curves ----------------- -The starting point of the calculation is a curve of hazard event intensities, obtained at the location of one particular asset. The probability of occurrence is given either by the 'return period' or an 'exceedance probability'. The return period is the average time in years between occurrences of an event that exceeds a given intensity. The exceedance probability is the probability that in a year an event occurs that exceeds the given intensity. Exceedance probability is the reciprocal of the return period. +The starting point of the calculation is a curve of hazard event intensities, obtained at the location of one particular asset. The probability of occurrence is given either by the 'return period' or an 'exceedance probability'. The return period is the average time in years between occurrences of an event that exceeds a given intensity. The exceedance probability is the probability that in a year an event occurs that exceeds the given intensity. Exceedance probability is the reciprocal of the return period. .. image:: onboarding/return_periods.png :width: 500 - + .. image:: onboarding/exceedance_curve.png :width: 500 @@ -36,7 +36,7 @@ In general, a Vulnerability/Event Model is responsible for obtaining for a parti The damage or disruption is sometimes referred to as the 'impact'. The current implementation is non-parametric and based on discrete bins - although continuous versions of :code:`HazardEventDistrib`/:code:`VulnerabilityDistrib` could certainly be added, based on particular parametric distributions. - + :code:`HazardEventDistrib` is in this non-parametric version a histogram of hazard event intensities: defines a set of intensity bins and the annual probability of occurrence. :code:`VulnerabilityDistrib` is a matrix that provides the probability that if an event occurs with intensity falling in a particular intensity bin, an impact in a particular impact bin occurs. @@ -53,14 +53,14 @@ The model applies to: * A type of hazard event (Inundation, Wildfire, Drought, etc) * A type of asset (residential property, power generating asset, etc) -Decorators are used to 'tag' a model, so that an appropriate model can be selected for a given asset and hazard type; configuration allows types of :code:`Model` to be used in preference to other candidates. +Decorators are used to 'tag' a model, so that an appropriate model can be selected for a given asset and hazard type; configuration allows types of :code:`Model` to be used in preference to other candidates. Specific types of model also exist for common modelling approaches. In particular, although in general it is desirable that a model has the flexibility to define its hazard event distribution and vulnerability distribution, in many cases the former will be sourced directly from a data set and it only remains to define the vulnerability distribution. The :code:`Model` class allows the general form of the model to be implemented. The :code:`VulnerabilityModel` class is for cases where only the vulnerability is to be specified. On-boarding a model based on a damage/disruption curve ------------------------------------------------------ -A vulnerability distribution can be inferred directly from a damage/disruption curve: +A vulnerability distribution can be inferred directly from a damage/disruption curve: .. image:: onboarding/disruption_curve.png :width: 500 @@ -79,15 +79,13 @@ In some cases, even if a full vulnerability matrix is unavailable, an estimate o .. image:: onboarding/damage_with_uncertainty.png :width: 500 -source: Huizinga et al. 'Global flood depth-damage functions: methodology and the database with guidelines' - -In such cases :code:`VulnerabilityModel` can be used to specify the close-formed conditional probability distribution to be used for a given intensity level. The cumulative probability density function is expected, and is provided via an :code:`ImpactCurve` by implementing method :code:`get_impact_curve`. +source: Huizinga et al. 'Global flood depth-damage functions: methodology and the database with guidelines' + +In such cases :code:`VulnerabilityModel` can be used to specify the close-formed conditional probability distribution to be used for a given intensity level. The cumulative probability density function is expected, and is provided via an :code:`ImpactCurve` by implementing method :code:`get_impact_curve`. Example models are provided to illustrate this. A model that uses beta distributions to provide a distribution yields the following :code:`VulnerabilityDistrib` in the above case: .. image:: onboarding/vulnerability_with_uncertainty.png :width: 500 - -Note that a beta distribution is a commonly-used heuristic; its functional form is convenient for vulnerability distributions although there appears to be limited justification for its use beyond providing a convenient means to apply uncertainty to a vulnerability distribution. - +Note that a beta distribution is a commonly-used heuristic; its functional form is convenient for vulnerability distributions although there appears to be limited justification for its use beyond providing a convenient means to apply uncertainty to a vulnerability distribution. diff --git a/methodology/PhysicalRiskMethodology.tex b/methodology/PhysicalRiskMethodology.tex index ccf7c4ef..c78d7b12 100644 --- a/methodology/PhysicalRiskMethodology.tex +++ b/methodology/PhysicalRiskMethodology.tex @@ -104,7 +104,7 @@ \smallskip \newline% \indent The views expressed in this paper are those of the authors and do not necessarily reflect the views and policies of their respective employers.} - } + } \date{May 2023 [Draft]} @@ -140,46 +140,46 @@ \section{Introduction} The changing climate introduces new risks. These can be grouped into: \begin{enumerate} - \item Physical risks -- risks arising from the physical effects of climate change, - \item Transition risks -- risks arising from the transition to a low-carbon economy, - \item Liability risks -- considered a third by some \cite{WoetzelEtAl:2020}, these are the risks arising when those affected by anthropogenic climate change seek compensation. + \item Physical risks -- risks arising from the physical effects of climate change, + \item Transition risks -- risks arising from the transition to a low-carbon economy, + \item Liability risks -- considered a third by some \cite{WoetzelEtAl:2020}, these are the risks arising when those affected by anthropogenic climate change seek compensation. \end{enumerate} The methodology presented in this document concerns the assessment of physical risk. Physical risk comes from changes in climate \emph{\gls{hazard}s}. A hazard is the potential occurrence of a climate-related physical phenomenon that can impact human and ecological systems \cite{ReisingerEtAl:2020}\cite{WoetzelEtAl:2020}\cite{MitchellEtAl:2017}. More precisely, the impact may be loss of life, injury, or other health impact, as well as damage and loss to property, infrastructure, -livelihoods, service provision, ecosystems, and environmental resources (see Annex II of \cite{PortnerEtAl:2022}). Hazards can be divided into \emph{\gls{acute_hazard}s} and \emph{\gls{chronic_hazard}s}. An acute hazard is the potential occurrence of an \emph{event}, for example a heat wave, inundation (flood) or hurricane. A chronic hazard is the potential occurrence of a trend in climate parameters such as an increase in average temperature, sea-level or water stress indices. +livelihoods, service provision, ecosystems, and environmental resources (see Annex II of \cite{PortnerEtAl:2022}). Hazards can be divided into \emph{\gls{acute_hazard}s} and \emph{\gls{chronic_hazard}s}. An acute hazard is the potential occurrence of an \emph{event}, for example a heat wave, inundation (flood) or hurricane. A chronic hazard is the potential occurrence of a trend in climate parameters such as an increase in average temperature, sea-level or water stress indices. \newglossaryentry{hazard} { - name=hazard, - description=Climate-related physical phenonenon that can impact natural and socioeconomic systems. + name=hazard, + description=Climate-related physical phenonenon that can impact natural and socioeconomic systems. } \newglossaryentry{acute_hazard} { - name=acute hazard, - description={Hazard which is an event, for example a heat wave, inundation, hurricane or wild fire.} + name=acute hazard, + description={Hazard which is an event, for example a heat wave, inundation, hurricane or wild fire.} } \newglossaryentry{chronic_hazard} { - name=chronic hazard, - description={Hazard which is a long-term shift in a climate parameter such as average temperature, sea-level or a water stress index.} + name=chronic hazard, + description={Hazard which is a long-term shift in a climate parameter such as average temperature, sea-level or a water stress index.} } \newglossaryentry{hazard_event} { - name=hazard event, - description={Definition of the occurrence of a hazard which can be assigned a probability. For example, a flood occurring in the year 2050 at a certain location with a depth greater than 50 cm.} + name=hazard event, + description={Definition of the occurrence of a hazard which can be assigned a probability. For example, a flood occurring in the year 2050 at a certain location with a depth greater than 50 cm.} } \newglossaryentry{hazard_parameter} { - name=hazard parameter, - description=Definition of the shifting parameter of a chronic hazard. This is a time-varying quantity such as the average temperature or the average number of days per year over a certain temperature threshold. + name=hazard parameter, + description=Definition of the shifting parameter of a chronic hazard. This is a time-varying quantity such as the average temperature or the average number of days per year over a certain temperature threshold. } The authors of \cite{RangerEtAl:2022} argue that sudden accute events are the most likely to generate \emph{`material shocks to the financial sector in the near-term'} and note that techniques to generate probabilistic scenarios to inform financial decision making is well-developed in the insurance industry. This is taken as a guiding principle, that a methodology for the measurement of physical climate risk should be adapted from the techniques developed by catastrophe modellers. The authors also note that \emph{`the financial risks from physical climate shocks cannot be approximated by considering only average annual costs of weather extremes, even on long timescales. Larger, rarer events can cause significant damage and disruption and have long-lived impacts.'}. Another guiding principle is this handling of rare events. -A model designed to quantify physical risk must take into account: a) hazard likelihood of occurrence b) the damage or disruption caused c) the consequence of this damage/disruption. Damage/disruption caused by a hazard is determined by the \emph{vulnerability} of the asset that is exposed\footnote{\emph{Exposure} of an asset to a hazard is defined after \cite{MaskreyEtAl:2011}; for most purposes this is determined by asset location.}. With a focus on financial risk, damage/disruption refers to damage of financial assets and disruption to business activities. More generally, damage can refer to natural assets and disruption to populations and ecosystems. Hereafter we use the word `asset' to describe both physical assets and business activities. As an example, the physical infrastructure of a power generating asset may be damaged by inundation and its electricity production may be disrupted, leading to a loss in revenue. +A model designed to quantify physical risk must take into account: a) hazard likelihood of occurrence b) the damage or disruption caused c) the consequence of this damage/disruption. Damage/disruption caused by a hazard is determined by the \emph{vulnerability} of the asset that is exposed\footnote{\emph{Exposure} of an asset to a hazard is defined after \cite{MaskreyEtAl:2011}; for most purposes this is determined by asset location.}. With a focus on financial risk, damage/disruption refers to damage of financial assets and disruption to business activities. More generally, damage can refer to natural assets and disruption to populations and ecosystems. Hereafter we use the word `asset' to describe both physical assets and business activities. As an example, the physical infrastructure of a power generating asset may be damaged by inundation and its electricity production may be disrupted, leading to a loss in revenue. We assign explicit names to these three components, a), b) and c) for the financial risk case: \begin{enumerate}[a)] @@ -196,17 +196,17 @@ \section{Introduction} The purpose of this paper is to present the methodology of a framework that is sufficiently generic to be used for a wide range of physical climate risk models, both precise and approximate as required. The ability to perform precise, fine-grained calculations is an important requirement therefore. This paper serves as a specification for use in the \emph{`physrisk'} OS-Climate (OS-C) \cite{OSC} physical climate risk calculation module. -OS-C aims to provide a platform unconstrained by any one particular methodology choice, but takes inspiration from natural catastrophe modelling \cite{MitchellEtAl:2017} and in particular the \emph{Oasis Loss Modelling Framework} \cite{OasisLMF} (henceforth \emph{Oasis LMF}), which was designed to accommodate a wide range of catastrophe models and analyse physical risk in the context of the insurance market. Similarly to \emph{Oasis LMF}, we adopt a modular approach. This approach allows the user to change easily a particular modelling method, whilst maintaining the integration of the components. +OS-C aims to provide a platform unconstrained by any one particular methodology choice, but takes inspiration from natural catastrophe modelling \cite{MitchellEtAl:2017} and in particular the \emph{Oasis Loss Modelling Framework} \cite{OasisLMF} (henceforth \emph{Oasis LMF}), which was designed to accommodate a wide range of catastrophe models and analyse physical risk in the context of the insurance market. Similarly to \emph{Oasis LMF}, we adopt a modular approach. This approach allows the user to change easily a particular modelling method, whilst maintaining the integration of the components. In the following, models of hazards, vulnerability and financial impact are discussed in more detail. In a later section these are presented more formally. \paragraph{Hazard.} -As noted above, hazard models come in two varieties: models of acute hazards -- events -- and models of chronic hazards -- long-term shifts in climate parameters. In climate risk events are \emph{climate-conditioned}: based not just on historical events but also future projections under different assumptions. +As noted above, hazard models come in two varieties: models of acute hazards -- events -- and models of chronic hazards -- long-term shifts in climate parameters. In climate risk events are \emph{climate-conditioned}: based not just on historical events but also future projections under different assumptions. \begin{enumerate}[label=\Alph*.] \item{\emph{Accute hazard models.}} Accute hazard models may be \emph{event-based} or \emph{return-period-based}. -\emph{Event-based hazard models} are models of individual events and are common in natural catastrophe modelling. Typically, for a large number of events, a model provides spatial distributions (i.e. a map) of the probabilities of occurrence of different event intensities. These distributions are sometimes called `hazard footprints' \cite{OasisFinancialModule}. As an example, in the case of inundation, the hazard footprint would provide for different locations the probability of occurrence of different inundation depths -- associated with one particular inundation event. +\emph{Event-based hazard models} are models of individual events and are common in natural catastrophe modelling. Typically, for a large number of events, a model provides spatial distributions (i.e. a map) of the probabilities of occurrence of different event intensities. These distributions are sometimes called `hazard footprints' \cite{OasisFinancialModule}. As an example, in the case of inundation, the hazard footprint would provide for different locations the probability of occurrence of different inundation depths -- associated with one particular inundation event. Event-based hazard models are important when the \emph{correlation} of hazards to which assets are exposed is material to the analysis being performed. For example, if one house on a street is exposed to an inundation it is likely that the house two doors down will also be exposed. This is captured by event-based hazard models: both houses might well appear in the same hazard footprint. The models are therefore important in reinsurance risk calculations, say, where the ability to calculate accurately `worst-case' losses is highly desirable. @@ -216,12 +216,12 @@ \section{Introduction} \begin{itemize} -\item when correlation of hazards is not relevant to the calculation, for example when modelling a single asset, or for certain calculations, such as annual average ground-up loss\footnote{For calculation of certain measures only marginal probability of occurrence of a hazard at a given location is relevant. This is discussed in more detail later, but may be true for certain average measures; for measures of tail-risk, in contrast, joint probability is needed for the calculation.}, or -\item when it is satisfactory to model correlation using a heuristic approach (e.g. when obtaining a rough estimate based on 0\% ot 100\% correlation or some estimated average spatial correlation). This may be used in cases where it is desirable to separate low-risk from high risk lending portfolios for example. +\item when correlation of hazards is not relevant to the calculation, for example when modelling a single asset, or for certain calculations, such as annual average ground-up loss\footnote{For calculation of certain measures only marginal probability of occurrence of a hazard at a given location is relevant. This is discussed in more detail later, but may be true for certain average measures; for measures of tail-risk, in contrast, joint probability is needed for the calculation.}, or +\item when it is satisfactory to model correlation using a heuristic approach (e.g. when obtaining a rough estimate based on 0\% ot 100\% correlation or some estimated average spatial correlation). This may be used in cases where it is desirable to separate low-risk from high risk lending portfolios for example. \end{itemize} \item{\emph{Chronic hazards.}} -As discussed above, acute hazard models provide probability distributions for future events. In contrast chronic hazard models provide climate parameters only. The models are therefore non-probabilistic for a given scenario. For example, a model of average surface temperature would provide values for different latitudes and longitudes under a particular climate scenario (e.g. particular social-economic and representative concentration pathway). \emph{Under this particular scenario}, the assumption is that the climate parameter is certain to take the value. +As discussed above, acute hazard models provide probability distributions for future events. In contrast chronic hazard models provide climate parameters only. The models are therefore non-probabilistic for a given scenario. For example, a model of average surface temperature would provide values for different latitudes and longitudes under a particular climate scenario (e.g. particular social-economic and representative concentration pathway). \emph{Under this particular scenario}, the assumption is that the climate parameter is certain to take the value. \end{enumerate} @@ -234,11 +234,11 @@ \section{Introduction} \item{In many cases the properties of the asset sufficient to ascertain its vulnerability are, although in principle knowable, unknown. That is there is an \emph{epistemic uncertainty}\cite{MitchellEtAl:2017}.} \end{itemize} -Both these sources of uncertainty may be material to the calculation in hand and neglecting these is a potential source of model risk\footnote{We define model risk to be the risk that the model outputs lead to poor management information or cause bad decisions to be made. Note that model risk is \emph{not} the risk that a model is wrong: all models are in some sense `wrong', although some may be useful.}. In many climate risk calculations, epistemic uncertainty is particularly important: the vulnerability of assets in some portfolios may be uncertain but this does not prevent, say, the estimation of a likely upper bound to damage or disruption. Such a bound may be wrong however, if one does not allow for the possibility that the asset's nature is such that it may be significantly more vulnerable than some average level. +Both these sources of uncertainty may be material to the calculation in hand and neglecting these is a potential source of model risk\footnote{We define model risk to be the risk that the model outputs lead to poor management information or cause bad decisions to be made. Note that model risk is \emph{not} the risk that a model is wrong: all models are in some sense `wrong', although some may be useful.}. In many climate risk calculations, epistemic uncertainty is particularly important: the vulnerability of assets in some portfolios may be uncertain but this does not prevent, say, the estimation of a likely upper bound to damage or disruption. Such a bound may be wrong however, if one does not allow for the possibility that the asset's nature is such that it may be significantly more vulnerable than some average level. -At time of writing, physical risk calculations may make use of `bulk-assessment' approaches where accurate asset vulnerability information is unavailable and approximations are therefore required. The modelling framework aims to accommodate bulk-assessment-type models as well as approaches capable of modelling vulnerability more precisely, the assumption being that there is potentially great value in the results obtained from very simple models, as long as the model uncertainty is properly-quantified. The aim is to be able to accommodate both simple and complex models in combination. +At time of writing, physical risk calculations may make use of `bulk-assessment' approaches where accurate asset vulnerability information is unavailable and approximations are therefore required. The modelling framework aims to accommodate bulk-assessment-type models as well as approaches capable of modelling vulnerability more precisely, the assumption being that there is potentially great value in the results obtained from very simple models, as long as the model uncertainty is properly-quantified. The aim is to be able to accommodate both simple and complex models in combination. -\paragraph{Financial.} +\paragraph{Financial.} Finally, the financial component is concerned with translating a probability distribution of asset damage/disruption to a loss of profitability for a company, or a loss of value for a lender, insurer, equity stakeholder etc. Clearly, the models used in the Financial module answer questions specific to a certain user: is the ultimate objective that of measuring the physical risk for the company or for one of the asset's insurer? Depending on the answer to that question, a different financial model might be needed. One important feature of financial models is the role played by insurance. For example, for a lender, what is the impact of climate change on the level of risk of a commercial real estate portfolio? An increase in the frequency and severity of acute hazards may affect the value of the loan collateral but this can depend strongly on whether damage/disruption is covered by insurance and premiums remain low for example. @@ -257,7 +257,7 @@ \subsection{Overview} Data sets of \emph{hazard indicators}\footnote{a hazard indicator is measure used to quantify a hazard.} are obtained from a variety of sources. For modelling acute hazards, datasets typically comprise probability distributions of events such as inundations, periods of drought or periods of high wind. These data sets might, for example, specify the annual probability of occurrence of an event (e.g. high wind) of a certainty intensity (e.g. maximum wind speed) for some specified year in the future. An important class of such data sets are the \emph{hazard maps}, described later in this section. -\emph{Vulnerability models} are applied to different types of asset and different types of hazard. A vulnerability model will use information about an asset, typically its geolocation, type and relevant characteristics, and will source hazard indicator data using one or more \emph{hazard models}. The vulnerability model will construct from these inputs an impact distribution. +\emph{Vulnerability models} are applied to different types of asset and different types of hazard. A vulnerability model will use information about an asset, typically its geolocation, type and relevant characteristics, and will source hazard indicator data using one or more \emph{hazard models}. The vulnerability model will construct from these inputs an impact distribution. In the case of acute hazards, in order to derive the impact distribution vulnerability models will typically construct both: \begin{itemize} @@ -297,7 +297,7 @@ \subsection{Hazard model} Hazard indicator data sets are available from a number of sources both publicly-available and proprietary. A recent paper \cite{BavandiEtAl:2022} provides a review of sources of the \emph{`forward-looking climate-conditioned hazard data sets'}, as the authors describe the data, that are required by the methodology presented in this document. \cite{RichtersEtAl:2022} provides technical information on the data sets provided by the Network for Greening the Financial System (NGFS) scenarios and provides a useful introduction to scenarios and in particular Representative Concentration Pathways (RCPs) and Shared Socioeconomic Pathways (SSPs) as well as the Coupled Model Intercomparison Project (CMIP) of global climate models data sets. CMIP data sets are very often key inputs into the derivation of forward-looking climate-conditioned hazard indicators. -Subsequent sections include details of both vulnerability models and sources of hazard indicator data sets for each type of hazard. +Subsequent sections include details of both vulnerability models and sources of hazard indicator data sets for each type of hazard. \subsection{Vulnerability model} \label{SubSec:VulnerabilityModel} @@ -321,8 +321,8 @@ \subsubsection{Mathematical description of vulnerability models} The impact of hazards on a portfolio of $n$ assets is a (multivariate) probability distribution as a result of the primary and secondary uncertainties. The impact in a given year on a single asset is a random variable, $D$, with (marginal) probability density function $f_D(d)$. The probability of an impact exceeeding $d$ (the \emph{exceedance probability}), $F'_D(d) = \mathbb{P}[D > d]$ is given by: \begin{equation} - \label{Eq:ImpactExceed} - F'_D(d) = \int_d^{\infty} f_D(u) du + \label{Eq:ImpactExceed} + F'_D(d) = \int_d^{\infty} f_D(u) du \end{equation} This is related to the cumulative probability $F_{D}(d) = \mathbb{P}[D \le d]$ by $F'_D(d) = 1 - F_D(d)$. Exceedance probabilities are a popular measure in catastrophe model and the use of $F$ for cumulative probability and $F'$ for exceedance probability will be used hereafter to avoid confusion. @@ -331,53 +331,53 @@ \subsubsection{Mathematical description of vulnerability models} We define a conditional probability density function $f_{D|S}(d, s)$ to be the probability that given the occurrence of a hazard indicator $s$, an impact occurs of size $d$. This distribution captures the secondary uncertainty. -The impact distribution is then given by: - +The impact distribution is then given by: + \begin{equation} - \label{Eq:ImpactEffective} - f_D(d) = \int_{-\infty}^{\infty} f_S(s) f_{D|S}(d, s) ds + \label{Eq:ImpactEffective} + f_D(d) = \int_{-\infty}^{\infty} f_S(s) f_{D|S}(d, s) ds \end{equation} Note that $f_d(d)$ is identical to the {\it effective damageability} distribution of Oasis LMF\cite{OasisFinancialModule} and can be described as the `effective impact'. It is a marginal distribution and as such does not capture any correlation between events nor impacts. In the catastrophe models of Oasis LMF, impacts are sampled from this distribution \cite{OasisFinancialModule}, for example samples of fractional damage, which form the basis of a Monte Carlo calculation. This is done in order to apply insurance policy terms and conditions which can be complex and non-linear. -In the case of $n$ assets, multivariate random variables are defined $\mathbf{D} = (D_1,\ldots,D_d)$ and $\mathbf{S} = (S_1,\ldots,S_n)$. We henceforth use the single-asset index $i$ to denote marginal distributions: $f_{S_i}(s_i)$. +In the case of $n$ assets, multivariate random variables are defined $\mathbf{D} = (D_1,\ldots,D_d)$ and $\mathbf{S} = (S_1,\ldots,S_n)$. We henceforth use the single-asset index $i$ to denote marginal distributions: $f_{S_i}(s_i)$. \subsubsection{Return-period-based approach} -The \emph{return-period-based approach} -- sometimes called, a hazard-map-based approach -- makes use of marginal distributions $f_{S_i}$ for each (asset) location $i$, and not the joint distribution, $f_S(\mathbf{s})$. By definition, the marginals are related to the joint distribution by: +The \emph{return-period-based approach} -- sometimes called, a hazard-map-based approach -- makes use of marginal distributions $f_{S_i}$ for each (asset) location $i$, and not the joint distribution, $f_S(\mathbf{s})$. By definition, the marginals are related to the joint distribution by: \begin{equation} - \label{Eq:ImpactMarginal} - f_{S_i}(s_i) = \int_{-\infty}^{\infty} \int_{-\infty}^{\infty} \dots \int_{-\infty}^{\infty} f_S(s_1,s_2, \dots,s_n) \,ds_1 \dots ds_{i-1} ds_{i + 1} \dots ds_n + \label{Eq:ImpactMarginal} + f_{S_i}(s_i) = \int_{-\infty}^{\infty} \int_{-\infty}^{\infty} \dots \int_{-\infty}^{\infty} f_S(s_1,s_2, \dots,s_n) \,ds_1 \dots ds_{i-1} ds_{i + 1} \dots ds_n \end{equation} $f_{S_i}(s_i)$ is usually inferred from a type of hazard indicator data set which are known as \emph{hazard maps}. -\paragraph{Hazard maps.} Hazard maps are three-dimensional data sets from which intensities of hazard indicators can be looked up for different locations and different return periods, i.e. $H(x, y, \tau)$ provides hazard indicator intensity at location $(x, y)$ for return period $\tau$. That is, $H$ is the hazard indicator intensity such that the average time between events with intensity higher than $H$ is $\tau$. +\paragraph{Hazard maps.} Hazard maps are three-dimensional data sets from which intensities of hazard indicators can be looked up for different locations and different return periods, i.e. $H(x, y, \tau)$ provides hazard indicator intensity at location $(x, y)$ for return period $\tau$. That is, $H$ is the hazard indicator intensity such that the average time between events with intensity higher than $H$ is $\tau$. In order to use hazard maps to derive probabilities, we must, strictly, specify the model of probability of occurrence of events with intensity higher than $H$ assumed by the data set. Occurrence may be modelled by a Poisson distribution as in Equation~\ref{Eq:Poisson}. This gives the probability of $k$ occurrences in time interval $t$ where $\tau$ is the return period. \begin{equation} - \label{Eq:Poisson} - \mathbb{P}[X = k] = \frac{(t / \tau)^k}{k!} e^{-\frac{t}{\tau}} + \label{Eq:Poisson} + \mathbb{P}[X = k] = \frac{(t / \tau)^k}{k!} e^{-\frac{t}{\tau}} \end{equation} -Alternatively, the number of occurrences can be modelled as a Binomial distribution as in Equation~\ref{Eq:Binomial}, which provides the probability that $k$ occurrences occur in $n$ years, assuming that $\tau$ is specified in years. +Alternatively, the number of occurrences can be modelled as a Binomial distribution as in Equation~\ref{Eq:Binomial}, which provides the probability that $k$ occurrences occur in $n$ years, assuming that $\tau$ is specified in years. According to Equation~\ref{Eq:Binomial}, \emph{the probability that in a single year there is at least one event with intensity of $H$ or higher is $1/\tau$}. Unless otherwise specified, this is the interpretation used for $\tau$. Note that for Equation~\ref{Eq:Poisson} this relationship only applies approximately. \begin{equation} - \label{Eq:Binomial} - \mathbb{P}[X = k] = \binom{n}{k} (1/\tau)^k (1-1/\tau)^{n - k} + \label{Eq:Binomial} + \mathbb{P}[X = k] = \binom{n}{k} (1/\tau)^k (1-1/\tau)^{n - k} \end{equation} -$F_{S_i}$ can then be inferred from the hazard map for point-like assets. The curve $H(x_i, y_i, \tau)$ is looked up, providing $\tau$ and thereby annual exceedance probabilities for different intensities, $H$. In the case of a point-like asset, the look up is from spatial coordinates ($x_i$, $y_i$). A hazard map will have an associated co-ordinate reference system (CRS). For example the CRS of whole-globe maps is often the WGS84 World Geodetic System (EPSG:4326). In this case ($x_i$, $y_i$) represent longitude and latitude under that CRS. +$F_{S_i}$ can then be inferred from the hazard map for point-like assets. The curve $H(x_i, y_i, \tau)$ is looked up, providing $\tau$ and thereby annual exceedance probabilities for different intensities, $H$. In the case of a point-like asset, the look up is from spatial coordinates ($x_i$, $y_i$). A hazard map will have an associated co-ordinate reference system (CRS). For example the CRS of whole-globe maps is often the WGS84 World Geodetic System (EPSG:4326). In this case ($x_i$, $y_i$) represent longitude and latitude under that CRS. \paragraph{Effective impact.} Once $F_{S_i}$ and thereby $f_{S_i}$ is obtained, Equation~\ref{Eq:ImpactEffective} can be applied to obtain the impact distributions for each location $i$: \begin{equation} - \label{Eq:ImpactMarginal2} - f_{D_i}(d_i) = \int_{-\infty}^{\infty} f_{S_i}(s_i) f_{D_i|S_i}(d_i, s_i) ds_i + \label{Eq:ImpactMarginal2} + f_{D_i}(d_i) = \int_{-\infty}^{\infty} f_{S_i}(s_i) f_{D_i|S_i}(d_i, s_i) ds_i \end{equation} In order to aggregate impacts over a portfolio, the dependency structure must be provided; in general, such a dependency structure is specified by a copula\cite{Nelsen:2007}. This may be derived via a heuristic; for example a `worst case' dependency structure could be provided to obtain an upper bound, perhaps assuming 100\% correlation between impacts. In general the approach approach in this section is not intended for cases where accurate treatment of the dependence between the impacts is needed, but rather for: @@ -390,41 +390,41 @@ \subsubsection{Return-period-based approach} The Sklar theorem of copula theory states that for $n$ random variables~$(D_1, \dots, D_n)$ with joint cumulative density function~(CDF)~$F_D(d_1, \dots, d_n) = \mathbb{P}[D_1 \le d_1, \dots, D_n \le d_n]$, there exists a copula~\mbox{$C:[0,1]^n \rightarrow [0,1]$} such that \begin{equation} - \label{Eq:Copula} - F_D(d_1, \dots, d_n) = C \left( F_{D_1}(d_1), \dots, F_{D_n}(x_n) \right). + \label{Eq:Copula} + F_D(d_1, \dots, d_n) = C \left( F_{D_1}(d_1), \dots, F_{D_n}(x_n) \right). \end{equation} As a reminder, $F_{D_i}(d_i) = \mathbb{P}[D_i \le d_i]$ is the marginal distribution of random variable~$D_i$, \mbox{$i=1, \dots, n$}. In the general case, Monte Carlo approaches can be used to sample from $F_D$. The approach is: \begin{enumerate}[] - \item Sample vector $\mathbf{u}$ from $C$; - \item Calculate samples for vector $\mathbf{d}$ using the relationship $d_i = F_{D_i}^{-1}(u_i)$. + \item Sample vector $\mathbf{u}$ from $C$; + \item Calculate samples for vector $\mathbf{d}$ using the relationship $d_i = F_{D_i}^{-1}(u_i)$. \end{enumerate} The samples can then be used to construct a total damage, for example, via $\sum_i d_i$. Under heuristic approaches a Gaussian copula might be chosen: \begin{equation} - \label{Eq:CopulaGaussian} - C^{\text{Gaussian}}_K(\mathbf{u}) = \Phi_n(\Phi^{-1}(u_1), \dots, \Phi^{-1}(u_n);\mathbf{K}), + \label{Eq:CopulaGaussian} + C^{\text{Gaussian}}_K(\mathbf{u}) = \Phi_n(\Phi^{-1}(u_1), \dots, \Phi^{-1}(u_n);\mathbf{K}), \end{equation} where $\Phi(z)$ is the CDF of a standard normal variable, and $\Phi_n(\mathbf{z}; \mathbf{K})$ denotes a joint standard normal multivariate~CDF with mean zero and correlation matrix $\mathbf{K}$. Samples $\mathbf{u}$ can be obtained by the approach: \begin{enumerate}[] - \item Sample vector $\mathbf{z}$ of correlated normal random numbers, - \item Calculate samples for vector $\mathbf{u}$ using the relationship $u_i = \Phi_i(z_i)$. + \item Sample vector $\mathbf{z}$ of correlated normal random numbers, + \item Calculate samples for vector $\mathbf{u}$ using the relationship $u_i = \Phi_i(z_i)$. \end{enumerate} -As an example, if impact distributions represent damage to buildings as a result of inundation then one may attempt to model damage to two buildings in close proximity as being highly correlated. However catastrophe model practitioners might point out that even such considerations as the presence or absence of kerb stones and availability of sand bags are highly significant so any such assumption is prone to error. If the buildings are far apart (say in different continents) then the correlation is likely to be close to zero however. The two extremes of 0\% and 100\% correlation of impacts are special cases of this general approach and it may be appropriate to run calculations with such cases to obtain an estimate of the impact of correlation -- rather than to attempt to model correlation more precisely. +As an example, if impact distributions represent damage to buildings as a result of inundation then one may attempt to model damage to two buildings in close proximity as being highly correlated. However catastrophe model practitioners might point out that even such considerations as the presence or absence of kerb stones and availability of sand bags are highly significant so any such assumption is prone to error. If the buildings are far apart (say in different continents) then the correlation is likely to be close to zero however. The two extremes of 0\% and 100\% correlation of impacts are special cases of this general approach and it may be appropriate to run calculations with such cases to obtain an estimate of the impact of correlation -- rather than to attempt to model correlation more precisely. \subsubsection{Event-based approach} As mentioned in the previous section, where an accurate treatment of the dependence between impacts is needed, a heuristic is unlikely to be adequate. This can occur, for example, where it is required to model the occurrence of a 1 in 250 years `worst-case' event, the event being `worst-case' for a specific portfolio\footnote{In general, a `1 in 250 year' event for a portfolio is an ambiguous statement and requires the definition of a measure. For example the `1 in 250 year' \emph{ground-up loss} of a portfolio is unambiguous. For a single asset, `1 in 250 year' is unambiguous if impact is assumed to be a non-decreasing function of hazard intensity.}. In such cases, it is necessary to model the dependence of hazard intensity and vulnerability explicitly. In an event-based approach, this is achieved by calculating the impact of a large number of events. An event might, for example, be a flood or storm affecting a particular geographical region. Events can be: \begin{itemize} - \item historical events, or - \item synthetic, `plausible' events. + \item historical events, or + \item synthetic, `plausible' events. \end{itemize} In the case of synthetic events, the event may itself be probabilistic; at a particular time, in a particular part of the region, the intensity of the hazard might be represented by a probability distribution. However historical events are typically deterministic and synthetic event sets are often deterministic also; unless otherwise stated, this will be assumed to be the case. @@ -435,32 +435,32 @@ \subsubsection{Event-based approach} More formally, for each event, index $j$, a function $z_j$ is defined such that $\tau_{i, j} = z_j(x_i, y_i)$. Here $\tau_{i, j}$ is the severity of the event specified as a return period for asset index $i$ and event index $j$. $(x_i, y_i)$ are the coordinates of the asset in the relevant CRS. For the given event, $\tau_{i, j}$ is then used to look up a hazard intensity, from the hazard map: - + \begin{equation} - \label{Eq:Severity1} - s_{i, j} = H(x_i, y_i, \tau_{i, j}) + \label{Eq:Severity1} + s_{i, j} = H(x_i, y_i, \tau_{i, j}) \end{equation} Note that here $s_{i, j}$ is deterministic \emph{for a given event} and we have simply for the impact distribution for event $j$: \begin{equation} - \label{Eq:Severity2} - f_{D_i, j}(d_i) = f_{D_i|S_i}(d_i, s_{i, j}) + \label{Eq:Severity2} + f_{D_i, j}(d_i) = f_{D_i|S_i}(d_i, s_{i, j}) \end{equation} For each event and each asset, we can then draw $m$ samples from $f_{D_i, j}(d_i)$. The samples across all assets for a single event are drawn jointly using a copula as per Equation~\ref{Eq:Copula} to capture the dependence structure of impacts. Such an approach can be important if levels of damage sustained under a given hazard intensity are correlated between assets, which might be the case if the assets are similar in construction. However, by default samples are assumed to be independent. That is the approach is: For each of $n$ events, and for each of $m$ samples: \begin{enumerate}[] - \item sample vector $\mathbf{u}$ of uncorrelated random numbers $\mathbf{U} \stackrel{iid}{\sim} U[0, 1]$; - \item calculate vector $\mathbf{d}$ using the relationship $d_i = F_{D_i, j}^{-1}(u_i)$. + \item sample vector $\mathbf{u}$ of uncorrelated random numbers $\mathbf{U} \stackrel{iid}{\sim} U[0, 1]$; + \item calculate vector $\mathbf{d}$ using the relationship $d_i = F_{D_i, j}^{-1}(u_i)$. \end{enumerate} The resulting $n \times m$ sets of impacts for the portfolio of assets is the inputs into the financial model. \paragraph{Constant severity regions} Under a constant severity region approximation, $\tau_{i, j}$ is a constant across each asset $i$ for a particular event $j$. - + \subsubsection{Discrete form of acute vulnerability model} \label{Sec:MathematicalDescriptionOfAssetImpactModel} @@ -477,11 +477,11 @@ \subsubsection{Discrete form of acute vulnerability model} That is, $s^{(h, \text{lower})}_q$ and $s^{(h, \text{upper})}_q$ define the range of bin $q$. For the avoidance of doubt, $\sigma^{(h)}_q$ is related to the continuous probability density $f_S(s)$ by: \begin{equation} - \label{Eq:Discrete2} - \sigma^{(h)}_q = \int_ {s^{(h, \text{lower})}_q}^{s^{(h, \text{upper})}_q} f_S(s) ds + \label{Eq:Discrete2} + \sigma^{(h)}_q = \int_ {s^{(h, \text{lower})}_q}^{s^{(h, \text{upper})}_q} f_S(s) ds \end{equation} -We define $v^{(h, b)}_{pq}$ to be the conditional probability that \emph{given} the occurrence of an event associated with a hazard of type $h$ and with intensity $s^{(h)} \in (s^{(h, \text{lower})}_q, s^{(h, \text{upper})}_q]$ there is an impact of type $b$, $d^{(b)} \in (d^{(b,\text{lower})}_p, d^{(b,\text{upper})}_p]$. $b$ may be, for example, damage incurred expressed as a fraction of the asset present value. +We define $v^{(h, b)}_{pq}$ to be the conditional probability that \emph{given} the occurrence of an event associated with a hazard of type $h$ and with intensity $s^{(h)} \in (s^{(h, \text{lower})}_q, s^{(h, \text{upper})}_q]$ there is an impact of type $b$, $d^{(b)} \in (d^{(b,\text{lower})}_p, d^{(b,\text{upper})}_p]$. $b$ may be, for example, damage incurred expressed as a fraction of the asset present value. \begin{equation} @@ -507,36 +507,36 @@ \subsubsection{Discrete form of acute vulnerability model} If only the mean impact curve is available, then it is possible to create the matrix such that $v_{pq} \in \{0, 1\}$. The matrix then provides a simple mapping from intensity to impact; if the number of intensity and response bins is equal then matrix $\mathbf{v}$ is simply the identity matrix. However, note that these simplifications exclude from the model any uncertainty in the parameters\footnote{A better approach would be to estimate the standard deviation of the distributions from which the mean impact curve was calculated and to incorporate this.}. -\paragraph{Multiple occurrence of events.} Note that $\sigma^{(h)}_q$ is the probability of occurrence of \emph{at least one event} with intensity in bin $q$ in a year and the vulnerability, $v_{pq}$ gives the probability of impact given at least one event has occurred. Some care must therefore be taken when using probabilities $v_{pq}$ calibrated from single events as there is an implied approximation that either probability of multiple events is small and/or that impact is well-modelled as a single impact from the most intense event for a given year. +\paragraph{Multiple occurrence of events.} Note that $\sigma^{(h)}_q$ is the probability of occurrence of \emph{at least one event} with intensity in bin $q$ in a year and the vulnerability, $v_{pq}$ gives the probability of impact given at least one event has occurred. Some care must therefore be taken when using probabilities $v_{pq}$ calibrated from single events as there is an implied approximation that either probability of multiple events is small and/or that impact is well-modelled as a single impact from the most intense event for a given year. \subsubsection{Importance of secondary uncertainty} %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% \begin{figure}[ht] - - \begin{framed} - - \includegraphics[width=\textwidth]{plots/fig_intensity.pdf} - - \end{framed} - - \footnotesize - - \renewcommand{\arraystretch}{1.01} - - \vspace{-3ex} - - {\justify - The exceedance curve of event intensity at the asset location is shown on the right. The event intensity in this example is inundation depth in metres. Exceedance is a cumulative probability. As an example, the probability of an inundation event occurring within a single year of intensity 0.91m or greater is 0.2\%. An exceedance probability is the reciprocal of the return period; it could equivalently be said that the 0.91m intensity event occurs with a return period of 500 years. - The exceedance curve can be converted to a histogram of probabilities. Here the $n_h$ bins have ranges $(s^{(h, \text{lower})}_q, s^{(h, \text{upper})}_q]$. For example, the first bin has range (0.28m, 0.38m]. The second bin has range (0.38m, 0.43m]; that is $s^{(h, \text{lower})}_2 = 0.38$m and $s^{(h, \text{upper})}_2 = 0.43$m. $\sigma^{(h)}_2 = 0.02$. - \par} - - \vspace{-0.5ex} - - \caption{\small Event intensity exceedance curve (right) and corresponding histogram (left).} - \label{Fig:intensity} - + + \begin{framed} + + \includegraphics[width=\textwidth]{plots/fig_intensity.pdf} + + \end{framed} + + \footnotesize + + \renewcommand{\arraystretch}{1.01} + + \vspace{-3ex} + + {\justify + The exceedance curve of event intensity at the asset location is shown on the right. The event intensity in this example is inundation depth in metres. Exceedance is a cumulative probability. As an example, the probability of an inundation event occurring within a single year of intensity 0.91m or greater is 0.2\%. An exceedance probability is the reciprocal of the return period; it could equivalently be said that the 0.91m intensity event occurs with a return period of 500 years. + The exceedance curve can be converted to a histogram of probabilities. Here the $n_h$ bins have ranges $(s^{(h, \text{lower})}_q, s^{(h, \text{upper})}_q]$. For example, the first bin has range (0.28m, 0.38m]. The second bin has range (0.38m, 0.43m]; that is $s^{(h, \text{lower})}_2 = 0.38$m and $s^{(h, \text{upper})}_2 = 0.43$m. $\sigma^{(h)}_2 = 0.02$. + \par} + + \vspace{-0.5ex} + + \caption{\small Event intensity exceedance curve (right) and corresponding histogram (left).} + \label{Fig:intensity} + \end{figure} %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% @@ -561,15 +561,15 @@ \subsubsection{Importance of secondary uncertainty} The conditional probabilities can then be combined: \begin{equation} - \label{Eq:epistemic2} - v^{(h, b)}_{pq} = \sum_a v^{(h, b)}_{pqa} \mathbb{P}[A = a] + \label{Eq:epistemic2} + v^{(h, b)}_{pq} = \sum_a v^{(h, b)}_{pqa} \mathbb{P}[A = a] \end{equation} $\mathbb{P}[A = a]$ is the \emph{prior} probability that the asset is of type $a$. This may be obtained from knowledge of the make-up of a portfolio. Note that through the application of Equation~\ref{Eq:model} the impact distribution now depends on the prior probabilities. To illustrate why it is reasonable that this should be the case, say we have two types of assets in our portfolio. Type A is vulnerable to a hazard with an intensity that has a relatively short return period of 50 years, whereas type B is invulnerable to all hazards but those with a vanishing small probability of occurrence. To derive the probability that an asset is damaged by a certain amount in a given year using Equation~\ref{Eq:epistemic2}, we must allow for the possibility that the asset may be of type A and may therefore be damaged as a result of 50 year events. -\paragraph{Epistemic uncertainty as source of error.} An alternate approach is to treat epistemic uncertainty as a source of error rather than, or in addition to, including it in the vulnerability as we have done here. This might be driven by the observation that as information as to the identity of assets is improved then the exceedance probability of a certain impact will change. This can be achieved by running an ensemble of calculations, changing the prior probabilities in each case. +\paragraph{Epistemic uncertainty as source of error.} An alternate approach is to treat epistemic uncertainty as a source of error rather than, or in addition to, including it in the vulnerability as we have done here. This might be driven by the observation that as information as to the identity of assets is improved then the exceedance probability of a certain impact will change. This can be achieved by running an ensemble of calculations, changing the prior probabilities in each case. \subsubsection{Interpolation of probability distributions} Cases arise where the event distributions and vulnerability distributions are not defined for a common set of intensity bins and interpolation is therefore required. The question then arises of how probability density is distributed within bins. The choice is model-specific and customizable, but here two common cases are described. @@ -590,48 +590,48 @@ \subsubsection{Probability bins from hazard maps} From Equation~\ref{Eq:Discrete2} the probability of an event occurring with hazard intensity in bin $q$ is expressed in terms of the probability density $f_S$ (dropping superscript $h$ for clarity): \begin{equation} - \label{Eq:Discrete2Again} - \sigma_q = \int_ {s^{(\text{lower})}_q}^{s^{(\text{upper})}_q} f_S(u) du \ - = \int_ {s^{(\text{lower})}_q}^{\infty} f_S(u) du - \int_ {s^{(\text{upper})}_q}^{\infty} f_S(u) du + \label{Eq:Discrete2Again} + \sigma_q = \int_ {s^{(\text{lower})}_q}^{s^{(\text{upper})}_q} f_S(u) du \ + = \int_ {s^{(\text{lower})}_q}^{\infty} f_S(u) du - \int_ {s^{(\text{upper})}_q}^{\infty} f_S(u) du \end{equation} The exceedance probability $F_S'$ is defined as: \begin{equation} - \label{Eq:DiscreteExceed} - F'_S(s) = \int_s^{\infty} f_S(u) du + \label{Eq:DiscreteExceed} + F'_S(s) = \int_s^{\infty} f_S(u) du \end{equation} from which we can write: \begin{equation} - \label{Eq:DiscreteExceed2} - \sigma_q = F'_S({s^{(\text{lower})}_q}) - F'_S({s^{(\text{upper})}_q}) + \label{Eq:DiscreteExceed2} + \sigma_q = F'_S({s^{(\text{lower})}_q}) - F'_S({s^{(\text{upper})}_q}) \end{equation} Using Equation~\ref{Eq:DiscreteExceed2}, a set of probability bins for the hazard event can be inferred from an exceedance probability curve. An exceedance probability curve can readily be inferred from a return-period curve using the result that the annual exceedance probability is the reciprocal of the return period expressed in years. -As an example, suppose that we have a hazard map for flood which contains return periods of 2, 5, 10, 25, 50, 100, 250, 500 and 1000 years. For a certain latitude/longitude the flood depths corresponding to the 9 return periods are, in metres: 0.06, 0.33, 0.51, 0.72, 0.86, 1.00, 1.15, 1.16 and 1.16. The data is shown together with the exceedance probability in Table~\ref{Table:HazardData}. +As an example, suppose that we have a hazard map for flood which contains return periods of 2, 5, 10, 25, 50, 100, 250, 500 and 1000 years. For a certain latitude/longitude the flood depths corresponding to the 9 return periods are, in metres: 0.06, 0.33, 0.51, 0.72, 0.86, 1.00, 1.15, 1.16 and 1.16. The data is shown together with the exceedance probability in Table~\ref{Table:HazardData}. \begin{table}[ht] - \caption{Example hazard event data.} - \centering - \begin{tabular}{c c c c} - \hline - Return period (years) & Flood depth (m) & Exceedance probability \\ [0.5ex] - \hline - 2 & 0.06 & 0.5 \\ - 5 & 0.33 & 0.2 \\ - 10 & 0.51 & 0.1 \\ - 25 & 0.72 & 0.04 \\ - 50 & 0.86 & 0.02 \\ - 100 & 1.00 & 0.01 \\ - 250 & 1.15 & 0.004 \\ - 500 & 1.16 & 0.002 \\ - 1000 & 1.16 & 0.001 \\ - \hline - \end{tabular} - \label{Table:HazardData} + \caption{Example hazard event data.} + \centering + \begin{tabular}{c c c c} + \hline + Return period (years) & Flood depth (m) & Exceedance probability \\ [0.5ex] + \hline + 2 & 0.06 & 0.5 \\ + 5 & 0.33 & 0.2 \\ + 10 & 0.51 & 0.1 \\ + 25 & 0.72 & 0.04 \\ + 50 & 0.86 & 0.02 \\ + 100 & 1.00 & 0.01 \\ + 250 & 1.15 & 0.004 \\ + 500 & 1.16 & 0.002 \\ + 1000 & 1.16 & 0.001 \\ + \hline + \end{tabular} + \label{Table:HazardData} \end{table} The flood depths become the bin edges of the probability distribution and the probabilities are calculated from Equation~\ref{Eq:DiscreteExceed2}. For example, the probability of occurrence of a flood with depth in the range (0.86m, 1.00m] is $0.02 - 0.01 = 0.01$\footnote{Care is needed at either end of the curve. There is a 0.001 probability that flood depth exceeds 1.16m in this example; should this be included in the (point-like) 1.16m bin?}. Note that in defining a set of bins in this way, no assumption about the interpolation between the flood depths is required. However, if we assume this to be linear then this implies that the probability density is constant across each bin since $f_S = \frac{dF_S(s)}{ds}$. @@ -646,41 +646,41 @@ \subsubsection{Vulnerability distributions and heuristics} The cumulative probability function of a Beta distribution is given by: \begin{equation} - \label{Eq:Beta1} - F_{\text{Beta}}(x) = \frac{B(x; a, b)}{B(1; a, b)} , + \label{Eq:Beta1} + F_{\text{Beta}}(x) = \frac{B(x; a, b)}{B(1; a, b)} , \end{equation} where $0 < x < 1$ and $B(x; a, b)$ is the incomplete Beta function: \begin{equation} - \label{Eq:IncompleteBeta} - B(x; a, b) = \int_0^{x} t^{a-1} (1 - t)^{b-1} dt . + \label{Eq:IncompleteBeta} + B(x; a, b) = \int_0^{x} t^{a-1} (1 - t)^{b-1} dt . \end{equation} If the mean, $\mu$ and standard deviation, $\sigma$ of the impact distribution are known then \cite{MitchellEtAl:2017}: \begin{equation} - \label{Eq:BetaA} - a = \frac{(1 - \mu)}{c^2} - \mu , + \label{Eq:BetaA} + a = \frac{(1 - \mu)}{c^2} - \mu , \end{equation} \begin{equation} - \label{Eq:BetaB} - b = \frac{a(1 - \mu)}{\mu} + \label{Eq:BetaB} + b = \frac{a(1 - \mu)}{\mu} \end{equation} where \begin{equation} - \label{Eq:BetaC} - c = \frac{\sigma}{\mu} + \label{Eq:BetaC} + c = \frac{\sigma}{\mu} \end{equation} In order to calculate the impact, the set of bins $p$ that define the impact probabilities $\delta_p$ of interest are first defined. The vulnerability matrix $v_{pq}$ of Equation~\ref{Eq:vulnerability} is then calculated. In order to apply Equation~\ref{Eq:Beta1}, $a$ and $b$ are calculated using mean and standard deviations of impact calculated at the mid-point of each intensity bin. We then have: \begin{equation} - \label{Eq:BetaVuln} - v_{pq} = F_{\text{Beta}}(d_p^{(\text{upper})}; a_q, b_q) - F_{\text{Beta}}(d_p^{(\text{lower})}; a_q, b_q) + \label{Eq:BetaVuln} + v_{pq} = F_{\text{Beta}}(d_p^{(\text{upper})}; a_q, b_q) - F_{\text{Beta}}(d_p^{(\text{lower})}; a_q, b_q) \end{equation} $a_q$ and $b_q$ are the values of $a$ and $b$ calculated from means and standard deviations calculated at the intensity bin centre $s_q = \frac{s_q^{(lower)} + s_q^{(upper)}}{2}$. @@ -690,7 +690,7 @@ \subsubsection{Vulnerability distributions and heuristics} \begin{framed} - \includegraphics[width=\textwidth]{plots/vulnerability_lagace_2008.png} + \includegraphics[width=\textwidth]{plots/vulnerability_lagace_2008.png} \end{framed} @@ -728,11 +728,11 @@ \subsection{Aggregation of impacts} \subsection{Financial model} \subsubsection{Types of calculation.} -Vulnerability models were described in \ref{SubSec:VulnerabilityModel} as a means to calculate the damage and disruption to a portfolio of assets for different hazard models. How the resulting probability distributions of impact are then used in a financial model depends on the intent of the analysis. We distinguish between \emph{stress test} and \emph{portfolio analysis} use cases. +Vulnerability models were described in \ref{SubSec:VulnerabilityModel} as a means to calculate the damage and disruption to a portfolio of assets for different hazard models. How the resulting probability distributions of impact are then used in a financial model depends on the intent of the analysis. We distinguish between \emph{stress test} and \emph{portfolio analysis} use cases. \emph{Stress tests} make use of climate-related shocks -- severe acute events -- in order to assess an impact. This might for example be the impact on a financial institution. Stress tests may make use of narrative scenarios or may take the approach of simulating large number of extreme but plausible events in order to identify a worst-case which is \emph{a priori} unknown. Indeed the two approaches may be combined, assessing the impact of a severe acute event coupled with other aggravating factors. -In a \emph{portfolio analysis}, the aim is to assess which parts of a portfolio of assets are most subject to physical climate risk. +In a \emph{portfolio analysis}, the aim is to assess which parts of a portfolio of assets are most subject to physical climate risk. \subsubsection{Climate risk measures and importance of change.} Climate risk models generally differ from catastrophe models in more than their use of climate-conditioned and projected hazard models. In particular, physical climate risk arises from \emph{changes} in climate. @@ -740,8 +740,8 @@ \subsubsection{Climate risk measures and importance of change.} We take as an example a real estate asset that is collateral for a loan. The hypothetical asset is exposed to both hurricane and flood hazards today, however it is covered by an insurance policy and its current valuation takes into account both historical occurrence of hazards and the policy details. Risk managers concerned with climate risk are likely to be interested in potential changes in value of the asset over the full term of the loan: \begin{enumerate} - \item if acute events become more frequent and severe, assets may become more expensive to insure and less desirable {\textcolor{red}{\emph{[Citation]}}} \footnote{For example, to a resident of a house subject to regular flooding.}, which can decrease the asset value; - \item if an extremely severe and widespread event occurs, default may lead to a distressed sale and/or the full insurance payout may not be made. + \item if acute events become more frequent and severe, assets may become more expensive to insure and less desirable {\textcolor{red}{\emph{[Citation]}}} \footnote{For example, to a resident of a house subject to regular flooding.}, which can decrease the asset value; + \item if an extremely severe and widespread event occurs, default may lead to a distressed sale and/or the full insurance payout may not be made. \end{enumerate} For a portfolio analysis, it is therefore likely to be the change in frequency of events and the change in probability of extremely severe events that is particularly of interest; these are the risk drivers. @@ -792,23 +792,23 @@ \subsubsection{Data availability} \section{Inundation} \subsection{Hazard models} -Inundation is modelled as an acute risk using the approach of Section~\ref{SubSec:AcuteAssetImpactModel}. Hazard event models compatible with this method provide inundation depths for different annual probabilities of occurrence -- or equivalently return periods. The need for sufficient granularity in the set of return periods is discussed in \cite{WardEtAl:2011}. +Inundation is modelled as an acute risk using the approach of Section~\ref{SubSec:AcuteAssetImpactModel}. Hazard event models compatible with this method provide inundation depths for different annual probabilities of occurrence -- or equivalently return periods. The need for sufficient granularity in the set of return periods is discussed in \cite{WardEtAl:2011}. Inundation hazards are incorporated into physical risk calculations using the World Resource Institute (WRI) Aqueduct flood model \cite{WardEtAl:2020} which has relatively high return-period granularity. This is based on the global modelling approach of \cite{WardEtAl:2013}. {\textcolor{red}{\emph{[Discuss and include refs for approaches based on flooded area?]}}} \subsection{Vulnerability models} -Notable damage models for real estate assets include the FEMA FAST `HAZUS' model \cite{ScawthornEtAl:2006} and an European Commission Joint Research Centre (JRC) model \cite{HuizingaEtAl:2017}. The latter is implemented in the \emph{physrisk} library. - +Notable damage models for real estate assets include the FEMA FAST `HAZUS' model \cite{ScawthornEtAl:2006} and an European Commission Joint Research Centre (JRC) model \cite{HuizingaEtAl:2017}. The latter is implemented in the \emph{physrisk} library. + \section{Heat} Heat is classified as both a chronic and an acute hazard. For example, increased average temperature in a particular area can lower average productivity from labour or make the area less desirable as a place to live, lowering real estate prices. We classify these as risks from chronic hazards. Heat waves are examples of acute hazard events; a period of particularly high temperature might lead to the complete suspension of industrial activity. -Multiple indexes for quantifying heat hazards have been suggested and multiple approaches for the modelling of acute events are present in the literature, e.g. \cite{MazdiyasniEtAl:2019}. Similarly, various methods for modelling the vulnerability to heat hazards have been suggested. Analyses of heat wave events are commonly based on Global and Regional Circulation Model (GCM and RCM) outputs \cite{DosioEtAl:2018}. In \cite{Christidis:2021} and \cite{Christidis:2013} the authors analyse ensembles of CMIP6 simulations with and without anthropogenic forcings in order to determine if extreme heat events are attributable to (anthropogenic) climate change. Such attribution analysis is based in part on finding return periods of events (see also \cite{StottEtAl:2016}). This estimation of return periods for events is directly applicable to acute hazard models. +Multiple indexes for quantifying heat hazards have been suggested and multiple approaches for the modelling of acute events are present in the literature, e.g. \cite{MazdiyasniEtAl:2019}. Similarly, various methods for modelling the vulnerability to heat hazards have been suggested. Analyses of heat wave events are commonly based on Global and Regional Circulation Model (GCM and RCM) outputs \cite{DosioEtAl:2018}. In \cite{Christidis:2021} and \cite{Christidis:2013} the authors analyse ensembles of CMIP6 simulations with and without anthropogenic forcings in order to determine if extreme heat events are attributable to (anthropogenic) climate change. Such attribution analysis is based in part on finding return periods of events (see also \cite{StottEtAl:2016}). This estimation of return periods for events is directly applicable to acute hazard models. -In order to support a wide range of hazard and vulnerability models, \emph{physrisk} includes the derivation of heat statistics from CMIP6 data\footnote{This is somewhat in contrast to the use of the Aqueduct model of \cite{WardEtAl:2020} for modelling inundation where the complete hazard model is used as-is within \emph{physrisk} -- albeit reformatted to handle efficiently the access patterns needed for physical risk calculations.}. +In order to support a wide range of hazard and vulnerability models, \emph{physrisk} includes the derivation of heat statistics from CMIP6 data\footnote{This is somewhat in contrast to the use of the Aqueduct model of \cite{WardEtAl:2020} for modelling inundation where the complete hazard model is used as-is within \emph{physrisk} -- albeit reformatted to handle efficiently the access patterns needed for physical risk calculations.}. \subsection{Hazard Models} @@ -838,10 +838,10 @@ \subsubsection{Impact of Temperature on labour productivity} The paper main conclusions are: \begin{itemize} - \item A statistically significant impact of 2.6 minutes lost per degree of temperature above $90^\circ F$ during normal economic periods and no relationship during a recession. This result is converted into the Celsius scale as \emph{physrisk} decided to take that scale as a reference. The 2.6 minutes is multiplied by a scaling factor of 1.8, which returns \textbf{an impact of 4.7 minutes lost per degree of temperature above $32.2^\circ C$}. - \item When using an indicator variable and linear regression the estimated impact was 5.6 minutes under Fahrenheit scale (respectively 10.08 minutes under Celsius scale) during normal economic periods, but the parameter was insignificant. - \item No relationship between temperature and work allocation with temperatures below $32.2^\circ C$. - \item Focus on labour allocation decisions, it does not account for other impacts such as reducing productivity. + \item A statistically significant impact of 2.6 minutes lost per degree of temperature above $90^\circ F$ during normal economic periods and no relationship during a recession. This result is converted into the Celsius scale as \emph{physrisk} decided to take that scale as a reference. The 2.6 minutes is multiplied by a scaling factor of 1.8, which returns \textbf{an impact of 4.7 minutes lost per degree of temperature above $32.2^\circ C$}. + \item When using an indicator variable and linear regression the estimated impact was 5.6 minutes under Fahrenheit scale (respectively 10.08 minutes under Celsius scale) during normal economic periods, but the parameter was insignificant. + \item No relationship between temperature and work allocation with temperatures below $32.2^\circ C$. + \item Focus on labour allocation decisions, it does not account for other impacts such as reducing productivity. \end{itemize} While the results are relevant and significant, is it important to highlight the following disclaimers on the results: @@ -874,9 +874,9 @@ \subsubsection{Impact of Temperature on labour productivity} \subsubsection{Uncertainty around the vulnerability Heat model} \paragraph{Overview} -The assessment is based on the research performed by Zhang and Shindel, which reviews the uncertainty in the heat risk literature \cite{ZhangAndShindell:2021}. This paper provides context around the uncertainty that exists in the result discussed in previous section, which is mainly explained by the methodology used for the estimation of the impact of temperature on labour productivity. +The assessment is based on the research performed by Zhang and Shindel, which reviews the uncertainty in the heat risk literature \cite{ZhangAndShindell:2021}. This paper provides context around the uncertainty that exists in the result discussed in previous section, which is mainly explained by the methodology used for the estimation of the impact of temperature on labour productivity. \begin{itemize} - \item \cite{ZhangAndShindell:2021} provides an analysis of the \textbf{differential forecasts} between using the \textbf{GZN method} (as reference to Graff-Zivin and Neidell) documented in \cite{TemperatureAndWork:2021}, versus the WetBulb Globe Temperature methodology (\textbf{WBGT method}) which includes other climate factors in addition to temperature: humidity, wind speed and heat radiation -- figure \ref{fig:WBGT} \footnote{Extracted from \cite{ZhangAndShindell:2021} -- p.4} provides the WBGT detailed approach. + \item \cite{ZhangAndShindell:2021} provides an analysis of the \textbf{differential forecasts} between using the \textbf{GZN method} (as reference to Graff-Zivin and Neidell) documented in \cite{TemperatureAndWork:2021}, versus the WetBulb Globe Temperature methodology (\textbf{WBGT method}) which includes other climate factors in addition to temperature: humidity, wind speed and heat radiation -- figure \ref{fig:WBGT} \footnote{Extracted from \cite{ZhangAndShindell:2021} -- p.4} provides the WBGT detailed approach. \item Another major source of differentiation is that the GZN method focuses on changes in labour allocation decisions while the WBGT method focuses on the physiological impacts of rising temperatures. \end{itemize} @@ -896,7 +896,7 @@ \subsubsection{Uncertainty around the vulnerability Heat model} -Note that there are differences in the functional forms applied in the original GZN method \cite{TemperatureAndTheAllocationofTime:2014} and the approach presented in \cite{TemperatureAndWork:2021}, with original GZN method using one linear regression with dummy variables for temperature buckets, while \cite{TemperatureAndWork:2021} uses multiple linear regressions with one variable reflecting the breach of the maximum temperature around anchor points (less than $70^\circ F$, $90^\circ F$, $90^\circ F$ and above). The WBGT methodology uses a non-linear function to relate labour loss to the WBGT consolidated measure. +Note that there are differences in the functional forms applied in the original GZN method \cite{TemperatureAndTheAllocationofTime:2014} and the approach presented in \cite{TemperatureAndWork:2021}, with original GZN method using one linear regression with dummy variables for temperature buckets, while \cite{TemperatureAndWork:2021} uses multiple linear regressions with one variable reflecting the breach of the maximum temperature around anchor points (less than $70^\circ F$, $90^\circ F$, $90^\circ F$ and above). The WBGT methodology uses a non-linear function to relate labour loss to the WBGT consolidated measure. Figure \ref{fig:CostsByRCP} \footnote{Extracted from \cite{ZhangAndShindell:2021} -- p.11} provides the forecasts of labour lost millions of 2016 USD (constant USD value). Most notably the original GZN produces more optimistic forecasts of the cost of labour lost (lower) than the WBGT method. Note that RCP8.5\footnote{The Intergovernmental Panel on Climate Chance modelling are based on representative concentration pathways (RCPs), which represent different emissions projections under basic, plausible economic and social assumptions, while staying within physical constraints. RPCs are constructed by back-calculating the amount of emissions that would result in a given amount of radiative forcing (which is the difference between solar radiation (energy) absorbed by the Earth and energy radiated back into the space) that would then result in a given amount of warming} refers to the scenario of high emissions and RCP4.5 refers to the scenario of moderate emissions. @@ -913,15 +913,15 @@ \subsubsection{Uncertainty around the vulnerability Heat model} There are 2 identified areas where uncertainty in the forecasts in \cite{TemperatureAndWork:2021} paper: the economic cycle and the model parameter uncertainty. \newline -The \textbf{economic cycle} is one area where uncertainty exists in the forecasts. -The paper shows that labour allocation decisions are sensitive to where in the economic cycle the US is; during a recession there does not appear to be a relationship between labour allocation and temperature. In order to measure the uncertainty explained by the economic cycle, one might consider the probability of a recession as a Bernoulli random variable with a probability p. Based on this there are two possibly approaches. A first approach is a Monte-Carlo like approach where one can randomly sample the 1, 0 value whether a recession occurs at each period on a time path. A second approach would be to use the expected value of the probability of the recession and estimate the impact as: +The \textbf{economic cycle} is one area where uncertainty exists in the forecasts. +The paper shows that labour allocation decisions are sensitive to where in the economic cycle the US is; during a recession there does not appear to be a relationship between labour allocation and temperature. In order to measure the uncertainty explained by the economic cycle, one might consider the probability of a recession as a Bernoulli random variable with a probability p. Based on this there are two possibly approaches. A first approach is a Monte-Carlo like approach where one can randomly sample the 1, 0 value whether a recession occurs at each period on a time path. A second approach would be to use the expected value of the probability of the recession and estimate the impact as: \begin{equation} \label{Eq:economiccycle} - Forecasted \ Minutes \ Lost = p \times 0 + (1-p) \times EV(X) + Forecasted \ Minutes \ Lost = p \times 0 + (1-p) \times EV(X) \end{equation} Where $X$ is the variable that refers to Minutes Lost during normal economic cycle -The second approach is attractive in its simplicity and ensuring the model does not lose its focus. -One concern is that the probability of recession, in reality, may be related to the realisation of climate related risks. Hence, there might be a over/under estimation of the probability unless the impact of the climate risk is also considered. Historical model estimated recession probabilities can be sourced from \cite{SmoothedU.S.RecessionProbabilities:2022}. However, we did not go further in the measurement of the uncertainty explained by the economic cycle because it requires us to focus on the modelling of another parameter ($p$, the probability of the recession to occur), which is not the purpose of this work. +The second approach is attractive in its simplicity and ensuring the model does not lose its focus. +One concern is that the probability of recession, in reality, may be related to the realisation of climate related risks. Hence, there might be a over/under estimation of the probability unless the impact of the climate risk is also considered. Historical model estimated recession probabilities can be sourced from \cite{SmoothedU.S.RecessionProbabilities:2022}. However, we did not go further in the measurement of the uncertainty explained by the economic cycle because it requires us to focus on the modelling of another parameter ($p$, the probability of the recession to occur), which is not the purpose of this work. %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% % to add in the references: https://github.com/os-climate/physrisk/blob/main/methodology/PhysicalRiskMethodologyBibliography.bib @@ -932,14 +932,14 @@ \subsubsection{Uncertainty around the vulnerability Heat model} % publisher={University of Oregon} % year={2022}, %} -Instead, we focus on the \textbf{model parameter uncertainty approach}. In \cite{ZhangAndShindell:2021}, there is a linear relationship between temperature and work minutes lost ($\beta$),and a constraint is applied to ensure that total time allocation sums to 24 hours, which returns a non-linear regression model at the end. Given that the main coefficient of interest is denoted $\beta$, an inference is applied assuming that $\beta$ follows a $Student-T$ distribution: +Instead, we focus on the \textbf{model parameter uncertainty approach}. In \cite{ZhangAndShindell:2021}, there is a linear relationship between temperature and work minutes lost ($\beta$),and a constraint is applied to ensure that total time allocation sums to 24 hours, which returns a non-linear regression model at the end. Given that the main coefficient of interest is denoted $\beta$, an inference is applied assuming that $\beta$ follows a $Student-T$ distribution: \begin{equation} - \label{Eq:uncertaintyStudentT} + \label{Eq:uncertaintyStudentT} d\beta \sim T(\beta, SE, N-K) \end{equation} -Where $SE$ is the Standard Error of the coefficient and $(N-K)$ is the number of degrees of freedom, $N$ is the number of observations and $K$ is the number of model parameters. Hence, one can estimate the coefficients of the confidence interval (CI) at a given level of confidence $CI\%$: +Where $SE$ is the Standard Error of the coefficient and $(N-K)$ is the number of degrees of freedom, $N$ is the number of observations and $K$ is the number of model parameters. Hence, one can estimate the coefficients of the confidence interval (CI) at a given level of confidence $CI\%$: \begin{equation} - \label{Eq:CIStudent} + \label{Eq:CIStudent} d\beta_{CI\%} = \beta \pm T(p) \times SE \end{equation} Where $T(p)$ donates the probability density function (pdf) of the student $T$ distribution with probability $p$ which corresponds to the $CI\%$, the standard error $SE = 2.23 \ min$ and $\beta = - 4.68$. @@ -960,28 +960,28 @@ \subsubsection{Uncertainty around the vulnerability Heat model} As the degrees of freedom increases, the t distributions converge to the standard normal. Therefore, for simplicity reasons in the context of this work, it is assumed that that the daily labour productivity impact $\beta$ can be measured as: \begin{equation} \label{Eq:uncertainty1} - \beta \sim \mathcal{N}(m,\,SE^{2})\,\ where \ m = 4.68 \ min \ and \ SE = 2.23 \ min + \beta \sim \mathcal{N}(m,\,SE^{2})\,\ where \ m = 4.68 \ min \ and \ SE = 2.23 \ min \end{equation} -As an example, consider an $1.5^\circ C$ degree day increase in the temperature. We can then multiply through the normal distribution as shown below: +As an example, consider an $1.5^\circ C$ degree day increase in the temperature. We can then multiply through the normal distribution as shown below: %The buckets of the daily maximum temperature above $32.2^\circ C$ are defined as an incremental increase of $1.5^\circ %C$, starting from $0^\circ C$ to $18^\circ C$: $\begin{pmatrix} 0 & 1.5 & 3 & ... & 18 \end{pmatrix}$. For a $1.5^\circ %C$ daily temperature increase, the uncertainty around the daily labour productivity impact is given by the following %normal distribution: \begin{equation} \label{Eq:uncertainty2} - 1.5 \times \beta \sim \mathcal{N}(1.5 \times \beta,\, (1.5 \times SE)^{2})\, + 1.5 \times \beta \sim \mathcal{N}(1.5 \times \beta,\, (1.5 \times SE)^{2})\, \end{equation} -This can be generalised for a degree day increase of x using the following distribution: +This can be generalised for a degree day increase of x using the following distribution: \begin{equation} \label{Eq:uncertainty3} - x \times \beta \sim \mathcal{N}(x \times \beta,\, (x \times SE)^{2})\, + x \times \beta \sim \mathcal{N}(x \times \beta,\, (x \times SE)^{2})\, \end{equation} For example, there is 1\% chance that the lost labour productivity exceeds $29.6$ minutes per day if the maximum daily temperature exceeds at $32.2^\circ C$ by $3^\circ C$. This number is computed as $\mathcal{N}^{-1} (m',SE'^2)(1\%)$ where $m'= 3 \times m = -14.013 \ min$ and $SE'= 3 \times SE = 6.69 \ min$. The $99\%CI$ of the lost labour productivity per day if the maximum daily temperature exceeds at $32.2^\circ C$ by $3^\circ C$ is $[+1.6 \ min, -29.6 \ min]$. -%Adding point regarding impact as a percentage of total labour +%Adding point regarding impact as a percentage of total labour The estimated loss of labour time is then transformed into a percentage estimate: @@ -1006,7 +1006,7 @@ \subsubsection{Uncertainty around the vulnerability Heat model} \caption{WBGT and labour availability} \label{fig:WBGT-Hazard} \end{figure} -Note that another indicator deriving from the WBGT hazard model is the Work Loss (WL), which is computed as $WL = 1 - WA$. It is another way to do the assessment but leads to same results. +Note that another indicator deriving from the WBGT hazard model is the Work Loss (WL), which is computed as $WL = 1 - WA$. It is another way to do the assessment but leads to same results. \newline The aggregation of the outputs of the GZN vulnerability model (minutes of productivity labour loss) and the WBGT vulnerability model (WA), returns the effective number of working hours, which represents a way to measure the uncertainty around the GZN vulnerability model. Figure \ref{fig:Aggregation} provides the aggregation process and results: \begin{figure}[h] @@ -1017,11 +1017,11 @@ \subsubsection{Uncertainty around the vulnerability Heat model} \end{figure} If the WL was used instead of the WA, then it will be multiplied by the hours worked derived from the GZN model to get the annual total labor loss due to heat. -Given the modelling assumptions around the parameters used to compute the WA in the WBGT model, it is important to measure the uncertainty around these parameters, $\alpha1$ and $\alpha2$, which depend on the work intensities. +Given the modelling assumptions around the parameters used to compute the WA in the WBGT model, it is important to measure the uncertainty around these parameters, $\alpha1$ and $\alpha2$, which depend on the work intensities. The source paper provides the parameters $\alpha1$ and $\alpha2$ for three different work intensities low, medium and high with industries mapped to each intensity. These categories are broad and do not account for variance within and industry and between industries in the same category. To account for this uncertainty the WBGT approach was adjusted to include uncertainty around the industry. -Consider an asset which is market as in a high risk sector. We assume that the work ability is uniformly distributed with a mean equal to the $WA_H$ and a floor (a) and ceiling (b) equidistant from the mean. We assume that the floor a is halfway between $WA_H$ and $WA_M$. So a and b can be estimated based on the below formulae: +Consider an asset which is market as in a high risk sector. We assume that the work ability is uniformly distributed with a mean equal to the $WA_H$ and a floor (a) and ceiling (b) equidistant from the mean. We assume that the floor a is halfway between $WA_H$ and $WA_M$. So a and b can be estimated based on the below formulae: \begin{equation} \label{Eq:WBGT_Floor} @@ -1033,13 +1033,13 @@ \subsubsection{Uncertainty around the vulnerability Heat model} b = WA_H + \frac{WA_H - WA_M}{2}\, \end{equation} -And the WBGT work ability can be represented based on the below formula: +And the WBGT work ability can be represented based on the below formula: \begin{equation} \label{Eq:WBGT_Uniform} - WA \sim \mathcal{U}(a ,b)\, + WA \sim \mathcal{U}(a ,b)\, \end{equation} - + With this we can estimate the variance of the WBGT work ability using the standard formula for the variance of a Uniform distribution: \begin{equation} @@ -1060,7 +1060,7 @@ \subsubsection{Uncertainty around the vulnerability Heat model} \begin{aligned} \label{Eq:Var_Joint} Var(EffectiveWork) = (1- Estimated \ loss \ of \ labour \ time )^2 \times Var(WBGT) + \\ - WA_H^2 \times Var(GZN) + var(WBGT) \times Var(GZN) + WA_H^2 \times Var(GZN) + var(WBGT) \times Var(GZN) \end{aligned} \end{equation} diff --git a/methodology/PhysicalRiskMethodologyBibliography.bib b/methodology/PhysicalRiskMethodologyBibliography.bib index 8a7fe9a6..a47fa06c 100644 --- a/methodology/PhysicalRiskMethodologyBibliography.bib +++ b/methodology/PhysicalRiskMethodologyBibliography.bib @@ -183,12 +183,12 @@ @book{MitchellEtAl:2017 } @book{Nelsen:2007, - author = {Roger~B. Nelsen}, - title = {An Introduction to Copulas}, - year = {2007}, - edition = {2nd}, - publisher = {Princeton University Press}, - address = {New York~(NY)} + author = {Roger~B. Nelsen}, + title = {An Introduction to Copulas}, + year = {2007}, + edition = {2nd}, + publisher = {Princeton University Press}, + address = {New York~(NY)} } % TemperatureAndTheAllocationofTime @@ -358,4 +358,4 @@ @article{ZhangAndShindell:2021 pages={1--18}, year={2021}, publisher={Springer} -} \ No newline at end of file +} diff --git a/notebooks/vulnerability_onboarding/EU JRC global flood depth-damage functions/EU JRC global flood depth-damage functions.json b/notebooks/vulnerability_onboarding/EU JRC global flood depth-damage functions/EU JRC global flood depth-damage functions.json index 490c7228..6618bed7 100644 --- a/notebooks/vulnerability_onboarding/EU JRC global flood depth-damage functions/EU JRC global flood depth-damage functions.json +++ b/notebooks/vulnerability_onboarding/EU JRC global flood depth-damage functions/EU JRC global flood depth-damage functions.json @@ -708,4 +708,4 @@ "location": "Global" } ] -} \ No newline at end of file +} diff --git a/notebooks/vulnerability_onboarding/EU JRC global flood depth-damage functions/onboard.ipynb b/notebooks/vulnerability_onboarding/EU JRC global flood depth-damage functions/onboard.ipynb index 0e5ab42e..6fa5eab7 100644 --- a/notebooks/vulnerability_onboarding/EU JRC global flood depth-damage functions/onboard.ipynb +++ b/notebooks/vulnerability_onboarding/EU JRC global flood depth-damage functions/onboard.ipynb @@ -26,16 +26,25 @@ "import numpy as np\n", "import pandas as pd\n", "\n", - "df = pd.read_csv('raw.csv')\n", + "df = pd.read_csv(\"raw.csv\")\n", "\n", "# consistent with physrisk continent definition\n", - "location_mappings = { \"Europe\": \"Europe\", \"North America\": \"North America\", \"Central & South America\": \"South America\", \"Asia\": \"Asia\", \"Africa\": \"Africa\", \"Oceania\": \"Oceania\", \"Global\": \"Global\" }\n", - "type_mappings = { \"Residential buildings\": \"Buildings/Residential\",\n", + "location_mappings = {\n", + " \"Europe\": \"Europe\",\n", + " \"North America\": \"North America\",\n", + " \"Central & South America\": \"South America\",\n", + " \"Asia\": \"Asia\",\n", + " \"Africa\": \"Africa\",\n", + " \"Oceania\": \"Oceania\",\n", + " \"Global\": \"Global\",\n", + "}\n", + "type_mappings = {\n", + " \"Residential buildings\": \"Buildings/Residential\",\n", " \"Commercial buildings\": \"Buildings/Commercial\",\n", - " \"Industrial buildings\": \"Buildings/Industrial\"\n", + " \"Industrial buildings\": \"Buildings/Industrial\",\n", "}\n", "\n", - "data = { \"items\": [] }\n", + "data = {\"items\": []}\n", "\n", "curve_list = data[\"items\"]\n", "for mapping in type_mappings:\n", @@ -46,7 +55,7 @@ " zero_as_minimum = True if location == \"North America\" else False\n", " # for North America, the 0 depth damage is for flooding of any depth. We consider that a 1 cm inundation.\n", " depth = np.concatenate([[0, 0.01], flood_depth[1:]]) if zero_as_minimum else flood_depth\n", - " \n", + "\n", " mean = type_df[location + \"_Mean\"].to_numpy()\n", " std = type_df[location + \"_Std\"].to_numpy()\n", " mean = np.concatenate([[0], mean]) if zero_as_minimum else mean\n", @@ -54,10 +63,21 @@ " if np.any(np.isnan(mean)):\n", " mean = []\n", " if np.any(np.isnan(std)):\n", - " std = [] \n", - " curve_list.append({ \"asset_type\": type_mappings[mapping], \"event_type\": \"RiverineInundation\", \"location\": location_mappings[location], \"impact_type\": \"Damage\", \"intensity\": list(depth), \"intensity_units\": \"m\", \"impact_mean\": list(mean), \"impact_std\": list(std) }) \n", + " std = []\n", + " curve_list.append(\n", + " {\n", + " \"asset_type\": type_mappings[mapping],\n", + " \"event_type\": \"RiverineInundation\",\n", + " \"location\": location_mappings[location],\n", + " \"impact_type\": \"Damage\",\n", + " \"intensity\": list(depth),\n", + " \"intensity_units\": \"m\",\n", + " \"impact_mean\": list(mean),\n", + " \"impact_std\": list(std),\n", + " }\n", + " )\n", "\n", - "with open('EU JRC global flood depth-damage functions.json', 'w') as f:\n", + "with open(\"EU JRC global flood depth-damage functions.json\", \"w\") as f:\n", " vulnerability_json = json.dumps(data, sort_keys=True, indent=4)\n", " f.write(vulnerability_json)" ] diff --git a/notebooks/vulnerability_onboarding/Wind/Table_A2_Impact_Function_Slope.csv b/notebooks/vulnerability_onboarding/Wind/Table_A2_Impact_Function_Slope.csv index c6ff7ec6..aab5404b 100644 --- a/notebooks/vulnerability_onboarding/Wind/Table_A2_Impact_Function_Slope.csv +++ b/notebooks/vulnerability_onboarding/Wind/Table_A2_Impact_Function_Slope.csv @@ -9,4 +9,4 @@ WP2,1,83,74.7,84.7,188.4,38.2,36.7,104.9,25.89,16.44,1 WP3,1,69,74.7,80.2,112.8,15.2,14.8,20.5,5.32,3.83,1 WP4,5,64,74.7,135.6,190.5,73.8,35.9,43.8,35.56,3.35,1 Combined,53,473,74.7,–,–,22.2,16.8,24.4,4.69,2.15,1 -Global calibration,53,473,74.7,73.4,110.1,22.2,22.2,33.1,4.69,4.84,1 \ No newline at end of file +Global calibration,53,473,74.7,73.4,110.1,22.2,22.2,33.1,4.69,4.84,1 diff --git a/notebooks/vulnerability_onboarding/Wind/Table_S2_V_half_individual_fitting_per_event.csv b/notebooks/vulnerability_onboarding/Wind/Table_S2_V_half_individual_fitting_per_event.csv index 36399467..10022dd6 100644 --- a/notebooks/vulnerability_onboarding/Wind/Table_S2_V_half_individual_fitting_per_event.csv +++ b/notebooks/vulnerability_onboarding/Wind/Table_S2_V_half_individual_fitting_per_event.csv @@ -471,4 +471,4 @@ EM_ID,ibtracsID,v_half_fitted [m/s],country,country_id,region,year,Reported_Dama 2017-0432,2017288N09138,270,JPN,392,WP4,2017,1000000000,2014,995484463.5,995126307.3,-0.000359846,2017-0432JPN 2017-0468,2017252N14147,325.7,JPN,392,WP4,2017,500000000,2014,497742231.7,622698955.4,0.223980848,2017-0468JPN 2017-0485,2017236N15129,285.9,CHN,156,WP3,2017,56000000,2014,47967576.85,47983654.85,0.000335128,2017-0485CHN -2017-0508,2017333N06082,44.1,LKA,144,NI,2017,346000000,2014,314311010.2,316529153.6,0.007032376,2017-0508LKA \ No newline at end of file +2017-0508,2017333N06082,44.1,LKA,144,NI,2017,346000000,2014,314311010.2,316529153.6,0.007032376,2017-0508LKA diff --git a/notebooks/vulnerability_onboarding/Wind/onboard.ipynb b/notebooks/vulnerability_onboarding/Wind/onboard.ipynb index 82a7d285..c5d57dfb 100644 --- a/notebooks/vulnerability_onboarding/Wind/onboard.ipynb +++ b/notebooks/vulnerability_onboarding/Wind/onboard.ipynb @@ -38,17 +38,17 @@ "import numpy as np\n", "import pandas as pd\n", "\n", - "df = pd.read_csv('Table_A2_Impact_Function_Slope.csv')\n", + "df = pd.read_csv(\"Table_A2_Impact_Function_Slope.csv\")\n", "region = df[\"region\"].to_numpy()\n", "vhalf = df[\"vhalf_b\"].to_numpy()\n", "\n", "\n", "print(region)\n", "print(vhalf)\n", - "#df = pd.read_csv('Table_S2_V_half_individual_fitting_per_event.csv')\n", - "#vhalf = df.where(df.region == \"WP2\").vhalf_fitted\n", - "#region = df[\"region\"].to_numpy()\n", - "#vhalf = df[\"vhalf_fitted\"].to_numpy()\n" + "# df = pd.read_csv('Table_S2_V_half_individual_fitting_per_event.csv')\n", + "# vhalf = df.where(df.region == \"WP2\").vhalf_fitted\n", + "# region = df[\"region\"].to_numpy()\n", + "# vhalf = df[\"vhalf_fitted\"].to_numpy()" ] }, { @@ -83,9 +83,10 @@ } ], "source": [ - "v_half = df[\"v_half_fitted [m/s]\"] #df[df.region == \"WP2\"][\"v_half_fitted [m/s]\"]\n", + "v_half = df[\"v_half_fitted [m/s]\"] # df[df.region == \"WP2\"][\"v_half_fitted [m/s]\"]\n", "\n", "import matplotlib.pyplot as plot\n", + "\n", "plot.hist(v_half)" ] }, @@ -106,6 +107,7 @@ "source": [ "print(v_half.mean())\n", "import numpy as np\n", + "\n", "print(np.quantile(v_half, [0.25, 0.75]))" ] }, @@ -148,22 +150,24 @@ "import numpy as np\n", "import matplotlib.pyplot as plt\n", "\n", + "\n", "def vul(v, v_half):\n", " v_thresh = 25.7\n", - " #v_half = 135.6 # wp4 74.7 135.6 190.5\n", + " # v_half = 135.6 # wp4 74.7 135.6 190.5\n", " vn = np.where(v > v_thresh, v - v_thresh, 0) / (v_half - v_thresh)\n", " f = vn**3 / (1 + vn**3)\n", " return f\n", "\n", + "\n", "v = np.arange(0, 90, 10)\n", - "fig, ax = plt.subplots() \n", - "#for item in v_half.to_numpy():\n", + "fig, ax = plt.subplots()\n", + "# for item in v_half.to_numpy():\n", "# ax.plot(v, vul(v, item))\n", "ax.plot(v, vul(v, 74.7))\n", "ax.plot(v, vul(v, 190.5))\n", "ax.plot(v, vul(v, 135.6))\n", - "#ax.plot(v, vul(v, 100))\n", - "#ax.plot(v, vul(v, 220))" + "# ax.plot(v, vul(v, 100))\n", + "# ax.plot(v, vul(v, 220))" ] }, { diff --git a/setup.cfg b/setup.cfg index 45bdad45..a95c4f52 100644 --- a/setup.cfg +++ b/setup.cfg @@ -30,7 +30,7 @@ install_requires = scipy==1.7.3 s3fs==2022.1.0 zarr==2.10.3 - + [options.packages.find] where = src include = physrisk* diff --git a/src/physrisk/data/static/example_portfolios/industrial_activity_small.json b/src/physrisk/data/static/example_portfolios/industrial_activity_small.json index 589e6aa6..5a937be9 100644 --- a/src/physrisk/data/static/example_portfolios/industrial_activity_small.json +++ b/src/physrisk/data/static/example_portfolios/industrial_activity_small.json @@ -64,4 +64,4 @@ "longitude": 138.5572 } ] -} \ No newline at end of file +} diff --git a/src/physrisk/data/static/example_portfolios/mixed_small.json b/src/physrisk/data/static/example_portfolios/mixed_small.json index 7e4aae00..35fb6049 100644 --- a/src/physrisk/data/static/example_portfolios/mixed_small.json +++ b/src/physrisk/data/static/example_portfolios/mixed_small.json @@ -22,4 +22,4 @@ "longitude": 90.5314 } ] -} \ No newline at end of file +} diff --git a/src/physrisk/data/static/example_portfolios/power_generating_small.json b/src/physrisk/data/static/example_portfolios/power_generating_small.json index 4875e8c1..2de7cf3c 100644 --- a/src/physrisk/data/static/example_portfolios/power_generating_small.json +++ b/src/physrisk/data/static/example_portfolios/power_generating_small.json @@ -71,4 +71,4 @@ "longitude": -68.9814 } ] -} \ No newline at end of file +} diff --git a/src/physrisk/data/static/example_portfolios/real_estate_small.json b/src/physrisk/data/static/example_portfolios/real_estate_small.json index abe8de81..03a90bbf 100644 --- a/src/physrisk/data/static/example_portfolios/real_estate_small.json +++ b/src/physrisk/data/static/example_portfolios/real_estate_small.json @@ -71,4 +71,4 @@ "longitude": 90.3429 } ] -} \ No newline at end of file +} diff --git a/src/physrisk/data/static/hazard/inventory.json b/src/physrisk/data/static/hazard/inventory.json index be59ff87..2cd0ffae 100644 --- a/src/physrisk/data/static/hazard/inventory.json +++ b/src/physrisk/data/static/hazard/inventory.json @@ -1660,4 +1660,4 @@ "units": "m/s" } ] -} \ No newline at end of file +} diff --git a/src/physrisk/data/static/vulnerability/EU JRC global flood depth-damage functions.json b/src/physrisk/data/static/vulnerability/EU JRC global flood depth-damage functions.json index 490c7228..6618bed7 100644 --- a/src/physrisk/data/static/vulnerability/EU JRC global flood depth-damage functions.json +++ b/src/physrisk/data/static/vulnerability/EU JRC global flood depth-damage functions.json @@ -708,4 +708,4 @@ "location": "Global" } ] -} \ No newline at end of file +} diff --git a/src/physrisk/data/static/world.json b/src/physrisk/data/static/world.json index 3a01ced6..3e923901 100644 --- a/src/physrisk/data/static/world.json +++ b/src/physrisk/data/static/world.json @@ -886,4 +886,4 @@ "country_iso_a3": "SSD" } ] -} \ No newline at end of file +} diff --git a/src/test/data/hazard_model_store.py b/src/test/data/hazard_model_store.py index 0e253fc6..6f2aa5c6 100644 --- a/src/test/data/hazard_model_store.py +++ b/src/test/data/hazard_model_store.py @@ -10,43 +10,13 @@ class TestData: - longitudes = [ - 69.4787, - 68.71, - 20.1047, - 19.8936, - 19.6359, - 0.5407, - 6.9366, - 6.935, - 13.7319, - 13.7319, - 14.4809, - -68.3556, - -68.3556, - -68.9892, - -70.9157, - ] - latitudes = [ - 34.556, - 35.9416, - 39.9116, - 41.6796, - 42.0137, - 35.7835, - 36.8789, - 36.88, - -12.4706, - -12.4706, - -9.7523, - -38.9368, - -38.9368, - -34.5792, - -39.2145, - ] + # fmt: off + longitudes = [69.4787, 68.71, 20.1047, 19.8936, 19.6359, 0.5407, 6.9366, 6.935, 13.7319, 13.7319, 14.4809, -68.3556, -68.3556, -68.9892, -70.9157] # noqa + latitudes = [34.556, 35.9416, 39.9116, 41.6796, 42.0137, 35.7835, 36.8789, 36.88, -12.4706, -12.4706, -9.7523, -38.9368, -38.9368, -34.5792, -39.2145] # noqa coastal_longitudes = [12.2, 50.5919, 90.3473, 90.4295, 90.4804, 90.3429, 90.5153, 90.6007] coastal_latitudes = [-5.55, 26.1981, 23.6473, 23.6783, 23.5699, 23.9904, 23.59, 23.6112] + # fmt: on def get_mock_hazard_model_store_single_curve(): diff --git a/src/test/kernel/test_hazard_models.py b/src/test/kernel/test_hazard_models.py new file mode 100644 index 00000000..38bad53e --- /dev/null +++ b/src/test/kernel/test_hazard_models.py @@ -0,0 +1,95 @@ +import test.data.hazard_model_store as hms +from dataclasses import dataclass +from typing import Dict, List, Mapping, NamedTuple, Sequence, Tuple + +import numpy as np + +from physrisk.kernel.assets import RealEstateAsset +from physrisk.kernel.hazard_model import ( + HazardDataRequest, + HazardDataResponse, + HazardEventDataResponse, + HazardModel, + HazardParameterDataResponse, +) +from physrisk.kernel.hazards import ChronicHeat, Wind +from physrisk.kernel.impact import calculate_impacts +from physrisk.vulnerability_models.real_estate_models import GenericTropicalCycloneModel + + +@dataclass +class SinglePointData: + latitude: float + longitude: float + scenario: str + year: int + wind_return_periods: np.ndarray # years + wind_intensities: np.ndarray # m/s + chronic_heat_intensity: float # days over 35C + # etc + + +class PointsKey(NamedTuple): + latitude: float + longitude: float + scenario: str + year: int + + +class PointBasedHazardModel(HazardModel): + def __init__(self, points: Sequence[SinglePointData]): + """HazardModel suitable for storing relatively small number (<~ million say) of individual hazard + data points. + + Args: + points (Sequence[SinglePointData]): List of points. + """ + self.points: Dict[Tuple[PointsKey, float, float], SinglePointData] = { + self._get_key(p.latitude, p.longitude, p.scenario, p.year): p for p in points + } + + def _get_key(self, latitude: float, longitude: float, scenario: str, year: int): + return PointsKey(latitude=round(latitude, 3), longitude=round(longitude, 3), scenario=scenario, year=year) + + def get_hazard_events(self, requests: List[HazardDataRequest]) -> Mapping[HazardDataRequest, HazardDataResponse]: + response: Dict[HazardDataRequest, HazardDataResponse] = {} + for request in requests: + point = self.points[self._get_key(request.latitude, request.longitude, request.scenario, request.year)] + if request.hazard_type == Wind and request.indicator_id == "max_speed": + response[request] = HazardEventDataResponse( + return_periods=point.wind_return_periods, intensities=point.wind_intensities + ) + elif request.hazard_type == ChronicHeat and request.indicator_id == "days/above/35c": + response[request] = HazardParameterDataResponse(np.array(point.chronic_heat_intensity)) + # etc + return response + + +def test_using_point_based_hazard_model(): + # test that shows how data already present for a number of points can be used in a HazardModel + scenario = "rcp8p5" + year = 2080 + assets = [ + RealEstateAsset(lat, lon, location="Asia", type="Buildings/Industrial") + for lon, lat in zip(hms.TestData.longitudes[0:1], hms.TestData.latitudes[0:1]) + ] + # fmt: off + wind_return_periods = np.array([10.0, 20.0, 30.0, 40.0, 50.0, 60.0, 70.0, 80.0, 90.0, 100.0, 200.0, 300.0, 400.0, 500.0, 600.0, 700.0, 800.0, 900.0, 1000.0]) # noqa + wind_intensities = np.array([37.279999, 44.756248, 48.712502, 51.685001, 53.520000, 55.230000, 56.302502, 57.336250, 58.452499, 59.283749, 63.312500, 65.482498, 66.352501, 67.220001, 67.767502, 68.117500, 68.372498, 69.127502, 70.897499 ]) # noqa + # fmt: on + point = SinglePointData( + hms.TestData.latitudes[0], + hms.TestData.longitudes[0], + scenario=scenario, + year=year, + wind_return_periods=wind_return_periods, + wind_intensities=wind_intensities, + chronic_heat_intensity=0, + ) + + hazard_model = PointBasedHazardModel([point]) + vulnerability_models = {RealEstateAsset: [GenericTropicalCycloneModel()]} + results = calculate_impacts(assets, hazard_model, vulnerability_models, scenario=scenario, year=year) + impact_distrib = results[(assets[0], Wind)].impact + mean_impact = impact_distrib.mean_impact() + np.testing.assert_almost_equal(mean_impact, 0.009909858317497338) diff --git a/src/test/models/test_wind_models.py b/src/test/models/test_wind_models.py index 4909331a..abc470a0 100644 --- a/src/test/models/test_wind_models.py +++ b/src/test/models/test_wind_models.py @@ -15,50 +15,10 @@ def test_wind_real_estate_model(): year = 2080 # mock some IRIS data for the calculation: store, root = hms.zarr_memory_store() - return_periods = [ - 10.0, - 20.0, - 30.0, - 40.0, - 50.0, - 60.0, - 70.0, - 80.0, - 90.0, - 100.0, - 200.0, - 300.0, - 400.0, - 500.0, - 600.0, - 700.0, - 800.0, - 900.0, - 1000.0, - ] - intensity = np.array( - [ - 37.279999, - 44.756248, - 48.712502, - 51.685001, - 53.520000, - 55.230000, - 56.302502, - 57.336250, - 58.452499, - 59.283749, - 63.312500, - 65.482498, - 66.352501, - 67.220001, - 67.767502, - 68.117500, - 68.372498, - 69.127502, - 70.897499, - ] - ) + # fmt: off + return_periods = [10.0, 20.0, 30.0, 40.0, 50.0, 60.0, 70.0, 80.0, 90.0, 100.0, 200.0, 300.0, 400.0, 500.0, 600.0, 700.0, 800.0, 900.0, 1000.0] # noqa + intensity = np.array([37.279999, 44.756248, 48.712502, 51.685001, 53.520000, 55.230000, 56.302502, 57.336250, 58.452499, 59.283749, 63.312500, 65.482498, 66.352501, 67.220001, 67.767502, 68.117500, 68.372498, 69.127502, 70.897499 ]) # noqa + # fmt: on shape, transform = hms.shape_transform_21600_43200(return_periods=return_periods) path = f"wind/iris/v1/max_speed_{scenario}_{year}".format(scenario=scenario, year=year) hms.add_curves(