<?xml version="1.0"?>
<!DOCTYPE rfc SYSTEM "rfc2629.dtd" [
<!ENTITY RFC2119 PUBLIC ''
'http://xml.resource.org/public/rfc/bibxml/reference.RFC.2119.xml'>
<!ENTITY RFC2234 PUBLIC ''
'http://xml.resource.org/public/rfc/bibxml/reference.RFC.2234.xml'>
<!ENTITY RFC3588 PUBLIC ''
'http://xml.resource.org/public/rfc/bibxml/reference.RFC.3588.xml'>
<!ENTITY RFC4005 PUBLIC ''
'http://xml.resource.org/public/rfc/bibxml/reference.RFC.4005.xml'>
<!ENTITY RFC4072 PUBLIC ''
'http://xml.resource.org/public/rfc/bibxml/reference.RFC.4072.xml'>
<!ENTITY RFC3748 PUBLIC ''
'http://xml.resource.org/public/rfc/bibxml/reference.RFC.3748.xml'>
<!ENTITY RFC4282 PUBLIC ''
'http://xml.resource.org/public/rfc/bibxml/reference.RFC.4282.xml'>
<!ENTITY RFC4284 PUBLIC ''
'http://xml.resource.org/public/rfc/bibxml/reference.RFC.4284.xml'>
<!ENTITY RFC4283 PUBLIC ''
'http://xml.resource.org/public/rfc/bibxml/reference.RFC.4283.xml'>
<!ENTITY RFC2486 PUBLIC ''
'http://xml.resource.org/public/rfc/bibxml/reference.RFC.2486.xml'>
<!ENTITY RFC2865 PUBLIC ''
'http://xml.resource.org/public/rfc/bibxml/reference.RFC.2865.xml'>
<!ENTITY RFC5113 PUBLIC ''
'http://xml.resource.org/public/rfc/bibxml/reference.RFC.5113.xml'>
<!ENTITY RFC1034 PUBLIC ''
'http://xml.resource.org/public/rfc/bibxml/reference.RFC.1034.xml'>
<!ENTITY RFC1035 PUBLIC ''
'http://xml.resource.org/public/rfc/bibxml/reference.RFC.1035.xml'>
<!ENTITY RFC3490 PUBLIC ''
'http://xml.resource.org/public/rfc/bibxml/reference.RFC.3490.xml'>
<!ENTITY RFC6408 PUBLIC ''
'http://xml.resource.org/public/rfc/bibxml/reference.RFC.6408.xml'>
<!ENTITY RFC6733 PUBLIC ''
'http://xml.resource.org/public/rfc/bibxml/reference.RFC.6733.xml'>
<!ENTITY RFC5226 PUBLIC ''
'http://xml.resource.org/public/rfc/bibxml/reference.RFC.5226.xml'>
<!ENTITY RFC4006 PUBLIC ''
'http://xml.resource.org/public/rfc/bibxml/reference.RFC.4006.xml'>
<!ENTITY RFC7068 PUBLIC ''
'http://xml.resource.org/public/rfc/bibxml/reference.RFC.7068.xml'>
<!ENTITY RFC7415 PUBLIC ''
'http://xml.resource.org/public/rfc/bibxml/reference.RFC.7415.xml'>
<!ENTITY I-D.ietf-dime-ovli PUBLIC ''
'http://xml.resource.org/public/rfc/bibxml3/reference.I-D.draft-ietf-dime-ovli-08.xml'>
<!ENTITY I-D.ietf-dime-agent-overload PUBLIC ''
'http://xml.resource.org/public/rfc/bibxml3/reference.I-D.draft-ietf-dime-agent-overload-00.xml'>



]>
<?xml-stylesheet type='text/xsl' href='rfc2629.xslt' ?>
<?rfc toc="yes" ?>
<?rfc symrefs="yes" ?>
<?rfc sortrefs="yes" ?>
<?rfc iprnotified="no" ?>
<?rfc strict="no" ?>
<?rfc compact="yes" ?>
<?rfc subcompact="no" ?>
<rfc ipr="trust200902"

    category="std"
     docName="draft-ietf-dime-doic-rate-control-01.txt">
  <front>
    <title abbrev="Diameter Overload Rate Control">Diameter Overload Rate Control</title>
    <author role="editor" initials="S" surname="Donovan" fullname="Steve Donovan">
      <organization>Oracle</organization>
      <address>
        <postal>
          <street>17210 Campbell Road</street>
          <city>Dallas</city>
          <region>Texas</region>
          <code>75254</code>
          <country>United States</country>
        </postal>
        <email>srdonovan@usdonovans.com</email>
      </address>
    </author>
    <author initials="E" surname="Noel" fullname="Eric Noel">
     <organization>AT&amp;T Labs</organization>
     <address>
       <postal>
         <street>200s Laurel Avenue</street>
         <city>Middletown</city>
         <region>NJ</region>
         <code>07747</code>
         <country>United States</country>
       </postal>
       <email>ecnoel@research.att.com</email>
     </address>
    </author>
    <date month="March" year="2015"/>
    <area>Operations and Management</area>
    <workgroup>Diameter Maintenance and Extensions (DIME)</workgroup>
    <keyword>Internet-Draft</keyword>
    <keyword>Diameter</keyword>
    <keyword>Overload</keyword>
    <abstract>
      <t>
       This specification documents an extension to the Diameter Overload
       Indication Conveyance (DOIC) base solution.  This extension adds a new
       overload control abatement algorithm.  This abatement algorithm
       allows for a DOIC reporting node to specify a maximum rate at which
       a DOIC reacting node sends Diameter requests to the DOIC reporting node.
      </t>
    </abstract>
    <note title="Requirements">
      <t>
       The key words "MUST", "MUST NOT", "REQUIRED", "SHALL", "SHALL NOT",
       "SHOULD", "SHOULD NOT", "RECOMMENDED", "MAY", and "OPTIONAL" in this
       document are to be interpreted as described in
       <xref target="RFC2119">RFC 2119</xref>.
      </t>
    </note>
  </front>

  <middle>

    <section title="Introduction" anchor="intro">
      <t>
        This document defines a new Diameter overload control abatement algorithm.
      </t>
      <t>
        The base Diameter overload specification <xref target="I-D.ietf-dime-ovli"/>
        defines the loss algorithm as the
        default Diameter overload abatement algorithm.  The loss algorithm allows
        a reporting node to instruct a reacting node to
        reduce the amount of traffic sent to the reporting node by abating (diverting
        or throttling) a percentage
        of requests sent to the
        server.  While this can effectively decrease the load handled by the
        server, it does not directly address cases where the rate of arrival
        of service requests increase quickly.

        If the service
        requests that result in Diameter transactions increases quickly then
        the loss algorithm cannot guarantee the load presented to the server
        remains below a specific rate level. The loss algorithm can be slow to
        protect the stability of reporting
        nodes when subject with rapidly changing loads.
      </t>
      <t>
        Consider the case where a reacting node is handling 100 service requests per
        second, where each of these service requests
        results in one Diameter transaction being sent to a reacting node.
        If the reacting node is approaching an
        overload state, or is already in an overload state, it will send a Diameter
        overload report requesting a percentage
        reduction in traffic sent.  Assume for this discussion that the reporting node
        requests a 10% reduction.  The reacting node will
        then abate (diverting or throttling) ten Diameter transactions a second, sending the remaining
        90 transactions per second to the reacting node.
      </t>
      <t>
        Now assume that the reacting node's service requests spikes to 1000 requests per
        second. The reacting node will continue to honor the
        reporting nodes request for a 10% reduction in traffic.  This results, in this
        example, in the reacting node sending
        900 Diameter transactions per second, abating the remaining 100 transactions
        per second.  This spike in traffic is significantly
        higher than the reporting node is expecting
        to handle and can result in negative impacts to the stability of the
        reporting node.
      </t>
      <t>
        The reporting node can, and likely would, send another overload report requesting that
        the reacting node abate 91% of requests to get
        back to the desired 90 transactions per second.  However, once the spike has abated
        and the reacting node handled service requests
        returns to 100 per second, this will result in just 9 transactions per
        second being sent to the reporting node, requiring a new overload report
        setting the reduction percentage back to 10%.  This control feedback loop
        has the potential to make the situation worse.
      </t>
      <t>
        One of the benefits of a rate based algorithm is that it better handles
        spikes in traffic.  Instead of sending
        a request to reduce traffic by a percentage, the rate approach allows
        the reporting node to specify the maximum
        number of Diameter requests per second that can be sent to the
        reporting node.  For instance, in this example, the reporting node could
        send a rate based request specifying the maximum transactions per second
        to be 90.  The reacting node will send the 90
        regardless of whether it is receiving 100 or 1000 service requests per second.
      </t>
      <t>
        This document extends the base DOIC solution <xref target="I-D.ietf-dime-ovli"/>
        to add support for the rate based overload abatement algorithm.
      </t>
      <t>
        This document draws heavily on work in the RIA SIP Overload Control working group.
        The definition of the rate abatement algorithm is copied almost verbatim
        from the SOC document <xref target="RFC7415"/>, with
        changes focused on making the wording consistent with the DOIC solution
        and the Diameter protocol.
      </t>
      <t><list><t>
        Editor's Note: Need to verify that the latest text from the SOC document
        is currently being used.
      </t></list></t>
    </section>

    <section title="Terminology and Abbreviations" anchor="abbrev">
      <t>
        <list style="hanging">
          <t hangText="Diameter Node">
          <vspace blankLines="1"/>
          A RFC6733 Diameter Client, RFC6733 Diameter Server, or RFC6733
          Diameter Agent.
          </t>
          <t hangText="Diameter Endpoint">
          <vspace blankLines="1"/>
          An RFC6733 Diameter Client or RFC6733 Diameter Server.
          </t>
          <t hangText="DOIC Node">
          <vspace blankLines="1"/>
          A Diameter Node that supports the DOIC solution
          defined in <xref target="I-D.ietf-dime-ovli"/>.
          </t>
          <t hangText="Reporting Node">
          <vspace blankLines="1"/>
          A DOIC Node that sends a DOIC overload report.
          </t>
          <t hangText="Reacting Node">
          <vspace blankLines="1"/>
          A DOIC Node that receives and acts on a DOIC overload report.
          </t>
        </list>
      </t>
    </section>
    <section title="Interaction with DOIC report types">
      <t>
        As of the publication of this specification there are two DOIC report
        types defined with the specification of a third in progress:
      </t>
      <t><list style="numbers">
        <t>
          Host - Overload of a specific Diameter Application at a specific Diameter Node
          as defined in <xref target="I-D.ietf-dime-ovli"/>.
        </t>
        <t>
          Realm - Overload of a specific Diameter Application at a specific Diameter Realm
          as defined in <xref target="I-D.ietf-dime-ovli"/>.
        </t>
        <t>
          Peer - Overload of a specific Diameter peer as defined in
          <xref target="I-D.ietf-dime-agent-overload"/>.
        </t>
      </list></t>
      <t>
        The rate algorithm MAY be selected by reporting nodes for any of these report types.
      </t>
      <t><list><t>
        Editor's note: It needs to be validated that use of the rate algorithm
        applies to the host and realm report types.
      </t></list></t>
      <t>
        It is expected that all report types defined in the future will indicate
        whether or not the rate algorithm can be used with that report type.
      </t>
    </section>
    <section title="Capability Announcement">
<!--
      <t>
        Editors Note: This section depends upon the completion of the base Diameter
        Overload specification.
        As such, it cannot be complete until the data model and extension
        mechanism are finalized in the base DOC
        specification.  Details for any new AVPs or modifications to existing
        AVPs will be finalized in a future version of the draft after the base DOC
        specification has stabilized.
      </t>
-->
      <t>
        This extension defines the rate abatement algorithm (referred to as rate
        in this document) feature.  Support for
        the rate feature will
        be reflected by use of a new value, as defined in <xref target="fvector"/>,
        in the OC-Feature-Vector AVP per the rules defined in
        <xref target="I-D.ietf-dime-ovli"/>.
      </t>
      <t>
        Note that Diameter nodes that support the rate feature will, by definition,
        support both the loss and
        rate based abatement algorithms.  DOIC reacting nodes SHOULD indicate
        support for both the loss and rate algorithms in the OC-Feature-Vector AVP.
      </t>
      <t><list><t>
        There may be local policy reasons that cause a DOIC node that supports
        the rate abatement algorithm to not include it in the OC-Feature-Vector.
        All reacting nodes,
        however, must continue to include loss in the OC-Feature-Vector in order
        to remain compliant with <xref target="I-D.ietf-dime-ovli"/>.
      </t></list></t>
<!--
      <t>
        A reporting nodes MUST select either the rate or the loss algorithm when
        receiving a request that contains an OC-Supported-Features AVP.
      </t>
-->
      <t>
        A reporting node MAY select one abatement algorithm to apply to
        host and realm reports and a different algorithm to apply to peer
        reports.
      </t>
      <t><list>
        <t>
          For host or realm reports the selected algorithm is
          reflected in the OC-Feature-Vector AVP sent as part of the
          OC-Selected-Features AVP included in answer messages for transaction
          where the request contained
          an OC-Supported-Features AVP.  This is per
          the procedures defined in <xref target="I-D.ietf-dime-ovli"/>.
        </t>
        <t>
          For peer reports the selected algorithm is reflected
          in the OC-Peer-Algo AVP sent as part of the OC-Supported-Features
          AVP included answer messages for transaction where the request contained
          an OC-Supported-Features AVP.  This is per the procedures defined in
          <xref target="I-D.ietf-dime-agent-overload"/>.
        </t>
      </list></t>
      <t><list><t>
        Editor's Node: The peer report specification is still under development and,
        as such, the above paragraph is subject to change.
      </t></list></t>
    </section>
    <section title="Overload Report Handling">
      <t>
        This section describes any changes to the behavior
        defined in <xref target="I-D.ietf-dime-ovli"/> for handling of overload
        reports when the rate overload abatement algorithm is used.
      </t>
      <section title="Reporting Node Overload Control State">
        <t>
          A reporting node that uses the rate abatement algorithm SHOULD maintain
          reporting node OCS for each reacting node to which it sends a rate OLR.
        </t>
        <t><list><t>
          This is different from the behavior defines in <xref target="I-D.ietf-dime-ovli"/>
          where a single loss percentage sent to all reacting nodes.
        </t></list></t>
        <t>
          A reporting node SHOULD maintain OCS entries when using the rate
          abatement algorithm per supported Diameter
          application, per targeted reacting node and per report-type.
        </t>
        <t>
          A rate OCS entry is identified by the tuple of Application-Id, report-type and
          DiameterID of the target of the rate OLR.
        </t>
<!--
        <t>
          A reporting node that supports the rate abatement algorithm
          MUST be able to include rate as the selected abatement algorithm
          in the reporting node OCS.
        </t>
-->
        <t>
          A reporting node that supports the rate abatement algorithm
          MUST be able to include the specified rate in the abatement algorithm specific
          portion of the reporting node rate OCS.
        </t>
        <t>
          All other elements for the OCS defined in <xref target="I-D.ietf-dime-ovli"/>
          and <xref target="I-D.ietf-dime-agent-overload"/>
          also apply to the reporting nodes OCS when using the rate abatement
          algorithm.
        </t>
      </section>
      <section title="Reacting Node Overload Control State">
        <t>
          A reacting node that supports the rate abatement algorithm
          MUST be able to include rate as the selected abatement algorithm
          in the reacting node OCS.
        </t>
        <t>
          A reacting node that supports the rate abatement algorithm
          MUST be able to include the rate specified in the OC-Maximum-Rate AVP included
          in the OC-OLR AVP as an element of the abatement algorithm specific
          portion of reacting node OCS entries.
        </t>
        <t>
          All other elements for the OCS defined in <xref target="I-D.ietf-dime-ovli"/>
          and <xref target="I-D.ietf-dime-agent-overload"/>
          also apply to the reporting nodes OCS when using the rate abatement
          algorithm.
        </t>
      </section>
      <section title="Reporting Node Maintenance of Overload Control State">
        <t>
          A reporting node that has selected the rate overload abatement algorithm
          and enters an overload condition MUST indicate rate as the abatement
          algorithm in the resulting reporting node OCS entries.
        </t>
        <t>
          A reporting node that has selected the rate abatement algorithm
          and enters an overload condition MUST indicate the selected
          rate in the resulting reporting node OCS entries.
        </t>
        <t>
          When selecting the rate algorithm in the response to
          a request that contained an OC-Supporting-Features
          AVP with an OC-Feature-Vector AVP indicating support for the rate feature,
          a reporting node MUST ensure that a reporting node OCS entry exists
          for the target of the overload report.  The target is defined as
          follows:
        </t>
        <t><list style="symbols">
          <t>
            For Host reports the target is the DiameterID contained in the
            Origin-Host AVP received in the request.
          </t>
          <t>
            For Realm reports the target is the DiameterID contained in the
            Origin-Realm AVP received in the request.
          </t>
          <t>
            For Peer reports the target is the DiameterID of the Diameter Peer from
            which the request was received.
          </t>
        </list></t>
      </section>
      <section title="Reacting Node Maintenance of Overload Control State">
        <t>
          When receiving an answer message indicating that the reacting node
          has selected the rate algorithm, a reaction node MUST indicate the
          rate abatement algorithm in the reacting node OCS entry for the
          reporting node.
        </t>
        <t>
          A reacting node receiving an overload report for the rate abatement
          algorithm MUST save the rate received in the OC-Maximum-Rate AVP contained in
          the OC-OLR AVP in the reacting node OCS entry.
        </t>
      </section>
      <section title="Reporting Node Behavior for Rate Abatement Algorithm">
        <t>
          When in an overload condition with rate selected as the overload
          abatement algorithm and when handling a request that contained
          an OC-Supported-Features AVP that indicated support for the rate
          abatement algorithm,
          a reporting node SHOULD include an
          OC-OLR AVP for the rate algorithm using the parameters stored in the
          reporting node OCS for the target of the overload report.
        </t>
        <t><list><t>
          Editor's Note: The above is a pretty complicated way of saying that
          the reporting node should include an OC-OLR in the appropriate answer
          messages.  The basic requirement isn't rate feature specific but
          rather that in all cases the reporting node generates an OC-OLR according
          to the parameters of the appropriate OCS entry.  This wording probably
          can be improved based on the generic behavior definition.
        </t></list></t>
        <t>
          When sending an overload report for the Rate algorithm, the OC-Maximum-Rate AVP
          is included and the OC-Reduction-Percentage AVP is not included.
        </t>
      </section>
      <section title="Reacting Node Behavior for Rate Abatement Algorithm">
        <t>
          When determining if abatement treatment should be applied to a request
          being sent to a reporting node that has selected the rate overload
          abatement algorithm, the reacting node MAY use the algorithm
          detailed in <xref target="rate"/>.
        </t>
        <t><list><t>
          Note: Other algorithms for controlling the rate can be implemented by
          the reacting node as long as they result in the correct rate of traffic
          being sent to the reporting node.
        </t></list></t>
        <t>
          Once a determination is made by the reacting node that an individual
          Diameter request is to be subjected to abatement treatment then the
          procedures for throttling and diversion defined  in <xref target="I-D.ietf-dime-ovli"/>
          and <xref target="I-D.ietf-dime-agent-overload"/> apply.
        </t>
      </section>
    </section>
    <section title="Rate Abatement Algorithm AVPs" anchor="rate">
      <t>
        Editors Note: This section depends upon the completion of the base
        DOIC specification.
        As such, it cannot be complete until the data model and extension mechanism
        are finalized.  Details for any new AVPs or modifications to existing
        AVPs will be finalized in a future version of the draft after the base
        DOC specification has stabilized.
      </t>
      <section title="OC-Supported-Features AVP">
        <t>
          The rate algorithm does not add any AVPs to the OC-Supported-Features AVP.
        </t>
        <t>
          The rate algorithm does add a new feature bit to be carried in the
          OC-Feature-Vector AVP.
        </t>
        <section title="OC-Feature-Vector AVP" anchor="fvector">
          <t>
            This extension adds the following capabilities to the OC-Feature-Vector AVP.
          </t>
          <t>
            <list style="hanging">
                 <t hangText="OLR_RATE_ALGORITHM (0x0000000000000004)">
                  <vspace blankLines="1"/>
                  When this flag is set by the overload control endpoint it indicates that
                  the DOIC Node supports the rate overload control algorithm.
                 </t>
            </list>
          </t>
        </section>
      </section>
      <section title="OC-OLR AVP">
        <t>
          This extension defines the OC-Maximum-Rate AVP to be an optional part of the OC-OLR AVP.
        </t>
        <figure>
        <artwork><![CDATA[
   OC-OLR ::= < AVP Header: TBD2 >
              < OC-Sequence-Number >
              < OC-Report-Type >
              [ OC-Reduction-Percentage ]
              [ OC-Validity-Duration ]
              [ OC-Source-ID ]
              [ OC-Abatement-Algorithm ]
              [ OC-Maximum-Rate ]
            * [ AVP ]
  ]]>
        </artwork>
        </figure>
        <t>
          This extension makes no changes to the other AVPs that are part of the
          OC-OLR AVP.
        </t>
        <t>
          This extension does not define new overload report types.  The existing
          report types of host and realm defined in
          <xref target="I-D.ietf-dime-ovli"/> apply to the rate control algorithm.
          The peer report type defined in
          <xref target="I-D.ietf-dime-agent-overload"/> also applies to the rate control algorithm.
        </t>
        <section title="OC-Maximum-Rate AVP">
          <t>
            The OC-Maximum-Rate AVP (AVP code TBD1) is type of Unsigned32 and describes
            the maximum rate that
            that the sender is requested to send traffic.  This is specified in terms
            of requests per second.
          </t>
          <t><list><t>
            Editor's note: Do we need to specify a maximum value?
          </t></list></t>
          <t>
            A value of zero indicates that no traffic is to be sent.
          </t>
        </section>
      </section>
      <section title="Attribute Value Pair flag rules">
        <t>
          <figure>
          <artwork>
          <![CDATA[
                                                            +---------+
                                                            |AVP flag |
                                                            |rules    |
                                                            +----+----+
                            AVP   Section                   |    |MUST|
    Attribute Name          Code  Defined Value Type        |MUST| NOT|
   +--------------------------------------------------------+----+----+
   |OC-Maximum-Rate                 TBD1    x.x   Unsigned64        |    | V  |
   +--------------------------------------------------------+----+----+
   ]]>
          </artwork>
          </figure>
        </t>

      </section>
    </section>

    <section title="Rate Based Abatement Algorithm">
      <t>
        This section is pulled from <xref target="RFC7415"/>,
        with minor changes needed to
        make it apply to the Diameter protocol.
      </t>
      <section title="Overview">
      <t>
        The reporting node is the one protected by the overload control algorithm
        defined here.  The reacting node is the one
        that abates traffic towards the server.
      </t>
      <t>
        Following the procedures defined in [draft-ietf-dime-doic], the reacting node and
        reporting node signal one another support for rate-based overload control.
      </t>
      <t>
   Then periodically, the reporting node relies on internal measurements (e.g.
   CPU utilization or queuing delay) to evaluate its overload state
   and estimate a target maximum Diameter request rate in number of requests per
   second (as opposed to target percent reduction in the case of loss-based
   abatement).
      </t>
      <t>
   When in an overloaded state, the reporting node uses the OC-OLR AVP to
   inform reacting nodes of its overload state and of the target Diameter
   request rate.
      </t>
      <t>
   Upon receiving the overload report with a target maximum Diameter request rate,
   each reacting node applies abatement treatment for
    new Diameter requests towards the reporting node.
      </t>
      </section>

      <section title="Reporting Node Behavior">
      <t>
   The actual algorithm used by the reporting node to determine its overload
   state and estimate a target maximum Diameter request rate is beyond the scope of
   this document.
      </t>
      <t>
   However, the reporting node MUST periodically evaluate its overload state
   and estimate a target Diameter request rate beyond which it would become
   overloaded. The reporting node must allocate a portion of the target Diameter
   request rate to each of its reacting nodes. The reporting node may set the same rate
   for every reacting node, or may set different rates for different reacting node.
      </t>
      <t>
   The maximum rate determined by the reporting node for a reacting node applies to the
   entire stream of Diameter requests, even though abatement may only
   affect a particular subset of the requests, since the reacting node might apply
   priority as part of its decision of which requests to abate.
      </t>
      <t>
   When setting the maximum rate for a particular reacting node, the reporting node
   may need take into account the workload (e.g. cpu load per request)
   of the distribution of message types from that reacting node.  Furthermore,
   because the reacting node may prioritize the specific types of messages it
   sends while under overload restriction, this distribution of message
   types may be different from
   the message distribution for that reacting node under non-overload
   conditions (e.g., either higher or lower cpu load).
      </t>
      <t>
   Note that the AVP for the rate algorithm is an upper bound
   (in request messages per second) on the traffic sent by the reacting node to the
   reporting node. The reacting node may send traffic at a rate significantly lower
   than the upper bound, for a variety of reasons.
      </t>
      <t>
   In other words, when multiple reacting nodes are being controlled by an
   overloaded reporting node, at any given time some reacting nodes may receive
   requests at a rate below its target maximum Diameter request rate while others
   above that target rate. But the resulting request rate presented to
   the overloaded reporting node will converge towards the target Diameter request
   rate.
      </t>
      <t>
   Upon detection of overload, and the determination to invoke overload
   controls, the reporting node MUST follow the specifications in
   [draft-ietf-dime-ovli] to notify its clients of the allocated
   target maximum Diameter request rate and to notify them that the rate
   overload abatement is in effect.
      </t>
      <t>
   The reporting node MUST use the OC-Maximum-Rate AVP defined in this specification
   to communicate a target maximum Diameter request rate to each of its clients.
      </t>
      </section>
      <section title="Reacting Node Behavior">
        <section title="Default algorithm">
        <t>
   In determining whether or not to transmit a specific message, the
   reacting node can use any algorithm that limits the message rate to
   the OC-Maximum-Rate AVP value in units of messages per second.
   For ease of discussion,
   we define T = 1/[OC-Maximum-Rate] as the target inter-Diameter request
   interval.
    It may be strictly deterministic, or it may be
   probabilistic. It may, or may not, have a tolerance factor, to allow
   for short bursts, as long as the long term rate remains below 1/T.
         </t>
         <t>
   The algorithm may have provisions for prioritizing traffic.
        </t>
        <t>
   If the algorithm requires other parameters (in addition to "T",
   which is 1/OC-Maximum-Rate), they may be set autonomously by the reacting node, or they
   may be negotiated independently between reacting node and reporting node.
        </t>
        <t>
   In either case, the coordination is out of scope for this document.
   The default algorithms presented here (one with and one without provisions for
   prioritizing traffic) are only examples.
        </t>
        <t>
   To apply abatement treatment to
    new Diameter requests at the rate specified in the OC-Maximum-Rate AVP value
   sent by the reporting node to its reacting nodes, the reacting node MAY use the proposed
   default algorithm for rate-based control or any other
   equivalent algorithm that forward messages in conformance with the
   upper bound of 1/T messages per second.
        </t>
        <t>
   The default Leaky Bucket algorithm presented here is based on [ITU-T
   Rec. I.371] Appendix A.2.  The algorithm makes it possible for
   reacting nodes to deliver Diameter requests at a rate specified in the OC-Maximum-Rate value
   with tolerance parameter TAU (preferably configurable).
        </t>
        <t>
   Conceptually, the Leaky Bucket algorithm can be viewed as a finite
   capacity bucket whose real-valued content drains out at a continuous
   rate of 1 unit of content per time unit and whose content increases
   by the increment T for each forwarded Diameter request. T is computed as
   the inverse of the rate specified in the OC-Maximum-Rate AVP value, namely T = 1 /
   OC-Maximum-Rate.
        </t>
        <t>
   Note that when the OC-Maximum-Rate value is 0 with a non-zero OC-Validity-Duration, then
   the reacting node should apply abatement treatment to 100% of Diameter requests destined to the
   overloaded reporting node. However, when the OC-Validity-Duration value is 0, the
   reacting node should stop applying abatement treatment.
        </t>
        <t>
   If, at a new Diameter request arrival, the content of the bucket is less
   than or equal to the limit value TAU, then the Diameter request is
   forwarded to the server; otherwise, the abatement treatment is applied to the
   Diameter request.
        </t>
        <t>
   Note that the capacity of the bucket (the upper bound of the
   counter) is (T + TAU).
        </t>
        <t>
   The tolerance parameter TAU determines how close the long-term
   admitted rate is to an ideal control that would admit all Diameter
   requests for arrival rates less than 1/T and then admit Diameter requests
   precisely at the rate of 1/T for arrival rates above 1/T. In
   particular at mean arrival rates close to 1/T, it determines the
   tolerance to deviation of the inter-arrival time from T (the larger
   TAU the more tolerance to deviations from the inter-departure
   interval T).
        </t>
        <t>
   This deviation from the inter-departure interval influences the
   admitted rate burstyness, or the number of consecutive Diameter requests
   forwarded to the reporting node (burst size proportional to TAU over the
   difference between 1/T and the arrival rate).
        </t>
        <t>
          In situations where reacting nodes are configured with some knowledge about
the reporting node (e.g., operator pre-provisioning), it can be beneficial to
choose a value of TAU based on how many reacting nodes will be sending
requests to the reporting node.

        </t>
        <t>
   Reporting nodes with a very large number of reacting nodes, each with a relatively
   small arrival rate, will generally benefit from a smaller value for
   TAU in order to limit queuing (and hence response times) at the
   reporting node when subjected to a sudden surge of traffic from all reacting nodes.
   Conversely, a reporting node with a relatively small number of reacting nodes, each
   with proportionally larger arrival rate, will benefit from a larger
   value of TAU.
        </t>
        <t>
   Once the control has been activated, at the arrival time of the k-th
   new Diameter request, ta(k), the content of the bucket is provisionally
   updated to the value
        </t>
        <t>
   X' = X - (ta(k) - LCT)
        </t>
        <t>
   where X is the value of the leaky bucket counter after arrival of
   the last forwarded Diameter request, and LCT is the time at which the
   last Diameter request was forwarded.
        </t>
        <t>
   If X' is less than or equal to the limit value TAU, then the new Diameter
   request is forwarded and the leaky bucket counter X is set to X' (or
   to 0 if X' is negative) plus the increment T, and LCT is set to the
   current time ta(k). If X' is greater than the limit value TAU, then
   the abatement treatment is applied to the new Diameter request
    and the values of X and LCT are
   unchanged.
        </t>
        <t>
   When the first response from the reporting node has been received indicating
   control activation (OC-Validity-Duration>0), LCT is set to the time of
   activation, and the leaky bucket counter is initialized to the
   parameter TAU0 (preferably configurable) which is 0 or larger but
   less than or equal to TAU.
        </t>
        <t>
   TAU can assume any positive real number value and is not necessarily
   bounded by T.
        </t>
        <t>
   TAU=4*T is a reasonable compromise between burst size and abatement
   rate adaptation at low offered rate.
        </t>
        <t>
   Note that specification of a value for TAU, and any communication or
   coordination between servers, is beyond the scope of this document.
        </t>
        <t>
   A reference algorithm is shown below.
        </t>
        <t>
   No priority case:
        </t>
        <t>
        <figure>
        <artwork>

   // T: inter-transmission interval, set to 1 / OC-Maximum-Rate
   // TAU: tolerance parameter
   // ta: arrival time of the most recent arrival
   // LCT: arrival time of last SIP request that was sent to the server
   //      (initialized to the first arrival time)
   // X: current value of the leaky bucket counter (initialized to
   //    TAU0)

   // After most recent arrival, calculate auxiliary variable Xp
   Xp = X - (ta - LCT);

   if (Xp &lt;= TAU) {
     // Transmit SIP request
     // Update X and LCT
     X = max (0, Xp) + T;
     LCT = ta;
   } else {
     // Reject SIP request
     // Do not update X and LCT
   }
        </artwork>
        </figure>
        </t>
        </section>

        <section title="Priority treatment">
        <t>
   The reacting node is
   responsible for applying message priority and for maintaining two categories
   of requests: Request candidates for reduction, requests not subject
   to reduction (except under extenuating circumstances when there
   aren't any messages in the first category that can be reduced).
        </t>
        <t>
   Accordingly, the proposed Leaky bucket implementation is modified to
   support priority using two thresholds for Diameter requests in the set of
   request candidates for reduction. With two priorities, the proposed
   Leaky bucket requires two thresholds TAU1 &lt; TAU2:
        </t>
        <t>
        <list style="symbols">
        <t>All new requests would be admitted when the leaky bucket
        counter is at or below TAU1,
        </t>
        <t>Only higher priority requests would be admitted when the leaky
        bucket counter is between TAU1 and TAU2,
        </t>
        <t>All requests would be rejected when the bucket counter is above
        TAU2.
        </t>
        </list>
        </t>
        <t>
   This can be generalized to n priorities using n thresholds for n>2
   in the obvious way.
        </t>
        <t>
   With a priority scheme that relies on two tolerance parameters (TAU2
   influences the priority traffic, TAU1 influences the non-priority
   traffic), always set TAU1 &lt;= TAU2 (TAU is replaced by TAU1 and
   TAU2).  Setting both tolerance parameters to the same value is
   equivalent to having no priority. TAU1 influences the admitted rate
   the same way as TAU does when no priority is set. And the larger the
   difference between TAU1 and TAU2, the closer the control is to
   strict priority queuing.
        </t>
        <t>
   TAU1 and TAU2 can assume any positive real number value and is not
   necessarily bounded by T.
        </t>
        <t>
   Reasonable values for TAU0, TAU1 &amp; TAU2 are:
        </t>
        <t><list style="symbols">
          <t>
           TAU0 = 0,
           </t>
           <t>
             TAU1 = 1/2 * TAU2, and
           </t>
           <t>
             TAU2 = 10 * T.
           </t>
          </list></t>
        <t>
   Note that specification of a value for TAU1 and TAU2, and any
   communication or coordination between servers, is beyond the scope
   of this document.
        </t>
        <t>
   A reference algorithm is shown below.
        </t>
        <t>
   Priority case:
        </t>
        <t>
        <figure>
        <artwork>

   // T: inter-transmission interval, set to 1 / OC-Maximum-Rate
   // TAU1: tolerance parameter of no priority Diameter requests
   // TAU2: tolerance parameter of priority Diameter requests
   // ta: arrival time of the most recent arrival
   // LCT: arrival time of last Diameter request that was sent to the server
   //      (initialized to the first arrival time)
   // X: current value of the leaky bucket counter (initialized to
   //    TAU0)

   // After most recent arrival, calculate auxiliary variable Xp
   Xp = X - (ta - LCT);

   if (AnyRequestReceived &amp;&amp; Xp &lt;= TAU1) || (PriorityRequestReceived &amp;&amp;
   Xp &lt;= TAU2 &amp;&amp; Xp > TAU1) {
     // Transmit Diameter request
     // Update X and LCT
     X = max (0, Xp) + T;
     LCT = ta;
   } else {
     // Apply abatement treatment to Diameter request
     // Do not update X and LCT
   }
        </artwork>
        </figure>
        </t>
        </section>
        <section title="Optional enhancement: avoidance of resonance">
        <t>
   As the number of reacting node sources of traffic increases and the
   throughput of the reporting node decreases, the maximum rate admitted by
   each reacting node needs to decrease, and therefore the value of T becomes
   larger. Under some circumstances, e.g. if the traffic arises very
   quickly simultaneously at many sources, the occupancies of each
   bucket can become synchronized, resulting in the admissions from
   each source being close in time and batched or very 'peaky' arrivals
   at the reporting node, which not only gives rise to control instability, but
   also very poor delays and even lost messages. An appropriate term
   for this is 'resonance' [Erramilli].
        </t>
        <t>
          If the network topology is such that resonance can occur, then a
          simple way to avoid resonance is to randomize the bucket occupancy at
          two appropriate points -- at the activation of control and whenever
          the bucket empties -- as described below.
        </t>
        <t>
   After updating the value of the leaky bucket to X', generate a value
   u as follows:
        </t>
        <t>
     if X' > 0, then u=0
        </t>
        <t>
          else if X' &lt;= 0, then let u be set to a random value uniformly
                              distributed between -1/2 and +1/2
        </t>
        <t>
   Then (only) if the arrival is admitted, increase the bucket by an
   amount T + uT, which will therefore be just T if the bucket hadn't
   emptied, or lie between T/2 and 3T/2 if it had.
        </t>
        <t>
   This randomization should also be done when control is activated,
   i.e. instead of simply initializing the leaky bucket counter to
   TAU0, initialize it to TAU0 + uT, where u is uniformly distributed
   as above. Since activation would have been a result of response to a
   request sent by the reacting node, the second term in this expression can
   be interpreted as being the bucket increment following that
   admission.
        </t>
        <t>
   This method has the following characteristics:
        </t>
        <t>
        <list style="symbols">
        <t>
        If TAU0 is chosen to be equal to TAU and all sources
        activate control at the same time due to an extremely high
        request rate, then the time until the first request admitted by
        each reacting node would be uniformly distributed over [0,T];
        </t>
        <t>
        The maximum occupancy is TAU + (3/2)T, rather than TAU + T
        without randomization;
        </t>
        <t>
        For the special case of 'classic gapping' where TAU=0, then the
        minimum time between admissions is uniformly distributed over
        [T/2, 3T/2], and the mean time between admissions is the same,
        i.e. T+1/R where R is the request arrival rate.
        </t>
        <t>
        At high load randomization rarely occurs, so there is no loss
        of precision of the admitted rate, even though the randomized
        'phasing' of the buckets remains.
        </t>
        </list>
        </t>
        </section>
        </section>
        </section>

    <section title="IANA Consideration">
    <t>
    TBD
    </t>
    </section>
    <section title="Security Considerations">
    <t>Agent overload is an extension to the based Diameter overload mechanism.  As such, all of the
    security considerations outlined in <xref target="I-D.ietf-dime-ovli"/> apply to the agent overload scenarios.
    </t>
    </section>
    <section title="Acknowledgements">
    <t>
    </t>
    </section>


  </middle>

  <back>

  <references title="Normative References">
  &RFC2119;
  &RFC6733;
  &RFC5226;

  &I-D.ietf-dime-ovli;
  &I-D.ietf-dime-agent-overload;

<!--
  <reference anchor='I-D.ietf-dime-ovli'>
        <front>
            <title>Diameter Overload Indication Conveyance</title>
            <author initials='J.' surname='Korhonen'>
                <organization abbrev='Broadcom Communications'>
                Broadcom Communications
                </organization>
            </author>

            <date month='October' year='2013' />
        </front>
        <format type='TXT' octets='94506'
                target='http://xml.resource.org/public/rfc/bibxml3/reference.I-D.draft-ietf-dime-ovli-00.xml' />
  </reference>
  <reference anchor="I-D.SOC-overload-rate-control">
    <front>
      <title>SIP Overload Rate Control</title>
      <author initials="E." surname="Noel">
      <organization>AT&amp;t</organization>
      </author>
      <date month="February" year="2014"/>
    </front>
  </reference>
-->
  </references>

  <references title="Informative References">

  &RFC7415;
<!--
  <reference anchor="I-D.donovan-agent-overload">
    <front>
      <title>Diameter Agent Overload</title>
      <author initials="S." surname="Donovan">
      <organization>Oracle</organization>
      </author>
      <date month="February" year="2014"/>
    </front>
  </reference>
-->
  </references>

  </back>
 </rfc>
