One document matched: draft-ietf-rmcat-coupled-cc-00.xml


<?xml version="1.0" encoding="US-ASCII"?>
<!-- This template is for creating an Internet Draft using xml2rfc,
     which is available here: http://xml.resource.org. -->
<!DOCTYPE rfc SYSTEM "rfc2629.dtd" [
<!-- One method to get references from the online citation libraries.
     There has to be one entity for each item to be referenced. 
     An alternate method (rfc include) is described in the references. -->

<!ENTITY RFC2119 SYSTEM "http://xml2rfc.ietf.org/public/rfc/bibxml/reference.RFC.2119.xml">
<!ENTITY RFC3124 SYSTEM "http://xml2rfc.ietf.org/public/rfc/bibxml/reference.RFC.3124.xml">
<!ENTITY RFC5348 SYSTEM "http://xml2rfc.ietf.org/public/rfc/bibxml/reference.RFC.5348.xml">
<!ENTITY I-D.narten-iana-considerations-rfc2434bis SYSTEM "http://xml2rfc.ietf.org/public/rfc/bibxml3/reference.I-D.narten-iana-considerations-rfc2434bis.xml">
]>
<?xml-stylesheet type='text/xsl' href='rfc2629.xslt' ?>
<!-- used by XSLT processors -->
<!-- For a complete list and description of processing instructions (PIs), 
     please see http://xml.resource.org/authoring/README.html. -->
<!-- Below are generally applicable Processing Instructions (PIs) that most I-Ds might want to use.
     (Here they are set differently than their defaults in xml2rfc v1.32) -->
<?rfc strict="yes" ?>
<!-- give errors regarding ID-nits and DTD validation -->
<!-- control the table of contents (ToC) -->
<?rfc toc="yes"?>
<!-- generate a ToC -->
<?rfc tocdepth="3"?>
<!-- the number of levels of subsections in ToC. default: 3 -->
<!-- control references -->
<?rfc symrefs="yes"?>
<!-- use symbolic references tags, i.e, [RFC2119] instead of [1] -->
<?rfc sortrefs="yes" ?>
<!-- sort the reference entries alphabetically -->
<!-- control vertical white space 
     (using these PIs as follows is recommended by the RFC Editor) -->
<?rfc compact="yes" ?>
<!-- do not start each main section on a new page -->
<?rfc subcompact="no" ?>
<!-- keep one blank line between list items -->
<!-- end of list of popular I-D processing instructions -->
<?xml-stylesheet type="text/xsl" href="rfc2629.xslt"?>
<rfc category="exp" docName="draft-ietf-rmcat-coupled-cc-00" ipr="trust200902">
	<!--	noModificationTrust200902 noDerivativesTrust200902 pre5378Trust200902">-->
	<!-- updates="6298"> -->
	<!-- ipr="full3978"> -->
  <!-- category values: std, bcp, info, exp, and historic
     ipr values: full3667, noModification3667, noDerivatives3667
     you can add the attributes updates="NNNN" and obsoletes="NNNN" 
     they will automatically be output with "(if approved)" -->

  <!-- ***** FRONT MATTER ***** -->

  <front>
    <!-- The abbreviated title is used in the page header - it is only necessary if the 
         full title is longer than 39 characters -->

    <!-- <title abbrev="Abbreviated Title">Coupled congestion control</title> -->
    <title>Coupled congestion control for RTP media</title>

    <!-- add 'role="editor"' below for the editors if appropriate -->

    <!-- Another author who claims to be an editor -->


    <author fullname="Safiqul Islam" initials="S.I." surname="Islam">
      <organization>University of Oslo</organization>
      <address>
        <postal>
          <street>PO Box 1080 Blindern</street>
          <!-- Reorder these if your country does things differently -->
          <code>N-0316</code>
          <city>Oslo</city>
          <region></region>
          <country>Norway</country>
        </postal>
        <phone>+47 22 84 08 37</phone>
        <email>safiquli@ifi.uio.no</email>
        <!-- uri and facsimile elements may also be added -->
      </address>
    </author>

    <author fullname="Michael Welzl" initials="M.W." surname="Welzl">
      <organization>University of Oslo</organization>
      <address>
        <postal>
          <street>PO Box 1080 Blindern</street>
          <!-- Reorder these if your country does things differently -->
          <code>N-0316</code>
          <city>Oslo</city>
          <region></region>
          <country>Norway</country>
        </postal>
        <phone>+47 22 85 24 20</phone>
        <email>michawe@ifi.uio.no</email>
        <!-- uri and facsimile elements may also be added -->
      </address>
    </author>


      <author fullname="Stein Gjessing" initials="S.G." surname="Gjessing">
          <organization>University of Oslo</organization>
          <address>
              <postal>
                  <street>PO Box 1080 Blindern</street>
                  <!-- Reorder these if your country does things differently -->
                  <code>N-0316</code>
                  <city>Oslo</city>
                  <region></region>
                  <country>Norway</country>
              </postal>
              <phone>+47 22 85 24 44</phone>
              <email>steing@ifi.uio.no</email>
              <!-- uri and facsimile elements may also be added -->
          </address>
      </author>
      
      

    <date year="2015" />

    <!-- If the month and year are both specified and are the current ones, xml2rfc will fill 
         in the current day for you. If only the current year is specified, xml2rfc will fill 
	 in the current day and month for you. If the year is not the current one, it is 
	 necessary to specify at least a month (xml2rfc assumes day="1" if not specified for the 
	 purpose of calculating the expiry date).  With drafts it is normally sufficient to 
	 specify just the year. -->

    <!-- Meta-data Declarations -->

    <area>Transport</area>

    <workgroup>RTP Media Congestion Avoidance Techniques (rmcat)</workgroup>

    <!-- WG name at the upperleft corner of the doc,
         IETF is fine for individual submissions.  
	 If this element is not present, the default is "Network Working Group",
         which is used by the RFC Editor as a nod to the history of the IETF. -->

    <keyword>tcp</keyword>

    <!-- Keywords will be incorporated into HTML output
         files in a meta tag but they have no effect on text or nroff
         output. If you submit your draft to the RFC Editor, the
         keywords will be used for the search engine. -->

    <abstract>
	    <t>When multiple congestion controlled RTP sessions traverse the same network bottleneck, it can be beneficial to combine their controls such that the total on-the-wire behavior is improved. This document describes such a method for flows that have the same sender, in a way that is as flexible and simple as possible while minimizing the amount of changes needed to existing RTP applications. It specifies how to apply the method for the NADA congestion control algorithm.</t>
    </abstract>
  </front>

  <middle>
    <section title="Introduction" anchor='sec-intro'>
	    <t><!--For interactive applications, RTP media congestion control mechanisms should minimize the amount of self-inflicted queuing delay.--> When there is enough data to send, a congestion controller must increase its sending rate until the path's capacity has been reached; depending on the controller, sometimes the rate is increased further, until packets are ECN-marked or dropped. <!--In the public Internet, increasing beyond the capacity limit is currently the only way to get any feedback from the network that can be used as an indication of congestion.--> This process inevitably creates undesirable queuing delay -- an effect that is amplified when multiple congestion controlled connections traverse the same network bottleneck. </t>

<t>The Congestion Manager (CM) <xref target="RFC3124"/> couples flows by providing a single congestion controller. It is hard to implement because it requires an additional congestion controller and removes all per-connection congestion control functionality, which is quite a significant change to existing RTP based applications. <!--, and 2) it aggregates connections by destination address, thereby implicitly assuming that all packets that share the same destination address are routed across the same bottleneck in the network. This assumption can be wrong when, e.g., NATs or Equal-Cost Multi-Path (ECMP) routing are used.--> This document presents a method to combine the behavior of congestion control mechanisms that is easier to implement than the Congestion Manager <xref target="RFC3124"/> and also requires less significant changes to existing RTP based applications. It attempts to roughly approximate the CM behavior by sharing information between existing congestion controllers. It is able to honor user-specified priorities, which is required by rtcweb <xref target="rtcweb-usecases"/>.</t>
    </section>


    <section title="Definitions" anchor='sec-def'>
        <t>The key words "MUST", "MUST NOT", "REQUIRED", "SHALL", "SHALL NOT",
        "SHOULD", "SHOULD NOT", "RECOMMENDED", "MAY", and "OPTIONAL" in this
        document are to be interpreted as described in <xref
        target="RFC2119">RFC 2119</xref>.</t>

	<t><list style="hanging" hangIndent="6">
	  <t hangText="Available Bandwidth:">
	    <vspace />
	    The available bandwidth is the nominal link capacity minus the amount of traffic that traversed the link during a certain time interval, divided by that time interval.</t>
	  <t hangText="Bottleneck:">
	    <vspace />
	    The first link with the smallest available bandwidth along the path between a sender and receiver.</t>
	  <t hangText="Flow:">
	    <vspace />
	    A flow is the entity that congestion control is operating on. It could, for example, be a transport layer connection, an RTP session, or a subsession that is multiplexed onto a single RTP session together with other subsessions.</t>
	  <t hangText="Flow Group Identifier (FGI):">
	    <vspace />
	    A unique identifier for each subset of flows that is limited by a common bottleneck.</t>
	  <t hangText="Flow State Exchange (FSE):">
	    <vspace />
	    The entity that maintains information that is exchanged between flows.</t>
	  <t hangText="Flow Group (FG):">
	    <vspace />
	    A group of flows having the same FGI.</t>
	  <t hangText="Shared Bottleneck Detection (SBD):">
	    <vspace />
	    The entity that determines which flows traverse the same bottleneck in the network, or the process of doing so.</t>
	</list></t>

    </section>

    <section title="Limitations" anchor='sec-limits'>
      <t><list style="hanging" hangIndent="6">
	<t hangText="Sender-side only:">
	    <vspace />
	    Coupled congestion control as described here only operates inside a single host on the sender side. This is because, irrespective of where the major decisions for congestion control are taken, the sender of a flow needs to eventually decide the transmission rate. Additionally, the necessary information about how much data an application can currently send on a flow is often only available at the sender side, making the sender an obvious choice for placement of the elements and mechanisms described here.</t>
<!-- This doesn't play a role, does it?
     <t hangText="Only one congested link:">As per the definition above, only one bottleneck can exist between one sender and receiver. However, in the context of this document, the point of defining a bottleneck is to define a point of congestion, i.e. a link where a queue grows and flows begin to influence each other. Due to cross traffic, there can be several such congestion points between a sender and receiver. For simplicity, this fact is ignored here.</t> -->
     <t hangText="Shared bottlenecks do not change quickly:">
    <vspace />
     As per the definition above, a bottleneck depends on cross traffic, and since such traffic can heavily fluctuate, bottlenecks can change at a high frequency (e.g., there can be oscillation between two or more links). This means that, when flows are partially routed along different paths, they may quickly change between sharing and not sharing a bottleneck. For simplicity, here it is assumed that a shared bottleneck is valid for a time interval that is significantly longer than the interval at which congestion controllers operate. Note that, for the only SBD mechanism defined in this document (multiplexing on the same five-tuple), the notion of a shared bottleneck stays correct even in the presence of fast traffic fluctuations: since all flows that are assumed to share a bottleneck are routed in the same way, if the bottleneck changes, it will still be shared.</t>
      </list></t>
  </section>

    <section title="Architectural overview" anchor='sec-arch'>
      <t>Figure 1 shows the elements of the architecture for coupled congestion control: the Flow State Exchange (FSE), Shared Bottleneck Detection (SBD) and Flows. The FSE is a storage element that can be implemented in two ways: active and passive. In the active version, it initiates communication with flows and SBD. However, in the passive version, it does not actively initiate communication with flows and SBD; its only active role is internal state maintenance (e.g., an implementation could use soft state to remove a flow's data after long periods of inactivity). Every time a flow's congestion control mechanism would normally update its sending rate, the flow instead updates information in the FSE and performs a query on the FSE, leading to a sending rate that can be different from what the congestion controller originally determined. Using information about/from the currently active flows, SBD updates the FSE with the correct Flow State Identifiers (FSIs).
      </t>
	<figure align="center">
		<!--<preamble>Preamble</preamble>-->
		<artwork align="center">
		  <![CDATA[

-------  <---  Flow 1
| FSE |  <---  Flow 2 ..
-------  <---  .. Flow N
   ^
   |             |
-------          |
| SBD |  <-------|
-------
]]>
		</artwork>
		<postamble>Figure 1: Coupled congestion control architecture</postamble>
	</figure>
<t>Since everything shown in Figure 1 is assumed to operate on a single host (the sender) only, this document only describes aspects that have an influence on the resulting on-the-wire behavior. It does, for instance, not define how many bits must be used to represent FSIs, or in which way the entities communicate. Implementations can take various forms: for instance, all the elements in the figure could be implemented within a single application, thereby operating on flows generated by that application only. Another alternative could be to implement both the FSE and SBD together in a separate process which different applications communicate with via some form of Inter-Process Communication (IPC). Such an implementation would extend the scope to flows generated by multiple applications. The FSE and SBD could also be included in the Operating System kernel.</t>
    </section>

    <section title="Roles" anchor='roles'>
      <t>This section gives an overview of the roles of the elements of coupled congestion control, and provides an example of how coupled congestion control can operate.</t>
      <section title="SBD">
	<t>SBD uses knowledge about the flows to determine which flows belong in the same Flow Group (FG), and assigns FGIs accordingly.
	This knowledge can be derived in three basic ways:

    <list style="numbers">
        <t>From multiplexing: it can be based on the simple assumption that packets sharing the same five-tuple (IP source
        and destination address, protocol, and transport layer port number pair) and having the same
        Differentiated Services Code Point (DSCP) in the IP header are typically treated in the same way along the path.
        The latter method is the only one specified in this document: SBD MAY consider all flows that use the same
        five-tuple and DSCP to belong to the same FG. This classification applies to certain tunnels, or RTP flows
        that are multiplexed over one transport (cf. <xref target="transport-multiplex"/>). In one way or another,
        such multiplexing will probably be recommended for use with rtcweb <xref target="rtcweb-rtp-usage"/>.</t>
        <t>Via configuration: e.g. by assuming that a common wireless uplink is also a shared bottleneck.</t>
        <t>From measurements: e.g. by considering correlations among measured delay and loss as an indication of a shared bottleneck.</t>
    </list>
    </t>
    <t>The methods above have some essential trade-offs: e.g., multiplexing is a completely reliable measure, however it
    is limited in scope to two end points (i.e., it cannot be applied to couple congestion controllers of one sender
    talking to multiple receivers). A measurement-based SBD mechanism is described in <xref target="sbd"/>. Measurements can never be
    100% reliable, in particular because they are based on the past but applying coupled congestion control means to
    make an assumption about the future; it is therefore recommended to implement cautionary measures, e.g. by
    disabling coupled congestion control if enabling it causes a significant increase in delay and/or packet loss.
    Measurements also take time, which entails a certain delay for turning on coupling (refer to <xref target="sbd"/> for details).</t>
    
      </section>
      <section title="FSE" anchor="fse-variables">
	<t>The FSE contains a list of all flows that have registered with it. For each flow, it stores the following:
	<list style="symbols">
	  <t>a unique flow number to identify the flow</t>
	  <t>the FGI of the FG that it belongs to (based on the definitions in this document, a flow has only one bottleneck, and can therefore be in only one FG)</t>
	  <t>a priority P, which here is assumed to be represented as a floating point number in the range from 0.1 (unimportant) to 1 (very important). A negative value is used to indicate that a flow has terminated</t>
	  <t>The rate used by the flow in bits per second, FSE_R. </t>

     <!-- <t> A flag G is used to describe whether the flow is greedy or not. A value 1 is used to represent the greedy flows and 0 to represent the non-greedy flows. NOTE TO SELF: don't use the word "greedy" in this draft</t> -->
	</list>
   </t>
    <t>The FSE can operate on window-based as well as rate-based congestion controllers (TEMPORARY NOTE: and probably -- not yet tested --
    combinations thereof, with calculations to convert from one to the other). In case of a
    window-based controller, FSE_R is a window, and all the text below should be considered to
    refer to window, not rates.</t>
    
    <t>In the FSE, each FG contains one static variable S_CR which is meant to be the sum of the calculated rates of all flows in the same FG (including the flow itself). This value is used to calculate the sending rate. </t>

	<t>The information listed here is enough to implement the sample flow algorithm given below. FSE implementations could easily be extended to store, e.g., a flow's current sending rate for statistics gathering or future potential optimizations.</t>
      </section>
      <section title="Flows" anchor='flows'>
	<t>Flows register themselves with SBD and FSE when they start, deregister from the FSE when they stop, and carry out an UPDATE function call every time their congestion controller calculates a new sending rate. Via UPDATE, they provide the newly calculated rate and optionally (if the algorithm supports it) the desired rate. The desired rate is less than the calculated rate in case of application-limited flows; otherwise, it is the same as the calculated rate.</t>
          
<t>Below, two example algorithms are described. While other algorithms could be used instead, the same algorithm must be applied to all flows.</t>
          <!--Text from a previous version, only applies to the passive variant:
           The way the algorithm is described here, the operations are carried out by the flows, but they are the same for all flows. This means that the algorithm could, for example, be implemented in a library that provides registration, deregistration functions and the UPDATE function. To minimize the number of changes to existing applications, one could, however, also embed this functionality in the FSE element.</t> -->

 <section title="Example algorithm 1 - Active FSE" anchor='example-alg-act'>
  <t>This algorithm was designed to be the simplest possible method to assign rates according to the priorities of flows. Simulations results in <xref target="fse"></xref> indicate that it does however not significantly reduce queuing delay and packet loss.</t>
  <t><list style="format (%d)">
    <t>When a flow f starts, it registers itself with SBD and the FSE. FSE_R is initialized with the congestion controller's initial rate. SBD will assign the correct FGI. When a flow is assigned an FGI, it adds its FSE_R to S_CR.</t>
    <t>When a flow f stops, its entry is removed from the list.</t>  
      <t>Every time the congestion controller of the flow f determines a new sending rate CC_R, the flow calls UPDATE, which carries out the tasks listed below to derive the new sending rates for all the flows in the FG. A flow's UPDATE function uses a local (i.e. per-flow) temporary variable S_P, which is the sum of all the priorities.
    <list style="format (%c)">  

    <t> It updates S_CR.
        <figure align="left">
            <artwork align="left">
              <![CDATA[
            S_CR = S_CR + CC_R - FSE_R(f)]]>
            </artwork>
        </figure>
    </t> 

    <t> It calculates the sum of all the priorities, S_P.
        <figure align="left">
            <artwork align="left">
              <![CDATA[
            S_P = 0
            for all flows i in FG do
                S_P = S_P + P(i)
            end for]]>
            </artwork>
        </figure>

    </t>         


    <t> It calculates the sending rates for all the flows in an FG and distributes them.
        <figure align="left">
            <artwork align="left">
              <![CDATA[
            for all flows i in FG do
                FSE_R(i) = (P(i)*S_CR)/S_P
                send FSE_R(i) to the flow i
            end for]]>
            </artwork>
        </figure>

    </t> 


    </list></t>

  </list></t>


 </section>


 <section title="Example algorithm 2 - Conservative Active FSE" anchor='example-alg-act-cons'>
     <t>This algorithm extends algorithm 1 to conservatively emulate the behavior of a single flow by proportionally reducing the aggregate rate on congestion. Simulations results in <xref target="fse"></xref> indicate that it can significantly reduce queuing delay and packet loss. <!--It misses some features that we would like to incorporate in future versions of this document (e.g. letting bulk transfers immediately use the bandwidth that is not used by application-limited flows); if these features make the algorithm significantly more complex, this will be included as a third variant of the algorithm.--></t>
  <t><list style="format (%d)">
    <t>When a flow f starts, it registers itself with SBD and the FSE. FSE_R is initialized with the congestion controller's initial rate. SBD will assign the correct FGI. When a flow is assigned an FGI, it adds its FSE_R to S_CR.</t>
    <t>When a flow f stops, its entry is removed from the list.</t>  
      <t>Every time the congestion controller of the flow f determines a new sending rate CC_R, the flow calls UPDATE, which carries out the tasks listed below to derive the new sending rates for all the flows in the FG. A flow's UPDATE function uses a local (i.e. per-flow) temporary variable S_P, which is the sum of all the priorities, and a local variable DELTA, which is used to calculate the difference between CC_R and the previously stored FSE_R. To prevent flows from either ignoring congestion or overreacting, a timer keeps them from changing their rates immediately after the common rate reduction that follows a congestion event. This timer is set to 2 RTTs of the flow that experienced congestion because it is assumed that a congestion event can persist for up to one RTT of that flow, with another RTT added to compensate for fluctuations in the measured RTT value.
    <list style="format (%c)">  

 
    <t> It updates S_CR based on DELTA.
        <figure align="left">
            <artwork align="left">
              <![CDATA[
            if Timer has expired or not set then 
              DELTA = CC_R - FSE_R(f)
              if DELTA < 0 then  // Reduce S_CR proportionally 
                S_CR = S_CR * CC_R / FSE_R(f)
                Set Timer for 2 RTTs
              else    
                S_CR = S_CR + DELTA
              end if
             end if ]]>
            </artwork>
        </figure>
    </t> 

    <t> It calculates the sum of all the priorities, S_P.
        <figure align="left">
            <artwork align="left">
              <![CDATA[
            S_P = 0
            for all flows i in FG do
                S_P = S_P + P(i)
            end for]]>
            </artwork>
        </figure>

    </t>         


    <t> It calculates the sending rates for all the flows in an FG and distributes them.
        <figure align="left">
            <artwork align="left">
              <![CDATA[
            for all flows i in FG do
                FSE_R(i) = (P(i)*S_CR)/S_P
                send FSE_R(i) to the flow i
            end for]]>
            </artwork>
        </figure>

    </t> 


    </list></t>

  </list></t>

 </section>




  </section>
 
    </section>
    
    <section anchor="Application" title="Application">

     <t>This section specifies how the FSE can be applied to specific congestion control mechanisms and makes general recommendations that facilitate applying the FSE to future congestion controls.</t>

    <section anchor="app-NADA" title="NADA">
     <t>Network-Assisted Dynamic Adapation (NADA) <xref target="nada"></xref> is a congestion control scheme for rtcweb. It calculates a reference rate R_n upon receiving an acknowledgment, and then, based on the reference rate, it calculates a video target rate R_v and a sending rate for the flows, R_s.</t>
     
     <t>When applying the FSE to NADA, the UPDATE function call described in <xref target="flows"></xref> gives the FSE NADA's reference rate R_n. The recommended algorithm for NADA is the Active FSE in <xref target="example-alg-act"></xref>. In step 3 (c), when the FSE_R(i) is "sent" to the flow i, this means updating R_v and R_s of flow i with the value of FSE_R(i).</t>

     <t>NADA simulation results are available from
     http://heim.ifi.uio.no/safiquli/coupled-cc/. The next version of this document will refer to a technical report that will be made available at the same URL.</t>
    </section>

    <section anchor="app-general" title="General recommendations">
    <t>This section will provides general advice for applying the FSE to congestion control mechanisms. TEMPORARY NOTE: Future versions of this document will contain a longer list.</t>
          <t><list style="hanging" hangIndent="6">
	<t hangText="Receiver-side calculations:">
	    <vspace />
When receiver-side calculations make assumptions about the rate of the sender, the calculations need to be synchronized or the receiver needs to be updated accordingly. This applies to TFRC <xref target="RFC5348"/>, for example, where simulations showed somewhat less favorable results when using the FSE without a receiver-side change <xref target="fse" />.</t>
      </list></t>
          
    </section>

    </section>

    <section anchor="Acknowledgements" title="Acknowledgements">
       <t>This document has benefitted from discussions with and feedback from David Hayes, Mirja Kuehlewind, Andreas Petlund, David Ros (who also gave the FSE its name), Zaheduzzaman Sarker and Varun Singh. The authors would like to thank Xiaoqing Zhu for helping with NADA.</t>
<t>This work was partially funded by the European Community under its Seventh Framework Programme through the Reducing Internet Transport Latency (RITE) project (ICT-317700).</t>
    </section>


    <!-- Possibly a 'Contributors' section ... -->

    <section anchor="IANA" title="IANA Considerations">
      <t>This memo includes no request to IANA.</t>
    </section>

    <section anchor="Security" title="Security Considerations">
      <t>In scenarios where the architecture described in this document is applied across applications, various cheating possibilities arise: e.g., supporting wrong values for the calculated rate, the desired rate, or the priority of a flow. In the worst case, such cheating could either prevent other flows from sending or make them send at a rate that is unreasonably large. The end result would be unfair behavior at the network bottleneck, akin to what could be achieved with any UDP based application. Hence, since this is no worse than UDP in general, there seems to be no significant harm in using this in the absence of UDP rate limiters.</t>

<t>In the case of a single-user system, it should also be in the interest of any application programmer to give the user the best possible experience by using reasonable flow priorities or even letting the user choose them. In a multi-user system, this interest may not be given, and one could imagine the worst case of an "arms race" situation, where applications end up setting their priorities to the maximum value. If all applications do this, the end result is a fair allocation in which the priority mechanism is implicitly eliminated, and no major harm is done.</t>
    </section>
  </middle>

  <!--  *****BACK MATTER ***** -->

  <back>
    <!-- References split into informative and normative -->

    <!-- There are 2 ways to insert reference entries from the citation libraries:
     1. define an ENTITY at the top, and use "ampersand character"RFC2629; here (as shown)
     2. simply use a PI "less than character"?rfc include="reference.RFC.2119.xml"?> here
        (for I-Ds: include="reference.I-D.narten-iana-considerations-rfc2434bis.xml")

     Both are cited textually in the same manner: by using xref elements.
     If you use the PI option, xml2rfc will, by default, try to find included files in the same
     directory as the including file. You can also define the XML_LIBRARY environment variable
     with a value containing a set of directories to search.  These can be either in the local
     filing system or remote ones accessed by http (http://domain/dir/... ).-->

    <references title="Normative References">
      <!--?rfc include="http://xml.resource.org/public/rfc/bibxml/reference.RFC.2119.xml"?-->
      &RFC2119;
      &RFC3124;
      &RFC5348;
    </references>

    <references title="Informative References">
	  <reference anchor="rtcweb-usecases" target="">
		  <front>
	  		<title>Web Real-Time Communication Use-cases and Requirements</title>
			<author initials="C." surname="Holmberg" fullname="C. Holmberg"></author>
			<author initials="S." surname="Hakansson" fullname="S. Hakansson"></author>
			<author initials="G." surname="Eriksson" fullname="G. Eriksson"></author>
			<date month="February" year="2014"/>
		</front>
			<seriesInfo name="Internet-draft" value="draft-ietf-rtcweb-use-cases-and-requirements-14.txt"/>
	</reference>

	  <reference anchor="transport-multiplex" target="">
		  <front>
	  		<title>Multiple RTP Sessions on a Single Lower-Layer Transport</title>
			<author initials="M." surname="Westerlund" fullname="M. Westerlund"></author>
			<author initials="C." surname="Perkins" fullname="C. Perkins"></author>
			<date month="October" year="2013"/>
		</front>
			<seriesInfo name="Internet-draft" value="draft-westerlund-avtcore-transport-multiplexing-07.txt"/>
	</reference>

	  <reference anchor="rtcweb-rtp-usage" target="">
		  <front>
	  		<title>Web Real-Time Communication (WebRTC): Media Transport and Use of RTP</title>
			<author initials="C." surname="Perkins" fullname="C. Perkins"></author>
			<author initials="M." surname="Westerlund" fullname="M. Westerlund"></author>
			<author initials="J." surname="Ott" fullname="J. Ott"></author>
			<date month="October" year="2014"/>
		</front>
			<seriesInfo name="Internet-draft" value="draft-ietf-rtcweb-rtp-usage-18.txt"/>
	</reference>

    <reference anchor="fse">
      <front>
        <title>Coupled Congestion Control for RTP Media</title>
      <author initials="S.I." surname="Islam" fullname="S. Islam"> </author>
      <author initials="M.W." surname="Welzl" fullname="M. Welzl" > </author>
      <author initials="S.G." surname="Gjessing" fullname="S Gjessing" > </author>
      <author initials="N.K." surname="Khademi" fullname="N Khademi" > </author>
      <date year="2014" />
    </front>
    <seriesInfo name="ACM SIGCOMM Capacity Sharing Workshop (CSWS 2014); extended version available as a technical report from http://safiquli.at.ifi.uio.no/paper/fse-tech-report.pdf" value="" />
    </reference>


	  <reference anchor="sbd" target="">
		  <front>
	  		<title>Shared Bottleneck Detection for Coupled Congestion Control for RTP Media</title>
			<author initials="D." surname="Hayes" fullname="D. Hayes"></author>
			<author initials="S." surname="Ferlin" fullname="S. Ferlin"></author>
			<author initials="M." surname="Welzl" fullname="M. Welzl"></author>
			<date month="May" year="2015"/>
		</front>
			<seriesInfo name="Internet-draft" value="draft-ietf-rmcat-sbd-00.txt"/>
	</reference>

      <reference anchor="nada" target="">
      <front>
        <title>NADA: A Unified Congestion Control Scheme for Real-Time Media</title>
      <author initials="X." surname="Zhu" fullname="X. Zhu"></author>
      <author initials="R." surname="Pan" fullname="R. Pan"></author>
      <author initials="M. A." surname="Ramalho" fullname="M.A. Ramalho"></author>
      <author initials="S." surname="Mena" fullname="S. Mena"></author>
      <author initials="C." surname="Ganzhorn" fullname="C. Ganzhorn"></author>
      <author initials="P. E." surname="Jones" fullname="P. E. Jones"></author>
      <author initials="S." surname="De Aronco" fullname="S. De Aronco"></author>
      <date month="April" year="2015"/>
    </front>
      <seriesInfo name="Internet-draft" value="draft-ietf-rmcat-nada-00"/>
  </reference>
	
    </references>


    <section title="Scheduling" anchor='scheduling'>

    <t> When connections originate from the same host, it would be possible to use only one single sender-side congestion controller which determines the overall allowed sending rate, and then use a local scheduler to assign a proportion of this rate to each RTP session. This way, priorities could also be implemented as a function of the scheduler. The Congestion Manager (CM) <xref target="RFC3124"/> also uses such a scheduling function.</t>        

     </section> 

    <section title="Example algorithm - Passive FSE" anchor='example-alg-pas'>

    

  <t>Active algorithms calculate the rates for all the flows in the FG and actively distribute them. In a passive algorithm, UPDATE returns a rate that should be used instead of the rate that the congestion controller has determined. This can make a passive algorithm easier to implement; however, when round-trip times of flows are unequal,
shorter-RTT flows will update and react to the overall FSE state more often than longer-RTT flows, which can produce unwanted side effects. This problem is more significant when the congestion control convergence depends on the RTT. While the passive algorithm works better for congestion controls with RTT-independent convergence, it can still produce oscillations on short time scales. The algorithm described below is therefore considered as highly experimental.</t>
  
  <t>This passive version of the FSE stores the following information in addition to the variables described in <xref target="fse-variables"></xref>: 

   <list style="symbols">

      <t>The desired rate DR. This can be smaller than the calculated rate if the application feeding into the flow has less data to send than the congestion controller would allow. In case of a bulk transfer, DR must be set to CC_R received from the flow's congestion module.</t>
    </list>  
<!--    <t>A continuously growing flow number per FGI. The first flow to register itself with the FSE is assigned number 1, the second flow is assigned number 2, etc.</t> -->
  </t>
  
  <t>The passive version of the FSE contains one static variable per FG called TLO (Total Leftover Rate -- used to let a flow 'take' bandwidth from application-limited or terminated flows) which is initialized to 0. For the passive version, S_CR is limited to increase or decrease as conservatively as a flow's congestion controller decides in order to prohibit sudden rate jumps.<!--At most, it can be the sum of these calculated rates, as seen by the flow during its last rate update.--></t>


  <t><list style="format (%d)">
    <t>When a flow f starts, it registers itself with SBD and the FSE. FSE_R and DR are initialized with the congestion controller's initial rate. SBD will assign the correct FGI. When a flow is assigned an FGI, it adds its FSE_R to S_CR.</t>
    <t>When a flow f stops, it sets its DR to 0 and sets P to -1.</t>  
    <t>Every time the congestion controller of the flow f determines a new sending rate CC_R, assuming the flow's new desired rate new_DR to be "infinity" in case of a bulk data transfer with an unknown maximum rate, the flow calls UPDATE, which carries out the tasks listed below to derive the flow's new sending rate, Rate. A flow's UPDATE function uses a few local (i.e. per-flow) temporary variables, which are all initialized to 0: DELTA, new_S_CR and S_P.
    <list style="format (%c)">
          <t>For all the flows in its FG (including itself), it calculates the sum of all the calculated rates, new_S_CR. Then it calculates the difference between FSE_R(f) and CC_R, DELTA.
              <figure align="left">
                  <artwork align="left">
                      <![CDATA[
            for all flows i in FG do
                new_S_CR = new_S_CR + FSE_R(i)
            end for
            DELTA =  CC_R - FSE_R(f)]]>
                  </artwork>
              </figure>
        </t>
          
        <t>It updates S_CR, FSE_R(f) and DR(f).
              <figure align="left">
                  <artwork align="left">
                      <![CDATA[
            FSE_R(f) = CC_R
            if DELTA > 0 then  // the flow's rate has increased
                S_CR = S_CR + DELTA
            else if DELTA < 0 then
                S_CR = new_S_CR + DELTA
            end if 
            DR(f) = min(new_DR,FSE_R(f))]]>
                  </artwork>
              </figure>
        </t>
          
        <t>It calculates the leftover rate TLO, removes the terminated flows from the FSE and calculates the sum of all the priorities, S_P.
              <figure align="left">
                  <artwork align="left">
                      <![CDATA[
            for all flows i in FG do
               if P(i)<0 then
                  delete flow
               else
                  S_P = S_P + P(i)
               end if
            end for
            if DR(f) < FSE_R(f) then
               TLO = TLO + (P(f)/S_P) * S_CR - DR(f))
            end if]]>
                  </artwork>
              </figure>
        </t>
          
        <t>It calculates the sending rate, Rate.
              <figure align="left">
                  <artwork align="left">
                      <![CDATA[
            Rate = min(new_DR, (P(f)*S_CR)/S_P + TLO)
                          
            if Rate != new_DR and TLO > 0 then
                TLO = 0  // f has 'taken' TLO
            end if]]>
                  </artwork>
              </figure>
        </t>
          
        <t>It updates DR(f) and FSE_R(f) with Rate.
            <figure align="left">
                <artwork align="left">
                    <![CDATA[
            if Rate > DR(f) then
                DR(f) = Rate
            end if
            FSE_R(f)  = Rate]]>
                </artwork>
            </figure>
        </t>
          
    </list></t>

  </list></t>
        <t>The goals of the flow algorithm are to achieve prioritization, improve network utilization in the face of application-limited flows, and impose limits on the increase behavior such that the negative impact of multiple flows trying to increase their rate together is minimized. It does that by assigning a flow a sending rate that may not be what the flow's congestion controller expected. It therefore builds on the assumption that no significant inefficiencies arise from temporary application-limited behavior or from quickly jumping to a rate that is higher than the congestion controller intended. How problematic these issues really are depends on the controllers in use and requires careful per-controller experimentation. The coupled congestion control mechanism described here also does not require all controllers to be equal; effects of heterogeneous controllers, or homogeneous controllers being in different states, are also subject to experimentation.</t>
     
            <t>This algorithm gives all the leftover rate of application-limited flows to the first
            flow that updates its sending rate, provided that this flow needs it all (otherwise, its own leftover rate can be taken by the next flow   that updates its rate).  Other policies could be applied, e.g. to divide the leftover rate of a flow
            equally among all other flows in the FGI.</t>

    <section anchor="example-op" title="Example operation (passive)">
       <t>In order to illustrate the operation of the passive coupled congestion control algorithm, this section presents a toy example of two flows that use it. Let us assume that both flows traverse a common 10 Mbit/s bottleneck and use a simplistic congestion controller that starts out with 1 Mbit/s, increases its rate by 1 Mbit/s in the absence of congestion and decreases it by 2 Mbit/s in the presence of congestion. For simplicity, flows are assumed to always operate in a round-robin fashion. Rate numbers below without units are assumed to be in Mbit/s. For illustration purposes, the actual sending rate is also shown for every flow in FSE diagrams even though it is not really stored in the FSE.</t>

<t>Flow #1 begins. It is a bulk data transfer and considers itself to have top priority.  This is the FSE after the flow algorithm's step 1:</t>
  <figure align="left">
        <artwork align="left">
      <![CDATA[
----------------------------------------
| # | FGI |  P  | FSE_R  |  DR  | Rate |
|   |     |     |        |      |      |
| 1 |  1  |  1  |   1    |   1  |   1  |
----------------------------------------
S_CR = 1, TLO = 0
              
]]>
    </artwork>
  </figure>
<t>Its congestion controller gradually increases its rate. Eventually, at some point, the FSE should look like this:</t>
  <figure align="left">
    <artwork align="left">
      <![CDATA[
--------------------------------------
| # | FGI |  P  |  FSE_R  |  DR  | Rate |
|   |     |     |         |      |      |
| 1 |  1  |  1  |   10    |  10  |  10  |
-----------------------------------------
S_CR = 10, TLO = 0

]]>
    </artwork>
  </figure>
<t>Now another flow joins. It is also a bulk data transfer, and has a lower priority (0.5):</t>
  <figure align="left">
    <artwork align="left">
      <![CDATA[
----------------------------------------
| # | FGI |   P   | FSE_R  |  DR  | Rate |
|   |     |       |        |      |      |
| 1 |  1  |   1   |   10   |  10  |  10  |
| 2 |  1  |  0.5  |    1   |   1  |   1  |
------------------------------------------
S_CR = 11, TLO = 0

]]>
    </artwork>
  </figure>
<t>Now assume that the first flow updates its rate to 8, because the total sending rate of 11 exceeds the total capacity.
Let us take a closer look at what happens in step 3 of the flow algorithm.</t>
  <figure align="left">
    <artwork align="left">
      <![CDATA[
CC_R = 8. new_DR = infinity.
3 a) new_S_CR = 11; DELTA = 8 - 10 = -2.
3 b) FSE_Rf) = 8. DELTA is negative, hence S_CR = 9;
     DR(f) = 8.
3 c) S_P = 1.5.
3 d) new sending rate = min(infinity, 1/1.5 * 9 + 0) = 6.
3 e) FSE_R(f) = 6.

The resulting FSE looks as follows:
----------------------------------------
| # | FGI |   P   |  FSE_R  |  DR  | Rate |
|   |     |       |         |      |      |
| 1 |  1  |   1   |    6    |   8  |   6  |
| 2 |  1  |  0.5  |    1    |   1  |   1  |
-------------------------------------------
S_CR = 9, TLO = 0

]]>
    </artwork>
  </figure>
<t>The effect is that flow #1 is sending with 6 Mbit/s instead of the 8 Mbit/s that the congestion controller derived. Let us now assume that flow #2 updates its rate. Its congestion controller detects that the network is not fully saturated (the actual total sending rate is 6+1=7) and increases its rate.</t>
  <figure align="left">
    <artwork align="left">
      <![CDATA[
CC_R=2. new_DR = infinity.
3 a) new_S_CR = 7; DELTA = 2 - 1 = 1.
3 b) FSE_R(f) = 2. DELTA is positive, hence S_CR = 9 + 1 = 10;
     DR(f) = 2.
3 c) S_P = 1.5.
3 d) new sending rate = min(infinity, 0.5/1.5 * 10 + 0) = 3.33.
3 e) DR(f) = FSE_R(f) = 3.33.

The resulting FSE looks as follows:
-------------------------------------------
| # | FGI |   P   |  FSE_R  |  DR  | Rate |
|   |     |       |         |      |      |
| 1 |  1  |   1   |    6    |   8  |   6  |
| 2 |  1  |  0.5  |   3.33  | 3.33 | 3.33 |
-------------------------------------------
S_CR = 10, TLO = 0

]]>
    </artwork>
  </figure>
        <t>The effect is that flow #2 is now sending with 3.33 Mbit/s, which is close to half of the rate of flow #1 and leads to a total utilization of 6(#1) + 3.33(#2) = 9.33 Mbit/s. Flow #2's congestion controller has increased its rate faster than the controller actually expected. Now, flow #1 updates its rate. Its congestion controller detects that the network is not fully saturated and increases its rate. Additionally, the application feeding into flow #1 limits the flow's sending rate to at most 2 Mbit/s.</t>
  <figure align="left">
    <artwork align="left">
      <![CDATA[
CC_R=7. new_DR=2.
3 a) new_S_CR = 9.33; DELTA = 1.
3 b) FSE_R(f) = 7, DELTA is positive, hence S_CR = 10 + 1 = 11;
     DR = min(2, 7) = 2.
3 c) S_P = 1.5; DR(f) < FSE_R(f), hence TLO = 1/1.5 * 11 - 2 = 5.33.
3 d) new sending rate = min(2, 1/1.5 * 11 + 5.33) = 2.
3 e) FSE_R(f) = 2.

The resulting FSE looks as follows:
-------------------------------------------
| # | FGI |   P   |  FSE_R  |  DR  | Rate |
|   |     |       |         |      |      |
| 1 |  1  |   1   |    2    |   2  |   2  |
| 2 |  1  |  0.5  |   3.33  | 3.33 | 3.33 |
-------------------------------------------
S_CR = 11, TLO = 5.33

              
]]>
    </artwork>
  </figure>
<t>Now, the total rate of the two flows is 2 + 3.33 = 5.33 Mbit/s, i.e. the network is significantly underutilized due to the limitation of flow #1. Flow #2 updates its rate. Its congestion controller detects that the network is not fully saturated and increases its rate.</t>
  <figure align="left">
    <artwork align="left">
      <![CDATA[
CC_R=4.33. new_DR = infinity.
3 a) new_S_CR = 5.33; DELTA = 1.
3 b) FSE_R(f) = 4.33. DELTA is positive, hence S_CR = 12;
     DR(f) = 4.33.
3 c) S_P = 1.5.
3 d) new sending rate: min(infinity, 0.5/1.5 * 12 + 5.33 ) = 9.33.
3 e) FSE_R(f) = 9.33, DR(f) = 9.33.

The resulting FSE looks as follows:
-------------------------------------------
| # | FGI |   P   |  FSE_R  |  DR  | Rate |
|   |     |       |         |      |      |
| 1 |  1  |   1   |    2    |   2  |   2  |
| 2 |  1  |  0.5  |   9.33  | 9.33 | 9.33 |
-------------------------------------------
S_CR = 12, TLO = 0

]]>
    </artwork>
  </figure>
<t>Now, the total rate of the two flows is 2 + 9.33 = 11.33 Mbit/s. Finally, flow #1 terminates. It sets P to -1 and DR to 0. Let us assume that it terminated late enough for flow #2 to still experience the network in a congested state, i.e. flow #2 decreases its rate in the next iteration.</t>

    <figure align="left">
    <artwork align="left">
      <![CDATA[
CC_R = 7.33. new_DR = infinity.
3 a) new_S_CR = 11.33; DELTA = -2.
3 b) FSE_R(f) = 7.33. DELTA is negative, hence S_CR = 9.33;
     DR(f) = 7.33.
3 c) Flow 1 has P = -1, hence it is deleted from the FSE.
     S_P = 0.5.
3 d) new sending rate: min(infinity, 0.5/0.5*9.33 + 0) = 9.33.
3 e) FSE_R(f) = DR(f) = 9.33.

The resulting FSE looks as follows:
-------------------------------------------
| # | FGI |   P   |  FSE_R  |  DR  | Rate |
|   |     |       |         |      |      |
| 2 |  1  |  0.5  |   9.33  | 9.33 | 9.33 |
-------------------------------------------
S_CR = 9.33, TLO = 0

]]>
        </artwork>
    </figure>
        
    </section>
 </section>



<!--
    
 <section title="Change log">
    <section anchor="-00-01" title="Changes from -00 to -01">
      <t>
      <list style="symbols">
        <t> Added change log. </t>
        <t> Updated the example algorithm and its operation.</t>
      </list>
    </t>

    </section>
      <section anchor="-01-02" title="Changes from -01 to -02">
          <t>
          <list style="symbols">
              <t>Included an active version of the algorithm which is simpler.</t>
              <t>Replaced "greedy flow" with "bulk data transfer" and "non-greedy" with "application-limited".</t>
              <t>Updated new_CR to CC_R, and CR to FSE_R for better understanding.  </t>
          </list>
          </t>
      </section>
      <section anchor="-02-03" title="Changes from -02 to -03">
          <t>
          <list style="symbols">
              <t>Included an active conservative version of the algorithm which reduces queue growth and packet loss; added a reference to a technical report that shows these benefits with simulations.</t>
              <t>Moved the passive variant of the algorithm to appendix.</t>
          </list>
          </t>
      </section>
      <section anchor="-03-04" title="Changes from -03 to -04">
          <t>
          <list style="symbols">
              <t>Extended SBD section.</t>
              <t>Added a note about window-based controllers.</t>
          </list>
          </t>
      </section>

      <section anchor="-04-05" title="Changes from -04 to -05">
          <t>
          <list style="symbols">
              <t>Added a section about applying the FSE to specific congestion control algorithms, with a subsection specifying its use with NADA.</t>
          </list>
          </t>
      </section>

  </section>    -->

      
      <!-- <section anchor="-00-01" title="Changes from -00 to -01">
       <t>Updated the example algorithm and its operation to let flows fairly take the leftover rate from other non-greedy and/or terminated flows.</t>
       </section> -->

    <!-- Change Log
v00 2006-03-15  EBD   Initial version

v01 2006-04-03  EBD   Moved PI location back to position 1 -
                      v3.1 of XMLmind is better with them at this location.
v02 2007-03-07  AH    removed extraneous nested_list attribute,
                      other minor corrections
v03 2007-03-09  EBD   Added comments on null IANA sections and fixed heading capitalization.
                      Modified comments around figure to reflect non-implementation of
                      figure indent control.  Put in reference using anchor="DOMINATION".
                      Fixed up the date specification comments to reflect current truth.
v04 2007-03-09 AH     Major changes: shortened discussion of PIs,
                      added discussion of rfc include.
v05 2007-03-10 EBD    Added preamble to C program example to tell about ABNF and alternative 
                      images. Removed meta-characters from comments (causes problems).  -->
  </back>
</rfc>

PAFTECH AB 2003-20262026-04-23 03:13:55