<?xml version="1.0" encoding="utf-8"?>
<!-- 
     draft-rfcxml-general-template-standard-00
  
     This template includes examples of the most commonly used features of RFCXML with comments 
     explaining how to customise them. This template can be quickly turned into an I-D by editing 
     the examples provided. Look for [REPLACE], [REPLACE/DELETE], [CHECK] and edit accordingly.
     Note - 'DELETE' means delete the element or attribute, not just the contents.
     
     Documentation is at https://authors.ietf.org/en/templates-and-schemas
-->
<?xml-model href="rfc7991bis.rnc"?>  <!-- Required for schema validation and schema-aware editing -->
<!-- <?xml-stylesheet type="text/xsl" href="rfc2629.xslt" ?> -->
<!-- This third-party XSLT can be enabled for direct transformations in XML processors, including most browsers -->


<!DOCTYPE rfc [
  <!ENTITY nbsp    "&#160;">
  <!ENTITY zwsp   "&#8203;">
  <!ENTITY nbhy   "&#8209;">
  <!ENTITY wj     "&#8288;">
]>
<!-- If further character entities are required then they should be added to the DOCTYPE above.
     Use of an external entity file is not recommended. -->

<rfc
  xmlns:xi="http://www.w3.org/2001/XInclude"
  category="info"
  docName="draft-hu-ccamp-uonaco-control-framework-01"
  ipr="trust200902"
  obsoletes=""
  updates=""
  submissionType="IETF"
  xml:lang="en"
  version="3">
<!-- [REPLACE] 
       * docName with name of your draft
     [CHECK] 
       * category should be one of std, bcp, info, exp, historic
       * ipr should be one of trust200902, noModificationTrust200902, noDerivativesTrust200902, pre5378Trust200902
       * updates can be an RFC number as NNNN
       * obsoletes can be an RFC number as NNNN 
-->

  <front>
    <title abbrev="UONACO Control Framework">A Control Framework for Unified Optical Networks and AI Computing Orchestration (UONACO)</title>
    <!--  [REPLACE/DELETE] abbrev. The abbreviated title is required if the full title is longer than 39 characters -->

    <seriesInfo name="Internet-Draft" value="draft-hu-ccamp-uonaco-control-framework-01"/>
   
    <author fullname="Qiaojun Hu" initials="Q" role="editor" surname="Hu">
    <!-- <author fullname="Yanxia Tan" initials="China Unicom" role="editor" surname="Tan"> -->
      <!-- [CHECK]
             * initials should not include an initial for the surname
             * role="editor" is optional -->
    <!-- Can have more than one author -->
      
    <!-- all of the following elements are optional -->
      <organization>Beijing University of Posts and Telecommunications</organization>
      <address>
        <!-- <postal> -->
          <!-- Reorder these if your country does things differently -->
          <!-- <street>Street [REPLACE/DELETE]</street>
          <city>City [REPLACE/DELETE]</city>
          <region>Region [REPLACE/DELETE]</region>
          <code>Postal code [REPLACE/DELETE]</code>
          <country>Country [REPLACE/DELETE]</country> -->
          <!-- Uses two letter country code -->
        <!-- </postal>         -->
        <!-- <phone>Phone [REPLACE/DELETE]</phone> -->
        <email>qiaoj475@bupt.edu.cn</email>  
        <!-- Can have more than one <email> element -->
        <!-- <uri>URI [REPLACE/DELETE]</uri> -->
      </address>
    </author>

    <author fullname="Zheng Han" initials="Z" surname="Han">
      <organization>Beijing University of Posts and Telecommunications</organization>
      <address>
        <email>2025010255@bupt.cn</email>
      </address>
    </author>
    
    <author fullname="Wei Wang" initials="W" surname="Wang">
    <!-- <author fullname="Yanxia Tan" initials="China Unicom" role="editor" surname="Tan"> -->
      <!-- [CHECK]
             * initials should not include an initial for the surname
             * role="editor" is optional -->
    <!-- Can have more than one author -->
      
    <!-- all of the following elements are optional -->
      <organization>Beijing University of Posts and Telecommunications</organization>
      <address>
        <!-- <postal> -->
          <!-- Reorder these if your country does things differently -->
          <!-- <street>Street [REPLACE/DELETE]</street>
          <city>City [REPLACE/DELETE]</city>
          <region>Region [REPLACE/DELETE]</region>
          <code>Postal code [REPLACE/DELETE]</code>
          <country>Country [REPLACE/DELETE]</country> -->
          <!-- Uses two letter country code -->
        <!-- </postal>         -->
        <!-- <phone>Phone [REPLACE/DELETE]</phone> -->
        <email>weiw@bupt.edu.cn</email>  
        <!-- Can have more than one <email> element -->
        <!-- <uri>URI [REPLACE/DELETE]</uri> -->
      </address>
    </author>

    <author fullname="Jie Zhang" initials="J" surname="Zhang">
    <!-- <author fullname="Yanxia Tan" initials="China Unicom" role="editor" surname="Tan"> -->
      <!-- [CHECK]
             * initials should not include an initial for the surname
             * role="editor" is optional -->
    <!-- Can have more than one author -->
      
    <!-- all of the following elements are optional -->
      <organization>Beijing University of Posts and Telecommunications</organization>
      <address>
        <!-- <postal> -->
          <!-- Reorder these if your country does things differently -->
          <!-- <street>Street [REPLACE/DELETE]</street>
          <city>City [REPLACE/DELETE]</city>
          <region>Region [REPLACE/DELETE]</region>
          <code>Postal code [REPLACE/DELETE]</code>
          <country>Country [REPLACE/DELETE]</country> -->
          <!-- Uses two letter country code -->
        <!-- </postal>         -->
        <!-- <phone>Phone [REPLACE/DELETE]</phone> -->
        <email>jie.zhang@bupt.edu.cn</email>  
        <!-- Can have more than one <email> element -->
        <!-- <uri>URI [REPLACE/DELETE]</uri> -->
      </address>
    </author>

    <author fullname="Yongli Zhao" initials="Y" surname="Zhao">
    <!-- <author fullname="Yanxia Tan" initials="China Unicom" role="editor" surname="Tan"> -->
      <!-- [CHECK]
             * initials should not include an initial for the surname
             * role="editor" is optional -->
    <!-- Can have more than one author -->
      
    <!-- all of the following elements are optional -->
      <organization>Beijing University of Posts and Telecommunications</organization>
      <address>
        <!-- <postal> -->
          <!-- Reorder these if your country does things differently -->
          <!-- <street>Street [REPLACE/DELETE]</street>
          <city>City [REPLACE/DELETE]</city>
          <region>Region [REPLACE/DELETE]</region>
          <code>Postal code [REPLACE/DELETE]</code>
          <country>Country [REPLACE/DELETE]</country> -->
          <!-- Uses two letter country code -->
        <!-- </postal>         -->
        <!-- <phone>Phone [REPLACE/DELETE]</phone> -->
        <email>yonglizhao@bupt.edu.cn</email>  
        <!-- Can have more than one <email> element -->
        <!-- <uri>URI [REPLACE/DELETE]</uri> -->
      </address>
    </author>

    <author fullname="Yanxia Tan" initials="Y" role="editor" surname="Tan">
    <!-- <author fullname="Yanxia Tan" initials="China Unicom" role="editor" surname="Tan"> -->
      <!-- [CHECK]
             * initials should not include an initial for the surname
             * role="editor" is optional -->
    <!-- Can have more than one author -->
      
    <!-- all of the following elements are optional -->
      <organization>China Unicom</organization>
      <address>
        <!-- <postal> -->
          <!-- Reorder these if your country does things differently -->
          <!-- <street>Street [REPLACE/DELETE]</street>
          <city>City [REPLACE/DELETE]</city>
          <region>Region [REPLACE/DELETE]</region>
          <code>Postal code [REPLACE/DELETE]</code>
          <country>Country [REPLACE/DELETE]</country> -->
          <!-- Uses two letter country code -->
        <!-- </postal>         -->
        <!-- <phone>Phone [REPLACE/DELETE]</phone> -->
        <email>tanyx11@chinaunicom.cn</email>  
        <!-- Can have more than one <email> element -->
        <!-- <uri>URI [REPLACE/DELETE]</uri> -->
      </address>
    </author>
   
    <author fullname="Yanlei Zheng" initials="Y" surname="Zheng">
      <!-- [CHECK]
             * initials should not include an initial for the surname
             * role="editor" is optional -->
    <!-- Can have more than one author -->
      
    <!-- all of the following elements are optional -->
      <organization>China Unicom</organization>
      <address>
        <!-- <postal> -->
          <!-- Reorder these if your country does things differently -->
          <!-- <street>Street [REPLACE/DELETE]</street>
          <city>City [REPLACE/DELETE]</city>
          <region>Region [REPLACE/DELETE]</region>
          <code>Postal code [REPLACE/DELETE]</code>
          <country>Country [REPLACE/DELETE]</country> -->
          <!-- Uses two letter country code -->
        <!-- </postal>         -->
        <!-- <phone>Phone [REPLACE/DELETE]</phone> -->
        <email>zhengyanlei@chinaunicom.cn</email>  
        <!-- Can have more than one <email> element -->
        <!-- <uri>URI [REPLACE/DELETE]</uri> -->
      </address>
    </author>

    <date year="2026"/>
    <!-- On draft subbmission:
         * If only the current year is specified, the current day and month will be used.
         * If the month and year are both specified and are the current ones, the current day will
           be used
         * If the year is not the current one, it is necessary to specify at least a month and day="1" will be used.
    -->

    <area>General</area>
    <workgroup>ccamp</workgroup>
    <!-- "Internet Engineering Task Force" is fine for individual submissions.  If this element is 
          not present, the default is "Network Working Group", which is used by the RFC Editor as 
          a nod to the history of the RFC Series. -->

    <!-- <keyword>keyword</keyword> -->
    <!-- [REPLACE/DELETE]. Multiple allowed.  Keywords are incorporated into HTML output files for 
         use by search engines. -->

    <abstract>
      <t>This document presents the control framework for Unified Optical Networks and AI Computing Orchestration (UONACO). Specifically, it defines the AI computing service model over wide-area networks, outlines the UONACO control architecture, identifies a set of UONACO components and interfaces, and describes their interactions. </t>
    </abstract>
 
  </front>

  <middle>
    
    <section>
      <name>Introduction</name>
      <t>Distributed AI computing has become a dominant paradigm for delivering large-scale AI services, enabling providers to meet stringent performance and scalability requirements by leveraging geographically dispersed AI data centers (AIDCs). In such environments, the efficiency of distributed training, inference, and remote service access depends critically on tight coordination between optical transport networks and compute orchestration systems.</t>
      <t>However, today's infrastructure operates with fundamentally isolated control planes: the optical transport layer, despite providing the high-bandwidth, low-latency, and deterministic backbone for wide-area AI collaboration, remains blind to the dynamic, heterogeneous demands of AI workloads.  It cannot discern whether a traffic flow stems from a bandwidth-intensive distributed training job requiring synchronized all-reduce operations across thousands of GPUs, or from a latency-critical inference request demanding sub-10ms end-to-end response.  Consequently, optical networks provision static or best-effort lightpaths without adapting to the real-time compute intent, leading to underutilized spectral resources or, worse, congestion-induced stalls during critical gradient synchronization phases.</t>
      <t>Conversely, AI compute schedulers (e.g., Kubernetes-based orchestrators in AIDCs) make placement decisions based solely on local GPU/CPU availability and memory capacity, with no awareness of the underlying optical fabric's state, such as available wavelength continuity, end-to-end propagation delay, per-link bandwidth headroom, or even the presence of OXC-based reconfigurable paths. As a result, a training job may be split across geographically distant AIDCs with abundant but poorly interconnected GPU pools, causing prolonged communication phases and severe “compute efficiency loss.” Similarly, a low-latency inference service might be deployed in a remote AIDC simply because it has idle GPUs, even though the optical path violates the application's SLA due to high round-trip delay or lack of dedicated wavelength isolation.</t>
      <t>To address these challenges, this document introduces the Unified Optical Networks and AI Computing Orchestration (UONACO) framework. UONACO establishes a unified control architecture that enables bidirectional signaling, joint resource modeling, and synchronized orchestration between the compute and optical domains. The framework supports three representative service models: AI training, AI inference, and accessing remote AI inference services. By aligning network provisioning with compute intent—and vice versa—UONACO aims to improve the efficiency of wide-area collaborative AI computing.</t>
      <section>
        <name>Requirements Language</name>
        <t>The key words "MUST", "MUST NOT", "REQUIRED", "SHALL",
          "SHALL NOT", "SHOULD", "SHOULD NOT", "RECOMMENDED", "NOT
          RECOMMENDED", "MAY", and "OPTIONAL" in this document are to be
          interpreted as described in BCP 14 <xref target="RFC2119"/>
          <xref target="RFC8174"/> when, and only when, they appear in
          all capitals, as shown here.</t>
      </section>
      <!-- [CHECK] The 'Requirements Language' section is optional -->

    </section>
    
    <section>
      <name>Service Model for AI Computing over Optical Network</name>
      <t>The deployment of wide-area AI services over optical infrastructure involves multiple stakeholders, each playing a distinct role in the end-to-end service delivery chain. To clarify responsibilities and interactions, this document defines a service model comprising the Customer, Service Provider, Network Provider, and Computing Power Provider.</t>


      <section>
        <name>Customer</name>
        <t>The Customer is the end user or enterprise that consumes AI capabilities. Three primary service patterns are observed:</t>
        <t>•	In AI training, the customer delegates the training of large-scale AI models to service providers, typically specifying performance, scale, and data privacy requirements.</t>
        <t>•	In AI inference, the customer leases computing resources to deploy and operate inference models, often serving downstream internet users with real-time or batch inference services.</t>
        <t>•	In accessing remote AI inference service, the customer invokes pre-deployed inference APIs offered by third parties, expecting deterministic latency, reliability, and quality of service without managing underlying infrastructure.</t>
      </section>

      <section>
        <name>Service Provider</name>
        <t>The Service Provider acts as the business orchestrator, interfacing directly with the Customer to translate high-level service intents—such as SLAs, geographic constraints, or performance targets—into concrete resource demands. It coordinates with both the Network Provider and the Computing Power Provider to fulfill these demands, and is responsible for service lifecycle management, billing, and customer support.</t>
      </section>

      <section>
        <name>Network Provider</name>
        <t>The Network Provider operates and manages the underlying optical transport infrastructure. It delivers high-bandwidth, low-latency, and deterministic connectivity services, including inter-AIDC backbone links and user-to-AIDC dedicated access circuits. The Network Provider exposes network capabilities—such as available bandwidth, path latency, and reliability—through standardized control interfaces to enable coordinated service provisioning.</t>
      </section>

      <section>
        <name>Computing Power Provider</name>
        <t>The Computing Power Provider owns and operates one or more Artificial Intelligence Data Centers (AIDCs). It offers compute, memory, and accelerator resources (e.g., GPUs, TPUs) for AI training and inference workloads. The Computing Power Provider reports real-time resource availability and performance metrics to the Service Provider and supports dynamic task placement and scaling based on orchestration instructions.</t>
      </section>

    </section>   
    
    <section>
      <name>UONACO Control and Management Architecture</name>
      <figure>
        <name>UONACO Control and Management Architecture</name>
        <artset>
        <!-- This <artset> includes two <artwork> elements, each of a different type -->
        <!-- SVG reference removed due to RFC 7996 compliance issues -->
          <artwork type="ascii-art" name="problem.txt">
            <![CDATA[
              +----------------------+
              |       Customer       |
              +---------+-^----------+
                        | |
              +---------v-+----------+
              | Service Orchestrator |
              +---------+-^----------+
                        | | SUI
        +---------------v-+------------------+
        |Unified Compute-Optical Orchestrator|
        +-----+-^-------------------+-^------+
              | | UCI               | | UOI
+-------------v-+-------+ +---------v-+----------------+
|Compute Power Scheduler| |Transport Network Controller|
+-----------+-^---------+ +------+-^-------------------+
            | |                  | |
            | |                  | |    +------------+
      +-----v-+-----+            | |    |User Access |
      |Compute Power|            | |    |   Point #1 |
      |    Pool     |            | |    +------+-----+
      |  +-------+  |            | |           |
      |  |AIDC #1|+-+-+   +------v-+------+    |
      |  +-------+  |  \+-|               |----+
      |             |     |Optical Network|
      |  +-------+  |   +-|               |----+
      |  |AIDC #2|+-+-+/  +---------------+    |
      |  +-------+  |                          |
      |             |                   +------+-----+
      +-------------+                   |User Access |
                                        |   Point #2 |
                                        +------------+

            ]]>
          </artwork>
        </artset>
      </figure>
      
      <section>
        <name>Overview</name>
        <t>As shown in Figure 1, the UONACO framework establishes a layered control architecture that enables end-to-end coordination between service intent, compute resources, and optical transport infrastructure. This architecture comprises five core functional components—Customer, Service Orchestrator (SO), Unified Compute-Optical Orchestrator (UCOO), Transport Network Controller (TNC), and Computing Power Scheduler (CPS)—interconnected through three standardized interfaces.</t>
      </section>



      <section>
        <name>Service Orchestrator</name>
        <t>The SO serves as the business-facing interface of the UONACO framework. It is responsible for accepting AI service requests from customers—such as “deploy a distributed training job across multiple AIDCs with end-to-end latency under X ms” or “provision an inference service with Y GPU instances and guaranteed bandwidth”—and translating these intent-based specifications into structured resource requirements. The SO also handles service lifecycle management, including billing, SLA enforcement, and user authentication. It does not manage physical resources directly but instead communicates abstracted demands to the UCOO via the SUI interface.</t>
      </section>

      <section>
        <name>Unified Compute-Optical Orchestrator</name>
        <t>The UCOO is the central coordination engine of the UONACO architecture. It receives service intents from the SO and continuously collects real-time telemetry from both the optical network (via TNC) and compute infrastructure (via CPS). Based on this global view, the UCOO executes joint optimization algorithms that consider both compute capabilities (e.g., GPU availability, memory) and network conditions (e.g., path latency, available bandwidth, congestion). The output of this decision process is a pair of synchronized instructions: one for optical path provisioning and another for compute task placement. The UCOO thus bridges the semantic and operational gap between the service layer and the infrastructure layer.</t>
      </section>    

      <section>
        <name>Transport Network Controller</name>
        <t>The TNC represents the control plane of the underlying optical transport infrastructure. It may encompass a hierarchy of controllers, including intra-domain optical controllers and inter-domain coordinators (e.g., multi-domain WSON or OXC orchestrators). The TNC is responsible for managing physical and virtual optical resources—such as wavelengths, time slots, fgOTN/OSU slices, and OXC cross-connects—and for executing path computation, signaling, and protection mechanisms. In the UONACO framework, the TNC exposes network topology, available capacity, and performance metrics to the UCOO through the UOI interface, and applies provisioning commands issued by the UCOO to establish, adjust, or release optical connections in response to compute workload dynamics.</t>
      </section> 

      <section>
        <name>Computing Power Scheduler</name>
        <t>The CPS acts as the controller for the AI compute pool, typically spanning one or more Artificial Intelligence Data Centers (AIDCs). It manages heterogeneous compute resources—including CPUs, GPUs, TPUs, memory, and storage—and reports their real-time availability, utilization, and performance characteristics (e.g., FLOPS, VRAM usage) to the UCOO. Upon receiving placement instructions from the UCOO via the UCI interface, the CPS schedules AI workloads (e.g., training jobs or inference containers) onto appropriate nodes, configures runtime environments, and ensures that compute tasks are aligned with the concurrently provisioned optical connectivity.</t>
      </section> 

      <section>
        <name>UONACO Interfaces</name>
        <t>The UONACO framework defines three key interfaces which have been shown in Figure 1, to enable interoperability and decoupled evolution of its components.</t>
        <t>SUI (SO-UCOO Interface): SUI connects SO and UCOO. Through this northbound interface, the SO conveys high-level service intent, including abstracted SLA requirements (e.g., maximum end-to-end latency, minimum bandwidth, geographic constraints), service type (e.g., AI training, inference, or remote access), and lifecycle events (e.g., service activation, modification, or termination). The UCOO interprets these intents as concrete resource demands and initiates joint optimization. The SUI thus serves as the bridge between business-oriented service definitions and infrastructure-aware orchestration. </t>
        <t>UOI (UCOO-TNC Interface): UOI links UCOO with TNC. This interface enables bidirectional communication: the UCOO sends optical resource requests specifying required connectivity attributes such as bandwidth, end-to-end latency bounds, path isolation level, and resilience requirements; in return, the TNC provides real-time network state updates, including topology, available wavelengths or time slots, link utilization, propagation delay, and fault status. By exposing network capabilities and constraints to the orchestration layer, the UOI allows the UCOO to make network-feasible decisions and enables the TNC to provision optical paths that are aligned with compute workload dynamics. </t>
        <t>UCI (UCOO-CPS Interface): UCI connects UCOO and CPS. Through this interface, the UCOO issues compute resource demands and task placement directives—such as the number and type of accelerators required, memory footprint, and preferred deployment topology—based on the outcome of joint compute-optical optimization. Conversely, the CPS reports real-time compute resource availability, node load, energy efficiency metrics, and task execution status (e.g., job progress, failure alerts). This feedback loop ensures that compute allocation respects both application requirements and the quality of the concurrently provisioned optical connectivity, thereby avoiding placements that would violate network SLAs. </t>
        <t>These interfaces are designed to be protocol-agnostic but are expected to leverage standardized, model-driven approaches (e.g., YANG/NETCONF or RESTCONF) to ensure vendor neutrality and scalability.</t>
      </section> 
    </section>


    <section anchor="IANA">
    <!-- All drafts are required to have an IANA considerations section. See RFC 8126 for a guide.-->
      <name>IANA Considerations</name>
      <t>TBD</t>
    </section>
    
    <section anchor="Security">
      <!-- All drafts are required to have a security considerations section. See RFC 3552 for a guide. -->
      <name>Security Considerations</name>
      <t>TBD</t>
    </section>
    
    <!-- NOTE: The Acknowledgements and Contributors sections are at the end of this template -->
  </middle>

  <back>
    <references>
      <name>References</name>
      <references>
        <name>Normative References</name>
        
        <xi:include href="https://bib.ietf.org/public/rfc/bibxml/reference.RFC.2119.xml"/>
        <xi:include href="https://bib.ietf.org/public/rfc/bibxml/reference.RFC.8174.xml"/>
        <!-- The recommended and simplest way to include a well known reference -->
        
      </references>
 

    </references>
  
    
 </back>
</rfc>