<?xml version="1.0"?>
<!DOCTYPE rfc SYSTEM "rfc2629.dtd">
<?rfc toc="yes"?>

<!--
     ASCII to XML transformation by Invisible Worlds, Inc.
     http://invisible.net/
     Last transformation: 03-Feb-1999, 02:01:07

     Cannonical version of this document is at:
     http://info.internet.isi.edu/in-notes/rfc/files/rfc2253.txt

     Implementors should verify all content with
     cannonical version.  Failure to do so may result in
     protocol failures.
-->

<rfc number="2253"
     category="std"
     obsoletes="1779">
<front>
<title abbrev="LADPv3 Distinguished Names">Lightweight Directory Access Protocol (v3): UTF-8 String Representation of Distinguished Names</title>
<author initials="M." surname="Wahl" fullname="Mark Wahl">
<organization>Critical Angle Inc.</organization>
<address>
<postal>
<street>4815 W. Braker Lane #502-385</street>
<street>Austin</street>
<street>TX 78759</street>
<country>USA</country>
</postal>
<email>M.Wahl@critical-angle.com</email>
</address>
</author>
<author initials="S." surname="Kille" fullname="Steve Kille">
<organization>Isode Ltd.</organization>
<address>
<postal>
<street>The Dome</street>
<street>The Square</street>
<street>Richmond</street>
<street>Surrey</street>
<street>TW9 1DT</street>
<street>England</street>
</postal>
<phone>+44-181-332-9091</phone>
<email>S.Kille@ISODE.COM</email>
</address>
</author>
<author initials="T." surname="Howes" fullname="Tim Howes">
<organization>Netscape Communications Corp.</organization>
<address>
<postal>
<street>501 E. Middlefield Rd</street>
<street>MS MV068</street>
<street>Mountain View</street>
<street>CA 94043</street>
<country>USA</country>
</postal>
<phone>+1 650 937-3419</phone>
<email>howes@netscape.com</email>
</address>
</author>
<date month="December" year="1997"/>
<area>Applications</area>
<keyword>LDAP</keyword>
<keyword>ITU abstract syntax notation one</keyword>
<keyword>ITU directory service protocol</keyword>
<keyword>UCS transformation format</keyword>
<keyword>directory</keyword>
<keyword>lightweight directory access protocol</keyword>
<abstract>
<t>
   This document describes a directory access protocol that provides
   both read and update access.  Update access requires secure
   authentication, but this document does not mandate implementation of
   any satisfactory authentication mechanisms.
</t>
<t>
   In accordance with RFC 2026, section 4.4.1, this specification is
   being approved by IESG as a Proposed Standard despite this
   limitation, for the following reasons:
<list>
<t>
   a. to encourage implementation and interoperability testing of
      these protocols (with or without update access) before they
      are deployed, and
</t>
<t>
   b. to encourage deployment and use of these protocols in read-only
      applications.  (e.g. applications where LDAPv3 is used as
      a query language for directories which are updated by some
      secure mechanism other than LDAP), and
</t>
<t>
   c. to avoid delaying the advancement and deployment of other Internet
      standards-track protocols which require the ability to query, but
      not update, LDAPv3 directory servers.
</t></list>
</t>
<t>
   Readers are hereby warned that until mandatory authentication
   mechanisms are standardized, clients and servers written according to
   this specification which make use of update functionality are
   UNLIKELY TO INTEROPERATE, or MAY INTEROPERATE ONLY IF AUTHENTICATION
   IS REDUCED TO AN UNACCEPTABLY WEAK LEVEL.
</t>
<t>
   Implementors are hereby discouraged from deploying LDAPv3 clients or
   servers which implement the update functionality, until a Proposed
   Standard for mandatory authentication in LDAPv3 has been approved and
   published as an RFC.
</t>
<t>
   The X.500 Directory uses distinguished names as the primary keys to
   entries in the directory.  Distinguished Names are encoded in ASN.1
   in the X.500 Directory protocols.  In the Lightweight Directory
   Access Protocol, a string representation of distinguished names is
   transferred.  This specification defines the string format for
   representing names, which is designed to give a clean representation
   of commonly used distinguished names, while being able to represent
   any distinguished name.
</t>
<t>
   The key words &quot;MUST&quot;, &quot;MUST NOT&quot;, &quot;REQUIRED&quot;, &quot;SHALL&quot;, &quot;SHALL NOT&quot;,
   &quot;SHOULD&quot;, &quot;SHOULD NOT&quot;, &quot;RECOMMENDED&quot;,  &quot;MAY&quot;, and &quot;OPTIONAL&quot; in this
   document are to be interpreted as described in RFC 2119 <xref target="_XREF_6"/>.
</t>
</abstract>
<note title="IESG Note">
<t>
   This document describes a directory access protocol that provides
   both read and update access.  Update access requires secure
   authentication, but this document does not mandate implementation of
   any satisfactory authentication mechanisms.
</t>
<t>
   In accordance with RFC 2026, section 4.4.1, this specification is
   being approved by IESG as a Proposed Standard despite this
   limitation, for the following reasons:
</t>
<t>
   a. to encourage implementation and interoperability testing of
      these protocols (with or without update access) before they
      are deployed, and
<list>
<t>
   b. to encourage deployment and use of these protocols in read-only
      applications.  (e.g. applications where LDAPv3 is used as
      a query language for directories which are updated by some
      secure mechanism other than LDAP), and
</t>
<t>
   c. to avoid delaying the advancement and deployment of other Internet
      standards-track protocols which require the ability to query, but
      not update, LDAPv3 directory servers.
</t></list>
</t>
<t>
   Readers are hereby warned that until mandatory authentication
   mechanisms are standardized, clients and servers written according to
   this specification which make use of update functionality are
   UNLIKELY TO INTEROPERATE, or MAY INTEROPERATE ONLY IF AUTHENTICATION
   IS REDUCED TO AN UNACCEPTABLY WEAK LEVEL.
</t>
<t>
   Implementors are hereby discouraged from deploying LDAPv3 clients or
   servers which implement the update functionality, until a Proposed
   Standard for mandatory authentication in LDAPv3 has been approved and
   published as an RFC.
</t>
</note>
</front>
<middle>
<!-- RFC original section: (1.) -->
<section title="Background">
<t>
   This specification assumes familiarity with X.500 <xref target="_XREF_1"/>, and the
   concept of Distinguished Name.  It is important to have a common
   format to be able to unambiguously represent a distinguished name.
   The primary goal of this specification is ease of encoding and
   decoding.  A secondary goal is to have names that are human readable.
   It is not expected that LDAP clients with a human user interface
   would display these strings directly to the user, but would most
   likely be performing translations (such as expressing attribute type
   names in one of the local national languages).
</t>
</section>
<!-- RFC original section: (2.) -->
<section title="Converting DistinguishedName from ASN.1 to a String">
<t>
   In X.501 <xref target="_XREF_2"/> the ASN.1 structure of distinguished name is defined as:
</t>
<figure><artwork>
       DistinguishedName ::= RDNSequence

       RDNSequence ::= SEQUENCE OF RelativeDistinguishedName
       RelativeDistinguishedName ::= SET SIZE (1..MAX) OF
        AttributeTypeAndValue

       AttributeTypeAndValue ::= SEQUENCE {
        type  AttributeType,
        value AttributeValue }
</artwork></figure>
<t>
   The following sections define the algorithm for converting from an
   ASN.1 structured representation to a UTF-8 string representation.
</t>
<!-- RFC original section: (2.1.) -->
<section title="Converting the RDNSequence">
<t>
   If the RDNSequence is an empty sequence, the result is the empty or
   zero length string.
</t>
<t>
   Otherwise, the output consists of the string encodings of each
   RelativeDistinguishedName in the RDNSequence (according to 2.2),
   starting with the last element of the sequence and moving backwards
   toward the first.
</t>
<t>
   The encodings of adjoining RelativeDistinguishedNames are separated
   by a comma character (&apos;,&apos; ASCII 44).
</t>
</section>
<!-- RFC original section: (2.2.) -->
<section title="Converting RelativeDistinguishedName">
<t>
   When converting from an ASN.1 RelativeDistinguishedName to a string,
   the output consists of the string encodings of each
   AttributeTypeAndValue (according to 2.3), in any order.
</t>
<t>
   Where there is a multi-valued RDN, the outputs from adjoining
   AttributeTypeAndValues are separated by a plus (&apos;+&apos; ASCII 43)
   character.
</t>
</section>
<!-- RFC original section: (2.3.) -->
<section title="Converting AttributeTypeAndValue">
<t>
   The AttributeTypeAndValue is encoded as the string representation of
   the AttributeType, followed by an equals character (&apos;=&apos; ASCII 61),
   followed by the string representation of the AttributeValue.  The
   encoding of the AttributeValue is given in section 2.4.
</t>
<t>
   If the AttributeType is in a published table of attribute types
   associated with LDAP <xref target="_XREF_4"/>, then the type name string from that table
   is used, otherwise it is encoded as the dotted-decimal encoding of
   the AttributeType&apos;s OBJECT IDENTIFIER. The dotted-decimal notation is
   described in <xref target="_XREF_3"/>.  As an example, strings for a few of the attribute
   types frequently seen in RDNs include:
</t>
<figure><artwork>
                    String  X.500 AttributeType
                    ------------------------------
                    CN      commonName
                    L       localityName
                    ST      stateOrProvinceName
                    O       organizationName
                    OU      organizationalUnitName
                    C       countryName
                    STREET  streetAddress
                    DC      domainComponent
                    UID     userid
</artwork></figure>
</section>
<!-- RFC original section: (2.4.) -->
<section title="Converting an AttributeValue from ASN.1 to a String">
<t>
   If the AttributeValue is of a type which does not have a string
   representation defined for it, then it is simply encoded as an
   octothorpe character (&apos;#&apos; ASCII 35) followed by the hexadecimal
   representation of each of the bytes of the BER encoding of the X.500
   AttributeValue.  This form SHOULD be used if the AttributeType is of
   the dotted-decimal form.
</t>
<t>
   Otherwise, if the AttributeValue is of a type which has a string
   representation, the value is converted first to a UTF-8 string
   according to its syntax specification (see for example section 6 of
   <xref target="_XREF_4"/>).
</t>
<t>
   If the UTF-8 string does not have any of the following characters
   which need escaping, then that string can be used as the string
   representation of the value.
<list>
<t>
    o   a space or &quot;#&quot; character occurring at the beginning of the
        string
</t>
<t>
    o   a space character occurring at the end of the string
</t>
<t>
    o   one of the characters &quot;,&quot;, &quot;+&quot;, &quot;&quot;&quot;, &quot;\&quot;, &quot;&lt;&quot;, &quot;&gt;&quot; or &quot;;&quot;
</t></list>
</t>
<t>
   Implementations MAY escape other characters.
</t>
<t>
   If a character to be escaped is one of the list shown above, then it
   is prefixed by a backslash (&apos;\&apos; ASCII 92).
</t>
<t>
   Otherwise the character to be escaped is replaced by a backslash and
   two hex digits, which form a single byte in the code of the
   character.
</t>
<t>
   Examples of the escaping mechanism are shown in section 5.
</t>
</section>
</section>
<!-- RFC original section: (3.) -->
<section title="Parsing a String back to a Distinguished Name">
<t>
   The structure of the string is specified in a BNF grammar, based on
   the grammar defined in RFC 822 <xref target="_XREF_5"/>.  Server implementations parsing a
   DN string generated by an LDAPv2 client MUST also accept (and ignore)
   the variants given in section 4 of this document.
</t>
<figure><artwork>
distinguishedName = [name]                    ; may be empty string


name       = name-component *(&quot;,&quot; name-component)


name-component = attributeTypeAndValue *(&quot;+&quot; attributeTypeAndValue)


attributeTypeAndValue = attributeType &quot;=&quot; attributeValue


attributeType = (ALPHA 1*keychar) / oid
keychar    = ALPHA / DIGIT / &quot;-&quot;


oid        = 1*DIGIT *(&quot;.&quot; 1*DIGIT)


attributeValue = string


string     = *( stringchar / pair )
             / &quot;#&quot; hexstring
             / QUOTATION *( quotechar / pair ) QUOTATION ; only from v2


quotechar     = &lt;any character except &quot;\&quot; or QUOTATION &gt;


special    = &quot;,&quot; / &quot;=&quot; / &quot;+&quot; / &quot;&lt;&quot; /  &quot;&gt;&quot; / &quot;#&quot; / &quot;;&quot;


pair       = &quot;\&quot; ( special / &quot;\&quot; / QUOTATION / hexpair )
stringchar = &lt;any character except one of special, &quot;\&quot; or QUOTATION &gt;


hexstring  = 1*hexpair
hexpair    = hexchar hexchar


hexchar    = DIGIT / &quot;A&quot; / &quot;B&quot; / &quot;C&quot; / &quot;D&quot; / &quot;E&quot; / &quot;F&quot;
             / &quot;a&quot; / &quot;b&quot; / &quot;c&quot; / &quot;d&quot; / &quot;e&quot; / &quot;f&quot;


ALPHA      =  &lt;any ASCII alphabetic character&gt;
                                         ; (decimal 65-90 and 97-122)
DIGIT      =  &lt;any ASCII decimal digit&gt;  ; (decimal 48-57)
QUOTATION  =  &lt;the ASCII double quotation mark character &apos;&quot;&apos; decimal 34&gt;
</artwork></figure>
</section>
<!-- RFC original section: (4.) -->
<section title="Relationship with RFC 1779 and LDAPv2">
<t>
   The syntax given in this document is more restrictive than the syntax
   in RFC 1779.  Implementations parsing a string generated by an LDAPv2
   client MUST accept the syntax of RFC 1779.  Implementations MUST NOT,
   however, generate any of the RFC 1779 encodings which are not
   described above in section 2.
</t>
<t>
   Implementations MUST allow a semicolon character to be used instead
   of a comma to separate RDNs in a distinguished name, and MUST also
   allow whitespace characters to be present on either side of the comma
   or semicolon.  The whitespace characters are ignored, and the
   semicolon replaced with a comma.
</t>
<t>
   Implementations MUST allow an oid in the attribute type to be
   prefixed by one of the character strings &quot;oid.&quot; or &quot;OID.&quot;.
</t>
<t>
   Implementations MUST allow for space (&apos; &apos; ASCII 32) characters to be
   present between name-component and &apos;,&apos;, between attributeTypeAndValue
   and &apos;+&apos;, between attributeType and &apos;=&apos;, and between &apos;=&apos; and
   attributeValue.  These space characters are ignored when parsing.
</t>
<t>
   Implementations MUST allow a value to be surrounded by quote (&apos;&quot;&apos;
   ASCII 34) characters, which are not part of the value.  Inside the
   quoted value, the following characters can occur without any
   escaping:
<list>
<t>
                   &quot;,&quot;, &quot;=&quot;, &quot;+&quot;, &quot;&lt;&quot;, &quot;&gt;&quot;, &quot;#&quot; and &quot;;&quot;
</t></list>
</t>
</section>
<!-- RFC original section: (5.) -->
<section title="Examples">
<t>
   This notation is designed to be convenient for common forms of name.
   This section gives a few examples of distinguished names written
   using this notation.  First is a name containing three relative
   distinguished names (RDNs):
</t>
<t>
   CN=Steve Kille,O=Isode Limited,C=GB
</t>
<t>
   Here is an example name containing three RDNs, in which the first RDN
   is multi-valued:
</t>
<t>
   OU=Sales+CN=J. Smith,O=Widget Inc.,C=US
</t>
<t>
   This example shows the method of quoting of a comma in an
   organization name:
</t>
<t>
   CN=L. Eagle,O=Sue\, Grabbit and Runn,C=GB
</t>
<t>
   An example name in which a value contains a carriage return
   character:
</t>
<t>
   CN=Before\0DAfter,O=Test,C=GB
</t>
<t>
   An example name in which an RDN was of an unrecognized type.  The
   value is the BER encoding of an OCTET STRING containing two bytes
   0x48 and 0x69.
</t>
<t>
   1.3.6.1.4.1.1466.0=#04024869,O=Test,C=GB
</t>
<t>
   Finally, an example of an RDN surname value consisting of 5 letters:
</t>
<figure><artwork>
   Unicode Letter Description      10646 code UTF-8  Quoted
   =============================== ========== ====== =======
   LATIN CAPITAL LETTER L          U0000004C  0x4C   L
   LATIN SMALL LETTER U            U00000075  0x75   u
   LATIN SMALL LETTER C WITH CARON U0000010D  0xC48D \C4\8D
   LATIN SMALL LETTER I            U00000069  0x69   i
   LATIN SMALL LETTER C WITH ACUTE U00000107  0xC487 \C4\87
</artwork></figure>
<t>
   Could be written in printable ASCII (useful for debugging purposes):
</t>
<t>
   SN=Lu\C4\8Di\C4\87
</t>
</section>
<!-- RFC original section: (6.) -->
<section title="References (BOILERPLATE)">
<t>
This RFC contained boilerplate in this section which has been moved
to the RFC2223-compliant unnumbered section &quot;References.&quot;
</t>
</section>
<!-- RFC original section: (7.) -->
<section title="Security Considerations">
<!-- 7.1 -->
<section title="Disclosure">
<t>
   Distinguished Names typically consist of descriptive information
   about the entries they name, which can be people, organizations,
   devices or other real-world objects.  This frequently includes some
   of the following kinds of information:
<list>
<t>
   - the common name of the object (i.e. a person&apos;s full name)
</t>
<t>
   - an email or TCP/IP address
</t>
<t>
   - its physical location (country, locality, city, street address)
</t>
<t>
   - organizational attributes (such as department name or affiliation)
</t></list>
</t>
<t>
   Most countries have privacy laws regarding the publication of
   information about people.
</t>
</section>
<!-- 7.2 -->
<section title="Use of Distinguished Names in Security Applications">
<t>
   The transformations of an AttributeValue value from its X.501 form to
   an LDAP string representation are not always reversible back to the
   same BER or DER form.  An example of a situation which requires the
   DER form of a distinguished name is the verification of an X.509
   certificate.
</t>
<t>
   For example, a distinguished name consisting of one RDN with one AVA,
   in which the type is commonName and the value is of the TeletexString
   choice with the letters &apos;Sam&apos; would be represented in LDAP as the
   string CN=Sam.  Another distinguished name in which the value is
   still &apos;Sam&apos; but of the PrintableString choice would have the same
   representation CN=Sam.
</t>
<t>
   Applications which require the reconstruction of the DER form of the
   value SHOULD NOT use the string representation of attribute syntaxes
   when converting a distinguished name to the LDAP format.  Instead,
   they SHOULD use the hexadecimal form prefixed by the octothorpe (&apos;#&apos;)
   as described in the first paragraph of section 2.4.
</t>
</section>
</section>
<!-- RFC original section: (8.) -->
<section title="Authors&apos; Addresses (BOILERPLATE)">
<t>
This RFC contained boilerplate in this section which has been moved
to the RFC2223-compliant unnumbered section &quot;Author&apos;s Address.&quot;
</t>
</section>
<!-- RFC original section: (9.) -->
<section title="Full Copyright Statement (BOILERPLATE)">
<t>
This RFC contained boilerplate in this section which has been moved
to the RFC2223-compliant unnumbered section &quot;Full Copyright Statement.&quot;
</t>
</section>
</middle>
<back>
<references>
<reference anchor="_XREF_1">
<front>
<title>MISSING TITLE</title>
<author>
<organization/>
</author>
<date month="MISSING" year="DATE"/>
</front>
<seriesInfo>The Directory -- overview of concepts</seriesInfo>
<seriesInfo>models and services. ITU-T Rec. X.500(1993).</seriesInfo>
</reference>
<reference anchor="_XREF_2">
<front>
<title>MISSING TITLE</title>
<author>
<organization/>
</author>
<date month="MISSING" year="DATE"/>
</front>
<seriesInfo>The Directory -- Models. ITU-T Rec. X.501(1993).</seriesInfo>
</reference>
<reference anchor="_XREF_3">
<front>
<title abbrev="Lightweight Directory Access  Protocol (v3">Lightweight Directory Access  Protocol (v3)</title>
<author initials="S." surname="Kille" fullname="S. Kille">
<organization/>
</author>
<date month="December" year="1997"/>
</front>
<seriesInfo>RFC 2251</seriesInfo>
</reference>
<reference anchor="_XREF_4">
<front>
<title abbrev="Lightweight Directory Access Protocol (v3">Lightweight Directory Access Protocol (v3): Attribute Syntax Definitions</title>
<author initials="S." surname="Kille" fullname="S. Kille">
<organization/>
</author>
<date month="December" year="1997"/>
</front>
<seriesInfo>RFC 2252</seriesInfo>
</reference>
<reference anchor="_XREF_5">
<front>
<title abbrev="Standard of the Format of ARPA-Internet">Standard of the Format of ARPA-Internet Text Messages</title>
<author initials="D." fullname="D. ">
<organization/>
</author>
<date month="August" year="1982"/>
</front>
<seriesInfo>STD 11</seriesInfo>
<seriesInfo>RFC 822</seriesInfo>
</reference>
<reference anchor="_XREF_6">
<front>
<title abbrev="Key words for use in RFCs to Indicate">Key words for use in RFCs to Indicate Requirement Levels</title>
<author initials="S." fullname="S. ">
<organization/>
</author>
<date month="MISSING" year="DATE"/>
</front>
<seriesInfo>RFC 2119</seriesInfo>
</reference>
</references>
</back>
</rfc>
