% -*- coding: utf-8; -*-
% ISO/IEC 14651-conformant delta for DIN 5007-1:2004 (sample)

reorder-after <BASE> %The umlaut is the diacritic with the highest priority
collating-symbol <UMLAUT> %specifically for the weight of the umlaut (distinct from the Trema in DIN 5007)
<UMLAUT> 
reorder-end


%Digits must follow letters 

%For the treatment of Roman numerals as well as digits as numbers we
%need preprocessing that is out of the scope of this profile

reorder-after <TFFFF> %After the Han ideographs, but before <SFFFF>
<S0030>  % 0
<S0031>  % 1
<S0032>  % 2
<S0033>  % 3
<S0034>  % 4
<S0035>  % 5
<S0036>  % 6
<S0037>  % 7
<S0038>  % 8
<S0039>  % 9
reorder-end

reorder-after <SFFFF>

order_start forward;forward;forward;forward 

%Whitspace precedes according to 6.2.1 all other characters on the
%first level. They thus get a non-ignorable weight 

<U0009> <S0009>;<BASE>;<MIN>;<U0009> % HORIZONTAL TABULATION (in 6429)
<U000A> <S000A>;<BASE>;<MIN>;<U000A> % LINE FEED (in 6429)
<U000B> <S000B>;<BASE>;<MIN>;<U000B> % VERTICAL TABULATION (in 6429)
<U000C> <S000C>;<BASE>;<MIN>;<U000C> % FORM FEED (in 6429)
<U000D> <S000D>;<BASE>;<MIN>;<U000D> % CARRIAGE RETURN (in 6429)
<U0020> <S0020>;<BASE>;<MIN>;<U0020> % SPACE


%Ligatures and the sharp S are already treated in the EOR delta in the sense of DIN 5007

<U00E4> <S0061>;"<BASE><UMLAUT>";"<MIN><MIN>";<U00E4> % LATIN SMALL LETTER A WITH DIAERESIS
<U00C4> <S0061>;"<BASE><UMLAUT>";"<CAP><MIN>";<U00C4> % LATIN CAPITAL LETTER A WITH DIAERESIS
<U00F6> <S006F>;"<BASE><UMLAUT>";"<MIN><MIN>";<U00F6> % LATIN SMALL LETTER O WITH DIAERESIS
<U00D6> <S006F>;"<BASE><UMLAUT>";"<CAP><MIN>";<U00D6> % LATIN CAPITAL LETTER O WITH DIAERESIS
<U00FC> <S0075>;"<BASE><UMLAUT>";"<MIN><MIN>";<U00FC> % LATIN SMALL LETTER U WITH DIAERESIS
<U00DC> <S0075>;"<BASE><UMLAUT>";"<CAP><MIN>";<U00DC> % LATIN CAPITAL LETTER U WITH DIAERESIS

%If we want an ordering according to 6.1.1.4.2, where Umlaute become
%base letter + e, these lines replace the previous six weight assignments
%<U00E4> "<S0061><S0065>";"<BASE><BASE><UMLAUT>";"<MIN><MIN><MIN>";<U00E4> % LATIN SMALL LETTER A WITH DIAERESIS
%<U00C4> "<S0061><S0065>";"<BASE><BASE><UMLAUT>";"<CAP><MIN><MIN>";<U00C4> % LATIN CAPITAL LETTER A WITH DIAERESIS
%<U00F6> "<S006F><S0065>";"<BASE><BASE><UMLAUT>";"<MIN><MIN><MIN>";<U00F6> % LATIN SMALL LETTER O WITH DIAERESIS
%<U00D6> "<S006F><S0065>";"<BASE><BASE><UMLAUT>";"<CAP><MIN><MIN>";<U00D6> % LATIN CAPITAL LETTER O WITH DIAERESIS
%<U00FC> "<S0075><S0065>";"<BASE><BASE><UMLAUT>";"<MIN><MIN><MIN>";<U00FC> % LATIN SMALL LETTER U WITH DIAERESIS
%<U00DC> "<S0075><S0065>";"<BASE><BASE><UMLAUT>";"<CAP><MIN><MIN>";<U00DC> % LATIN CAPITAL LETTER U WITH DIAERESIS

%Treatment of other Latin characters according to DIN 31638, 7.3.4.1
<U00FE> "<S0074><S0068>";"<BASE><BASE><VRNT1>";"<MIN><MIN><MIN>";<U00FE> % LATIN SMALL LETTER THORN (as th on the first level)
<U00DE> "<S0074><S0068>";"<BASE><BASE><VRNT1>";"<CAP><CAP><MIN>";<U00DE> % LATIN CAPITAL LETTER THORN

<U01BF> <S0079>;"<BASE><VRNT3>";"<MIN><MIN>";<U01BF> % LATIN LETTER WYNN (as y on the first level)
<U01F7> <S0079>;"<BASE><VRNT3>";"<CAP><MIN>";<U01F7> % LATIN CAPITAL LETTER WYNN        
<U0292> <S0079>;"<BASE><VRNT4>";"<MIN><MIN>";<U0292> % LATIN SMALL LETTER EZH (as y  on the first level, yogh and ezh are equated in ISO/IEC 10646)
<U01B7> <S0079>;"<BASE><VRNT4>";"<CAP><MIN>";<U01B7> % LATIN CAPITAL LETTER EZH 

reorder-end

None: DIN5007Delta (last edited 2008-10-03 10:05:51 by MKuester)