You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@commons.apache.org by gg...@apache.org on 2013/12/11 05:34:52 UTC

svn commit: r889932 [12/33] - in /websites/production/commons/content/proper/commons-codec: ./ apidocs/ apidocs/org/apache/commons/codec/ apidocs/org/apache/commons/codec/binary/ apidocs/org/apache/commons/codec/binary/class-use/ apidocs/org/apache/com...

Modified: websites/production/commons/content/proper/commons-codec/apidocs/src-html/org/apache/commons/codec/language/bm/Rule.html
==============================================================================
--- websites/production/commons/content/proper/commons-codec/apidocs/src-html/org/apache/commons/codec/language/bm/Rule.html (original)
+++ websites/production/commons/content/proper/commons-codec/apidocs/src-html/org/apache/commons/codec/language/bm/Rule.html Wed Dec 11 04:34:40 2013
@@ -40,607 +40,669 @@
 <span class="sourceLineNo">032</span>import java.util.regex.Matcher;<a name="line.32"></a>
 <span class="sourceLineNo">033</span>import java.util.regex.Pattern;<a name="line.33"></a>
 <span class="sourceLineNo">034</span><a name="line.34"></a>
-<span class="sourceLineNo">035</span>/**<a name="line.35"></a>
-<span class="sourceLineNo">036</span> * A phoneme rule.<a name="line.36"></a>
-<span class="sourceLineNo">037</span> * &lt;p&gt;<a name="line.37"></a>
-<span class="sourceLineNo">038</span> * Rules have a pattern, left context, right context, output phoneme, set of languages for which they apply<a name="line.38"></a>
-<span class="sourceLineNo">039</span> * and a logical flag indicating if all languages must be in play. A rule matches if:<a name="line.39"></a>
-<span class="sourceLineNo">040</span> * &lt;ul&gt;<a name="line.40"></a>
-<span class="sourceLineNo">041</span> * &lt;li&gt;the pattern matches at the current position&lt;/li&gt;<a name="line.41"></a>
-<span class="sourceLineNo">042</span> * &lt;li&gt;the string up until the beginning of the pattern matches the left context&lt;/li&gt;<a name="line.42"></a>
-<span class="sourceLineNo">043</span> * &lt;li&gt;the string from the end of the pattern matches the right context&lt;/li&gt;<a name="line.43"></a>
-<span class="sourceLineNo">044</span> * &lt;li&gt;logical is ALL and all languages are in scope; or&lt;/li&gt;<a name="line.44"></a>
-<span class="sourceLineNo">045</span> * &lt;li&gt;logical is any other value and at least one language is in scope&lt;/li&gt;<a name="line.45"></a>
-<span class="sourceLineNo">046</span> * &lt;/ul&gt;<a name="line.46"></a>
-<span class="sourceLineNo">047</span> * &lt;p&gt;<a name="line.47"></a>
-<span class="sourceLineNo">048</span> * Rules are typically generated by parsing rules resources. In normal use, there will be no need for the user<a name="line.48"></a>
-<span class="sourceLineNo">049</span> * to explicitly construct their own.<a name="line.49"></a>
-<span class="sourceLineNo">050</span> * &lt;p&gt;<a name="line.50"></a>
-<span class="sourceLineNo">051</span> * Rules are immutable and thread-safe.<a name="line.51"></a>
+<span class="sourceLineNo">035</span>import org.apache.commons.codec.language.bm.Languages.LanguageSet;<a name="line.35"></a>
+<span class="sourceLineNo">036</span><a name="line.36"></a>
+<span class="sourceLineNo">037</span>/**<a name="line.37"></a>
+<span class="sourceLineNo">038</span> * A phoneme rule.<a name="line.38"></a>
+<span class="sourceLineNo">039</span> * &lt;p&gt;<a name="line.39"></a>
+<span class="sourceLineNo">040</span> * Rules have a pattern, left context, right context, output phoneme, set of languages for which they apply<a name="line.40"></a>
+<span class="sourceLineNo">041</span> * and a logical flag indicating if all languages must be in play. A rule matches if:<a name="line.41"></a>
+<span class="sourceLineNo">042</span> * &lt;ul&gt;<a name="line.42"></a>
+<span class="sourceLineNo">043</span> * &lt;li&gt;the pattern matches at the current position&lt;/li&gt;<a name="line.43"></a>
+<span class="sourceLineNo">044</span> * &lt;li&gt;the string up until the beginning of the pattern matches the left context&lt;/li&gt;<a name="line.44"></a>
+<span class="sourceLineNo">045</span> * &lt;li&gt;the string from the end of the pattern matches the right context&lt;/li&gt;<a name="line.45"></a>
+<span class="sourceLineNo">046</span> * &lt;li&gt;logical is ALL and all languages are in scope; or&lt;/li&gt;<a name="line.46"></a>
+<span class="sourceLineNo">047</span> * &lt;li&gt;logical is any other value and at least one language is in scope&lt;/li&gt;<a name="line.47"></a>
+<span class="sourceLineNo">048</span> * &lt;/ul&gt;<a name="line.48"></a>
+<span class="sourceLineNo">049</span> * &lt;p&gt;<a name="line.49"></a>
+<span class="sourceLineNo">050</span> * Rules are typically generated by parsing rules resources. In normal use, there will be no need for the user<a name="line.50"></a>
+<span class="sourceLineNo">051</span> * to explicitly construct their own.<a name="line.51"></a>
 <span class="sourceLineNo">052</span> * &lt;p&gt;<a name="line.52"></a>
-<span class="sourceLineNo">053</span> * &lt;b&gt;Rules resources&lt;/b&gt;<a name="line.53"></a>
+<span class="sourceLineNo">053</span> * Rules are immutable and thread-safe.<a name="line.53"></a>
 <span class="sourceLineNo">054</span> * &lt;p&gt;<a name="line.54"></a>
-<span class="sourceLineNo">055</span> * Rules are typically loaded from resource files. These are UTF-8 encoded text files. They are systematically<a name="line.55"></a>
-<span class="sourceLineNo">056</span> * named following the pattern:<a name="line.56"></a>
-<span class="sourceLineNo">057</span> * &lt;blockquote&gt;org/apache/commons/codec/language/bm/${NameType#getName}_${RuleType#getName}_${language}.txt&lt;/blockquote&gt;<a name="line.57"></a>
-<span class="sourceLineNo">058</span> * &lt;p&gt;<a name="line.58"></a>
-<span class="sourceLineNo">059</span> * The format of these resources is the following:<a name="line.59"></a>
-<span class="sourceLineNo">060</span> * &lt;ul&gt;<a name="line.60"></a>
-<span class="sourceLineNo">061</span> * &lt;li&gt;&lt;b&gt;Rules:&lt;/b&gt; whitespace separated, double-quoted strings. There should be 4 columns to each row, and these<a name="line.61"></a>
-<span class="sourceLineNo">062</span> * will be interpreted as:<a name="line.62"></a>
-<span class="sourceLineNo">063</span> * &lt;ol&gt;<a name="line.63"></a>
-<span class="sourceLineNo">064</span> * &lt;li&gt;pattern&lt;/li&gt;<a name="line.64"></a>
-<span class="sourceLineNo">065</span> * &lt;li&gt;left context&lt;/li&gt;<a name="line.65"></a>
-<span class="sourceLineNo">066</span> * &lt;li&gt;right context&lt;/li&gt;<a name="line.66"></a>
-<span class="sourceLineNo">067</span> * &lt;li&gt;phoneme&lt;/li&gt;<a name="line.67"></a>
-<span class="sourceLineNo">068</span> * &lt;/ol&gt;<a name="line.68"></a>
-<span class="sourceLineNo">069</span> * &lt;/li&gt;<a name="line.69"></a>
-<span class="sourceLineNo">070</span> * &lt;li&gt;&lt;b&gt;End-of-line comments:&lt;/b&gt; Any occurrence of '//' will cause all text following on that line to be discarded<a name="line.70"></a>
-<span class="sourceLineNo">071</span> * as a comment.&lt;/li&gt;<a name="line.71"></a>
-<span class="sourceLineNo">072</span> * &lt;li&gt;&lt;b&gt;Multi-line comments:&lt;/b&gt; Any line starting with '/*' will start multi-line commenting mode. This will skip<a name="line.72"></a>
-<span class="sourceLineNo">073</span> * all content until a line ending in '*' and '/' is found.&lt;/li&gt;<a name="line.73"></a>
-<span class="sourceLineNo">074</span> * &lt;li&gt;&lt;b&gt;Blank lines:&lt;/b&gt; All blank lines will be skipped.&lt;/li&gt;<a name="line.74"></a>
-<span class="sourceLineNo">075</span> * &lt;/ul&gt;<a name="line.75"></a>
-<span class="sourceLineNo">076</span> *<a name="line.76"></a>
-<span class="sourceLineNo">077</span> * @since 1.6<a name="line.77"></a>
-<span class="sourceLineNo">078</span> * @version $Id: Rule.java 1435550 2013-01-19 14:09:52Z tn $<a name="line.78"></a>
-<span class="sourceLineNo">079</span> */<a name="line.79"></a>
-<span class="sourceLineNo">080</span>public class Rule {<a name="line.80"></a>
-<span class="sourceLineNo">081</span><a name="line.81"></a>
-<span class="sourceLineNo">082</span>    public static final class Phoneme implements PhonemeExpr {<a name="line.82"></a>
-<span class="sourceLineNo">083</span>        public static final Comparator&lt;Phoneme&gt; COMPARATOR = new Comparator&lt;Phoneme&gt;() {<a name="line.83"></a>
-<span class="sourceLineNo">084</span>            @Override<a name="line.84"></a>
-<span class="sourceLineNo">085</span>            public int compare(final Phoneme o1, final Phoneme o2) {<a name="line.85"></a>
-<span class="sourceLineNo">086</span>                for (int i = 0; i &lt; o1.phonemeText.length(); i++) {<a name="line.86"></a>
-<span class="sourceLineNo">087</span>                    if (i &gt;= o2.phonemeText.length()) {<a name="line.87"></a>
-<span class="sourceLineNo">088</span>                        return +1;<a name="line.88"></a>
-<span class="sourceLineNo">089</span>                    }<a name="line.89"></a>
-<span class="sourceLineNo">090</span>                    final int c = o1.phonemeText.charAt(i) - o2.phonemeText.charAt(i);<a name="line.90"></a>
-<span class="sourceLineNo">091</span>                    if (c != 0) {<a name="line.91"></a>
-<span class="sourceLineNo">092</span>                        return c;<a name="line.92"></a>
-<span class="sourceLineNo">093</span>                    }<a name="line.93"></a>
-<span class="sourceLineNo">094</span>                }<a name="line.94"></a>
-<span class="sourceLineNo">095</span><a name="line.95"></a>
-<span class="sourceLineNo">096</span>                if (o1.phonemeText.length() &lt; o2.phonemeText.length()) {<a name="line.96"></a>
-<span class="sourceLineNo">097</span>                    return -1;<a name="line.97"></a>
-<span class="sourceLineNo">098</span>                }<a name="line.98"></a>
-<span class="sourceLineNo">099</span><a name="line.99"></a>
-<span class="sourceLineNo">100</span>                return 0;<a name="line.100"></a>
-<span class="sourceLineNo">101</span>            }<a name="line.101"></a>
-<span class="sourceLineNo">102</span>        };<a name="line.102"></a>
-<span class="sourceLineNo">103</span><a name="line.103"></a>
-<span class="sourceLineNo">104</span>        private final CharSequence phonemeText;<a name="line.104"></a>
-<span class="sourceLineNo">105</span>        private final Languages.LanguageSet languages;<a name="line.105"></a>
-<span class="sourceLineNo">106</span><a name="line.106"></a>
-<span class="sourceLineNo">107</span>        public Phoneme(final CharSequence phonemeText, final Languages.LanguageSet languages) {<a name="line.107"></a>
-<span class="sourceLineNo">108</span>            this.phonemeText = phonemeText;<a name="line.108"></a>
-<span class="sourceLineNo">109</span>            this.languages = languages;<a name="line.109"></a>
-<span class="sourceLineNo">110</span>        }<a name="line.110"></a>
-<span class="sourceLineNo">111</span><a name="line.111"></a>
-<span class="sourceLineNo">112</span>        public Phoneme append(final CharSequence str) {<a name="line.112"></a>
-<span class="sourceLineNo">113</span>            return new Phoneme(this.phonemeText.toString() + str.toString(), this.languages);<a name="line.113"></a>
-<span class="sourceLineNo">114</span>        }<a name="line.114"></a>
-<span class="sourceLineNo">115</span><a name="line.115"></a>
-<span class="sourceLineNo">116</span>        public Languages.LanguageSet getLanguages() {<a name="line.116"></a>
-<span class="sourceLineNo">117</span>            return this.languages;<a name="line.117"></a>
-<span class="sourceLineNo">118</span>        }<a name="line.118"></a>
-<span class="sourceLineNo">119</span><a name="line.119"></a>
-<span class="sourceLineNo">120</span>        @Override<a name="line.120"></a>
-<span class="sourceLineNo">121</span>        public Iterable&lt;Phoneme&gt; getPhonemes() {<a name="line.121"></a>
-<span class="sourceLineNo">122</span>            return Collections.singleton(this);<a name="line.122"></a>
-<span class="sourceLineNo">123</span>        }<a name="line.123"></a>
-<span class="sourceLineNo">124</span><a name="line.124"></a>
-<span class="sourceLineNo">125</span>        public CharSequence getPhonemeText() {<a name="line.125"></a>
-<span class="sourceLineNo">126</span>            return this.phonemeText;<a name="line.126"></a>
+<span class="sourceLineNo">055</span> * &lt;b&gt;Rules resources&lt;/b&gt;<a name="line.55"></a>
+<span class="sourceLineNo">056</span> * &lt;p&gt;<a name="line.56"></a>
+<span class="sourceLineNo">057</span> * Rules are typically loaded from resource files. These are UTF-8 encoded text files. They are systematically<a name="line.57"></a>
+<span class="sourceLineNo">058</span> * named following the pattern:<a name="line.58"></a>
+<span class="sourceLineNo">059</span> * &lt;blockquote&gt;org/apache/commons/codec/language/bm/${NameType#getName}_${RuleType#getName}_${language}.txt&lt;/blockquote&gt;<a name="line.59"></a>
+<span class="sourceLineNo">060</span> * &lt;p&gt;<a name="line.60"></a>
+<span class="sourceLineNo">061</span> * The format of these resources is the following:<a name="line.61"></a>
+<span class="sourceLineNo">062</span> * &lt;ul&gt;<a name="line.62"></a>
+<span class="sourceLineNo">063</span> * &lt;li&gt;&lt;b&gt;Rules:&lt;/b&gt; whitespace separated, double-quoted strings. There should be 4 columns to each row, and these<a name="line.63"></a>
+<span class="sourceLineNo">064</span> * will be interpreted as:<a name="line.64"></a>
+<span class="sourceLineNo">065</span> * &lt;ol&gt;<a name="line.65"></a>
+<span class="sourceLineNo">066</span> * &lt;li&gt;pattern&lt;/li&gt;<a name="line.66"></a>
+<span class="sourceLineNo">067</span> * &lt;li&gt;left context&lt;/li&gt;<a name="line.67"></a>
+<span class="sourceLineNo">068</span> * &lt;li&gt;right context&lt;/li&gt;<a name="line.68"></a>
+<span class="sourceLineNo">069</span> * &lt;li&gt;phoneme&lt;/li&gt;<a name="line.69"></a>
+<span class="sourceLineNo">070</span> * &lt;/ol&gt;<a name="line.70"></a>
+<span class="sourceLineNo">071</span> * &lt;/li&gt;<a name="line.71"></a>
+<span class="sourceLineNo">072</span> * &lt;li&gt;&lt;b&gt;End-of-line comments:&lt;/b&gt; Any occurrence of '//' will cause all text following on that line to be discarded<a name="line.72"></a>
+<span class="sourceLineNo">073</span> * as a comment.&lt;/li&gt;<a name="line.73"></a>
+<span class="sourceLineNo">074</span> * &lt;li&gt;&lt;b&gt;Multi-line comments:&lt;/b&gt; Any line starting with '/*' will start multi-line commenting mode. This will skip<a name="line.74"></a>
+<span class="sourceLineNo">075</span> * all content until a line ending in '*' and '/' is found.&lt;/li&gt;<a name="line.75"></a>
+<span class="sourceLineNo">076</span> * &lt;li&gt;&lt;b&gt;Blank lines:&lt;/b&gt; All blank lines will be skipped.&lt;/li&gt;<a name="line.76"></a>
+<span class="sourceLineNo">077</span> * &lt;/ul&gt;<a name="line.77"></a>
+<span class="sourceLineNo">078</span> *<a name="line.78"></a>
+<span class="sourceLineNo">079</span> * @since 1.6<a name="line.79"></a>
+<span class="sourceLineNo">080</span> * @version $Id: Rule.java 1544532 2013-11-22 13:38:35Z ggregory $<a name="line.80"></a>
+<span class="sourceLineNo">081</span> */<a name="line.81"></a>
+<span class="sourceLineNo">082</span>public class Rule {<a name="line.82"></a>
+<span class="sourceLineNo">083</span><a name="line.83"></a>
+<span class="sourceLineNo">084</span>    public static final class Phoneme implements PhonemeExpr {<a name="line.84"></a>
+<span class="sourceLineNo">085</span>        public static final Comparator&lt;Phoneme&gt; COMPARATOR = new Comparator&lt;Phoneme&gt;() {<a name="line.85"></a>
+<span class="sourceLineNo">086</span>            @Override<a name="line.86"></a>
+<span class="sourceLineNo">087</span>            public int compare(final Phoneme o1, final Phoneme o2) {<a name="line.87"></a>
+<span class="sourceLineNo">088</span>                for (int i = 0; i &lt; o1.phonemeText.length(); i++) {<a name="line.88"></a>
+<span class="sourceLineNo">089</span>                    if (i &gt;= o2.phonemeText.length()) {<a name="line.89"></a>
+<span class="sourceLineNo">090</span>                        return +1;<a name="line.90"></a>
+<span class="sourceLineNo">091</span>                    }<a name="line.91"></a>
+<span class="sourceLineNo">092</span>                    final int c = o1.phonemeText.charAt(i) - o2.phonemeText.charAt(i);<a name="line.92"></a>
+<span class="sourceLineNo">093</span>                    if (c != 0) {<a name="line.93"></a>
+<span class="sourceLineNo">094</span>                        return c;<a name="line.94"></a>
+<span class="sourceLineNo">095</span>                    }<a name="line.95"></a>
+<span class="sourceLineNo">096</span>                }<a name="line.96"></a>
+<span class="sourceLineNo">097</span><a name="line.97"></a>
+<span class="sourceLineNo">098</span>                if (o1.phonemeText.length() &lt; o2.phonemeText.length()) {<a name="line.98"></a>
+<span class="sourceLineNo">099</span>                    return -1;<a name="line.99"></a>
+<span class="sourceLineNo">100</span>                }<a name="line.100"></a>
+<span class="sourceLineNo">101</span><a name="line.101"></a>
+<span class="sourceLineNo">102</span>                return 0;<a name="line.102"></a>
+<span class="sourceLineNo">103</span>            }<a name="line.103"></a>
+<span class="sourceLineNo">104</span>        };<a name="line.104"></a>
+<span class="sourceLineNo">105</span><a name="line.105"></a>
+<span class="sourceLineNo">106</span>        private final StringBuilder phonemeText;<a name="line.106"></a>
+<span class="sourceLineNo">107</span>        private final Languages.LanguageSet languages;<a name="line.107"></a>
+<span class="sourceLineNo">108</span><a name="line.108"></a>
+<span class="sourceLineNo">109</span>        public Phoneme(final CharSequence phonemeText, final Languages.LanguageSet languages) {<a name="line.109"></a>
+<span class="sourceLineNo">110</span>            this.phonemeText = new StringBuilder(phonemeText);<a name="line.110"></a>
+<span class="sourceLineNo">111</span>            this.languages = languages;<a name="line.111"></a>
+<span class="sourceLineNo">112</span>        }<a name="line.112"></a>
+<span class="sourceLineNo">113</span><a name="line.113"></a>
+<span class="sourceLineNo">114</span>        public Phoneme(final Phoneme phonemeLeft, final Phoneme phonemeRight) {<a name="line.114"></a>
+<span class="sourceLineNo">115</span>            this(phonemeLeft.phonemeText, phonemeLeft.languages);<a name="line.115"></a>
+<span class="sourceLineNo">116</span>            this.phonemeText.append(phonemeRight.phonemeText);<a name="line.116"></a>
+<span class="sourceLineNo">117</span>        }<a name="line.117"></a>
+<span class="sourceLineNo">118</span><a name="line.118"></a>
+<span class="sourceLineNo">119</span>        public Phoneme(final Phoneme phonemeLeft, final Phoneme phonemeRight, final Languages.LanguageSet languages) {<a name="line.119"></a>
+<span class="sourceLineNo">120</span>            this(phonemeLeft.phonemeText, languages);<a name="line.120"></a>
+<span class="sourceLineNo">121</span>            this.phonemeText.append(phonemeRight.phonemeText);<a name="line.121"></a>
+<span class="sourceLineNo">122</span>        }<a name="line.122"></a>
+<span class="sourceLineNo">123</span><a name="line.123"></a>
+<span class="sourceLineNo">124</span>        public Phoneme append(final CharSequence str) {<a name="line.124"></a>
+<span class="sourceLineNo">125</span>            this.phonemeText.append(str);<a name="line.125"></a>
+<span class="sourceLineNo">126</span>            return this;<a name="line.126"></a>
 <span class="sourceLineNo">127</span>        }<a name="line.127"></a>
 <span class="sourceLineNo">128</span><a name="line.128"></a>
-<span class="sourceLineNo">129</span>        public Phoneme join(final Phoneme right) {<a name="line.129"></a>
-<span class="sourceLineNo">130</span>            return new Phoneme(this.phonemeText.toString() + right.phonemeText.toString(),<a name="line.130"></a>
-<span class="sourceLineNo">131</span>                               this.languages.restrictTo(right.languages));<a name="line.131"></a>
-<span class="sourceLineNo">132</span>        }<a name="line.132"></a>
-<span class="sourceLineNo">133</span>    }<a name="line.133"></a>
-<span class="sourceLineNo">134</span><a name="line.134"></a>
-<span class="sourceLineNo">135</span>    public interface PhonemeExpr {<a name="line.135"></a>
-<span class="sourceLineNo">136</span>        Iterable&lt;Phoneme&gt; getPhonemes();<a name="line.136"></a>
-<span class="sourceLineNo">137</span>    }<a name="line.137"></a>
-<span class="sourceLineNo">138</span><a name="line.138"></a>
-<span class="sourceLineNo">139</span>    public static final class PhonemeList implements PhonemeExpr {<a name="line.139"></a>
-<span class="sourceLineNo">140</span>        private final List&lt;Phoneme&gt; phonemes;<a name="line.140"></a>
+<span class="sourceLineNo">129</span>        public Languages.LanguageSet getLanguages() {<a name="line.129"></a>
+<span class="sourceLineNo">130</span>            return this.languages;<a name="line.130"></a>
+<span class="sourceLineNo">131</span>        }<a name="line.131"></a>
+<span class="sourceLineNo">132</span><a name="line.132"></a>
+<span class="sourceLineNo">133</span>        @Override<a name="line.133"></a>
+<span class="sourceLineNo">134</span>        public Iterable&lt;Phoneme&gt; getPhonemes() {<a name="line.134"></a>
+<span class="sourceLineNo">135</span>            return Collections.singleton(this);<a name="line.135"></a>
+<span class="sourceLineNo">136</span>        }<a name="line.136"></a>
+<span class="sourceLineNo">137</span><a name="line.137"></a>
+<span class="sourceLineNo">138</span>        public CharSequence getPhonemeText() {<a name="line.138"></a>
+<span class="sourceLineNo">139</span>            return this.phonemeText;<a name="line.139"></a>
+<span class="sourceLineNo">140</span>        }<a name="line.140"></a>
 <span class="sourceLineNo">141</span><a name="line.141"></a>
-<span class="sourceLineNo">142</span>        public PhonemeList(final List&lt;Phoneme&gt; phonemes) {<a name="line.142"></a>
-<span class="sourceLineNo">143</span>            this.phonemes = phonemes;<a name="line.143"></a>
-<span class="sourceLineNo">144</span>        }<a name="line.144"></a>
-<span class="sourceLineNo">145</span><a name="line.145"></a>
-<span class="sourceLineNo">146</span>        @Override<a name="line.146"></a>
-<span class="sourceLineNo">147</span>        public List&lt;Phoneme&gt; getPhonemes() {<a name="line.147"></a>
-<span class="sourceLineNo">148</span>            return this.phonemes;<a name="line.148"></a>
+<span class="sourceLineNo">142</span>        /**<a name="line.142"></a>
+<span class="sourceLineNo">143</span>         * @deprecated since 1.9<a name="line.143"></a>
+<span class="sourceLineNo">144</span>         */<a name="line.144"></a>
+<span class="sourceLineNo">145</span>        @Deprecated<a name="line.145"></a>
+<span class="sourceLineNo">146</span>        public Phoneme join(final Phoneme right) {<a name="line.146"></a>
+<span class="sourceLineNo">147</span>            return new Phoneme(this.phonemeText.toString() + right.phonemeText.toString(),<a name="line.147"></a>
+<span class="sourceLineNo">148</span>                               this.languages.restrictTo(right.languages));<a name="line.148"></a>
 <span class="sourceLineNo">149</span>        }<a name="line.149"></a>
 <span class="sourceLineNo">150</span>    }<a name="line.150"></a>
 <span class="sourceLineNo">151</span><a name="line.151"></a>
-<span class="sourceLineNo">152</span>    /**<a name="line.152"></a>
-<span class="sourceLineNo">153</span>     * A minimal wrapper around the functionality of Pattern that we use, to allow for alternate implementations.<a name="line.153"></a>
-<span class="sourceLineNo">154</span>     */<a name="line.154"></a>
-<span class="sourceLineNo">155</span>    public static interface RPattern {<a name="line.155"></a>
-<span class="sourceLineNo">156</span>        boolean isMatch(CharSequence input);<a name="line.156"></a>
-<span class="sourceLineNo">157</span>    }<a name="line.157"></a>
+<span class="sourceLineNo">152</span>    public interface PhonemeExpr {<a name="line.152"></a>
+<span class="sourceLineNo">153</span>        Iterable&lt;Phoneme&gt; getPhonemes();<a name="line.153"></a>
+<span class="sourceLineNo">154</span>    }<a name="line.154"></a>
+<span class="sourceLineNo">155</span><a name="line.155"></a>
+<span class="sourceLineNo">156</span>    public static final class PhonemeList implements PhonemeExpr {<a name="line.156"></a>
+<span class="sourceLineNo">157</span>        private final List&lt;Phoneme&gt; phonemes;<a name="line.157"></a>
 <span class="sourceLineNo">158</span><a name="line.158"></a>
-<span class="sourceLineNo">159</span>    public static final RPattern ALL_STRINGS_RMATCHER = new RPattern() {<a name="line.159"></a>
-<span class="sourceLineNo">160</span>        @Override<a name="line.160"></a>
-<span class="sourceLineNo">161</span>        public boolean isMatch(final CharSequence input) {<a name="line.161"></a>
-<span class="sourceLineNo">162</span>            return true;<a name="line.162"></a>
-<span class="sourceLineNo">163</span>        }<a name="line.163"></a>
-<span class="sourceLineNo">164</span>    };<a name="line.164"></a>
-<span class="sourceLineNo">165</span><a name="line.165"></a>
-<span class="sourceLineNo">166</span>    public static final String ALL = "ALL";<a name="line.166"></a>
-<span class="sourceLineNo">167</span><a name="line.167"></a>
-<span class="sourceLineNo">168</span>    private static final String DOUBLE_QUOTE = "\"";<a name="line.168"></a>
-<span class="sourceLineNo">169</span><a name="line.169"></a>
-<span class="sourceLineNo">170</span>    private static final String HASH_INCLUDE = "#include";<a name="line.170"></a>
-<span class="sourceLineNo">171</span><a name="line.171"></a>
-<span class="sourceLineNo">172</span>    private static final Map&lt;NameType, Map&lt;RuleType, Map&lt;String, List&lt;Rule&gt;&gt;&gt;&gt; RULES =<a name="line.172"></a>
-<span class="sourceLineNo">173</span>            new EnumMap&lt;NameType, Map&lt;RuleType, Map&lt;String, List&lt;Rule&gt;&gt;&gt;&gt;(NameType.class);<a name="line.173"></a>
-<span class="sourceLineNo">174</span><a name="line.174"></a>
-<span class="sourceLineNo">175</span>    static {<a name="line.175"></a>
-<span class="sourceLineNo">176</span>        for (final NameType s : NameType.values()) {<a name="line.176"></a>
-<span class="sourceLineNo">177</span>            final Map&lt;RuleType, Map&lt;String, List&lt;Rule&gt;&gt;&gt; rts =<a name="line.177"></a>
-<span class="sourceLineNo">178</span>                    new EnumMap&lt;RuleType, Map&lt;String, List&lt;Rule&gt;&gt;&gt;(RuleType.class);<a name="line.178"></a>
-<span class="sourceLineNo">179</span><a name="line.179"></a>
-<span class="sourceLineNo">180</span>            for (final RuleType rt : RuleType.values()) {<a name="line.180"></a>
-<span class="sourceLineNo">181</span>                final Map&lt;String, List&lt;Rule&gt;&gt; rs = new HashMap&lt;String, List&lt;Rule&gt;&gt;();<a name="line.181"></a>
+<span class="sourceLineNo">159</span>        public PhonemeList(final List&lt;Phoneme&gt; phonemes) {<a name="line.159"></a>
+<span class="sourceLineNo">160</span>            this.phonemes = phonemes;<a name="line.160"></a>
+<span class="sourceLineNo">161</span>        }<a name="line.161"></a>
+<span class="sourceLineNo">162</span><a name="line.162"></a>
+<span class="sourceLineNo">163</span>        @Override<a name="line.163"></a>
+<span class="sourceLineNo">164</span>        public List&lt;Phoneme&gt; getPhonemes() {<a name="line.164"></a>
+<span class="sourceLineNo">165</span>            return this.phonemes;<a name="line.165"></a>
+<span class="sourceLineNo">166</span>        }<a name="line.166"></a>
+<span class="sourceLineNo">167</span>    }<a name="line.167"></a>
+<span class="sourceLineNo">168</span><a name="line.168"></a>
+<span class="sourceLineNo">169</span>    /**<a name="line.169"></a>
+<span class="sourceLineNo">170</span>     * A minimal wrapper around the functionality of Pattern that we use, to allow for alternate implementations.<a name="line.170"></a>
+<span class="sourceLineNo">171</span>     */<a name="line.171"></a>
+<span class="sourceLineNo">172</span>    public interface RPattern {<a name="line.172"></a>
+<span class="sourceLineNo">173</span>        boolean isMatch(CharSequence input);<a name="line.173"></a>
+<span class="sourceLineNo">174</span>    }<a name="line.174"></a>
+<span class="sourceLineNo">175</span><a name="line.175"></a>
+<span class="sourceLineNo">176</span>    public static final RPattern ALL_STRINGS_RMATCHER = new RPattern() {<a name="line.176"></a>
+<span class="sourceLineNo">177</span>        @Override<a name="line.177"></a>
+<span class="sourceLineNo">178</span>        public boolean isMatch(final CharSequence input) {<a name="line.178"></a>
+<span class="sourceLineNo">179</span>            return true;<a name="line.179"></a>
+<span class="sourceLineNo">180</span>        }<a name="line.180"></a>
+<span class="sourceLineNo">181</span>    };<a name="line.181"></a>
 <span class="sourceLineNo">182</span><a name="line.182"></a>
-<span class="sourceLineNo">183</span>                final Languages ls = Languages.getInstance(s);<a name="line.183"></a>
-<span class="sourceLineNo">184</span>                for (final String l : ls.getLanguages()) {<a name="line.184"></a>
-<span class="sourceLineNo">185</span>                    try {<a name="line.185"></a>
-<span class="sourceLineNo">186</span>                        rs.put(l, parseRules(createScanner(s, rt, l), createResourceName(s, rt, l)));<a name="line.186"></a>
-<span class="sourceLineNo">187</span>                    } catch (final IllegalStateException e) {<a name="line.187"></a>
-<span class="sourceLineNo">188</span>                        throw new IllegalStateException("Problem processing " + createResourceName(s, rt, l), e);<a name="line.188"></a>
-<span class="sourceLineNo">189</span>                    }<a name="line.189"></a>
-<span class="sourceLineNo">190</span>                }<a name="line.190"></a>
-<span class="sourceLineNo">191</span>                if (!rt.equals(RuleType.RULES)) {<a name="line.191"></a>
-<span class="sourceLineNo">192</span>                    rs.put("common", parseRules(createScanner(s, rt, "common"), createResourceName(s, rt, "common")));<a name="line.192"></a>
-<span class="sourceLineNo">193</span>                }<a name="line.193"></a>
-<span class="sourceLineNo">194</span><a name="line.194"></a>
-<span class="sourceLineNo">195</span>                rts.put(rt, Collections.unmodifiableMap(rs));<a name="line.195"></a>
-<span class="sourceLineNo">196</span>            }<a name="line.196"></a>
-<span class="sourceLineNo">197</span><a name="line.197"></a>
-<span class="sourceLineNo">198</span>            RULES.put(s, Collections.unmodifiableMap(rts));<a name="line.198"></a>
-<span class="sourceLineNo">199</span>        }<a name="line.199"></a>
-<span class="sourceLineNo">200</span>    }<a name="line.200"></a>
-<span class="sourceLineNo">201</span><a name="line.201"></a>
-<span class="sourceLineNo">202</span>    private static boolean contains(final CharSequence chars, final char input) {<a name="line.202"></a>
-<span class="sourceLineNo">203</span>        for (int i = 0; i &lt; chars.length(); i++) {<a name="line.203"></a>
-<span class="sourceLineNo">204</span>            if (chars.charAt(i) == input) {<a name="line.204"></a>
-<span class="sourceLineNo">205</span>                return true;<a name="line.205"></a>
-<span class="sourceLineNo">206</span>            }<a name="line.206"></a>
-<span class="sourceLineNo">207</span>        }<a name="line.207"></a>
-<span class="sourceLineNo">208</span>        return false;<a name="line.208"></a>
-<span class="sourceLineNo">209</span>    }<a name="line.209"></a>
-<span class="sourceLineNo">210</span><a name="line.210"></a>
-<span class="sourceLineNo">211</span>    private static String createResourceName(final NameType nameType, final RuleType rt, final String lang) {<a name="line.211"></a>
-<span class="sourceLineNo">212</span>        return String.format("org/apache/commons/codec/language/bm/%s_%s_%s.txt",<a name="line.212"></a>
-<span class="sourceLineNo">213</span>                             nameType.getName(), rt.getName(), lang);<a name="line.213"></a>
-<span class="sourceLineNo">214</span>    }<a name="line.214"></a>
-<span class="sourceLineNo">215</span><a name="line.215"></a>
-<span class="sourceLineNo">216</span>    private static Scanner createScanner(final NameType nameType, final RuleType rt, final String lang) {<a name="line.216"></a>
-<span class="sourceLineNo">217</span>        final String resName = createResourceName(nameType, rt, lang);<a name="line.217"></a>
-<span class="sourceLineNo">218</span>        final InputStream rulesIS = Languages.class.getClassLoader().getResourceAsStream(resName);<a name="line.218"></a>
-<span class="sourceLineNo">219</span><a name="line.219"></a>
-<span class="sourceLineNo">220</span>        if (rulesIS == null) {<a name="line.220"></a>
-<span class="sourceLineNo">221</span>            throw new IllegalArgumentException("Unable to load resource: " + resName);<a name="line.221"></a>
-<span class="sourceLineNo">222</span>        }<a name="line.222"></a>
-<span class="sourceLineNo">223</span><a name="line.223"></a>
-<span class="sourceLineNo">224</span>        return new Scanner(rulesIS, ResourceConstants.ENCODING);<a name="line.224"></a>
-<span class="sourceLineNo">225</span>    }<a name="line.225"></a>
-<span class="sourceLineNo">226</span><a name="line.226"></a>
-<span class="sourceLineNo">227</span>    private static Scanner createScanner(final String lang) {<a name="line.227"></a>
-<span class="sourceLineNo">228</span>        final String resName = String.format("org/apache/commons/codec/language/bm/%s.txt", lang);<a name="line.228"></a>
-<span class="sourceLineNo">229</span>        final InputStream rulesIS = Languages.class.getClassLoader().getResourceAsStream(resName);<a name="line.229"></a>
-<span class="sourceLineNo">230</span><a name="line.230"></a>
-<span class="sourceLineNo">231</span>        if (rulesIS == null) {<a name="line.231"></a>
-<span class="sourceLineNo">232</span>            throw new IllegalArgumentException("Unable to load resource: " + resName);<a name="line.232"></a>
-<span class="sourceLineNo">233</span>        }<a name="line.233"></a>
-<span class="sourceLineNo">234</span><a name="line.234"></a>
-<span class="sourceLineNo">235</span>        return new Scanner(rulesIS, ResourceConstants.ENCODING);<a name="line.235"></a>
-<span class="sourceLineNo">236</span>    }<a name="line.236"></a>
-<span class="sourceLineNo">237</span><a name="line.237"></a>
-<span class="sourceLineNo">238</span>    private static boolean endsWith(final CharSequence input, final CharSequence suffix) {<a name="line.238"></a>
-<span class="sourceLineNo">239</span>        if (suffix.length() &gt; input.length()) {<a name="line.239"></a>
-<span class="sourceLineNo">240</span>            return false;<a name="line.240"></a>
-<span class="sourceLineNo">241</span>        }<a name="line.241"></a>
-<span class="sourceLineNo">242</span>        for (int i = input.length() - 1, j = suffix.length() - 1; j &gt;= 0; i--, j--) {<a name="line.242"></a>
-<span class="sourceLineNo">243</span>            if (input.charAt(i) != suffix.charAt(j)) {<a name="line.243"></a>
-<span class="sourceLineNo">244</span>                return false;<a name="line.244"></a>
-<span class="sourceLineNo">245</span>            }<a name="line.245"></a>
-<span class="sourceLineNo">246</span>        }<a name="line.246"></a>
-<span class="sourceLineNo">247</span>        return true;<a name="line.247"></a>
-<span class="sourceLineNo">248</span>    }<a name="line.248"></a>
-<span class="sourceLineNo">249</span><a name="line.249"></a>
-<span class="sourceLineNo">250</span>    /**<a name="line.250"></a>
-<span class="sourceLineNo">251</span>     * Gets rules for a combination of name type, rule type and languages.<a name="line.251"></a>
-<span class="sourceLineNo">252</span>     *<a name="line.252"></a>
-<span class="sourceLineNo">253</span>     * @param nameType<a name="line.253"></a>
-<span class="sourceLineNo">254</span>     *            the NameType to consider<a name="line.254"></a>
-<span class="sourceLineNo">255</span>     * @param rt<a name="line.255"></a>
-<span class="sourceLineNo">256</span>     *            the RuleType to consider<a name="line.256"></a>
-<span class="sourceLineNo">257</span>     * @param langs<a name="line.257"></a>
-<span class="sourceLineNo">258</span>     *            the set of languages to consider<a name="line.258"></a>
-<span class="sourceLineNo">259</span>     * @return a list of Rules that apply<a name="line.259"></a>
-<span class="sourceLineNo">260</span>     */<a name="line.260"></a>
-<span class="sourceLineNo">261</span>    public static List&lt;Rule&gt; getInstance(final NameType nameType, final RuleType rt,<a name="line.261"></a>
-<span class="sourceLineNo">262</span>                                         final Languages.LanguageSet langs) {<a name="line.262"></a>
-<span class="sourceLineNo">263</span>        return langs.isSingleton() ? getInstance(nameType, rt, langs.getAny()) :<a name="line.263"></a>
-<span class="sourceLineNo">264</span>                                     getInstance(nameType, rt, Languages.ANY);<a name="line.264"></a>
+<span class="sourceLineNo">183</span>    public static final String ALL = "ALL";<a name="line.183"></a>
+<span class="sourceLineNo">184</span><a name="line.184"></a>
+<span class="sourceLineNo">185</span>    private static final String DOUBLE_QUOTE = "\"";<a name="line.185"></a>
+<span class="sourceLineNo">186</span><a name="line.186"></a>
+<span class="sourceLineNo">187</span>    private static final String HASH_INCLUDE = "#include";<a name="line.187"></a>
+<span class="sourceLineNo">188</span><a name="line.188"></a>
+<span class="sourceLineNo">189</span>    private static final Map&lt;NameType, Map&lt;RuleType, Map&lt;String, Map&lt;String, List&lt;Rule&gt;&gt;&gt;&gt;&gt; RULES =<a name="line.189"></a>
+<span class="sourceLineNo">190</span>            new EnumMap&lt;NameType, Map&lt;RuleType, Map&lt;String, Map&lt;String, List&lt;Rule&gt;&gt;&gt;&gt;&gt;(NameType.class);<a name="line.190"></a>
+<span class="sourceLineNo">191</span><a name="line.191"></a>
+<span class="sourceLineNo">192</span>    static {<a name="line.192"></a>
+<span class="sourceLineNo">193</span>        for (final NameType s : NameType.values()) {<a name="line.193"></a>
+<span class="sourceLineNo">194</span>            final Map&lt;RuleType, Map&lt;String, Map&lt;String, List&lt;Rule&gt;&gt;&gt;&gt; rts =<a name="line.194"></a>
+<span class="sourceLineNo">195</span>                    new EnumMap&lt;RuleType, Map&lt;String, Map&lt;String, List&lt;Rule&gt;&gt;&gt;&gt;(RuleType.class);<a name="line.195"></a>
+<span class="sourceLineNo">196</span><a name="line.196"></a>
+<span class="sourceLineNo">197</span>            for (final RuleType rt : RuleType.values()) {<a name="line.197"></a>
+<span class="sourceLineNo">198</span>                final Map&lt;String, Map&lt;String, List&lt;Rule&gt;&gt;&gt; rs = new HashMap&lt;String, Map&lt;String, List&lt;Rule&gt;&gt;&gt;();<a name="line.198"></a>
+<span class="sourceLineNo">199</span><a name="line.199"></a>
+<span class="sourceLineNo">200</span>                final Languages ls = Languages.getInstance(s);<a name="line.200"></a>
+<span class="sourceLineNo">201</span>                for (final String l : ls.getLanguages()) {<a name="line.201"></a>
+<span class="sourceLineNo">202</span>                    try {<a name="line.202"></a>
+<span class="sourceLineNo">203</span>                        rs.put(l, parseRules(createScanner(s, rt, l), createResourceName(s, rt, l)));<a name="line.203"></a>
+<span class="sourceLineNo">204</span>                    } catch (final IllegalStateException e) {<a name="line.204"></a>
+<span class="sourceLineNo">205</span>                        throw new IllegalStateException("Problem processing " + createResourceName(s, rt, l), e);<a name="line.205"></a>
+<span class="sourceLineNo">206</span>                    }<a name="line.206"></a>
+<span class="sourceLineNo">207</span>                }<a name="line.207"></a>
+<span class="sourceLineNo">208</span>                if (!rt.equals(RuleType.RULES)) {<a name="line.208"></a>
+<span class="sourceLineNo">209</span>                    rs.put("common", parseRules(createScanner(s, rt, "common"), createResourceName(s, rt, "common")));<a name="line.209"></a>
+<span class="sourceLineNo">210</span>                }<a name="line.210"></a>
+<span class="sourceLineNo">211</span><a name="line.211"></a>
+<span class="sourceLineNo">212</span>                rts.put(rt, Collections.unmodifiableMap(rs));<a name="line.212"></a>
+<span class="sourceLineNo">213</span>            }<a name="line.213"></a>
+<span class="sourceLineNo">214</span><a name="line.214"></a>
+<span class="sourceLineNo">215</span>            RULES.put(s, Collections.unmodifiableMap(rts));<a name="line.215"></a>
+<span class="sourceLineNo">216</span>        }<a name="line.216"></a>
+<span class="sourceLineNo">217</span>    }<a name="line.217"></a>
+<span class="sourceLineNo">218</span><a name="line.218"></a>
+<span class="sourceLineNo">219</span>    private static boolean contains(final CharSequence chars, final char input) {<a name="line.219"></a>
+<span class="sourceLineNo">220</span>        for (int i = 0; i &lt; chars.length(); i++) {<a name="line.220"></a>
+<span class="sourceLineNo">221</span>            if (chars.charAt(i) == input) {<a name="line.221"></a>
+<span class="sourceLineNo">222</span>                return true;<a name="line.222"></a>
+<span class="sourceLineNo">223</span>            }<a name="line.223"></a>
+<span class="sourceLineNo">224</span>        }<a name="line.224"></a>
+<span class="sourceLineNo">225</span>        return false;<a name="line.225"></a>
+<span class="sourceLineNo">226</span>    }<a name="line.226"></a>
+<span class="sourceLineNo">227</span><a name="line.227"></a>
+<span class="sourceLineNo">228</span>    private static String createResourceName(final NameType nameType, final RuleType rt, final String lang) {<a name="line.228"></a>
+<span class="sourceLineNo">229</span>        return String.format("org/apache/commons/codec/language/bm/%s_%s_%s.txt",<a name="line.229"></a>
+<span class="sourceLineNo">230</span>                             nameType.getName(), rt.getName(), lang);<a name="line.230"></a>
+<span class="sourceLineNo">231</span>    }<a name="line.231"></a>
+<span class="sourceLineNo">232</span><a name="line.232"></a>
+<span class="sourceLineNo">233</span>    private static Scanner createScanner(final NameType nameType, final RuleType rt, final String lang) {<a name="line.233"></a>
+<span class="sourceLineNo">234</span>        final String resName = createResourceName(nameType, rt, lang);<a name="line.234"></a>
+<span class="sourceLineNo">235</span>        final InputStream rulesIS = Languages.class.getClassLoader().getResourceAsStream(resName);<a name="line.235"></a>
+<span class="sourceLineNo">236</span><a name="line.236"></a>
+<span class="sourceLineNo">237</span>        if (rulesIS == null) {<a name="line.237"></a>
+<span class="sourceLineNo">238</span>            throw new IllegalArgumentException("Unable to load resource: " + resName);<a name="line.238"></a>
+<span class="sourceLineNo">239</span>        }<a name="line.239"></a>
+<span class="sourceLineNo">240</span><a name="line.240"></a>
+<span class="sourceLineNo">241</span>        return new Scanner(rulesIS, ResourceConstants.ENCODING);<a name="line.241"></a>
+<span class="sourceLineNo">242</span>    }<a name="line.242"></a>
+<span class="sourceLineNo">243</span><a name="line.243"></a>
+<span class="sourceLineNo">244</span>    private static Scanner createScanner(final String lang) {<a name="line.244"></a>
+<span class="sourceLineNo">245</span>        final String resName = String.format("org/apache/commons/codec/language/bm/%s.txt", lang);<a name="line.245"></a>
+<span class="sourceLineNo">246</span>        final InputStream rulesIS = Languages.class.getClassLoader().getResourceAsStream(resName);<a name="line.246"></a>
+<span class="sourceLineNo">247</span><a name="line.247"></a>
+<span class="sourceLineNo">248</span>        if (rulesIS == null) {<a name="line.248"></a>
+<span class="sourceLineNo">249</span>            throw new IllegalArgumentException("Unable to load resource: " + resName);<a name="line.249"></a>
+<span class="sourceLineNo">250</span>        }<a name="line.250"></a>
+<span class="sourceLineNo">251</span><a name="line.251"></a>
+<span class="sourceLineNo">252</span>        return new Scanner(rulesIS, ResourceConstants.ENCODING);<a name="line.252"></a>
+<span class="sourceLineNo">253</span>    }<a name="line.253"></a>
+<span class="sourceLineNo">254</span><a name="line.254"></a>
+<span class="sourceLineNo">255</span>    private static boolean endsWith(final CharSequence input, final CharSequence suffix) {<a name="line.255"></a>
+<span class="sourceLineNo">256</span>        if (suffix.length() &gt; input.length()) {<a name="line.256"></a>
+<span class="sourceLineNo">257</span>            return false;<a name="line.257"></a>
+<span class="sourceLineNo">258</span>        }<a name="line.258"></a>
+<span class="sourceLineNo">259</span>        for (int i = input.length() - 1, j = suffix.length() - 1; j &gt;= 0; i--, j--) {<a name="line.259"></a>
+<span class="sourceLineNo">260</span>            if (input.charAt(i) != suffix.charAt(j)) {<a name="line.260"></a>
+<span class="sourceLineNo">261</span>                return false;<a name="line.261"></a>
+<span class="sourceLineNo">262</span>            }<a name="line.262"></a>
+<span class="sourceLineNo">263</span>        }<a name="line.263"></a>
+<span class="sourceLineNo">264</span>        return true;<a name="line.264"></a>
 <span class="sourceLineNo">265</span>    }<a name="line.265"></a>
 <span class="sourceLineNo">266</span><a name="line.266"></a>
 <span class="sourceLineNo">267</span>    /**<a name="line.267"></a>
-<span class="sourceLineNo">268</span>     * Gets rules for a combination of name type, rule type and a single language.<a name="line.268"></a>
+<span class="sourceLineNo">268</span>     * Gets rules for a combination of name type, rule type and languages.<a name="line.268"></a>
 <span class="sourceLineNo">269</span>     *<a name="line.269"></a>
 <span class="sourceLineNo">270</span>     * @param nameType<a name="line.270"></a>
 <span class="sourceLineNo">271</span>     *            the NameType to consider<a name="line.271"></a>
 <span class="sourceLineNo">272</span>     * @param rt<a name="line.272"></a>
 <span class="sourceLineNo">273</span>     *            the RuleType to consider<a name="line.273"></a>
-<span class="sourceLineNo">274</span>     * @param lang<a name="line.274"></a>
-<span class="sourceLineNo">275</span>     *            the language to consider<a name="line.275"></a>
-<span class="sourceLineNo">276</span>     * @return a list rules for a combination of name type, rule type and a single language.<a name="line.276"></a>
+<span class="sourceLineNo">274</span>     * @param langs<a name="line.274"></a>
+<span class="sourceLineNo">275</span>     *            the set of languages to consider<a name="line.275"></a>
+<span class="sourceLineNo">276</span>     * @return a list of Rules that apply<a name="line.276"></a>
 <span class="sourceLineNo">277</span>     */<a name="line.277"></a>
-<span class="sourceLineNo">278</span>    public static List&lt;Rule&gt; getInstance(final NameType nameType, final RuleType rt, final String lang) {<a name="line.278"></a>
-<span class="sourceLineNo">279</span>        final List&lt;Rule&gt; rules = RULES.get(nameType).get(rt).get(lang);<a name="line.279"></a>
-<span class="sourceLineNo">280</span><a name="line.280"></a>
-<span class="sourceLineNo">281</span>        if (rules == null) {<a name="line.281"></a>
-<span class="sourceLineNo">282</span>            throw new IllegalArgumentException(String.format("No rules found for %s, %s, %s.",<a name="line.282"></a>
-<span class="sourceLineNo">283</span>                                               nameType.getName(), rt.getName(), lang));<a name="line.283"></a>
+<span class="sourceLineNo">278</span>    public static List&lt;Rule&gt; getInstance(final NameType nameType, final RuleType rt,<a name="line.278"></a>
+<span class="sourceLineNo">279</span>                                         final Languages.LanguageSet langs) {<a name="line.279"></a>
+<span class="sourceLineNo">280</span>        final Map&lt;String, List&lt;Rule&gt;&gt; ruleMap = getInstanceMap(nameType, rt, langs);<a name="line.280"></a>
+<span class="sourceLineNo">281</span>        final List&lt;Rule&gt; allRules = new ArrayList&lt;Rule&gt;();<a name="line.281"></a>
+<span class="sourceLineNo">282</span>        for (final List&lt;Rule&gt; rules : ruleMap.values()) {<a name="line.282"></a>
+<span class="sourceLineNo">283</span>            allRules.addAll(rules);<a name="line.283"></a>
 <span class="sourceLineNo">284</span>        }<a name="line.284"></a>
-<span class="sourceLineNo">285</span><a name="line.285"></a>
-<span class="sourceLineNo">286</span>        return rules;<a name="line.286"></a>
-<span class="sourceLineNo">287</span>    }<a name="line.287"></a>
-<span class="sourceLineNo">288</span><a name="line.288"></a>
-<span class="sourceLineNo">289</span>    private static Phoneme parsePhoneme(final String ph) {<a name="line.289"></a>
-<span class="sourceLineNo">290</span>        final int open = ph.indexOf("[");<a name="line.290"></a>
-<span class="sourceLineNo">291</span>        if (open &gt;= 0) {<a name="line.291"></a>
-<span class="sourceLineNo">292</span>            if (!ph.endsWith("]")) {<a name="line.292"></a>
-<span class="sourceLineNo">293</span>                throw new IllegalArgumentException("Phoneme expression contains a '[' but does not end in ']'");<a name="line.293"></a>
-<span class="sourceLineNo">294</span>            }<a name="line.294"></a>
-<span class="sourceLineNo">295</span>            final String before = ph.substring(0, open);<a name="line.295"></a>
-<span class="sourceLineNo">296</span>            final String in = ph.substring(open + 1, ph.length() - 1);<a name="line.296"></a>
-<span class="sourceLineNo">297</span>            final Set&lt;String&gt; langs = new HashSet&lt;String&gt;(Arrays.asList(in.split("[+]")));<a name="line.297"></a>
-<span class="sourceLineNo">298</span><a name="line.298"></a>
-<span class="sourceLineNo">299</span>            return new Phoneme(before, Languages.LanguageSet.from(langs));<a name="line.299"></a>
-<span class="sourceLineNo">300</span>        } else {<a name="line.300"></a>
-<span class="sourceLineNo">301</span>            return new Phoneme(ph, Languages.ANY_LANGUAGE);<a name="line.301"></a>
-<span class="sourceLineNo">302</span>        }<a name="line.302"></a>
-<span class="sourceLineNo">303</span>    }<a name="line.303"></a>
-<span class="sourceLineNo">304</span><a name="line.304"></a>
-<span class="sourceLineNo">305</span>    private static PhonemeExpr parsePhonemeExpr(final String ph) {<a name="line.305"></a>
-<span class="sourceLineNo">306</span>        if (ph.startsWith("(")) { // we have a bracketed list of options<a name="line.306"></a>
-<span class="sourceLineNo">307</span>            if (!ph.endsWith(")")) {<a name="line.307"></a>
-<span class="sourceLineNo">308</span>                throw new IllegalArgumentException("Phoneme starts with '(' so must end with ')'");<a name="line.308"></a>
-<span class="sourceLineNo">309</span>            }<a name="line.309"></a>
-<span class="sourceLineNo">310</span><a name="line.310"></a>
-<span class="sourceLineNo">311</span>            final List&lt;Phoneme&gt; phs = new ArrayList&lt;Phoneme&gt;();<a name="line.311"></a>
-<span class="sourceLineNo">312</span>            final String body = ph.substring(1, ph.length() - 1);<a name="line.312"></a>
-<span class="sourceLineNo">313</span>            for (final String part : body.split("[|]")) {<a name="line.313"></a>
-<span class="sourceLineNo">314</span>                phs.add(parsePhoneme(part));<a name="line.314"></a>
-<span class="sourceLineNo">315</span>            }<a name="line.315"></a>
-<span class="sourceLineNo">316</span>            if (body.startsWith("|") || body.endsWith("|")) {<a name="line.316"></a>
-<span class="sourceLineNo">317</span>                phs.add(new Phoneme("", Languages.ANY_LANGUAGE));<a name="line.317"></a>
-<span class="sourceLineNo">318</span>            }<a name="line.318"></a>
-<span class="sourceLineNo">319</span><a name="line.319"></a>
-<span class="sourceLineNo">320</span>            return new PhonemeList(phs);<a name="line.320"></a>
-<span class="sourceLineNo">321</span>        } else {<a name="line.321"></a>
-<span class="sourceLineNo">322</span>            return parsePhoneme(ph);<a name="line.322"></a>
-<span class="sourceLineNo">323</span>        }<a name="line.323"></a>
-<span class="sourceLineNo">324</span>    }<a name="line.324"></a>
-<span class="sourceLineNo">325</span><a name="line.325"></a>
-<span class="sourceLineNo">326</span>    private static List&lt;Rule&gt; parseRules(final Scanner scanner, final String location) {<a name="line.326"></a>
-<span class="sourceLineNo">327</span>        final List&lt;Rule&gt; lines = new ArrayList&lt;Rule&gt;();<a name="line.327"></a>
-<span class="sourceLineNo">328</span>        int currentLine = 0;<a name="line.328"></a>
-<span class="sourceLineNo">329</span><a name="line.329"></a>
-<span class="sourceLineNo">330</span>        boolean inMultilineComment = false;<a name="line.330"></a>
-<span class="sourceLineNo">331</span>        while (scanner.hasNextLine()) {<a name="line.331"></a>
-<span class="sourceLineNo">332</span>            currentLine++;<a name="line.332"></a>
-<span class="sourceLineNo">333</span>            final String rawLine = scanner.nextLine();<a name="line.333"></a>
-<span class="sourceLineNo">334</span>            String line = rawLine;<a name="line.334"></a>
-<span class="sourceLineNo">335</span><a name="line.335"></a>
-<span class="sourceLineNo">336</span>            if (inMultilineComment) {<a name="line.336"></a>
-<span class="sourceLineNo">337</span>                if (line.endsWith(ResourceConstants.EXT_CMT_END)) {<a name="line.337"></a>
-<span class="sourceLineNo">338</span>                    inMultilineComment = false;<a name="line.338"></a>
-<span class="sourceLineNo">339</span>                }<a name="line.339"></a>
-<span class="sourceLineNo">340</span>            } else {<a name="line.340"></a>
-<span class="sourceLineNo">341</span>                if (line.startsWith(ResourceConstants.EXT_CMT_START)) {<a name="line.341"></a>
-<span class="sourceLineNo">342</span>                    inMultilineComment = true;<a name="line.342"></a>
-<span class="sourceLineNo">343</span>                } else {<a name="line.343"></a>
-<span class="sourceLineNo">344</span>                    // discard comments<a name="line.344"></a>
-<span class="sourceLineNo">345</span>                    final int cmtI = line.indexOf(ResourceConstants.CMT);<a name="line.345"></a>
-<span class="sourceLineNo">346</span>                    if (cmtI &gt;= 0) {<a name="line.346"></a>
-<span class="sourceLineNo">347</span>                        line = line.substring(0, cmtI);<a name="line.347"></a>
-<span class="sourceLineNo">348</span>                    }<a name="line.348"></a>
-<span class="sourceLineNo">349</span><a name="line.349"></a>
-<span class="sourceLineNo">350</span>                    // trim leading-trailing whitespace<a name="line.350"></a>
-<span class="sourceLineNo">351</span>                    line = line.trim();<a name="line.351"></a>
-<span class="sourceLineNo">352</span><a name="line.352"></a>
-<span class="sourceLineNo">353</span>                    if (line.length() == 0) {<a name="line.353"></a>
-<span class="sourceLineNo">354</span>                        continue; // empty lines can be safely skipped<a name="line.354"></a>
-<span class="sourceLineNo">355</span>                    }<a name="line.355"></a>
-<span class="sourceLineNo">356</span><a name="line.356"></a>
-<span class="sourceLineNo">357</span>                    if (line.startsWith(HASH_INCLUDE)) {<a name="line.357"></a>
-<span class="sourceLineNo">358</span>                        // include statement<a name="line.358"></a>
-<span class="sourceLineNo">359</span>                        final String incl = line.substring(HASH_INCLUDE.length()).trim();<a name="line.359"></a>
-<span class="sourceLineNo">360</span>                        if (incl.contains(" ")) {<a name="line.360"></a>
-<span class="sourceLineNo">361</span>                            throw new IllegalArgumentException("Malformed import statement '" + rawLine + "' in " +<a name="line.361"></a>
-<span class="sourceLineNo">362</span>                                                               location);<a name="line.362"></a>
-<span class="sourceLineNo">363</span>                        } else {<a name="line.363"></a>
-<span class="sourceLineNo">364</span>                            lines.addAll(parseRules(createScanner(incl), location + "-&gt;" + incl));<a name="line.364"></a>
-<span class="sourceLineNo">365</span>                        }<a name="line.365"></a>
-<span class="sourceLineNo">366</span>                    } else {<a name="line.366"></a>
-<span class="sourceLineNo">367</span>                        // rule<a name="line.367"></a>
-<span class="sourceLineNo">368</span>                        final String[] parts = line.split("\\s+");<a name="line.368"></a>
-<span class="sourceLineNo">369</span>                        if (parts.length != 4) {<a name="line.369"></a>
-<span class="sourceLineNo">370</span>                            throw new IllegalArgumentException("Malformed rule statement split into " + parts.length +<a name="line.370"></a>
-<span class="sourceLineNo">371</span>                                                               " parts: " + rawLine + " in " + location);<a name="line.371"></a>
-<span class="sourceLineNo">372</span>                        } else {<a name="line.372"></a>
-<span class="sourceLineNo">373</span>                            try {<a name="line.373"></a>
-<span class="sourceLineNo">374</span>                                final String pat = stripQuotes(parts[0]);<a name="line.374"></a>
-<span class="sourceLineNo">375</span>                                final String lCon = stripQuotes(parts[1]);<a name="line.375"></a>
-<span class="sourceLineNo">376</span>                                final String rCon = stripQuotes(parts[2]);<a name="line.376"></a>
-<span class="sourceLineNo">377</span>                                final PhonemeExpr ph = parsePhonemeExpr(stripQuotes(parts[3]));<a name="line.377"></a>
-<span class="sourceLineNo">378</span>                                final int cLine = currentLine;<a name="line.378"></a>
-<span class="sourceLineNo">379</span>                                final Rule r = new Rule(pat, lCon, rCon, ph) {<a name="line.379"></a>
-<span class="sourceLineNo">380</span>                                    private final int myLine = cLine;<a name="line.380"></a>
-<span class="sourceLineNo">381</span>                                    private final String loc = location;<a name="line.381"></a>
-<span class="sourceLineNo">382</span><a name="line.382"></a>
-<span class="sourceLineNo">383</span>                                    @Override<a name="line.383"></a>
-<span class="sourceLineNo">384</span>                                    public String toString() {<a name="line.384"></a>
-<span class="sourceLineNo">385</span>                                        final StringBuilder sb = new StringBuilder();<a name="line.385"></a>
-<span class="sourceLineNo">386</span>                                        sb.append("Rule");<a name="line.386"></a>
-<span class="sourceLineNo">387</span>                                        sb.append("{line=").append(myLine);<a name="line.387"></a>
-<span class="sourceLineNo">388</span>                                        sb.append(", loc='").append(loc).append('\'');<a name="line.388"></a>
-<span class="sourceLineNo">389</span>                                        sb.append('}');<a name="line.389"></a>
-<span class="sourceLineNo">390</span>                                        return sb.toString();<a name="line.390"></a>
-<span class="sourceLineNo">391</span>                                    }<a name="line.391"></a>
-<span class="sourceLineNo">392</span>                                };<a name="line.392"></a>
-<span class="sourceLineNo">393</span>                                lines.add(r);<a name="line.393"></a>
-<span class="sourceLineNo">394</span>                            } catch (final IllegalArgumentException e) {<a name="line.394"></a>
-<span class="sourceLineNo">395</span>                                throw new IllegalStateException("Problem parsing line '" + currentLine + "' in " +<a name="line.395"></a>
-<span class="sourceLineNo">396</span>                                                                location, e);<a name="line.396"></a>
-<span class="sourceLineNo">397</span>                            }<a name="line.397"></a>
-<span class="sourceLineNo">398</span>                        }<a name="line.398"></a>
-<span class="sourceLineNo">399</span>                    }<a name="line.399"></a>
-<span class="sourceLineNo">400</span>                }<a name="line.400"></a>
-<span class="sourceLineNo">401</span>            }<a name="line.401"></a>
-<span class="sourceLineNo">402</span>        }<a name="line.402"></a>
-<span class="sourceLineNo">403</span><a name="line.403"></a>
-<span class="sourceLineNo">404</span>        return lines;<a name="line.404"></a>
-<span class="sourceLineNo">405</span>    }<a name="line.405"></a>
-<span class="sourceLineNo">406</span><a name="line.406"></a>
-<span class="sourceLineNo">407</span>    /**<a name="line.407"></a>
-<span class="sourceLineNo">408</span>     * Attempts to compile the regex into direct string ops, falling back to Pattern and Matcher in the worst case.<a name="line.408"></a>
-<span class="sourceLineNo">409</span>     *<a name="line.409"></a>
-<span class="sourceLineNo">410</span>     * @param regex<a name="line.410"></a>
-<span class="sourceLineNo">411</span>     *            the regular expression to compile<a name="line.411"></a>
-<span class="sourceLineNo">412</span>     * @return an RPattern that will match this regex<a name="line.412"></a>
-<span class="sourceLineNo">413</span>     */<a name="line.413"></a>
-<span class="sourceLineNo">414</span>    private static RPattern pattern(final String regex) {<a name="line.414"></a>
-<span class="sourceLineNo">415</span>        final boolean startsWith = regex.startsWith("^");<a name="line.415"></a>
-<span class="sourceLineNo">416</span>        final boolean endsWith = regex.endsWith("$");<a name="line.416"></a>
-<span class="sourceLineNo">417</span>        final String content = regex.substring(startsWith ? 1 : 0, endsWith ? regex.length() - 1 : regex.length());<a name="line.417"></a>
-<span class="sourceLineNo">418</span>        final boolean boxes = content.contains("[");<a name="line.418"></a>
-<span class="sourceLineNo">419</span><a name="line.419"></a>
-<span class="sourceLineNo">420</span>        if (!boxes) {<a name="line.420"></a>
-<span class="sourceLineNo">421</span>            if (startsWith &amp;&amp; endsWith) {<a name="line.421"></a>
-<span class="sourceLineNo">422</span>                // exact match<a name="line.422"></a>
-<span class="sourceLineNo">423</span>                if (content.length() == 0) {<a name="line.423"></a>
-<span class="sourceLineNo">424</span>                    // empty<a name="line.424"></a>
-<span class="sourceLineNo">425</span>                    return new RPattern() {<a name="line.425"></a>
-<span class="sourceLineNo">426</span>                        @Override<a name="line.426"></a>
-<span class="sourceLineNo">427</span>                        public boolean isMatch(final CharSequence input) {<a name="line.427"></a>
-<span class="sourceLineNo">428</span>                            return input.length() == 0;<a name="line.428"></a>
-<span class="sourceLineNo">429</span>                        }<a name="line.429"></a>
-<span class="sourceLineNo">430</span>                    };<a name="line.430"></a>
-<span class="sourceLineNo">431</span>                } else {<a name="line.431"></a>
-<span class="sourceLineNo">432</span>                    return new RPattern() {<a name="line.432"></a>
-<span class="sourceLineNo">433</span>                        @Override<a name="line.433"></a>
-<span class="sourceLineNo">434</span>                        public boolean isMatch(final CharSequence input) {<a name="line.434"></a>
-<span class="sourceLineNo">435</span>                            return input.equals(content);<a name="line.435"></a>
-<span class="sourceLineNo">436</span>                        }<a name="line.436"></a>
-<span class="sourceLineNo">437</span>                    };<a name="line.437"></a>
-<span class="sourceLineNo">438</span>                }<a name="line.438"></a>
-<span class="sourceLineNo">439</span>            } else if ((startsWith || endsWith) &amp;&amp; content.length() == 0) {<a name="line.439"></a>
-<span class="sourceLineNo">440</span>                // matches every string<a name="line.440"></a>
-<span class="sourceLineNo">441</span>                return ALL_STRINGS_RMATCHER;<a name="line.441"></a>
-<span class="sourceLineNo">442</span>            } else if (startsWith) {<a name="line.442"></a>
-<span class="sourceLineNo">443</span>                // matches from start<a name="line.443"></a>
-<span class="sourceLineNo">444</span>                return new RPattern() {<a name="line.444"></a>
-<span class="sourceLineNo">445</span>                    @Override<a name="line.445"></a>
-<span class="sourceLineNo">446</span>                    public boolean isMatch(final CharSequence input) {<a name="line.446"></a>
-<span class="sourceLineNo">447</span>                        return startsWith(input, content);<a name="line.447"></a>
-<span class="sourceLineNo">448</span>                    }<a name="line.448"></a>
-<span class="sourceLineNo">449</span>                };<a name="line.449"></a>
-<span class="sourceLineNo">450</span>            } else if (endsWith) {<a name="line.450"></a>
-<span class="sourceLineNo">451</span>                // matches from start<a name="line.451"></a>
-<span class="sourceLineNo">452</span>                return new RPattern() {<a name="line.452"></a>
-<span class="sourceLineNo">453</span>                    @Override<a name="line.453"></a>
-<span class="sourceLineNo">454</span>                    public boolean isMatch(final CharSequence input) {<a name="line.454"></a>
-<span class="sourceLineNo">455</span>                        return endsWith(input, content);<a name="line.455"></a>
-<span class="sourceLineNo">456</span>                    }<a name="line.456"></a>
-<span class="sourceLineNo">457</span>                };<a name="line.457"></a>
-<span class="sourceLineNo">458</span>            }<a name="line.458"></a>
-<span class="sourceLineNo">459</span>        } else {<a name="line.459"></a>
-<span class="sourceLineNo">460</span>            final boolean startsWithBox = content.startsWith("[");<a name="line.460"></a>
-<span class="sourceLineNo">461</span>            final boolean endsWithBox = content.endsWith("]");<a name="line.461"></a>
-<span class="sourceLineNo">462</span><a name="line.462"></a>
-<span class="sourceLineNo">463</span>            if (startsWithBox &amp;&amp; endsWithBox) {<a name="line.463"></a>
-<span class="sourceLineNo">464</span>                String boxContent = content.substring(1, content.length() - 1);<a name="line.464"></a>
-<span class="sourceLineNo">465</span>                if (!boxContent.contains("[")) {<a name="line.465"></a>
-<span class="sourceLineNo">466</span>                    // box containing alternatives<a name="line.466"></a>
-<span class="sourceLineNo">467</span>                    final boolean negate = boxContent.startsWith("^");<a name="line.467"></a>
-<span class="sourceLineNo">468</span>                    if (negate) {<a name="line.468"></a>
-<span class="sourceLineNo">469</span>                        boxContent = boxContent.substring(1);<a name="line.469"></a>
-<span class="sourceLineNo">470</span>                    }<a name="line.470"></a>
-<span class="sourceLineNo">471</span>                    final String bContent = boxContent;<a name="line.471"></a>
-<span class="sourceLineNo">472</span>                    final boolean shouldMatch = !negate;<a name="line.472"></a>
-<span class="sourceLineNo">473</span><a name="line.473"></a>
-<span class="sourceLineNo">474</span>                    if (startsWith &amp;&amp; endsWith) {<a name="line.474"></a>
-<span class="sourceLineNo">475</span>                        // exact match<a name="line.475"></a>
-<span class="sourceLineNo">476</span>                        return new RPattern() {<a name="line.476"></a>
-<span class="sourceLineNo">477</span>                            @Override<a name="line.477"></a>
-<span class="sourceLineNo">478</span>                            public boolean isMatch(final CharSequence input) {<a name="line.478"></a>
-<span class="sourceLineNo">479</span>                                return input.length() == 1 &amp;&amp; contains(bContent, input.charAt(0)) == shouldMatch;<a name="line.479"></a>
-<span class="sourceLineNo">480</span>                            }<a name="line.480"></a>
-<span class="sourceLineNo">481</span>                        };<a name="line.481"></a>
-<span class="sourceLineNo">482</span>                    } else if (startsWith) {<a name="line.482"></a>
-<span class="sourceLineNo">483</span>                        // first char<a name="line.483"></a>
-<span class="sourceLineNo">484</span>                        return new RPattern() {<a name="line.484"></a>
-<span class="sourceLineNo">485</span>                            @Override<a name="line.485"></a>
-<span class="sourceLineNo">486</span>                            public boolean isMatch(final CharSequence input) {<a name="line.486"></a>
-<span class="sourceLineNo">487</span>                                return input.length() &gt; 0 &amp;&amp; contains(bContent, input.charAt(0)) == shouldMatch;<a name="line.487"></a>
-<span class="sourceLineNo">488</span>                            }<a name="line.488"></a>
-<span class="sourceLineNo">489</span>                        };<a name="line.489"></a>
-<span class="sourceLineNo">490</span>                    } else if (endsWith) {<a name="line.490"></a>
-<span class="sourceLineNo">491</span>                        // last char<a name="line.491"></a>
-<span class="sourceLineNo">492</span>                        return new RPattern() {<a name="line.492"></a>
-<span class="sourceLineNo">493</span>                            @Override<a name="line.493"></a>
-<span class="sourceLineNo">494</span>                            public boolean isMatch(final CharSequence input) {<a name="line.494"></a>
-<span class="sourceLineNo">495</span>                                return input.length() &gt; 0 &amp;&amp;<a name="line.495"></a>
-<span class="sourceLineNo">496</span>                                       contains(bContent, input.charAt(input.length() - 1)) == shouldMatch;<a name="line.496"></a>
-<span class="sourceLineNo">497</span>                            }<a name="line.497"></a>
-<span class="sourceLineNo">498</span>                        };<a name="line.498"></a>
-<span class="sourceLineNo">499</span>                    }<a name="line.499"></a>
+<span class="sourceLineNo">285</span>        return allRules;<a name="line.285"></a>
+<span class="sourceLineNo">286</span>    }<a name="line.286"></a>
+<span class="sourceLineNo">287</span><a name="line.287"></a>
+<span class="sourceLineNo">288</span>    /**<a name="line.288"></a>
+<span class="sourceLineNo">289</span>     * Gets rules for a combination of name type, rule type and a single language.<a name="line.289"></a>
+<span class="sourceLineNo">290</span>     *<a name="line.290"></a>
+<span class="sourceLineNo">291</span>     * @param nameType<a name="line.291"></a>
+<span class="sourceLineNo">292</span>     *            the NameType to consider<a name="line.292"></a>
+<span class="sourceLineNo">293</span>     * @param rt<a name="line.293"></a>
+<span class="sourceLineNo">294</span>     *            the RuleType to consider<a name="line.294"></a>
+<span class="sourceLineNo">295</span>     * @param lang<a name="line.295"></a>
+<span class="sourceLineNo">296</span>     *            the language to consider<a name="line.296"></a>
+<span class="sourceLineNo">297</span>     * @return a list of Rules that apply<a name="line.297"></a>
+<span class="sourceLineNo">298</span>     */<a name="line.298"></a>
+<span class="sourceLineNo">299</span>    public static List&lt;Rule&gt; getInstance(final NameType nameType, final RuleType rt, final String lang) {<a name="line.299"></a>
+<span class="sourceLineNo">300</span>        return getInstance(nameType, rt, LanguageSet.from(new HashSet&lt;String&gt;(Arrays.asList(lang))));<a name="line.300"></a>
+<span class="sourceLineNo">301</span>    }<a name="line.301"></a>
+<span class="sourceLineNo">302</span><a name="line.302"></a>
+<span class="sourceLineNo">303</span>    /**<a name="line.303"></a>
+<span class="sourceLineNo">304</span>     * Gets rules for a combination of name type, rule type and languages.<a name="line.304"></a>
+<span class="sourceLineNo">305</span>     *<a name="line.305"></a>
+<span class="sourceLineNo">306</span>     * @param nameType<a name="line.306"></a>
+<span class="sourceLineNo">307</span>     *            the NameType to consider<a name="line.307"></a>
+<span class="sourceLineNo">308</span>     * @param rt<a name="line.308"></a>
+<span class="sourceLineNo">309</span>     *            the RuleType to consider<a name="line.309"></a>
+<span class="sourceLineNo">310</span>     * @param langs<a name="line.310"></a>
+<span class="sourceLineNo">311</span>     *            the set of languages to consider<a name="line.311"></a>
+<span class="sourceLineNo">312</span>     * @return a map containing all Rules that apply, grouped by the first character of the rule pattern<a name="line.312"></a>
+<span class="sourceLineNo">313</span>     * @since 1.9<a name="line.313"></a>
+<span class="sourceLineNo">314</span>     */<a name="line.314"></a>
+<span class="sourceLineNo">315</span>    public static Map&lt;String, List&lt;Rule&gt;&gt; getInstanceMap(final NameType nameType, final RuleType rt,<a name="line.315"></a>
+<span class="sourceLineNo">316</span>                                                         final Languages.LanguageSet langs) {<a name="line.316"></a>
+<span class="sourceLineNo">317</span>        return langs.isSingleton() ? getInstanceMap(nameType, rt, langs.getAny()) :<a name="line.317"></a>
+<span class="sourceLineNo">318</span>                                     getInstanceMap(nameType, rt, Languages.ANY);<a name="line.318"></a>
+<span class="sourceLineNo">319</span>    }<a name="line.319"></a>
+<span class="sourceLineNo">320</span><a name="line.320"></a>
+<span class="sourceLineNo">321</span>    /**<a name="line.321"></a>
+<span class="sourceLineNo">322</span>     * Gets rules for a combination of name type, rule type and a single language.<a name="line.322"></a>
+<span class="sourceLineNo">323</span>     *<a name="line.323"></a>
+<span class="sourceLineNo">324</span>     * @param nameType<a name="line.324"></a>
+<span class="sourceLineNo">325</span>     *            the NameType to consider<a name="line.325"></a>
+<span class="sourceLineNo">326</span>     * @param rt<a name="line.326"></a>
+<span class="sourceLineNo">327</span>     *            the RuleType to consider<a name="line.327"></a>
+<span class="sourceLineNo">328</span>     * @param lang<a name="line.328"></a>
+<span class="sourceLineNo">329</span>     *            the language to consider<a name="line.329"></a>
+<span class="sourceLineNo">330</span>     * @return a map containing all Rules that apply, grouped by the first character of the rule pattern<a name="line.330"></a>
+<span class="sourceLineNo">331</span>     * @since 1.9<a name="line.331"></a>
+<span class="sourceLineNo">332</span>     */<a name="line.332"></a>
+<span class="sourceLineNo">333</span>    public static Map&lt;String, List&lt;Rule&gt;&gt; getInstanceMap(final NameType nameType, final RuleType rt,<a name="line.333"></a>
+<span class="sourceLineNo">334</span>                                                         final String lang) {<a name="line.334"></a>
+<span class="sourceLineNo">335</span>        final Map&lt;String, List&lt;Rule&gt;&gt; rules = RULES.get(nameType).get(rt).get(lang);<a name="line.335"></a>
+<span class="sourceLineNo">336</span><a name="line.336"></a>
+<span class="sourceLineNo">337</span>        if (rules == null) {<a name="line.337"></a>
+<span class="sourceLineNo">338</span>            throw new IllegalArgumentException(String.format("No rules found for %s, %s, %s.",<a name="line.338"></a>
+<span class="sourceLineNo">339</span>                                               nameType.getName(), rt.getName(), lang));<a name="line.339"></a>
+<span class="sourceLineNo">340</span>        }<a name="line.340"></a>
+<span class="sourceLineNo">341</span><a name="line.341"></a>
+<span class="sourceLineNo">342</span>        return rules;<a name="line.342"></a>
+<span class="sourceLineNo">343</span>    }<a name="line.343"></a>
+<span class="sourceLineNo">344</span><a name="line.344"></a>
+<span class="sourceLineNo">345</span>    private static Phoneme parsePhoneme(final String ph) {<a name="line.345"></a>
+<span class="sourceLineNo">346</span>        final int open = ph.indexOf("[");<a name="line.346"></a>
+<span class="sourceLineNo">347</span>        if (open &gt;= 0) {<a name="line.347"></a>
+<span class="sourceLineNo">348</span>            if (!ph.endsWith("]")) {<a name="line.348"></a>
+<span class="sourceLineNo">349</span>                throw new IllegalArgumentException("Phoneme expression contains a '[' but does not end in ']'");<a name="line.349"></a>
+<span class="sourceLineNo">350</span>            }<a name="line.350"></a>
+<span class="sourceLineNo">351</span>            final String before = ph.substring(0, open);<a name="line.351"></a>
+<span class="sourceLineNo">352</span>            final String in = ph.substring(open + 1, ph.length() - 1);<a name="line.352"></a>
+<span class="sourceLineNo">353</span>            final Set&lt;String&gt; langs = new HashSet&lt;String&gt;(Arrays.asList(in.split("[+]")));<a name="line.353"></a>
+<span class="sourceLineNo">354</span><a name="line.354"></a>
+<span class="sourceLineNo">355</span>            return new Phoneme(before, Languages.LanguageSet.from(langs));<a name="line.355"></a>
+<span class="sourceLineNo">356</span>        } else {<a name="line.356"></a>
+<span class="sourceLineNo">357</span>            return new Phoneme(ph, Languages.ANY_LANGUAGE);<a name="line.357"></a>
+<span class="sourceLineNo">358</span>        }<a name="line.358"></a>
+<span class="sourceLineNo">359</span>    }<a name="line.359"></a>
+<span class="sourceLineNo">360</span><a name="line.360"></a>
+<span class="sourceLineNo">361</span>    private static PhonemeExpr parsePhonemeExpr(final String ph) {<a name="line.361"></a>
+<span class="sourceLineNo">362</span>        if (ph.startsWith("(")) { // we have a bracketed list of options<a name="line.362"></a>
+<span class="sourceLineNo">363</span>            if (!ph.endsWith(")")) {<a name="line.363"></a>
+<span class="sourceLineNo">364</span>                throw new IllegalArgumentException("Phoneme starts with '(' so must end with ')'");<a name="line.364"></a>
+<span class="sourceLineNo">365</span>            }<a name="line.365"></a>
+<span class="sourceLineNo">366</span><a name="line.366"></a>
+<span class="sourceLineNo">367</span>            final List&lt;Phoneme&gt; phs = new ArrayList&lt;Phoneme&gt;();<a name="line.367"></a>
+<span class="sourceLineNo">368</span>            final String body = ph.substring(1, ph.length() - 1);<a name="line.368"></a>
+<span class="sourceLineNo">369</span>            for (final String part : body.split("[|]")) {<a name="line.369"></a>
+<span class="sourceLineNo">370</span>                phs.add(parsePhoneme(part));<a name="line.370"></a>
+<span class="sourceLineNo">371</span>            }<a name="line.371"></a>
+<span class="sourceLineNo">372</span>            if (body.startsWith("|") || body.endsWith("|")) {<a name="line.372"></a>
+<span class="sourceLineNo">373</span>                phs.add(new Phoneme("", Languages.ANY_LANGUAGE));<a name="line.373"></a>
+<span class="sourceLineNo">374</span>            }<a name="line.374"></a>
+<span class="sourceLineNo">375</span><a name="line.375"></a>
+<span class="sourceLineNo">376</span>            return new PhonemeList(phs);<a name="line.376"></a>
+<span class="sourceLineNo">377</span>        } else {<a name="line.377"></a>
+<span class="sourceLineNo">378</span>            return parsePhoneme(ph);<a name="line.378"></a>
+<span class="sourceLineNo">379</span>        }<a name="line.379"></a>
+<span class="sourceLineNo">380</span>    }<a name="line.380"></a>
+<span class="sourceLineNo">381</span><a name="line.381"></a>
+<span class="sourceLineNo">382</span>    private static Map&lt;String, List&lt;Rule&gt;&gt; parseRules(final Scanner scanner, final String location) {<a name="line.382"></a>
+<span class="sourceLineNo">383</span>        final Map&lt;String, List&lt;Rule&gt;&gt; lines = new HashMap&lt;String, List&lt;Rule&gt;&gt;();<a name="line.383"></a>
+<span class="sourceLineNo">384</span>        int currentLine = 0;<a name="line.384"></a>
+<span class="sourceLineNo">385</span><a name="line.385"></a>
+<span class="sourceLineNo">386</span>        boolean inMultilineComment = false;<a name="line.386"></a>
+<span class="sourceLineNo">387</span>        while (scanner.hasNextLine()) {<a name="line.387"></a>
+<span class="sourceLineNo">388</span>            currentLine++;<a name="line.388"></a>
+<span class="sourceLineNo">389</span>            final String rawLine = scanner.nextLine();<a name="line.389"></a>
+<span class="sourceLineNo">390</span>            String line = rawLine;<a name="line.390"></a>
+<span class="sourceLineNo">391</span><a name="line.391"></a>
+<span class="sourceLineNo">392</span>            if (inMultilineComment) {<a name="line.392"></a>
+<span class="sourceLineNo">393</span>                if (line.endsWith(ResourceConstants.EXT_CMT_END)) {<a name="line.393"></a>
+<span class="sourceLineNo">394</span>                    inMultilineComment = false;<a name="line.394"></a>
+<span class="sourceLineNo">395</span>                }<a name="line.395"></a>
+<span class="sourceLineNo">396</span>            } else {<a name="line.396"></a>
+<span class="sourceLineNo">397</span>                if (line.startsWith(ResourceConstants.EXT_CMT_START)) {<a name="line.397"></a>
+<span class="sourceLineNo">398</span>                    inMultilineComment = true;<a name="line.398"></a>
+<span class="sourceLineNo">399</span>                } else {<a name="line.399"></a>
+<span class="sourceLineNo">400</span>                    // discard comments<a name="line.400"></a>
+<span class="sourceLineNo">401</span>                    final int cmtI = line.indexOf(ResourceConstants.CMT);<a name="line.401"></a>
+<span class="sourceLineNo">402</span>                    if (cmtI &gt;= 0) {<a name="line.402"></a>
+<span class="sourceLineNo">403</span>                        line = line.substring(0, cmtI);<a name="line.403"></a>
+<span class="sourceLineNo">404</span>                    }<a name="line.404"></a>
+<span class="sourceLineNo">405</span><a name="line.405"></a>
+<span class="sourceLineNo">406</span>                    // trim leading-trailing whitespace<a name="line.406"></a>
+<span class="sourceLineNo">407</span>                    line = line.trim();<a name="line.407"></a>
+<span class="sourceLineNo">408</span><a name="line.408"></a>
+<span class="sourceLineNo">409</span>                    if (line.length() == 0) {<a name="line.409"></a>
+<span class="sourceLineNo">410</span>                        continue; // empty lines can be safely skipped<a name="line.410"></a>
+<span class="sourceLineNo">411</span>                    }<a name="line.411"></a>
+<span class="sourceLineNo">412</span><a name="line.412"></a>
+<span class="sourceLineNo">413</span>                    if (line.startsWith(HASH_INCLUDE)) {<a name="line.413"></a>
+<span class="sourceLineNo">414</span>                        // include statement<a name="line.414"></a>
+<span class="sourceLineNo">415</span>                        final String incl = line.substring(HASH_INCLUDE.length()).trim();<a name="line.415"></a>
+<span class="sourceLineNo">416</span>                        if (incl.contains(" ")) {<a name="line.416"></a>
+<span class="sourceLineNo">417</span>                            throw new IllegalArgumentException("Malformed import statement '" + rawLine + "' in " +<a name="line.417"></a>
+<span class="sourceLineNo">418</span>                                                               location);<a name="line.418"></a>
+<span class="sourceLineNo">419</span>                        } else {<a name="line.419"></a>
+<span class="sourceLineNo">420</span>                            lines.putAll(parseRules(createScanner(incl), location + "-&gt;" + incl));<a name="line.420"></a>
+<span class="sourceLineNo">421</span>                        }<a name="line.421"></a>
+<span class="sourceLineNo">422</span>                    } else {<a name="line.422"></a>
+<span class="sourceLineNo">423</span>                        // rule<a name="line.423"></a>
+<span class="sourceLineNo">424</span>                        final String[] parts = line.split("\\s+");<a name="line.424"></a>
+<span class="sourceLineNo">425</span>                        if (parts.length != 4) {<a name="line.425"></a>
+<span class="sourceLineNo">426</span>                            throw new IllegalArgumentException("Malformed rule statement split into " + parts.length +<a name="line.426"></a>
+<span class="sourceLineNo">427</span>                                                               " parts: " + rawLine + " in " + location);<a name="line.427"></a>
+<span class="sourceLineNo">428</span>                        } else {<a name="line.428"></a>
+<span class="sourceLineNo">429</span>                            try {<a name="line.429"></a>
+<span class="sourceLineNo">430</span>                                final String pat = stripQuotes(parts[0]);<a name="line.430"></a>
+<span class="sourceLineNo">431</span>                                final String lCon = stripQuotes(parts[1]);<a name="line.431"></a>
+<span class="sourceLineNo">432</span>                                final String rCon = stripQuotes(parts[2]);<a name="line.432"></a>
+<span class="sourceLineNo">433</span>                                final PhonemeExpr ph = parsePhonemeExpr(stripQuotes(parts[3]));<a name="line.433"></a>
+<span class="sourceLineNo">434</span>                                final int cLine = currentLine;<a name="line.434"></a>
+<span class="sourceLineNo">435</span>                                final Rule r = new Rule(pat, lCon, rCon, ph) {<a name="line.435"></a>
+<span class="sourceLineNo">436</span>                                    private final int myLine = cLine;<a name="line.436"></a>
+<span class="sourceLineNo">437</span>                                    private final String loc = location;<a name="line.437"></a>
+<span class="sourceLineNo">438</span><a name="line.438"></a>
+<span class="sourceLineNo">439</span>                                    @Override<a name="line.439"></a>
+<span class="sourceLineNo">440</span>                                    public String toString() {<a name="line.440"></a>
+<span class="sourceLineNo">441</span>                                        final StringBuilder sb = new StringBuilder();<a name="line.441"></a>
+<span class="sourceLineNo">442</span>                                        sb.append("Rule");<a name="line.442"></a>
+<span class="sourceLineNo">443</span>                                        sb.append("{line=").append(myLine);<a name="line.443"></a>

[... 391 lines stripped ...]