summaryrefslogtreecommitdiff
path: root/doc/api/morfologik/tools/MorphEncoder.html
diff options
context:
space:
mode:
Diffstat (limited to 'doc/api/morfologik/tools/MorphEncoder.html')
-rw-r--r--doc/api/morfologik/tools/MorphEncoder.html584
1 files changed, 584 insertions, 0 deletions
diff --git a/doc/api/morfologik/tools/MorphEncoder.html b/doc/api/morfologik/tools/MorphEncoder.html
new file mode 100644
index 0000000..fc9fd18
--- /dev/null
+++ b/doc/api/morfologik/tools/MorphEncoder.html
@@ -0,0 +1,584 @@
+<!DOCTYPE HTML PUBLIC "-//W3C//DTD HTML 4.01 Transitional//EN" "http://www.w3.org/TR/html4/loose.dtd">
+<!--NewPage-->
+<HTML>
+<HEAD>
+<!-- Generated by javadoc (build 1.6.0_14) on Wed Jan 26 18:49:38 CET 2011 -->
+<TITLE>
+MorphEncoder
+</TITLE>
+
+<META NAME="date" CONTENT="2011-01-26">
+
+<LINK REL ="stylesheet" TYPE="text/css" HREF="../../stylesheet.css" TITLE="Style">
+
+<SCRIPT type="text/javascript">
+function windowTitle()
+{
+ if (location.href.indexOf('is-external=true') == -1) {
+ parent.document.title="MorphEncoder";
+ }
+}
+</SCRIPT>
+<NOSCRIPT>
+</NOSCRIPT>
+
+</HEAD>
+
+<BODY BGCOLOR="white" onload="windowTitle();">
+<HR>
+
+
+<!-- ========= START OF TOP NAVBAR ======= -->
+<A NAME="navbar_top"><!-- --></A>
+<A HREF="#skip-navbar_top" title="Skip navigation links"></A>
+<TABLE BORDER="0" WIDTH="100%" CELLPADDING="1" CELLSPACING="0" SUMMARY="">
+<TR>
+<TD COLSPAN=2 BGCOLOR="#EEEEFF" CLASS="NavBarCell1">
+<A NAME="navbar_top_firstrow"><!-- --></A>
+<TABLE BORDER="0" CELLPADDING="0" CELLSPACING="3" SUMMARY="">
+ <TR ALIGN="center" VALIGN="top">
+ <TD BGCOLOR="#EEEEFF" CLASS="NavBarCell1"> <A HREF="../../overview-summary.html"><FONT CLASS="NavBarFont1"><B>Overview</B></FONT></A>&nbsp;</TD>
+ <TD BGCOLOR="#EEEEFF" CLASS="NavBarCell1"> <A HREF="package-summary.html"><FONT CLASS="NavBarFont1"><B>Package</B></FONT></A>&nbsp;</TD>
+ <TD BGCOLOR="#FFFFFF" CLASS="NavBarCell1Rev"> &nbsp;<FONT CLASS="NavBarFont1Rev"><B>Class</B></FONT>&nbsp;</TD>
+ <TD BGCOLOR="#EEEEFF" CLASS="NavBarCell1"> <A HREF="package-tree.html"><FONT CLASS="NavBarFont1"><B>Tree</B></FONT></A>&nbsp;</TD>
+ <TD BGCOLOR="#EEEEFF" CLASS="NavBarCell1"> <A HREF="../../deprecated-list.html"><FONT CLASS="NavBarFont1"><B>Deprecated</B></FONT></A>&nbsp;</TD>
+ <TD BGCOLOR="#EEEEFF" CLASS="NavBarCell1"> <A HREF="../../index-all.html"><FONT CLASS="NavBarFont1"><B>Index</B></FONT></A>&nbsp;</TD>
+ <TD BGCOLOR="#EEEEFF" CLASS="NavBarCell1"> <A HREF="../../help-doc.html"><FONT CLASS="NavBarFont1"><B>Help</B></FONT></A>&nbsp;</TD>
+ </TR>
+</TABLE>
+</TD>
+<TD ALIGN="right" VALIGN="top" ROWSPAN=3><EM>
+</EM>
+</TD>
+</TR>
+
+<TR>
+<TD BGCOLOR="white" CLASS="NavBarCell2"><FONT SIZE="-2">
+&nbsp;<A HREF="../../morfologik/tools/Launcher.html" title="class in morfologik.tools"><B>PREV CLASS</B></A>&nbsp;
+&nbsp;<A HREF="../../morfologik/tools/WriterMessageLogger.html" title="class in morfologik.tools"><B>NEXT CLASS</B></A></FONT></TD>
+<TD BGCOLOR="white" CLASS="NavBarCell2"><FONT SIZE="-2">
+ <A HREF="../../index.html?morfologik/tools/MorphEncoder.html" target="_top"><B>FRAMES</B></A> &nbsp;
+&nbsp;<A HREF="MorphEncoder.html" target="_top"><B>NO FRAMES</B></A> &nbsp;
+&nbsp;<SCRIPT type="text/javascript">
+ <!--
+ if(window==top) {
+ document.writeln('<A HREF="../../allclasses-noframe.html"><B>All Classes</B></A>');
+ }
+ //-->
+</SCRIPT>
+<NOSCRIPT>
+ <A HREF="../../allclasses-noframe.html"><B>All Classes</B></A>
+</NOSCRIPT>
+
+
+</FONT></TD>
+</TR>
+<TR>
+<TD VALIGN="top" CLASS="NavBarCell3"><FONT SIZE="-2">
+ SUMMARY:&nbsp;NESTED&nbsp;|&nbsp;FIELD&nbsp;|&nbsp;<A HREF="#constructor_summary">CONSTR</A>&nbsp;|&nbsp;<A HREF="#method_summary">METHOD</A></FONT></TD>
+<TD VALIGN="top" CLASS="NavBarCell3"><FONT SIZE="-2">
+DETAIL:&nbsp;FIELD&nbsp;|&nbsp;<A HREF="#constructor_detail">CONSTR</A>&nbsp;|&nbsp;<A HREF="#method_detail">METHOD</A></FONT></TD>
+</TR>
+</TABLE>
+<A NAME="skip-navbar_top"></A>
+<!-- ========= END OF TOP NAVBAR ========= -->
+
+<HR>
+<!-- ======== START OF CLASS DATA ======== -->
+<H2>
+<FONT SIZE="-1">
+morfologik.tools</FONT>
+<BR>
+Class MorphEncoder</H2>
+<PRE>
+java.lang.Object
+ <IMG SRC="../../resources/inherit.gif" ALT="extended by "><B>morfologik.tools.MorphEncoder</B>
+</PRE>
+<HR>
+<DL>
+<DT><PRE>public final class <B>MorphEncoder</B><DT>extends java.lang.Object</DL>
+</PRE>
+
+<P>
+A class that converts tabular data to fsa morphological format. Three formats
+ are supported:
+ <ul>
+ <li><b>standard</b>, see <A HREF="../../morfologik/tools/MorphEncoder.html#standardEncode(byte[], byte[], byte[])"><CODE>standardEncode(byte[], byte[], byte[])</CODE></A></li>
+ <li><b>prefix</b>, see <A HREF="../../morfologik/tools/MorphEncoder.html#prefixEncode(byte[], byte[], byte[])"><CODE>prefixEncode(byte[], byte[], byte[])</CODE></A></li>
+ <li><b>infix</b>, see <A HREF="../../morfologik/tools/MorphEncoder.html#infixEncode(byte[], byte[], byte[])"><CODE>infixEncode(byte[], byte[], byte[])</CODE></A></li>
+ </ul>
+<P>
+
+<P>
+<HR>
+
+<P>
+
+<!-- ======== CONSTRUCTOR SUMMARY ======== -->
+
+<A NAME="constructor_summary"><!-- --></A>
+<TABLE BORDER="1" WIDTH="100%" CELLPADDING="3" CELLSPACING="0" SUMMARY="">
+<TR BGCOLOR="#CCCCFF" CLASS="TableHeadingColor">
+<TH ALIGN="left" COLSPAN="2"><FONT SIZE="+2">
+<B>Constructor Summary</B></FONT></TH>
+</TR>
+<TR BGCOLOR="white" CLASS="TableRowColor">
+<TD><CODE><B><A HREF="../../morfologik/tools/MorphEncoder.html#MorphEncoder()">MorphEncoder</A></B>()</CODE>
+
+<BR>
+&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;</TD>
+</TR>
+<TR BGCOLOR="white" CLASS="TableRowColor">
+<TD><CODE><B><A HREF="../../morfologik/tools/MorphEncoder.html#MorphEncoder(byte)">MorphEncoder</A></B>(byte&nbsp;annotationSeparator)</CODE>
+
+<BR>
+&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;</TD>
+</TR>
+</TABLE>
+&nbsp;
+<!-- ========== METHOD SUMMARY =========== -->
+
+<A NAME="method_summary"><!-- --></A>
+<TABLE BORDER="1" WIDTH="100%" CELLPADDING="3" CELLSPACING="0" SUMMARY="">
+<TR BGCOLOR="#CCCCFF" CLASS="TableHeadingColor">
+<TH ALIGN="left" COLSPAN="2"><FONT SIZE="+2">
+<B>Method Summary</B></FONT></TH>
+</TR>
+<TR BGCOLOR="white" CLASS="TableRowColor">
+<TD ALIGN="right" VALIGN="top" WIDTH="1%"><FONT SIZE="-1">
+<CODE>protected static&nbsp;java.lang.String</CODE></FONT></TD>
+<TD><CODE><B><A HREF="../../morfologik/tools/MorphEncoder.html#asString(byte[], java.lang.String)">asString</A></B>(byte[]&nbsp;str,
+ java.lang.String&nbsp;encoding)</CODE>
+
+<BR>
+&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;Converts a byte array to a given encoding.</TD>
+</TR>
+<TR BGCOLOR="white" CLASS="TableRowColor">
+<TD ALIGN="right" VALIGN="top" WIDTH="1%"><FONT SIZE="-1">
+<CODE>static&nbsp;int</CODE></FONT></TD>
+<TD><CODE><B><A HREF="../../morfologik/tools/MorphEncoder.html#commonPrefix(byte[], byte[])">commonPrefix</A></B>(byte[]&nbsp;s1,
+ byte[]&nbsp;s2)</CODE>
+
+<BR>
+&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;</TD>
+</TR>
+<TR BGCOLOR="white" CLASS="TableRowColor">
+<TD ALIGN="right" VALIGN="top" WIDTH="1%"><FONT SIZE="-1">
+<CODE>&nbsp;byte[]</CODE></FONT></TD>
+<TD><CODE><B><A HREF="../../morfologik/tools/MorphEncoder.html#infixEncode(byte[], byte[], byte[])">infixEncode</A></B>(byte[]&nbsp;wordForm,
+ byte[]&nbsp;wordLemma,
+ byte[]&nbsp;wordTag)</CODE>
+
+<BR>
+&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;This method converts wordform, wordLemma and the tag to the form:
+
+ inflected_form + MLKending + tags
+
+
+ where '+' is a separator, M is the position of characters to be deleted
+ towards the beginning of the inflected form ("A" means from the
+ beginning, "B" from the second character, "C" - from the third one, and
+ so on), L is the number of characters to be deleted from the position
+ specified by M ("A" means none, "B" means one, "C" - 2, etc.), K is a
+ character that specifies how many characters should be deleted from the
+ end of the inflected form to produce the lexeme by concatenating the
+ stripped string with the ending ("A" means none, "B' - 1, "C" - 2, and so
+ on).</TD>
+</TR>
+<TR BGCOLOR="white" CLASS="TableRowColor">
+<TD ALIGN="right" VALIGN="top" WIDTH="1%"><FONT SIZE="-1">
+<CODE>&nbsp;java.lang.String</CODE></FONT></TD>
+<TD><CODE><B><A HREF="../../morfologik/tools/MorphEncoder.html#infixEncodeUTF8(java.lang.String, java.lang.String, java.lang.String)">infixEncodeUTF8</A></B>(java.lang.String&nbsp;wordForm,
+ java.lang.String&nbsp;wordLemma,
+ java.lang.String&nbsp;wordTag)</CODE>
+
+<BR>
+&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;A UTF-8 variant of <A HREF="../../morfologik/tools/MorphEncoder.html#infixEncode(byte[], byte[], byte[])"><CODE>infixEncode(byte[], byte[], byte[])</CODE></A>.</TD>
+</TR>
+<TR BGCOLOR="white" CLASS="TableRowColor">
+<TD ALIGN="right" VALIGN="top" WIDTH="1%"><FONT SIZE="-1">
+<CODE>&nbsp;byte[]</CODE></FONT></TD>
+<TD><CODE><B><A HREF="../../morfologik/tools/MorphEncoder.html#prefixEncode(byte[], byte[], byte[])">prefixEncode</A></B>(byte[]&nbsp;wordForm,
+ byte[]&nbsp;wordLemma,
+ byte[]&nbsp;wordTag)</CODE>
+
+<BR>
+&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;This method converts wordform, wordLemma and the tag to the form:
+
+
+
+ inflected_form + LKending + tags
+
+
+ where '+' is a separator, L is the number of characters to be deleted
+ from the beginning of the word ("A" means none, "B" means one, "C" - 2,
+ etc.), K is a character that specifies how many characters should be
+ deleted from the end of the inflected form to produce the lexeme by
+ concatenating the stripped string with the ending ("A" means none,
+ "B' - 1, "C" - 2, and so on).</TD>
+</TR>
+<TR BGCOLOR="white" CLASS="TableRowColor">
+<TD ALIGN="right" VALIGN="top" WIDTH="1%"><FONT SIZE="-1">
+<CODE>&nbsp;java.lang.String</CODE></FONT></TD>
+<TD><CODE><B><A HREF="../../morfologik/tools/MorphEncoder.html#prefixEncodeUTF8(java.lang.String, java.lang.String, java.lang.String)">prefixEncodeUTF8</A></B>(java.lang.String&nbsp;wordForm,
+ java.lang.String&nbsp;wordLemma,
+ java.lang.String&nbsp;wordTag)</CODE>
+
+<BR>
+&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;A UTF-8 variant of <A HREF="../../morfologik/tools/MorphEncoder.html#prefixEncode(byte[], byte[], byte[])"><CODE>prefixEncode(byte[], byte[], byte[])</CODE></A> This
+ method converts wordform, wordLemma and the tag to the form:
+
+ inflected_form + LKending + tags
+
+
+ where '+' is a separator, L is the number of characters to be deleted
+ from the beginning of the word ("A" means none, "B" means one, "C" - 2,
+ etc.), K is a character that specifies how many characters should be
+ deleted from the end of the inflected form to produce the lexeme by
+ concatenating the stripped string with the ending ("A" means none,
+ "B' - 1, "C" - 2, and so on).</TD>
+</TR>
+<TR BGCOLOR="white" CLASS="TableRowColor">
+<TD ALIGN="right" VALIGN="top" WIDTH="1%"><FONT SIZE="-1">
+<CODE>&nbsp;byte[]</CODE></FONT></TD>
+<TD><CODE><B><A HREF="../../morfologik/tools/MorphEncoder.html#standardEncode(byte[], byte[], byte[])">standardEncode</A></B>(byte[]&nbsp;wordForm,
+ byte[]&nbsp;wordLemma,
+ byte[]&nbsp;wordTag)</CODE>
+
+<BR>
+&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;This method converts the wordForm, wordLemma and tag to the form:
+
+
+ wordForm + Kending + tags
+
+
+ where '+' is a separator, K is a character that specifies how many
+ characters should be deleted from the end of the inflected form to
+ produce the lexeme by concatenating the stripped string with the ending.</TD>
+</TR>
+<TR BGCOLOR="white" CLASS="TableRowColor">
+<TD ALIGN="right" VALIGN="top" WIDTH="1%"><FONT SIZE="-1">
+<CODE>&nbsp;java.lang.String</CODE></FONT></TD>
+<TD><CODE><B><A HREF="../../morfologik/tools/MorphEncoder.html#standardEncodeUTF8(java.lang.String, java.lang.String, java.lang.String)">standardEncodeUTF8</A></B>(java.lang.String&nbsp;wordForm,
+ java.lang.String&nbsp;wordLemma,
+ java.lang.String&nbsp;wordTag)</CODE>
+
+<BR>
+&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;&nbsp;A UTF-8 variant of <A HREF="../../morfologik/tools/MorphEncoder.html#standardEncode(byte[], byte[], byte[])"><CODE>standardEncode(byte[], byte[], byte[])</CODE></A> This
+ method converts the wordForm, wordLemma and tag to the form:
+
+
+ wordForm + Kending + tags
+
+
+ where '+' is a separator, K is a character that specifies how many
+ characters should be deleted from the end of the inflected form to
+ produce the lexeme by concatenating the stripped string with the ending.</TD>
+</TR>
+</TABLE>
+&nbsp;<A NAME="methods_inherited_from_class_java.lang.Object"><!-- --></A>
+<TABLE BORDER="1" WIDTH="100%" CELLPADDING="3" CELLSPACING="0" SUMMARY="">
+<TR BGCOLOR="#EEEEFF" CLASS="TableSubHeadingColor">
+<TH ALIGN="left"><B>Methods inherited from class java.lang.Object</B></TH>
+</TR>
+<TR BGCOLOR="white" CLASS="TableRowColor">
+<TD><CODE>clone, equals, finalize, getClass, hashCode, notify, notifyAll, toString, wait, wait, wait</CODE></TD>
+</TR>
+</TABLE>
+&nbsp;
+<P>
+
+<!-- ========= CONSTRUCTOR DETAIL ======== -->
+
+<A NAME="constructor_detail"><!-- --></A>
+<TABLE BORDER="1" WIDTH="100%" CELLPADDING="3" CELLSPACING="0" SUMMARY="">
+<TR BGCOLOR="#CCCCFF" CLASS="TableHeadingColor">
+<TH ALIGN="left" COLSPAN="1"><FONT SIZE="+2">
+<B>Constructor Detail</B></FONT></TH>
+</TR>
+</TABLE>
+
+<A NAME="MorphEncoder()"><!-- --></A><H3>
+MorphEncoder</H3>
+<PRE>
+public <B>MorphEncoder</B>()</PRE>
+<DL>
+</DL>
+<HR>
+
+<A NAME="MorphEncoder(byte)"><!-- --></A><H3>
+MorphEncoder</H3>
+<PRE>
+public <B>MorphEncoder</B>(byte&nbsp;annotationSeparator)</PRE>
+<DL>
+</DL>
+
+<!-- ============ METHOD DETAIL ========== -->
+
+<A NAME="method_detail"><!-- --></A>
+<TABLE BORDER="1" WIDTH="100%" CELLPADDING="3" CELLSPACING="0" SUMMARY="">
+<TR BGCOLOR="#CCCCFF" CLASS="TableHeadingColor">
+<TH ALIGN="left" COLSPAN="1"><FONT SIZE="+2">
+<B>Method Detail</B></FONT></TH>
+</TR>
+</TABLE>
+
+<A NAME="commonPrefix(byte[], byte[])"><!-- --></A><H3>
+commonPrefix</H3>
+<PRE>
+public static int <B>commonPrefix</B>(byte[]&nbsp;s1,
+ byte[]&nbsp;s2)</PRE>
+<DL>
+<DD><DL>
+</DL>
+</DD>
+</DL>
+<HR>
+
+<A NAME="standardEncode(byte[], byte[], byte[])"><!-- --></A><H3>
+standardEncode</H3>
+<PRE>
+public byte[] <B>standardEncode</B>(byte[]&nbsp;wordForm,
+ byte[]&nbsp;wordLemma,
+ byte[]&nbsp;wordTag)</PRE>
+<DL>
+<DD>This method converts the wordForm, wordLemma and tag to the form:
+
+ <pre>
+ wordForm + Kending + tags
+ </pre>
+
+ where '+' is a separator, K is a character that specifies how many
+ characters should be deleted from the end of the inflected form to
+ produce the lexeme by concatenating the stripped string with the ending.
+<P>
+<DD><DL>
+</DL>
+</DD>
+</DL>
+<HR>
+
+<A NAME="prefixEncode(byte[], byte[], byte[])"><!-- --></A><H3>
+prefixEncode</H3>
+<PRE>
+public byte[] <B>prefixEncode</B>(byte[]&nbsp;wordForm,
+ byte[]&nbsp;wordLemma,
+ byte[]&nbsp;wordTag)</PRE>
+<DL>
+<DD>This method converts wordform, wordLemma and the tag to the form:
+ <p>
+
+ <pre>
+ inflected_form + LKending + tags
+ </pre>
+ <p>
+ where '+' is a separator, L is the number of characters to be deleted
+ from the beginning of the word ("A" means none, "B" means one, "C" - 2,
+ etc.), K is a character that specifies how many characters should be
+ deleted from the end of the inflected form to produce the lexeme by
+ concatenating the stripped string with the ending ("A" means none,
+ "B' - 1, "C" - 2, and so on).
+<P>
+<DD><DL>
+<DT><B>Parameters:</B><DD><CODE>wordForm</CODE> - - inflected word form<DD><CODE>wordLemma</CODE> - - canonical form<DD><CODE>wordTag</CODE> - - tag
+<DT><B>Returns:</B><DD>the encoded string</DL>
+</DD>
+</DL>
+<HR>
+
+<A NAME="infixEncode(byte[], byte[], byte[])"><!-- --></A><H3>
+infixEncode</H3>
+<PRE>
+public byte[] <B>infixEncode</B>(byte[]&nbsp;wordForm,
+ byte[]&nbsp;wordLemma,
+ byte[]&nbsp;wordTag)</PRE>
+<DL>
+<DD>This method converts wordform, wordLemma and the tag to the form:
+ <pre>
+ inflected_form + MLKending + tags
+ </pre>
+ <p>
+ where '+' is a separator, M is the position of characters to be deleted
+ towards the beginning of the inflected form ("A" means from the
+ beginning, "B" from the second character, "C" - from the third one, and
+ so on), L is the number of characters to be deleted from the position
+ specified by M ("A" means none, "B" means one, "C" - 2, etc.), K is a
+ character that specifies how many characters should be deleted from the
+ end of the inflected form to produce the lexeme by concatenating the
+ stripped string with the ending ("A" means none, "B' - 1, "C" - 2, and so
+ on).
+<P>
+<DD><DL>
+<DT><B>Parameters:</B><DD><CODE>wordForm</CODE> - - inflected word form<DD><CODE>wordLemma</CODE> - - canonical form<DD><CODE>wordTag</CODE> - - tag
+<DT><B>Returns:</B><DD>the encoded string</DL>
+</DD>
+</DL>
+<HR>
+
+<A NAME="asString(byte[], java.lang.String)"><!-- --></A><H3>
+asString</H3>
+<PRE>
+protected static java.lang.String <B>asString</B>(byte[]&nbsp;str,
+ java.lang.String&nbsp;encoding)</PRE>
+<DL>
+<DD>Converts a byte array to a given encoding.
+<P>
+<DD><DL>
+<DT><B>Parameters:</B><DD><CODE>str</CODE> - Byte-array to be converted.
+<DT><B>Returns:</B><DD>Java String. If decoding is unsuccessful, the string is empty.</DL>
+</DD>
+</DL>
+<HR>
+
+<A NAME="standardEncodeUTF8(java.lang.String, java.lang.String, java.lang.String)"><!-- --></A><H3>
+standardEncodeUTF8</H3>
+<PRE>
+public java.lang.String <B>standardEncodeUTF8</B>(java.lang.String&nbsp;wordForm,
+ java.lang.String&nbsp;wordLemma,
+ java.lang.String&nbsp;wordTag)
+ throws java.io.UnsupportedEncodingException</PRE>
+<DL>
+<DD>A UTF-8 variant of <A HREF="../../morfologik/tools/MorphEncoder.html#standardEncode(byte[], byte[], byte[])"><CODE>standardEncode(byte[], byte[], byte[])</CODE></A> This
+ method converts the wordForm, wordLemma and tag to the form:
+
+ <pre>
+ wordForm + Kending + tags
+ </pre>
+
+ where '+' is a separator, K is a character that specifies how many
+ characters should be deleted from the end of the inflected form to
+ produce the lexeme by concatenating the stripped string with the ending.
+<P>
+<DD><DL>
+
+<DT><B>Throws:</B>
+<DD><CODE>java.io.UnsupportedEncodingException</CODE></DL>
+</DD>
+</DL>
+<HR>
+
+<A NAME="prefixEncodeUTF8(java.lang.String, java.lang.String, java.lang.String)"><!-- --></A><H3>
+prefixEncodeUTF8</H3>
+<PRE>
+public java.lang.String <B>prefixEncodeUTF8</B>(java.lang.String&nbsp;wordForm,
+ java.lang.String&nbsp;wordLemma,
+ java.lang.String&nbsp;wordTag)
+ throws java.io.UnsupportedEncodingException</PRE>
+<DL>
+<DD>A UTF-8 variant of <A HREF="../../morfologik/tools/MorphEncoder.html#prefixEncode(byte[], byte[], byte[])"><CODE>prefixEncode(byte[], byte[], byte[])</CODE></A> This
+ method converts wordform, wordLemma and the tag to the form:
+ <pre>
+ inflected_form + LKending + tags
+ </pre>
+ <p>
+ where '+' is a separator, L is the number of characters to be deleted
+ from the beginning of the word ("A" means none, "B" means one, "C" - 2,
+ etc.), K is a character that specifies how many characters should be
+ deleted from the end of the inflected form to produce the lexeme by
+ concatenating the stripped string with the ending ("A" means none,
+ "B' - 1, "C" - 2, and so on).
+<P>
+<DD><DL>
+<DT><B>Parameters:</B><DD><CODE>wordForm</CODE> - - inflected word form<DD><CODE>wordLemma</CODE> - - canonical form<DD><CODE>wordTag</CODE> - - tag
+<DT><B>Returns:</B><DD>the encoded string
+<DT><B>Throws:</B>
+<DD><CODE>java.io.UnsupportedEncodingException</CODE></DL>
+</DD>
+</DL>
+<HR>
+
+<A NAME="infixEncodeUTF8(java.lang.String, java.lang.String, java.lang.String)"><!-- --></A><H3>
+infixEncodeUTF8</H3>
+<PRE>
+public java.lang.String <B>infixEncodeUTF8</B>(java.lang.String&nbsp;wordForm,
+ java.lang.String&nbsp;wordLemma,
+ java.lang.String&nbsp;wordTag)
+ throws java.io.UnsupportedEncodingException</PRE>
+<DL>
+<DD>A UTF-8 variant of <A HREF="../../morfologik/tools/MorphEncoder.html#infixEncode(byte[], byte[], byte[])"><CODE>infixEncode(byte[], byte[], byte[])</CODE></A>.
+
+ This method converts wordform, wordLemma and the tag to the form:
+ <pre>
+ inflected_form + MLKending + tags
+ </pre>
+ <p>
+ where '+' is a separator, M is the position of characters to be deleted
+ towards the beginning of the inflected form ("A" means from the
+ beginning, "B" from the second character, "C" - from the third one, and
+ so on), L is the number of characters to be deleted from the position
+ specified by M ("A" means none, "B" means one, "C" - 2, etc.), K is a
+ character that specifies how many characters should be deleted from the
+ end of the inflected form to produce the lexeme by concatenating the
+ stripped string with the ending ("A" means none, "B' - 1, "C" - 2, and so
+ on).
+<P>
+<DD><DL>
+<DT><B>Parameters:</B><DD><CODE>wordForm</CODE> - - inflected word form<DD><CODE>wordLemma</CODE> - - canonical form<DD><CODE>wordTag</CODE> - - tag
+<DT><B>Returns:</B><DD>the encoded string
+<DT><B>Throws:</B>
+<DD><CODE>java.io.UnsupportedEncodingException</CODE></DL>
+</DD>
+</DL>
+<!-- ========= END OF CLASS DATA ========= -->
+<HR>
+
+
+<!-- ======= START OF BOTTOM NAVBAR ====== -->
+<A NAME="navbar_bottom"><!-- --></A>
+<A HREF="#skip-navbar_bottom" title="Skip navigation links"></A>
+<TABLE BORDER="0" WIDTH="100%" CELLPADDING="1" CELLSPACING="0" SUMMARY="">
+<TR>
+<TD COLSPAN=2 BGCOLOR="#EEEEFF" CLASS="NavBarCell1">
+<A NAME="navbar_bottom_firstrow"><!-- --></A>
+<TABLE BORDER="0" CELLPADDING="0" CELLSPACING="3" SUMMARY="">
+ <TR ALIGN="center" VALIGN="top">
+ <TD BGCOLOR="#EEEEFF" CLASS="NavBarCell1"> <A HREF="../../overview-summary.html"><FONT CLASS="NavBarFont1"><B>Overview</B></FONT></A>&nbsp;</TD>
+ <TD BGCOLOR="#EEEEFF" CLASS="NavBarCell1"> <A HREF="package-summary.html"><FONT CLASS="NavBarFont1"><B>Package</B></FONT></A>&nbsp;</TD>
+ <TD BGCOLOR="#FFFFFF" CLASS="NavBarCell1Rev"> &nbsp;<FONT CLASS="NavBarFont1Rev"><B>Class</B></FONT>&nbsp;</TD>
+ <TD BGCOLOR="#EEEEFF" CLASS="NavBarCell1"> <A HREF="package-tree.html"><FONT CLASS="NavBarFont1"><B>Tree</B></FONT></A>&nbsp;</TD>
+ <TD BGCOLOR="#EEEEFF" CLASS="NavBarCell1"> <A HREF="../../deprecated-list.html"><FONT CLASS="NavBarFont1"><B>Deprecated</B></FONT></A>&nbsp;</TD>
+ <TD BGCOLOR="#EEEEFF" CLASS="NavBarCell1"> <A HREF="../../index-all.html"><FONT CLASS="NavBarFont1"><B>Index</B></FONT></A>&nbsp;</TD>
+ <TD BGCOLOR="#EEEEFF" CLASS="NavBarCell1"> <A HREF="../../help-doc.html"><FONT CLASS="NavBarFont1"><B>Help</B></FONT></A>&nbsp;</TD>
+ </TR>
+</TABLE>
+</TD>
+<TD ALIGN="right" VALIGN="top" ROWSPAN=3><EM>
+</EM>
+</TD>
+</TR>
+
+<TR>
+<TD BGCOLOR="white" CLASS="NavBarCell2"><FONT SIZE="-2">
+&nbsp;<A HREF="../../morfologik/tools/Launcher.html" title="class in morfologik.tools"><B>PREV CLASS</B></A>&nbsp;
+&nbsp;<A HREF="../../morfologik/tools/WriterMessageLogger.html" title="class in morfologik.tools"><B>NEXT CLASS</B></A></FONT></TD>
+<TD BGCOLOR="white" CLASS="NavBarCell2"><FONT SIZE="-2">
+ <A HREF="../../index.html?morfologik/tools/MorphEncoder.html" target="_top"><B>FRAMES</B></A> &nbsp;
+&nbsp;<A HREF="MorphEncoder.html" target="_top"><B>NO FRAMES</B></A> &nbsp;
+&nbsp;<SCRIPT type="text/javascript">
+ <!--
+ if(window==top) {
+ document.writeln('<A HREF="../../allclasses-noframe.html"><B>All Classes</B></A>');
+ }
+ //-->
+</SCRIPT>
+<NOSCRIPT>
+ <A HREF="../../allclasses-noframe.html"><B>All Classes</B></A>
+</NOSCRIPT>
+
+
+</FONT></TD>
+</TR>
+<TR>
+<TD VALIGN="top" CLASS="NavBarCell3"><FONT SIZE="-2">
+ SUMMARY:&nbsp;NESTED&nbsp;|&nbsp;FIELD&nbsp;|&nbsp;<A HREF="#constructor_summary">CONSTR</A>&nbsp;|&nbsp;<A HREF="#method_summary">METHOD</A></FONT></TD>
+<TD VALIGN="top" CLASS="NavBarCell3"><FONT SIZE="-2">
+DETAIL:&nbsp;FIELD&nbsp;|&nbsp;<A HREF="#constructor_detail">CONSTR</A>&nbsp;|&nbsp;<A HREF="#method_detail">METHOD</A></FONT></TD>
+</TR>
+</TABLE>
+<A NAME="skip-navbar_bottom"></A>
+<!-- ======== END OF BOTTOM NAVBAR ======= -->
+
+<HR>
+
+</BODY>
+</HTML>