diff options
Diffstat (limited to 'morfologik-stemming/src/test/resources')
11 files changed, 52 insertions, 0 deletions
diff --git a/morfologik-stemming/src/test/resources/morfologik/stemming/test-diacritics-utf8.dict b/morfologik-stemming/src/test/resources/morfologik/stemming/test-diacritics-utf8.dict Binary files differnew file mode 100644 index 0000000..2a62f21 --- /dev/null +++ b/morfologik-stemming/src/test/resources/morfologik/stemming/test-diacritics-utf8.dict diff --git a/morfologik-stemming/src/test/resources/morfologik/stemming/test-diacritics-utf8.info b/morfologik-stemming/src/test/resources/morfologik/stemming/test-diacritics-utf8.info new file mode 100644 index 0000000..058aed2 --- /dev/null +++ b/morfologik-stemming/src/test/resources/morfologik/stemming/test-diacritics-utf8.info @@ -0,0 +1,9 @@ +#
+# Dictionary properties.
+#
+
+fsa.dict.separator=+
+fsa.dict.encoding=UTF-8
+
+fsa.dict.uses-prefixes=false
+fsa.dict.uses-infixes=false
diff --git a/morfologik-stemming/src/test/resources/morfologik/stemming/test-infix.dict b/morfologik-stemming/src/test/resources/morfologik/stemming/test-infix.dict Binary files differnew file mode 100644 index 0000000..cc91f70 --- /dev/null +++ b/morfologik-stemming/src/test/resources/morfologik/stemming/test-infix.dict diff --git a/morfologik-stemming/src/test/resources/morfologik/stemming/test-infix.info b/morfologik-stemming/src/test/resources/morfologik/stemming/test-infix.info new file mode 100644 index 0000000..535fac3 --- /dev/null +++ b/morfologik-stemming/src/test/resources/morfologik/stemming/test-infix.info @@ -0,0 +1,8 @@ +#
+# Dictionary properties.
+#
+
+fsa.dict.separator=+
+fsa.dict.encoding=iso-8859-2
+
+fsa.dict.uses-infixes=true
\ No newline at end of file diff --git a/morfologik-stemming/src/test/resources/morfologik/stemming/test-prefix.dict b/morfologik-stemming/src/test/resources/morfologik/stemming/test-prefix.dict Binary files differnew file mode 100644 index 0000000..d0bed4c --- /dev/null +++ b/morfologik-stemming/src/test/resources/morfologik/stemming/test-prefix.dict diff --git a/morfologik-stemming/src/test/resources/morfologik/stemming/test-prefix.info b/morfologik-stemming/src/test/resources/morfologik/stemming/test-prefix.info new file mode 100644 index 0000000..520739e --- /dev/null +++ b/morfologik-stemming/src/test/resources/morfologik/stemming/test-prefix.info @@ -0,0 +1,11 @@ +#
+# Dictionary properties.
+#
+
+fsa.dict.separator=+
+fsa.dict.encoding=iso-8859-2
+
+fsa.dict.uses-prefixes=true
+fsa.dict.uses-infixes=false
+
+fsa.dict.input-conversion=\\a ą, krowa Rzecz
\ No newline at end of file diff --git a/morfologik-stemming/src/test/resources/morfologik/stemming/test-separators.dict b/morfologik-stemming/src/test/resources/morfologik/stemming/test-separators.dict Binary files differnew file mode 100644 index 0000000..a71b9e7 --- /dev/null +++ b/morfologik-stemming/src/test/resources/morfologik/stemming/test-separators.dict diff --git a/morfologik-stemming/src/test/resources/morfologik/stemming/test-separators.info b/morfologik-stemming/src/test/resources/morfologik/stemming/test-separators.info new file mode 100644 index 0000000..8ec14c3 --- /dev/null +++ b/morfologik-stemming/src/test/resources/morfologik/stemming/test-separators.info @@ -0,0 +1,10 @@ +#
+# Dictionary properties.
+#
+
+fsa.dict.separator=+
+fsa.dict.encoding=iso8859-1
+
+fsa.dict.uses-prefixes=false
+fsa.dict.uses-infixes=false
+fsa.dict.uses-suffixes=false
diff --git a/morfologik-stemming/src/test/resources/morfologik/stemming/test-separators.txt b/morfologik-stemming/src/test/resources/morfologik/stemming/test-separators.txt new file mode 100644 index 0000000..cd77945 --- /dev/null +++ b/morfologik-stemming/src/test/resources/morfologik/stemming/test-separators.txt @@ -0,0 +1,8 @@ +token1+ +token2++ +token3+++ +token4+token2 +token5+token2+ +token6+token2++ +token7+token2+token3+ +token8+token2+token3++
\ No newline at end of file diff --git a/morfologik-stemming/src/test/resources/morfologik/stemming/test-synth.dict b/morfologik-stemming/src/test/resources/morfologik/stemming/test-synth.dict Binary files differnew file mode 100644 index 0000000..6890253 --- /dev/null +++ b/morfologik-stemming/src/test/resources/morfologik/stemming/test-synth.dict diff --git a/morfologik-stemming/src/test/resources/morfologik/stemming/test-synth.info b/morfologik-stemming/src/test/resources/morfologik/stemming/test-synth.info new file mode 100644 index 0000000..ffce33e --- /dev/null +++ b/morfologik-stemming/src/test/resources/morfologik/stemming/test-synth.info @@ -0,0 +1,6 @@ +#
+# Dictionary properties.
+#
+
+fsa.dict.separator=+
+fsa.dict.encoding=iso-8859-2
\ No newline at end of file |