summaryrefslogtreecommitdiff
path: root/morfologik-stemming/src/test/resources
diff options
context:
space:
mode:
Diffstat (limited to 'morfologik-stemming/src/test/resources')
-rw-r--r--morfologik-stemming/src/test/resources/morfologik/stemming/test-diacritics-utf8.dictbin0 -> 136 bytes
-rw-r--r--morfologik-stemming/src/test/resources/morfologik/stemming/test-diacritics-utf8.info9
-rw-r--r--morfologik-stemming/src/test/resources/morfologik/stemming/test-infix.dictbin0 -> 1859 bytes
-rw-r--r--morfologik-stemming/src/test/resources/morfologik/stemming/test-infix.info8
-rw-r--r--morfologik-stemming/src/test/resources/morfologik/stemming/test-prefix.dictbin0 -> 1776 bytes
-rw-r--r--morfologik-stemming/src/test/resources/morfologik/stemming/test-prefix.info11
-rw-r--r--morfologik-stemming/src/test/resources/morfologik/stemming/test-separators.dictbin0 -> 155 bytes
-rw-r--r--morfologik-stemming/src/test/resources/morfologik/stemming/test-separators.info10
-rw-r--r--morfologik-stemming/src/test/resources/morfologik/stemming/test-separators.txt8
-rw-r--r--morfologik-stemming/src/test/resources/morfologik/stemming/test-synth.dictbin0 -> 1354192 bytes
-rw-r--r--morfologik-stemming/src/test/resources/morfologik/stemming/test-synth.info6
11 files changed, 52 insertions, 0 deletions
diff --git a/morfologik-stemming/src/test/resources/morfologik/stemming/test-diacritics-utf8.dict b/morfologik-stemming/src/test/resources/morfologik/stemming/test-diacritics-utf8.dict
new file mode 100644
index 0000000..2a62f21
--- /dev/null
+++ b/morfologik-stemming/src/test/resources/morfologik/stemming/test-diacritics-utf8.dict
Binary files differ
diff --git a/morfologik-stemming/src/test/resources/morfologik/stemming/test-diacritics-utf8.info b/morfologik-stemming/src/test/resources/morfologik/stemming/test-diacritics-utf8.info
new file mode 100644
index 0000000..058aed2
--- /dev/null
+++ b/morfologik-stemming/src/test/resources/morfologik/stemming/test-diacritics-utf8.info
@@ -0,0 +1,9 @@
+#
+# Dictionary properties.
+#
+
+fsa.dict.separator=+
+fsa.dict.encoding=UTF-8
+
+fsa.dict.uses-prefixes=false
+fsa.dict.uses-infixes=false
diff --git a/morfologik-stemming/src/test/resources/morfologik/stemming/test-infix.dict b/morfologik-stemming/src/test/resources/morfologik/stemming/test-infix.dict
new file mode 100644
index 0000000..cc91f70
--- /dev/null
+++ b/morfologik-stemming/src/test/resources/morfologik/stemming/test-infix.dict
Binary files differ
diff --git a/morfologik-stemming/src/test/resources/morfologik/stemming/test-infix.info b/morfologik-stemming/src/test/resources/morfologik/stemming/test-infix.info
new file mode 100644
index 0000000..535fac3
--- /dev/null
+++ b/morfologik-stemming/src/test/resources/morfologik/stemming/test-infix.info
@@ -0,0 +1,8 @@
+#
+# Dictionary properties.
+#
+
+fsa.dict.separator=+
+fsa.dict.encoding=iso-8859-2
+
+fsa.dict.uses-infixes=true \ No newline at end of file
diff --git a/morfologik-stemming/src/test/resources/morfologik/stemming/test-prefix.dict b/morfologik-stemming/src/test/resources/morfologik/stemming/test-prefix.dict
new file mode 100644
index 0000000..d0bed4c
--- /dev/null
+++ b/morfologik-stemming/src/test/resources/morfologik/stemming/test-prefix.dict
Binary files differ
diff --git a/morfologik-stemming/src/test/resources/morfologik/stemming/test-prefix.info b/morfologik-stemming/src/test/resources/morfologik/stemming/test-prefix.info
new file mode 100644
index 0000000..520739e
--- /dev/null
+++ b/morfologik-stemming/src/test/resources/morfologik/stemming/test-prefix.info
@@ -0,0 +1,11 @@
+#
+# Dictionary properties.
+#
+
+fsa.dict.separator=+
+fsa.dict.encoding=iso-8859-2
+
+fsa.dict.uses-prefixes=true
+fsa.dict.uses-infixes=false
+
+fsa.dict.input-conversion=\\a ą, krowa Rzecz \ No newline at end of file
diff --git a/morfologik-stemming/src/test/resources/morfologik/stemming/test-separators.dict b/morfologik-stemming/src/test/resources/morfologik/stemming/test-separators.dict
new file mode 100644
index 0000000..a71b9e7
--- /dev/null
+++ b/morfologik-stemming/src/test/resources/morfologik/stemming/test-separators.dict
Binary files differ
diff --git a/morfologik-stemming/src/test/resources/morfologik/stemming/test-separators.info b/morfologik-stemming/src/test/resources/morfologik/stemming/test-separators.info
new file mode 100644
index 0000000..8ec14c3
--- /dev/null
+++ b/morfologik-stemming/src/test/resources/morfologik/stemming/test-separators.info
@@ -0,0 +1,10 @@
+#
+# Dictionary properties.
+#
+
+fsa.dict.separator=+
+fsa.dict.encoding=iso8859-1
+
+fsa.dict.uses-prefixes=false
+fsa.dict.uses-infixes=false
+fsa.dict.uses-suffixes=false
diff --git a/morfologik-stemming/src/test/resources/morfologik/stemming/test-separators.txt b/morfologik-stemming/src/test/resources/morfologik/stemming/test-separators.txt
new file mode 100644
index 0000000..cd77945
--- /dev/null
+++ b/morfologik-stemming/src/test/resources/morfologik/stemming/test-separators.txt
@@ -0,0 +1,8 @@
+token1+
+token2++
+token3+++
+token4+token2
+token5+token2+
+token6+token2++
+token7+token2+token3+
+token8+token2+token3++ \ No newline at end of file
diff --git a/morfologik-stemming/src/test/resources/morfologik/stemming/test-synth.dict b/morfologik-stemming/src/test/resources/morfologik/stemming/test-synth.dict
new file mode 100644
index 0000000..6890253
--- /dev/null
+++ b/morfologik-stemming/src/test/resources/morfologik/stemming/test-synth.dict
Binary files differ
diff --git a/morfologik-stemming/src/test/resources/morfologik/stemming/test-synth.info b/morfologik-stemming/src/test/resources/morfologik/stemming/test-synth.info
new file mode 100644
index 0000000..ffce33e
--- /dev/null
+++ b/morfologik-stemming/src/test/resources/morfologik/stemming/test-synth.info
@@ -0,0 +1,6 @@
+#
+# Dictionary properties.
+#
+
+fsa.dict.separator=+
+fsa.dict.encoding=iso-8859-2 \ No newline at end of file