[Groonga-commit] groonga/groonga at e10ae1c [master] test: add trigram tokenizer

Back to archive index

naoa null+****@clear*****
Thu May 21 21:20:02 JST 2015


naoa	2015-05-21 21:20:02 +0900 (Thu, 21 May 2015)

  New Revision: e10ae1cf5e0bf3022fc0f29a38ff4c6cb147e183
  https://github.com/groonga/groonga/commit/e10ae1cf5e0bf3022fc0f29a38ff4c6cb147e183

  Merged 6c4e87d: Merge pull request #339 from naoa/add-force_prefix-to-tokenize

  Message:
    test: add trigram tokenizer

  Added files:
    test/command/suite/tokenizers/trigram/force_prefix/multiple_tokens/matured.expected
    test/command/suite/tokenizers/trigram/force_prefix/multiple_tokens/matured.test
    test/command/suite/tokenizers/trigram/force_prefix/multiple_tokens/unmatured_one_character.expected
    test/command/suite/tokenizers/trigram/force_prefix/multiple_tokens/unmatured_one_character.test
    test/command/suite/tokenizers/trigram/force_prefix/multiple_tokens/unmatured_two_characters.expected
    test/command/suite/tokenizers/trigram/force_prefix/multiple_tokens/unmatured_two_characters.test
    test/command/suite/tokenizers/trigram/force_prefix/single_token/matured.expected
    test/command/suite/tokenizers/trigram/force_prefix/single_token/matured.test
    test/command/suite/tokenizers/trigram/force_prefix/single_token/unmatured_one_character.expected
    test/command/suite/tokenizers/trigram/force_prefix/single_token/unmatured_one_character.test
    test/command/suite/tokenizers/trigram/force_prefix/single_token/unmatured_two_characters.expected
    test/command/suite/tokenizers/trigram/force_prefix/single_token/unmatured_two_characters.test

  Added: test/command/suite/tokenizers/trigram/force_prefix/multiple_tokens/matured.expected (+20 -0) 100644
===================================================================
--- /dev/null
+++ test/command/suite/tokenizers/trigram/force_prefix/multiple_tokens/matured.expected    2015-05-21 21:20:02 +0900 (143bd31)
@@ -0,0 +1,20 @@
+tokenize TokenTrigram "ABCだよね" NormalizerAuto --mode GET
+[
+  [
+    0,
+    0.0,
+    0.0
+  ],
+  [
+    {
+      "value": "abc",
+      "position": 0,
+      "force_prefix": false
+    },
+    {
+      "value": "だよね",
+      "position": 1,
+      "force_prefix": false
+    }
+  ]
+]

  Added: test/command/suite/tokenizers/trigram/force_prefix/multiple_tokens/matured.test (+1 -0) 100644
===================================================================
--- /dev/null
+++ test/command/suite/tokenizers/trigram/force_prefix/multiple_tokens/matured.test    2015-05-21 21:20:02 +0900 (82f6eb5)
@@ -0,0 +1 @@
+tokenize TokenTrigram "ABCだよね" NormalizerAuto --mode GET

  Added: test/command/suite/tokenizers/trigram/force_prefix/multiple_tokens/unmatured_one_character.expected (+20 -0) 100644
===================================================================
--- /dev/null
+++ test/command/suite/tokenizers/trigram/force_prefix/multiple_tokens/unmatured_one_character.expected    2015-05-21 21:20:02 +0900 (ec3e13e)
@@ -0,0 +1,20 @@
+tokenize TokenTrigram "ABCだ" NormalizerAuto --mode GET
+[
+  [
+    0,
+    0.0,
+    0.0
+  ],
+  [
+    {
+      "value": "abc",
+      "position": 0,
+      "force_prefix": false
+    },
+    {
+      "value": "だ",
+      "position": 1,
+      "force_prefix": true
+    }
+  ]
+]

  Added: test/command/suite/tokenizers/trigram/force_prefix/multiple_tokens/unmatured_one_character.test (+1 -0) 100644
===================================================================
--- /dev/null
+++ test/command/suite/tokenizers/trigram/force_prefix/multiple_tokens/unmatured_one_character.test    2015-05-21 21:20:02 +0900 (369d9cb)
@@ -0,0 +1 @@
+tokenize TokenTrigram "ABCだ" NormalizerAuto --mode GET

  Added: test/command/suite/tokenizers/trigram/force_prefix/multiple_tokens/unmatured_two_characters.expected (+20 -0) 100644
===================================================================
--- /dev/null
+++ test/command/suite/tokenizers/trigram/force_prefix/multiple_tokens/unmatured_two_characters.expected    2015-05-21 21:20:02 +0900 (b34c9e9)
@@ -0,0 +1,20 @@
+tokenize TokenTrigram "ABCだよ" NormalizerAuto --mode GET
+[
+  [
+    0,
+    0.0,
+    0.0
+  ],
+  [
+    {
+      "value": "abc",
+      "position": 0,
+      "force_prefix": false
+    },
+    {
+      "value": "だよ",
+      "position": 1,
+      "force_prefix": false
+    }
+  ]
+]

  Added: test/command/suite/tokenizers/trigram/force_prefix/multiple_tokens/unmatured_two_characters.test (+1 -0) 100644
===================================================================
--- /dev/null
+++ test/command/suite/tokenizers/trigram/force_prefix/multiple_tokens/unmatured_two_characters.test    2015-05-21 21:20:02 +0900 (d30b3a9)
@@ -0,0 +1 @@
+tokenize TokenTrigram "ABCだよ" NormalizerAuto --mode GET

  Added: test/command/suite/tokenizers/trigram/force_prefix/single_token/matured.expected (+2 -0) 100644
===================================================================
--- /dev/null
+++ test/command/suite/tokenizers/trigram/force_prefix/single_token/matured.expected    2015-05-21 21:20:02 +0900 (2b6bd9a)
@@ -0,0 +1,2 @@
+tokenize TokenTrigram "だよね" NormalizerAuto --mode GET
+[[0,0.0,0.0],[{"value":"だよね","position":0,"force_prefix":false}]]

  Added: test/command/suite/tokenizers/trigram/force_prefix/single_token/matured.test (+1 -0) 100644
===================================================================
--- /dev/null
+++ test/command/suite/tokenizers/trigram/force_prefix/single_token/matured.test    2015-05-21 21:20:02 +0900 (f4db720)
@@ -0,0 +1 @@
+tokenize TokenTrigram "だよね" NormalizerAuto --mode GET

  Added: test/command/suite/tokenizers/trigram/force_prefix/single_token/unmatured_one_character.expected (+2 -0) 100644
===================================================================
--- /dev/null
+++ test/command/suite/tokenizers/trigram/force_prefix/single_token/unmatured_one_character.expected    2015-05-21 21:20:02 +0900 (0db9eb1)
@@ -0,0 +1,2 @@
+tokenize TokenTrigram "だ" NormalizerAuto --mode GET
+[[0,0.0,0.0],[{"value":"だ","position":0,"force_prefix":true}]]

  Added: test/command/suite/tokenizers/trigram/force_prefix/single_token/unmatured_one_character.test (+1 -0) 100644
===================================================================
--- /dev/null
+++ test/command/suite/tokenizers/trigram/force_prefix/single_token/unmatured_one_character.test    2015-05-21 21:20:02 +0900 (80dab12)
@@ -0,0 +1 @@
+tokenize TokenTrigram "だ" NormalizerAuto --mode GET

  Added: test/command/suite/tokenizers/trigram/force_prefix/single_token/unmatured_two_characters.expected (+2 -0) 100644
===================================================================
--- /dev/null
+++ test/command/suite/tokenizers/trigram/force_prefix/single_token/unmatured_two_characters.expected    2015-05-21 21:20:02 +0900 (b5f1428)
@@ -0,0 +1,2 @@
+tokenize TokenTrigram "だよ" NormalizerAuto --mode GET
+[[0,0.0,0.0],[{"value":"だよ","position":0,"force_prefix":false}]]

  Added: test/command/suite/tokenizers/trigram/force_prefix/single_token/unmatured_two_characters.test (+1 -0) 100644
===================================================================
--- /dev/null
+++ test/command/suite/tokenizers/trigram/force_prefix/single_token/unmatured_two_characters.test    2015-05-21 21:20:02 +0900 (8e8e859)
@@ -0,0 +1 @@
+tokenize TokenTrigram "だよ" NormalizerAuto --mode GET
-------------- next part --------------
HTML����������������������������...
Download 



More information about the Groonga-commit mailing list
Back to archive index