[Groonga-commit] groonga/groonga [master] test kytea: add tests

アーカイブの一覧に戻る

Kouhei Sutou null+****@clear*****
Tue Nov 13 14:06:31 JST 2012


Kouhei Sutou	2012-11-13 14:06:31 +0900 (Tue, 13 Nov 2012)

  New Revision: 06d493b21b493387838ff05732798ad40e7cfef0
  https://github.com/groonga/groonga/commit/06d493b21b493387838ff05732798ad40e7cfef0

  Log:
    test kytea: add tests

  Added files:
    test/command/suite/table_create/default_tokenizer/kytea/default.expected
    test/command/suite/table_create/default_tokenizer/kytea/default.test
    test/command/suite/table_create/default_tokenizer/kytea/normalize.expected
    test/command/suite/table_create/default_tokenizer/kytea/normalize.test
    test/command/suite/table_create/default_tokenizer/kytea/tokenized_delimiter/default.expected
    test/command/suite/table_create/default_tokenizer/kytea/tokenized_delimiter/default.test
    test/command/suite/table_create/default_tokenizer/kytea/tokenized_delimiter/normalize.expected
    test/command/suite/table_create/default_tokenizer/kytea/tokenized_delimiter/normalize.test

  Added: test/command/suite/table_create/default_tokenizer/kytea/default.expected (+70 -0) 100644
===================================================================
--- /dev/null
+++ test/command/suite/table_create/default_tokenizer/kytea/default.expected    2012-11-13 14:06:31 +0900 (6d70520)
@@ -0,0 +1,70 @@
+register tokenizers/kytea
+[[0,0.0,0.0],true]
+table_create Memos TABLE_NO_KEY
+[[0,0.0,0.0],true]
+column_create Memos content COLUMN_SCALAR Text
+[[0,0.0,0.0],true]
+table_create Terms TABLE_PAT_KEY ShortText   --default_tokenizer TokenKytea
+[[0,0.0,0.0],true]
+column_create Terms memos_content COLUMN_INDEX Memos content
+[[0,0.0,0.0],true]
+load --table Memos
+[
+{"content": "This is a pen."},
+{"content": "これはペンです。"}
+]
+[[0,0.0,0.0],2]
+select Terms --output_columns _key --limit -1
+[
+  [
+    0,
+    0.0,
+    0.0
+  ],
+  [
+    [
+      [
+        11
+      ],
+      [
+        [
+          "_key",
+          "ShortText"
+        ]
+      ],
+      [
+        "."
+      ],
+      [
+        "This"
+      ],
+      [
+        "a"
+      ],
+      [
+        "is"
+      ],
+      [
+        "pen"
+      ],
+      [
+        "。"
+      ],
+      [
+        "これ"
+      ],
+      [
+        "す"
+      ],
+      [
+        "で"
+      ],
+      [
+        "は"
+      ],
+      [
+        "ペン"
+      ]
+    ]
+  ]
+]

  Added: test/command/suite/table_create/default_tokenizer/kytea/default.test (+16 -0) 100644
===================================================================
--- /dev/null
+++ test/command/suite/table_create/default_tokenizer/kytea/default.test    2012-11-13 14:06:31 +0900 (9d51c74)
@@ -0,0 +1,16 @@
+register tokenizers/kytea
+
+table_create Memos TABLE_NO_KEY
+column_create Memos content COLUMN_SCALAR Text
+
+table_create Terms TABLE_PAT_KEY ShortText \
+  --default_tokenizer TokenKytea
+column_create Terms memos_content COLUMN_INDEX Memos content
+
+load --table Memos
+[
+{"content": "This is a pen."},
+{"content": "これはペンです。"}
+]
+
+select Terms --output_columns _key --limit -1

  Added: test/command/suite/table_create/default_tokenizer/kytea/normalize.expected (+70 -0) 100644
===================================================================
--- /dev/null
+++ test/command/suite/table_create/default_tokenizer/kytea/normalize.expected    2012-11-13 14:06:31 +0900 (c2bd72e)
@@ -0,0 +1,70 @@
+register tokenizers/kytea
+[[0,0.0,0.0],true]
+table_create Memos TABLE_NO_KEY
+[[0,0.0,0.0],true]
+column_create Memos content COLUMN_SCALAR Text
+[[0,0.0,0.0],true]
+table_create Terms TABLE_PAT_KEY|KEY_NORMALIZE ShortText   --default_tokenizer TokenKytea
+[[0,0.0,0.0],true]
+column_create Terms memos_content COLUMN_INDEX Memos content
+[[0,0.0,0.0],true]
+load --table Memos
+[
+{"content": "This is a pen."},
+{"content": "これはペンです。"}
+]
+[[0,0.0,0.0],2]
+select Terms --output_columns _key --limit -1
+[
+  [
+    0,
+    0.0,
+    0.0
+  ],
+  [
+    [
+      [
+        11
+      ],
+      [
+        [
+          "_key",
+          "ShortText"
+        ]
+      ],
+      [
+        "."
+      ],
+      [
+        "a"
+      ],
+      [
+        "is"
+      ],
+      [
+        "pen"
+      ],
+      [
+        "this"
+      ],
+      [
+        "。"
+      ],
+      [
+        "これ"
+      ],
+      [
+        "す"
+      ],
+      [
+        "で"
+      ],
+      [
+        "は"
+      ],
+      [
+        "ペン"
+      ]
+    ]
+  ]
+]

  Added: test/command/suite/table_create/default_tokenizer/kytea/normalize.test (+16 -0) 100644
===================================================================
--- /dev/null
+++ test/command/suite/table_create/default_tokenizer/kytea/normalize.test    2012-11-13 14:06:31 +0900 (9a57696)
@@ -0,0 +1,16 @@
+register tokenizers/kytea
+
+table_create Memos TABLE_NO_KEY
+column_create Memos content COLUMN_SCALAR Text
+
+table_create Terms TABLE_PAT_KEY|KEY_NORMALIZE ShortText \
+  --default_tokenizer TokenKytea
+column_create Terms memos_content COLUMN_INDEX Memos content
+
+load --table Memos
+[
+{"content": "This is a pen."},
+{"content": "これはペンです。"}
+]
+
+select Terms --output_columns _key --limit -1

  Added: test/command/suite/table_create/default_tokenizer/kytea/tokenized_delimiter/default.expected (+55 -0) 100644
===================================================================
--- /dev/null
+++ test/command/suite/table_create/default_tokenizer/kytea/tokenized_delimiter/default.expected    2012-11-13 14:06:31 +0900 (8639244)
@@ -0,0 +1,55 @@
+register tokenizers/kytea
+[[0,0.0,0.0],true]
+table_create Memos TABLE_NO_KEY
+[[0,0.0,0.0],true]
+column_create Memos content COLUMN_SCALAR Text
+[[0,0.0,0.0],true]
+table_create Terms TABLE_PAT_KEY ShortText   --default_tokenizer TokenKytea
+[[0,0.0,0.0],true]
+column_create Terms memos_content COLUMN_INDEX Memos content
+[[0,0.0,0.0],true]
+load --table Memos
+[
+{"content": "Th\uFFFEis is a p\uFFFEen."},
+{"content": "これは\uFFFEペン\uFFFEです。"}
+]
+[[0,0.0,0.0],2]
+select Terms --output_columns _key --limit -1
+[
+  [
+    0,
+    0.0,
+    0.0
+  ],
+  [
+    [
+      [
+        6
+      ],
+      [
+        [
+          "_key",
+          "ShortText"
+        ]
+      ],
+      [
+        "Th"
+      ],
+      [
+        "en."
+      ],
+      [
+        "is is a p"
+      ],
+      [
+        "これは"
+      ],
+      [
+        "です。"
+      ],
+      [
+        "ペン"
+      ]
+    ]
+  ]
+]

  Added: test/command/suite/table_create/default_tokenizer/kytea/tokenized_delimiter/default.test (+16 -0) 100644
===================================================================
--- /dev/null
+++ test/command/suite/table_create/default_tokenizer/kytea/tokenized_delimiter/default.test    2012-11-13 14:06:31 +0900 (4ebd72c)
@@ -0,0 +1,16 @@
+register tokenizers/kytea
+
+table_create Memos TABLE_NO_KEY
+column_create Memos content COLUMN_SCALAR Text
+
+table_create Terms TABLE_PAT_KEY ShortText \
+  --default_tokenizer TokenKytea
+column_create Terms memos_content COLUMN_INDEX Memos content
+
+load --table Memos
+[
+{"content": "Th\uFFFEis is a p\uFFFEen."},
+{"content": "これは\uFFFEペン\uFFFEです。"}
+]
+
+select Terms --output_columns _key --limit -1

  Added: test/command/suite/table_create/default_tokenizer/kytea/tokenized_delimiter/normalize.expected (+55 -0) 100644
===================================================================
--- /dev/null
+++ test/command/suite/table_create/default_tokenizer/kytea/tokenized_delimiter/normalize.expected    2012-11-13 14:06:31 +0900 (38b0ec7)
@@ -0,0 +1,55 @@
+register tokenizers/kytea
+[[0,0.0,0.0],true]
+table_create Memos TABLE_NO_KEY
+[[0,0.0,0.0],true]
+column_create Memos content COLUMN_SCALAR Text
+[[0,0.0,0.0],true]
+table_create Terms TABLE_PAT_KEY|KEY_NORMALIZE ShortText   --default_tokenizer TokenKytea
+[[0,0.0,0.0],true]
+column_create Terms memos_content COLUMN_INDEX Memos content
+[[0,0.0,0.0],true]
+load --table Memos
+[
+{"content": "Th\uFFFEis is a p\uFFFEen."},
+{"content": "これは\uFFFEペン\uFFFEです。"}
+]
+[[0,0.0,0.0],2]
+select Terms --output_columns _key --limit -1
+[
+  [
+    0,
+    0.0,
+    0.0
+  ],
+  [
+    [
+      [
+        6
+      ],
+      [
+        [
+          "_key",
+          "ShortText"
+        ]
+      ],
+      [
+        "en."
+      ],
+      [
+        "is is a p"
+      ],
+      [
+        "th"
+      ],
+      [
+        "これは"
+      ],
+      [
+        "です。"
+      ],
+      [
+        "ペン"
+      ]
+    ]
+  ]
+]

  Added: test/command/suite/table_create/default_tokenizer/kytea/tokenized_delimiter/normalize.test (+16 -0) 100644
===================================================================
--- /dev/null
+++ test/command/suite/table_create/default_tokenizer/kytea/tokenized_delimiter/normalize.test    2012-11-13 14:06:31 +0900 (e9cbae1)
@@ -0,0 +1,16 @@
+register tokenizers/kytea
+
+table_create Memos TABLE_NO_KEY
+column_create Memos content COLUMN_SCALAR Text
+
+table_create Terms TABLE_PAT_KEY|KEY_NORMALIZE ShortText \
+  --default_tokenizer TokenKytea
+column_create Terms memos_content COLUMN_INDEX Memos content
+
+load --table Memos
+[
+{"content": "Th\uFFFEis is a p\uFFFEen."},
+{"content": "これは\uFFFEペン\uFFFEです。"}
+]
+
+select Terms --output_columns _key --limit -1
-------------- next part --------------
HTML����������������������������...
ダウンロード 



More information about the Groonga-commit mailing list
アーカイブの一覧に戻る