Kouhei Sutou
null+****@clear*****
Tue Nov 13 14:06:31 JST 2012
Kouhei Sutou 2012-11-13 14:06:31 +0900 (Tue, 13 Nov 2012) New Revision: 06d493b21b493387838ff05732798ad40e7cfef0 https://github.com/groonga/groonga/commit/06d493b21b493387838ff05732798ad40e7cfef0 Log: test kytea: add tests Added files: test/command/suite/table_create/default_tokenizer/kytea/default.expected test/command/suite/table_create/default_tokenizer/kytea/default.test test/command/suite/table_create/default_tokenizer/kytea/normalize.expected test/command/suite/table_create/default_tokenizer/kytea/normalize.test test/command/suite/table_create/default_tokenizer/kytea/tokenized_delimiter/default.expected test/command/suite/table_create/default_tokenizer/kytea/tokenized_delimiter/default.test test/command/suite/table_create/default_tokenizer/kytea/tokenized_delimiter/normalize.expected test/command/suite/table_create/default_tokenizer/kytea/tokenized_delimiter/normalize.test Added: test/command/suite/table_create/default_tokenizer/kytea/default.expected (+70 -0) 100644 =================================================================== --- /dev/null +++ test/command/suite/table_create/default_tokenizer/kytea/default.expected 2012-11-13 14:06:31 +0900 (6d70520) @@ -0,0 +1,70 @@ +register tokenizers/kytea +[[0,0.0,0.0],true] +table_create Memos TABLE_NO_KEY +[[0,0.0,0.0],true] +column_create Memos content COLUMN_SCALAR Text +[[0,0.0,0.0],true] +table_create Terms TABLE_PAT_KEY ShortText --default_tokenizer TokenKytea +[[0,0.0,0.0],true] +column_create Terms memos_content COLUMN_INDEX Memos content +[[0,0.0,0.0],true] +load --table Memos +[ +{"content": "This is a pen."}, +{"content": "これはペンです。"} +] +[[0,0.0,0.0],2] +select Terms --output_columns _key --limit -1 +[ + [ + 0, + 0.0, + 0.0 + ], + [ + [ + [ + 11 + ], + [ + [ + "_key", + "ShortText" + ] + ], + [ + "." + ], + [ + "This" + ], + [ + "a" + ], + [ + "is" + ], + [ + "pen" + ], + [ + "。" + ], + [ + "これ" + ], + [ + "す" + ], + [ + "で" + ], + [ + "は" + ], + [ + "ペン" + ] + ] + ] +] Added: test/command/suite/table_create/default_tokenizer/kytea/default.test (+16 -0) 100644 =================================================================== --- /dev/null +++ test/command/suite/table_create/default_tokenizer/kytea/default.test 2012-11-13 14:06:31 +0900 (9d51c74) @@ -0,0 +1,16 @@ +register tokenizers/kytea + +table_create Memos TABLE_NO_KEY +column_create Memos content COLUMN_SCALAR Text + +table_create Terms TABLE_PAT_KEY ShortText \ + --default_tokenizer TokenKytea +column_create Terms memos_content COLUMN_INDEX Memos content + +load --table Memos +[ +{"content": "This is a pen."}, +{"content": "これはペンです。"} +] + +select Terms --output_columns _key --limit -1 Added: test/command/suite/table_create/default_tokenizer/kytea/normalize.expected (+70 -0) 100644 =================================================================== --- /dev/null +++ test/command/suite/table_create/default_tokenizer/kytea/normalize.expected 2012-11-13 14:06:31 +0900 (c2bd72e) @@ -0,0 +1,70 @@ +register tokenizers/kytea +[[0,0.0,0.0],true] +table_create Memos TABLE_NO_KEY +[[0,0.0,0.0],true] +column_create Memos content COLUMN_SCALAR Text +[[0,0.0,0.0],true] +table_create Terms TABLE_PAT_KEY|KEY_NORMALIZE ShortText --default_tokenizer TokenKytea +[[0,0.0,0.0],true] +column_create Terms memos_content COLUMN_INDEX Memos content +[[0,0.0,0.0],true] +load --table Memos +[ +{"content": "This is a pen."}, +{"content": "これはペンです。"} +] +[[0,0.0,0.0],2] +select Terms --output_columns _key --limit -1 +[ + [ + 0, + 0.0, + 0.0 + ], + [ + [ + [ + 11 + ], + [ + [ + "_key", + "ShortText" + ] + ], + [ + "." + ], + [ + "a" + ], + [ + "is" + ], + [ + "pen" + ], + [ + "this" + ], + [ + "。" + ], + [ + "これ" + ], + [ + "す" + ], + [ + "で" + ], + [ + "は" + ], + [ + "ペン" + ] + ] + ] +] Added: test/command/suite/table_create/default_tokenizer/kytea/normalize.test (+16 -0) 100644 =================================================================== --- /dev/null +++ test/command/suite/table_create/default_tokenizer/kytea/normalize.test 2012-11-13 14:06:31 +0900 (9a57696) @@ -0,0 +1,16 @@ +register tokenizers/kytea + +table_create Memos TABLE_NO_KEY +column_create Memos content COLUMN_SCALAR Text + +table_create Terms TABLE_PAT_KEY|KEY_NORMALIZE ShortText \ + --default_tokenizer TokenKytea +column_create Terms memos_content COLUMN_INDEX Memos content + +load --table Memos +[ +{"content": "This is a pen."}, +{"content": "これはペンです。"} +] + +select Terms --output_columns _key --limit -1 Added: test/command/suite/table_create/default_tokenizer/kytea/tokenized_delimiter/default.expected (+55 -0) 100644 =================================================================== --- /dev/null +++ test/command/suite/table_create/default_tokenizer/kytea/tokenized_delimiter/default.expected 2012-11-13 14:06:31 +0900 (8639244) @@ -0,0 +1,55 @@ +register tokenizers/kytea +[[0,0.0,0.0],true] +table_create Memos TABLE_NO_KEY +[[0,0.0,0.0],true] +column_create Memos content COLUMN_SCALAR Text +[[0,0.0,0.0],true] +table_create Terms TABLE_PAT_KEY ShortText --default_tokenizer TokenKytea +[[0,0.0,0.0],true] +column_create Terms memos_content COLUMN_INDEX Memos content +[[0,0.0,0.0],true] +load --table Memos +[ +{"content": "Th\uFFFEis is a p\uFFFEen."}, +{"content": "これは\uFFFEペン\uFFFEです。"} +] +[[0,0.0,0.0],2] +select Terms --output_columns _key --limit -1 +[ + [ + 0, + 0.0, + 0.0 + ], + [ + [ + [ + 6 + ], + [ + [ + "_key", + "ShortText" + ] + ], + [ + "Th" + ], + [ + "en." + ], + [ + "is is a p" + ], + [ + "これは" + ], + [ + "です。" + ], + [ + "ペン" + ] + ] + ] +] Added: test/command/suite/table_create/default_tokenizer/kytea/tokenized_delimiter/default.test (+16 -0) 100644 =================================================================== --- /dev/null +++ test/command/suite/table_create/default_tokenizer/kytea/tokenized_delimiter/default.test 2012-11-13 14:06:31 +0900 (4ebd72c) @@ -0,0 +1,16 @@ +register tokenizers/kytea + +table_create Memos TABLE_NO_KEY +column_create Memos content COLUMN_SCALAR Text + +table_create Terms TABLE_PAT_KEY ShortText \ + --default_tokenizer TokenKytea +column_create Terms memos_content COLUMN_INDEX Memos content + +load --table Memos +[ +{"content": "Th\uFFFEis is a p\uFFFEen."}, +{"content": "これは\uFFFEペン\uFFFEです。"} +] + +select Terms --output_columns _key --limit -1 Added: test/command/suite/table_create/default_tokenizer/kytea/tokenized_delimiter/normalize.expected (+55 -0) 100644 =================================================================== --- /dev/null +++ test/command/suite/table_create/default_tokenizer/kytea/tokenized_delimiter/normalize.expected 2012-11-13 14:06:31 +0900 (38b0ec7) @@ -0,0 +1,55 @@ +register tokenizers/kytea +[[0,0.0,0.0],true] +table_create Memos TABLE_NO_KEY +[[0,0.0,0.0],true] +column_create Memos content COLUMN_SCALAR Text +[[0,0.0,0.0],true] +table_create Terms TABLE_PAT_KEY|KEY_NORMALIZE ShortText --default_tokenizer TokenKytea +[[0,0.0,0.0],true] +column_create Terms memos_content COLUMN_INDEX Memos content +[[0,0.0,0.0],true] +load --table Memos +[ +{"content": "Th\uFFFEis is a p\uFFFEen."}, +{"content": "これは\uFFFEペン\uFFFEです。"} +] +[[0,0.0,0.0],2] +select Terms --output_columns _key --limit -1 +[ + [ + 0, + 0.0, + 0.0 + ], + [ + [ + [ + 6 + ], + [ + [ + "_key", + "ShortText" + ] + ], + [ + "en." + ], + [ + "is is a p" + ], + [ + "th" + ], + [ + "これは" + ], + [ + "です。" + ], + [ + "ペン" + ] + ] + ] +] Added: test/command/suite/table_create/default_tokenizer/kytea/tokenized_delimiter/normalize.test (+16 -0) 100644 =================================================================== --- /dev/null +++ test/command/suite/table_create/default_tokenizer/kytea/tokenized_delimiter/normalize.test 2012-11-13 14:06:31 +0900 (e9cbae1) @@ -0,0 +1,16 @@ +register tokenizers/kytea + +table_create Memos TABLE_NO_KEY +column_create Memos content COLUMN_SCALAR Text + +table_create Terms TABLE_PAT_KEY|KEY_NORMALIZE ShortText \ + --default_tokenizer TokenKytea +column_create Terms memos_content COLUMN_INDEX Memos content + +load --table Memos +[ +{"content": "Th\uFFFEis is a p\uFFFEen."}, +{"content": "これは\uFFFEペン\uFFFEです。"} +] + +select Terms --output_columns _key --limit -1 -------------- next part -------------- HTML����������������������������...ダウンロード