Kouhei Sutou
null+****@clear*****
Fri May 11 12:26:32 JST 2018
Kouhei Sutou 2018-05-11 12:26:32 +0900 (Fri, 11 May 2018) New Revision: 0c5d418df84d31af8ed693dc80ccd16cb200eb0d https://github.com/groonga/groonga/commit/0c5d418df84d31af8ed693dc80ccd16cb200eb0d Message: test: split report_source_location test Added files: test/command/suite/tokenizers/ngram/report_source_location/expand.expected test/command/suite/tokenizers/ngram/report_source_location/expand.test test/command/suite/tokenizers/ngram/report_source_location/loose_symbol.expected Removed files: test/command/suite/tokenizers/ngram/report_source_location.expected Renamed files: test/command/suite/tokenizers/ngram/report_source_location/loose_symbol.test (from test/command/suite/tokenizers/ngram/report_source_location.test) Deleted: test/command/suite/tokenizers/ngram/report_source_location.expected (+0 -157) 100644 =================================================================== --- test/command/suite/tokenizers/ngram/report_source_location.expected 2018-05-10 10:04:35 +0900 (085aa799d) +++ /dev/null @@ -1,157 +0,0 @@ -tokenize 'TokenNgram("report_source_location", true, "loose_symbol", true)' "ア㌕090(1234)56−78" NormalizerAuto -[ - [ - 0, - 0.0, - 0.0 - ], - [ - { - "value": "アキ", - "position": 0, - "force_prefix": false, - "source_offset": 0, - "source_length": 6 - }, - { - "value": "キロ", - "position": 1, - "force_prefix": false, - "source_offset": 3, - "source_length": 3 - }, - { - "value": "ログ", - "position": 2, - "force_prefix": false, - "source_offset": 3, - "source_length": 3 - }, - { - "value": "グラ", - "position": 3, - "force_prefix": false, - "source_offset": 3, - "source_length": 3 - }, - { - "value": "ラム", - "position": 4, - "force_prefix": false, - "source_offset": 3, - "source_length": 3 - }, - { - "value": "ム", - "position": 5, - "force_prefix": false, - "source_offset": 3, - "source_length": 3 - }, - { - "value": "090", - "position": 6, - "force_prefix": false, - "source_offset": 6, - "source_length": 9 - }, - { - "value": "(", - "position": 7, - "force_prefix": false, - "source_offset": 15, - "source_length": 3 - }, - { - "value": "1234", - "position": 8, - "force_prefix": false, - "source_offset": 18, - "source_length": 8 - }, - { - "value": ")", - "position": 9, - "force_prefix": false, - "source_offset": 26, - "source_length": 3 - }, - { - "value": "56", - "position": 10, - "force_prefix": false, - "source_offset": 29, - "source_length": 4 - }, - { - "value": "−", - "position": 11, - "force_prefix": false, - "source_offset": 33, - "source_length": 3 - }, - { - "value": "78", - "position": 12, - "force_prefix": false, - "source_offset": 36, - "source_length": 6 - }, - { - "value": "", - "position": 13, - "force_prefix": false, - "source_offset": 42, - "source_length": 0 - }, - { - "value": "アキ", - "position": 14, - "force_prefix": false, - "source_offset": 0, - "source_length": 6 - }, - { - "value": "キロ", - "position": 15, - "force_prefix": false, - "source_offset": 3, - "source_length": 3 - }, - { - "value": "ログ", - "position": 16, - "force_prefix": false, - "source_offset": 3, - "source_length": 3 - }, - { - "value": "グラ", - "position": 17, - "force_prefix": false, - "source_offset": 3, - "source_length": 3 - }, - { - "value": "ラム", - "position": 18, - "force_prefix": false, - "source_offset": 3, - "source_length": 3 - }, - { - "value": "ム", - "position": 19, - "force_prefix": false, - "source_offset": 3, - "source_length": 3 - }, - { - "value": "09012345678", - "position": 20, - "force_prefix": false, - "source_offset": 6, - "source_length": 36 - } - ] -] Added: test/command/suite/tokenizers/ngram/report_source_location/expand.expected (+59 -0) 100644 =================================================================== --- /dev/null +++ test/command/suite/tokenizers/ngram/report_source_location/expand.expected 2018-05-11 12:26:32 +0900 (56c2b8d84) @@ -0,0 +1,59 @@ +tokenize 'TokenNgram("report_source_location", true)' "ア㌕Az" NormalizerAuto +[ + [ + 0, + 0.0, + 0.0 + ], + [ + { + "value": "アキ", + "position": 0, + "force_prefix": false, + "source_offset": 0, + "source_length": 6 + }, + { + "value": "キロ", + "position": 1, + "force_prefix": false, + "source_offset": 3, + "source_length": 3 + }, + { + "value": "ログ", + "position": 2, + "force_prefix": false, + "source_offset": 3, + "source_length": 3 + }, + { + "value": "グラ", + "position": 3, + "force_prefix": false, + "source_offset": 3, + "source_length": 3 + }, + { + "value": "ラム", + "position": 4, + "force_prefix": false, + "source_offset": 3, + "source_length": 3 + }, + { + "value": "ム", + "position": 5, + "force_prefix": false, + "source_offset": 3, + "source_length": 3 + }, + { + "value": "az", + "position": 6, + "force_prefix": false, + "source_offset": 6, + "source_length": 4 + } + ] +] Added: test/command/suite/tokenizers/ngram/report_source_location/expand.test (+4 -0) 100644 =================================================================== --- /dev/null +++ test/command/suite/tokenizers/ngram/report_source_location/expand.test 2018-05-11 12:26:32 +0900 (f45dd3257) @@ -0,0 +1,4 @@ +tokenize \ + 'TokenNgram("report_source_location", true)' \ + "ア㌕Az" \ + NormalizerAuto Added: test/command/suite/tokenizers/ngram/report_source_location/loose_symbol.expected (+73 -0) 100644 =================================================================== --- /dev/null +++ test/command/suite/tokenizers/ngram/report_source_location/loose_symbol.expected 2018-05-11 12:26:32 +0900 (757c397f0) @@ -0,0 +1,73 @@ +tokenize 'TokenNgram("report_source_location", true, "loose_symbol", true)' "090(1234)56−78" NormalizerAuto +[ + [ + 0, + 0.0, + 0.0 + ], + [ + { + "value": "090", + "position": 0, + "force_prefix": false, + "source_offset": 0, + "source_length": 9 + }, + { + "value": "(", + "position": 1, + "force_prefix": false, + "source_offset": 9, + "source_length": 3 + }, + { + "value": "1234", + "position": 2, + "force_prefix": false, + "source_offset": 12, + "source_length": 8 + }, + { + "value": ")", + "position": 3, + "force_prefix": false, + "source_offset": 20, + "source_length": 3 + }, + { + "value": "56", + "position": 4, + "force_prefix": false, + "source_offset": 23, + "source_length": 4 + }, + { + "value": "−", + "position": 5, + "force_prefix": false, + "source_offset": 27, + "source_length": 3 + }, + { + "value": "78", + "position": 6, + "force_prefix": false, + "source_offset": 30, + "source_length": 6 + }, + { + "value": "", + "position": 7, + "force_prefix": false, + "source_offset": 36, + "source_length": 0 + }, + { + "value": "09012345678", + "position": 8, + "force_prefix": false, + "source_offset": 0, + "source_length": 36 + } + ] +] Renamed: test/command/suite/tokenizers/ngram/report_source_location/loose_symbol.test (+1 -1) 66% =================================================================== --- test/command/suite/tokenizers/ngram/report_source_location.test 2018-05-10 10:04:35 +0900 (e41363c28) +++ test/command/suite/tokenizers/ngram/report_source_location/loose_symbol.test 2018-05-11 12:26:32 +0900 (135a9c270) @@ -1,4 +1,4 @@ tokenize \ 'TokenNgram("report_source_location", true, "loose_symbol", true)' \ - "ア㌕090(1234)56−78" \ + "090(1234)56−78" \ NormalizerAuto -------------- next part -------------- HTML����������������������������... URL: https://lists.osdn.me/mailman/archives/groonga-commit/attachments/20180511/2e4207e7/attachment-0001.htm