pelias · orangejulius · Sep 12, 2019 · Sep 9, 2019
diff --git a/integration/analyzer_peliasIndexOneEdgeGram.js b/integration/analyzer_peliasIndexOneEdgeGram.js
@@ -45,7 +45,7 @@ module.exports.tests.analyze = function(test, common){
     assertAnalysis( 'keyword_street_suffix', 'ctr', ['c', 'ct', 'ctr', 'ce', 'cen', 'cent', 'cente', 'center'] );
 
     assertAnalysis( 'peliasIndexOneEdgeGramFilter', '1 a ab abc abcdefghij', [
-      '1', 'a', 'a', 'ab', 'a', 'ab', 'abc', 'a', 'ab', 'abc', 
+      '1', 'a', 'a', 'ab', 'a', 'ab', 'abc', 'a', 'ab', 'abc',
       'abcd', 'abcde', 'abcdef', 'abcdefg', 'abcdefgh', 'abcdefghi', 'abcdefghij'
     ] );
     assertAnalysis( 'removeAllZeroNumericPrefix', '00001', ['1'] );
@@ -58,7 +58,7 @@ module.exports.tests.analyze = function(test, common){
     assertAnalysis( 'no kstem', 'peoples', ['p', 'pe', 'peo', 'peop', 'peopl', 'people', 'peoples'] );
 
     // remove punctuation (handled by the char_filter)
-    assertAnalysis( 'punctuation', punctuation.all.join(''), ['-','-&'] );
+    assertAnalysis( 'punctuation', punctuation.all.join(''), ['&', 'a', 'an', 'and', 'u', 'un', 'und'] );
     assertAnalysis( 'punctuation', 'Hawai‘i', ['h', 'ha', 'haw', 'hawa', 'hawai', 'hawaii'] );
 
     // ensure that very large grams are created

diff --git a/integration/analyzer_peliasPhrase.js b/integration/analyzer_peliasPhrase.js
@@ -45,7 +45,7 @@ module.exports.tests.analyze = function(test, common){
     assertAnalysis( 'stem direction synonyms', '20 bear road northeast', ['0:20', '1:bear', '2:road', '2:rd', '3:northeast', '3:ne'], true );
 
     // remove punctuation (handled by the char_filter)
-    assertAnalysis( 'punctuation', punctuation.all.join(''), [ '-&' ] );
+    assertAnalysis( 'punctuation', punctuation.all.join(''), ['&', 'and', 'und'] );
     assertAnalysis( 'punctuation', 'Hawai‘i', ['hawaii'] );
 
     suite.run( t.end );

diff --git a/integration/analyzer_peliasQuery.js b/integration/analyzer_peliasQuery.js
@@ -33,7 +33,7 @@ module.exports.tests.analyze = function(test, common){
     assertAnalysis('no kstem', 'peoples', ['peoples']);
 
     // remove punctuation (handled by the char_filter)
-    assertAnalysis( 'punctuation', punctuation.all.join(''), ['-&'] );
+    assertAnalysis( 'punctuation', punctuation.all.join(''), ['&'] );
 
     suite.run( t.end );
   });

diff --git a/integration/analyzer_peliasQueryFullToken.js b/integration/analyzer_peliasQueryFullToken.js
@@ -43,7 +43,7 @@ module.exports.tests.analyze = function(test, common){
     assertAnalysis( 'no kstem', 'peoples', ['peoples'] );
 
     // remove punctuation (handled by the char_filter)
-    assertAnalysis( 'punctuation', punctuation.all.join(''), ['-&'] );
+    assertAnalysis( 'punctuation', punctuation.all.join(''), ['&', 'and', 'und'] );
 
     // ensure that very large tokens are created
     assertAnalysis( 'largeGrams', 'grolmanstrasse', [ 'grolmanstrasse' ]);

diff --git a/integration/analyzer_peliasQueryPartialToken.js b/integration/analyzer_peliasQueryPartialToken.js
@@ -40,7 +40,7 @@ module.exports.tests.analyze = function(test, common){
     assertAnalysis( 'no kstem', 'peoples', ['peoples'] );
 
     // remove punctuation (handled by the char_filter)
-    assertAnalysis( 'punctuation', punctuation.all.join(''), ['-&'] );
+    assertAnalysis( 'punctuation', punctuation.all.join(''), ['&', 'and', 'und'] );
 
     // ensure that very large grams are created
     assertAnalysis( 'largeGrams', 'grolmanstrasse', ['grolmanstrasse']);

diff --git a/integration/analyzer_peliasStreet.js b/integration/analyzer_peliasStreet.js
@@ -15,7 +15,7 @@ module.exports.tests.analyze = function(test, common){
     suite.action( function( done ){ setTimeout( done, 500 ); }); // wait for es to bring some shards up
 
     assertAnalysis( 'lowercase', 'F', ['f']);
-    assertAnalysis( 'asciifolding', 'Max-Beer-Straße', ['max-beer-strasse']);
+    assertAnalysis( 'asciifolding', 'Max-Beer-Straße', ['max', 'beer', 'strasse', 'str']);
     assertAnalysis( 'trim', ' f ', ['f'] );
     assertAnalysis( 'keyword_street_suffix', 'foo Street', ['0:foo', '1:street', '1:st'], true );
     assertAnalysis( 'keyword_street_suffix', 'foo Road', ['0:foo', '1:road', '1:rd'], true );

diff --git a/settings.js b/settings.js
@@ -27,11 +27,11 @@ function generate(){
       "tokenizer": {
         "peliasNameTokenizer": {
           "type": "pattern",
-          "pattern": "[\\s,/\\\\]+"
+          "pattern": "[\\s,/\\\\-]+"
         },
         "peliasStreetTokenizer": {
           "type": "pattern",
-          "pattern": "[\\s,/\\\\]+"
+          "pattern": "[\\s,/\\\\-]+"
         }
       },
       "analyzer": {

diff --git a/test/fixtures/expected.json b/test/fixtures/expected.json
@@ -4,11 +4,11 @@
       "tokenizer": {
         "peliasNameTokenizer": {
           "type": "pattern",
-          "pattern": "[\\s,/\\\\]+"
+          "pattern": "[\\s,/\\\\-]+"
         },
         "peliasStreetTokenizer": {
           "type": "pattern",
-          "pattern": "[\\s,/\\\\]+"
+          "pattern": "[\\s,/\\\\-]+"
         }
       },
       "analyzer": {