Merge pull request from joergreichert/28-stemming

Query "Tafeln" should also find entries with "Tafel"
This commit is contained in:
Jörg Reichert 2017-01-01 15:15:42 +01:00 committed by GitHub
commit 9b7a3da1de
4 changed files with 39 additions and 2 deletions

View file

@ -7,5 +7,6 @@ services:
- docker
script:
- chmod +x docker-entrypoint-es-plugins.sh
- docker-compose run web rake db:setup
- docker-compose run -e CI=true -e TRAVIS=true -e TRAVIS_BRANCH=$TRAVIS_BRANCH -e TRAVIS_COMMIT=$TRAVIS_COMMIT -e TRAVIS_JOB_NUMBER=$TRAVIS_JOB_NUMBER -e TRAVIS_PULL_REQUEST=$TRAVIS_PULL_REQUEST -e TRAVIS_JOB_ID=$TRAVIS_JOB_ID -e TRAVIS_REPO_SLUG=$TRAVIS_REPO_SLUG web bin/run-tests

View file

@ -21,8 +21,36 @@ class Paper < ActiveRecord::Base
index_name ['srm', Rails.env, self.base_class.to_s.pluralize.underscore].join('_')
settings index: { number_of_shards: 1 } do
mappings dynamic: false do
settings index: {
number_of_shards: 1,
analysis: {
filter: {
german_stop: {
type: "stop",
stopwords: "_german_"
},
german_stemmer: {
type: "stemmer",
language: "light_german"
},
decomp: {
type: "decompound"
}
},
analyzer: {
german: {
tokenizer: "standard",
filter: [
"lowercase",
"german_stop",
"german_normalization",
"german_stemmer",
"decomp"
]
}
}
}
} do mappings dynamic: false do
indexes :name, type: :string, analyzer: "german"
indexes :content, type: :string, analyzer: "german"
indexes :resolution, type: :string, analyzer: "german"

View file

@ -10,3 +10,6 @@ web:
ELASTICSEARCH_URL: 'http://elasticsearch:9200'
elasticsearch:
image: elasticsearch:1.7
volumes:
- .:/apps
entrypoint: /apps/docker-entrypoint-es-plugins.sh

View file

@ -0,0 +1,5 @@
#!/bin/bash
plugin -install elasticsearch-analysis-decompound --url http://xbib.org/repository/org/xbib/elasticsearch/plugin/elasticsearch-analysis-decompound/1.7.1.3/elasticsearch-analysis-decompound-1.7.1.3-plugin.zip
exec /docker-entrypoint.sh elasticsearch