mirror of
https://github.com/sphinx-doc/sphinx.git
synced 2025-02-25 18:55:22 -06:00
make stop word string unicode
This commit is contained in:
parent
6bda4586bd
commit
a130bb9f6f
@ -13,7 +13,7 @@ from sphinx.search import SearchLanguage, parse_stop_word
|
||||
|
||||
import snowballstemmer
|
||||
|
||||
danish_stopwords = parse_stop_word('''
|
||||
danish_stopwords = parse_stop_word(u'''
|
||||
| source: http://snowball.tartarus.org/algorithms/danish/stop.txt
|
||||
og | and
|
||||
i | in
|
||||
|
@ -13,7 +13,7 @@ from sphinx.search import SearchLanguage, parse_stop_word
|
||||
|
||||
import snowballstemmer
|
||||
|
||||
german_stopwords = parse_stop_word('''
|
||||
german_stopwords = parse_stop_word(u'''
|
||||
|source: http://snowball.tartarus.org/algorithms/german/stop.txt
|
||||
aber | but
|
||||
|
||||
|
@ -13,7 +13,7 @@ from sphinx.search import SearchLanguage, parse_stop_word
|
||||
|
||||
import snowballstemmer
|
||||
|
||||
spanish_stopwords = parse_stop_word('''
|
||||
spanish_stopwords = parse_stop_word(u'''
|
||||
|source: http://snowball.tartarus.org/algorithms/spanish/stop.txt
|
||||
de | from, of
|
||||
la | the, her
|
||||
|
@ -13,7 +13,7 @@ from sphinx.search import SearchLanguage, parse_stop_word
|
||||
|
||||
import snowballstemmer
|
||||
|
||||
finnish_stopwords = parse_stop_word('''
|
||||
finnish_stopwords = parse_stop_word(u'''
|
||||
| source: http://snowball.tartarus.org/algorithms/finnish/stop.txt
|
||||
| forms of BE
|
||||
|
||||
|
@ -13,7 +13,7 @@ from sphinx.search import SearchLanguage, parse_stop_word
|
||||
|
||||
import snowballstemmer
|
||||
|
||||
french_stopwords = parse_stop_word('''
|
||||
french_stopwords = parse_stop_word(u'''
|
||||
| source: http://snowball.tartarus.org/algorithms/french/stop.txt
|
||||
au | a + le
|
||||
aux | a + les
|
||||
|
@ -13,7 +13,7 @@ from sphinx.search import SearchLanguage, parse_stop_word
|
||||
|
||||
import snowballstemmer
|
||||
|
||||
hungarian_stopwords = parse_stop_word('''
|
||||
hungarian_stopwords = parse_stop_word(u'''
|
||||
| source: http://snowball.tartarus.org/algorithms/hungarian/stop.txt
|
||||
| prepared by Anna Tordai
|
||||
a
|
||||
|
@ -13,7 +13,7 @@ from sphinx.search import SearchLanguage, parse_stop_word
|
||||
|
||||
import snowballstemmer
|
||||
|
||||
italian_stopwords = parse_stop_word('''
|
||||
italian_stopwords = parse_stop_word(u'''
|
||||
| source: http://snowball.tartarus.org/algorithms/italian/stop.txt
|
||||
ad | a (to) before vowel
|
||||
al | a + il
|
||||
|
@ -13,7 +13,7 @@ from sphinx.search import SearchLanguage, parse_stop_word
|
||||
|
||||
import snowballstemmer
|
||||
|
||||
danish_stopwords = parse_stop_word('''
|
||||
danish_stopwords = parse_stop_word(u'''
|
||||
| source: http://snowball.tartarus.org/algorithms/danish/stop.txt
|
||||
og | and
|
||||
i | in
|
||||
|
@ -13,7 +13,7 @@ from sphinx.search import SearchLanguage, parse_stop_word
|
||||
|
||||
import snowballstemmer
|
||||
|
||||
norwegian_stopwords = parse_stop_word('''
|
||||
norwegian_stopwords = parse_stop_word(u'''
|
||||
| source: http://snowball.tartarus.org/algorithms/norwegian/stop.txt
|
||||
og | and
|
||||
i | in
|
||||
|
@ -13,7 +13,7 @@ from sphinx.search import SearchLanguage, parse_stop_word
|
||||
|
||||
import snowballstemmer
|
||||
|
||||
portuguese_stopwords = parse_stop_word('''
|
||||
portuguese_stopwords = parse_stop_word(u'''
|
||||
| source: http://snowball.tartarus.org/algorithms/portuguese/stop.txt
|
||||
de | of, from
|
||||
a | the; to, at; her
|
||||
|
@ -13,7 +13,7 @@ from sphinx.search import SearchLanguage, parse_stop_word
|
||||
|
||||
import snowballstemmer
|
||||
|
||||
russian_stopwords = parse_stop_word('''
|
||||
russian_stopwords = parse_stop_word(u'''
|
||||
| source: http://snowball.tartarus.org/algorithms/russian/stop.txt
|
||||
и | and
|
||||
в | in/into
|
||||
|
@ -13,7 +13,7 @@ from sphinx.search import SearchLanguage, parse_stop_word
|
||||
|
||||
import snowballstemmer
|
||||
|
||||
swedish_stopwords = parse_stop_word('''
|
||||
swedish_stopwords = parse_stop_word(u'''
|
||||
| source: http://snowball.tartarus.org/algorithms/swedish/stop.txt
|
||||
och | and
|
||||
det | it, this/that
|
||||
|
Loading…
Reference in New Issue
Block a user