mirror of
https://bitbucket.org/jsuto/piler.git
synced 2024-12-25 07:50:11 +01:00
Improved charset_table settings for sphinx.conf
Signed-off-by: Janos SUTO <sj@acts.hu>
This commit is contained in:
parent
d84307f2d8
commit
505e5cb568
@ -5,6 +5,14 @@ define('SPHINX_VERSION', 220); // If you have sphinx-3.1.1, then set SPHINX_VERS
|
|||||||
define('LOCALSTATEDIR', '@LOCALSTATEDIR@');
|
define('LOCALSTATEDIR', '@LOCALSTATEDIR@');
|
||||||
define('NGRAM_CONFIG', " #ngram_len = 1\n #ngram_chars = U+3000..U+2FA1F\n");
|
define('NGRAM_CONFIG', " #ngram_len = 1\n #ngram_chars = U+3000..U+2FA1F\n");
|
||||||
|
|
||||||
|
# See http://sphinxsearch.com/wiki/doku.php?id=charset_tables for more on the charset_table settings
|
||||||
|
# The following settings contains English and some Latin extras
|
||||||
|
define('SPHINX_CHARSET_TABLE', "0..9, english, _, \
|
||||||
|
U+C1->U+E1, U+C4->U+E4, U+C5->U+E5, U+C6->U+E6, U+C9->U+E9, U+CD->U+ED, U+D3->U+F3, U+D6->U+F6, U+D8->U+F8, \
|
||||||
|
U+DA->U+FA, U+DC->U+FC, U+0150->U+0151, U+0152->U+0153, U+0170->U+0171, U+01E2->U+E6, U+01E3->U+E6, U+01FC->U+E6, \
|
||||||
|
U+01FD->U+E6, U+1D01->U+E6, U+1D02->U+E6, U+1D2D->U+E6, U+1D46->U+E6, \
|
||||||
|
U+DF, U+E1, U+E4, U+E5, U+E6, U+E9, U+ED, U+00F3, U+F6, U+F8, U+FA, U+FC, U+0151, U+0153, U+0171\n");
|
||||||
|
|
||||||
?>
|
?>
|
||||||
|
|
||||||
#
|
#
|
||||||
@ -96,6 +104,7 @@ index main1
|
|||||||
<?php } ?>
|
<?php } ?>
|
||||||
min_prefix_len = 5
|
min_prefix_len = 5
|
||||||
min_word_len = 1
|
min_word_len = 1
|
||||||
|
charset_table = <?php print SPHINX_CHARSET_TABLE; ?>
|
||||||
<?php print NGRAM_CONFIG; ?>
|
<?php print NGRAM_CONFIG; ?>
|
||||||
}
|
}
|
||||||
|
|
||||||
@ -109,6 +118,7 @@ index main2
|
|||||||
<?php } ?>
|
<?php } ?>
|
||||||
min_prefix_len = 5
|
min_prefix_len = 5
|
||||||
min_word_len = 1
|
min_word_len = 1
|
||||||
|
charset_table = <?php print SPHINX_CHARSET_TABLE; ?>
|
||||||
<?php print NGRAM_CONFIG; ?>
|
<?php print NGRAM_CONFIG; ?>
|
||||||
}
|
}
|
||||||
|
|
||||||
@ -122,6 +132,7 @@ index main3
|
|||||||
<?php } ?>
|
<?php } ?>
|
||||||
min_prefix_len = 5
|
min_prefix_len = 5
|
||||||
min_word_len = 1
|
min_word_len = 1
|
||||||
|
charset_table = <?php print SPHINX_CHARSET_TABLE; ?>
|
||||||
<?php print NGRAM_CONFIG; ?>
|
<?php print NGRAM_CONFIG; ?>
|
||||||
}
|
}
|
||||||
|
|
||||||
@ -135,6 +146,7 @@ index main4
|
|||||||
<?php } ?>
|
<?php } ?>
|
||||||
min_prefix_len = 5
|
min_prefix_len = 5
|
||||||
min_word_len = 1
|
min_word_len = 1
|
||||||
|
charset_table = <?php print SPHINX_CHARSET_TABLE; ?>
|
||||||
<?php print NGRAM_CONFIG; ?>
|
<?php print NGRAM_CONFIG; ?>
|
||||||
}
|
}
|
||||||
|
|
||||||
@ -148,6 +160,7 @@ index dailydelta1
|
|||||||
<?php } ?>
|
<?php } ?>
|
||||||
min_prefix_len = 5
|
min_prefix_len = 5
|
||||||
min_word_len = 1
|
min_word_len = 1
|
||||||
|
charset_table = <?php print SPHINX_CHARSET_TABLE; ?>
|
||||||
<?php print NGRAM_CONFIG; ?>
|
<?php print NGRAM_CONFIG; ?>
|
||||||
}
|
}
|
||||||
|
|
||||||
@ -161,6 +174,7 @@ index delta1
|
|||||||
<?php } ?>
|
<?php } ?>
|
||||||
min_prefix_len = 5
|
min_prefix_len = 5
|
||||||
min_word_len = 1
|
min_word_len = 1
|
||||||
|
charset_table = <?php print SPHINX_CHARSET_TABLE; ?>
|
||||||
<?php print NGRAM_CONFIG; ?>
|
<?php print NGRAM_CONFIG; ?>
|
||||||
<?php if(SPHINX_VERSION >= 310) { ?>
|
<?php if(SPHINX_VERSION >= 310) { ?>
|
||||||
kbatch = main1, main2, main3, main4, dailydelta1
|
kbatch = main1, main2, main3, main4, dailydelta1
|
||||||
@ -178,6 +192,7 @@ index tag1
|
|||||||
<?php } ?>
|
<?php } ?>
|
||||||
min_prefix_len = 5
|
min_prefix_len = 5
|
||||||
min_word_len = 1
|
min_word_len = 1
|
||||||
|
charset_table = <?php print SPHINX_CHARSET_TABLE; ?>
|
||||||
<?php print NGRAM_CONFIG; ?>
|
<?php print NGRAM_CONFIG; ?>
|
||||||
}
|
}
|
||||||
|
|
||||||
@ -192,6 +207,7 @@ index note1
|
|||||||
<?php } ?>
|
<?php } ?>
|
||||||
min_prefix_len = 5
|
min_prefix_len = 5
|
||||||
min_word_len = 1
|
min_word_len = 1
|
||||||
|
charset_table = <?php print SPHINX_CHARSET_TABLE; ?>
|
||||||
<?php print NGRAM_CONFIG; ?>
|
<?php print NGRAM_CONFIG; ?>
|
||||||
}
|
}
|
||||||
|
|
||||||
|
Loading…
Reference in New Issue
Block a user