new word table layout for icu tokenizer

The table now directly reflects the different token types.
Extra information is saved in a json structure that may be
dynamically extended in the future without affecting the
table layout.
This commit is contained in:
Sarah Hoffmann
2021-07-20 10:27:06 +02:00
parent 34dcf02dee
commit 8377528952
2 changed files with 16 additions and 1 deletions

View File

@@ -0,0 +1,15 @@
DROP TABLE IF EXISTS word;
CREATE TABLE word_icu (
word_id INTEGER,
word_token text NOT NULL,
type text NOT NULL,
info jsonb
) {{db.tablespace.search_data}};
CREATE INDEX idx_word_word_token ON word
USING BTREE (word_token) {{db.tablespace.search_index}};
GRANT SELECT ON word TO "{{config.DATABASE_WEBUSER}}";
DROP SEQUENCE IF EXISTS seq_word;
CREATE SEQUENCE seq_word start 1;
GRANT SELECT ON seq_word to "{{config.DATABASE_WEBUSER}}";