185 lines
4.3 KiB
Markdown
185 lines
4.3 KiB
Markdown
## 目录结构
|
||
|
||
- pgsql-gis/
|
||
- pgsql-admin/
|
||
- docker-compose.yaml
|
||
|
||
```shell
|
||
mkdir pgsql-gis pgsql-admin
|
||
sudo chown 5050 ./pgsql-admin
|
||
```
|
||
|
||
## docker-compose.yaml
|
||
|
||
```yaml
|
||
version: '3.8'
|
||
services:
|
||
# PGSQL
|
||
pgsql-gis-16:
|
||
# 不支持全文检索
|
||
image: postgis/postgis:16-master
|
||
# 支持全文检索的自编译镜像
|
||
#image: pgsql-gis-fts:latest
|
||
container_name: pgsql-gis-16
|
||
ports:
|
||
- "35430:5432" # 替换
|
||
volumes:
|
||
- ./pgsql-gis:/var/lib/postgresql/data
|
||
environment:
|
||
POSTGRES_USER: # 替换
|
||
POSTGRES_PASSWORD: # 替换
|
||
POSTGRES_DB: # 替换
|
||
POSTGRES_INITDB_ARGS: --encoding=UTF8
|
||
restart: on-failure:3
|
||
# PG Admin(HTTP)
|
||
pgsql-admin:
|
||
image: dpage/pgadmin4:latest # 替换
|
||
container_name: pgsql-admin
|
||
ports:
|
||
- "18906:80" # 替换
|
||
volumes:
|
||
- ./pgsql-admin:/var/lib/pgadmin
|
||
environment:
|
||
PGADMIN_DEFAULT_EMAIL: demo@email.com
|
||
PGADMIN_DEFAULT_PASSWORD: # 替换
|
||
PGADMIN_CONFIG_CHECK_EMAIL_DELIVERABILITY: 'False'
|
||
restart: on-failure:3
|
||
# PG Admin(HTTPS)
|
||
# pgsql-admin:
|
||
# image: dpage/pgadmin4:latest
|
||
# container_name: pgsql-admin
|
||
# ports:
|
||
# - "18907:443"
|
||
# volumes:
|
||
# - ./pgsql-admin:/var/lib/pgadmin
|
||
# - ./certs:/certs
|
||
# environment:
|
||
# PGADMIN_DEFAULT_EMAIL: demo@email.com
|
||
# PGADMIN_DEFAULT_PASSWORD: # 替换
|
||
# PGADMIN_CONFIG_CHECK_EMAIL_DELIVERABILITY: 'False'
|
||
# PGADMIN_ENABLE_TLS: 'True'
|
||
# PGADMIN_SERVER_CERT_FILE: /certs/server.cert
|
||
# PGADMIN_SERVER_KEY_FILE: /certs/server.key
|
||
# restart: on-failure:3
|
||
```
|
||
|
||
## 添加全文索引支持
|
||
|
||
需要从 git 克隆 zhparser 添加中文分词支持,执行 docker build 命令的目录结构长这样:
|
||
|
||
- Dockerfile
|
||
- zhparser/
|
||
|
||
```bash
|
||
git clone https://github.com/amutu/zhparser.git
|
||
```
|
||
|
||
## Dockerfile
|
||
|
||
```bash
|
||
FROM postgis/postgis:16-master
|
||
|
||
ENV DEBIAN_FRONTEND=noninteractive
|
||
|
||
RUN apt-get update && apt-get install -y \
|
||
build-essential \
|
||
git \
|
||
libcurl4-openssl-dev \
|
||
libxml2-dev \
|
||
wget \
|
||
postgresql-server-dev-16 \
|
||
&& rm -rf /var/lib/apt/lists/*
|
||
|
||
RUN pg_config --version
|
||
|
||
WORKDIR /tmp
|
||
|
||
RUN wget http://www.xunsearch.com/scws/down/scws-1.2.3.tar.bz2 \
|
||
&& tar xjf scws-1.2.3.tar.bz2 \
|
||
&& cd scws-1.2.3 \
|
||
&& ./configure \
|
||
&& make && make install \
|
||
&& cd ..
|
||
|
||
COPY zhparser zhparser
|
||
|
||
RUN cd zhparser \
|
||
&& export PG_CONFIG=$(which pg_config) \
|
||
&& echo "Using pg_config: $PG_CONFIG" \
|
||
&& make USE_PGXS=1 \
|
||
&& make USE_PGXS=1 install \
|
||
&& cd ..
|
||
|
||
RUN rm -rf /tmp/*
|
||
|
||
WORKDIR /
|
||
```
|
||
|
||
## 编译
|
||
|
||
```bash
|
||
docker build -t pgsql-gis-fts .
|
||
```
|
||
|
||
## 启用中文分词扩展
|
||
|
||
```sql
|
||
CREATE EXTENSION IF NOT EXISTS zhparser;
|
||
```
|
||
|
||
```sql
|
||
CREATE TEXT SEARCH CONFIGURATION chinese_mix (PARSER = zhparser);
|
||
-- DROP TEXT SEARCH CONFIGURATION IF EXISTS chinese_mix;
|
||
```
|
||
|
||
```sql
|
||
ALTER TEXT SEARCH CONFIGURATION chinese_mix ADD MAPPING FOR n,v,a,i,e,l,d,j,m,q,r,t,u,w,x,z WITH simple;
|
||
```
|
||
|
||
## 测试
|
||
|
||
```sql
|
||
CREATE TABLE articles (
|
||
id SERIAL PRIMARY KEY,
|
||
title TEXT,
|
||
content TEXT,
|
||
-- 生成列:自动维护 tsvector,避免每次查询都计算,提高性能
|
||
content_tsvector TSVECTOR GENERATED ALWAYS AS (to_tsvector('chinese_mix', content)) STORED
|
||
);
|
||
```
|
||
|
||
```sql
|
||
-- 插入一些混合数据
|
||
INSERT INTO articles (title, content) VALUES
|
||
('AI 技术展望', '人工智能 (AI) 正在改变世界,PostgreSQL 是存储这些数据的首选数据库。'),
|
||
('PostgreSQL 16 新特性', 'PostgreSQL 16 带来了更好的性能,支持 JSON 增强和中文分词优化。'),
|
||
('日常开发笔记', 'Today I learned about zhparser. 它让中文搜索变得很简单。');
|
||
```
|
||
|
||
```sql
|
||
-- 搜索包含 "人工智能" 的文章
|
||
SELECT title, content
|
||
FROM articles
|
||
WHERE content_tsvector @@ to_tsquery('chinese_mix', '人工智能');
|
||
```
|
||
|
||
```sql
|
||
-- 搜索包含 "PostgreSQL" 的文章
|
||
SELECT title, content
|
||
FROM articles
|
||
WHERE content_tsvector @@ to_tsquery('chinese_mix', 'PostgreSQL');
|
||
```
|
||
|
||
```sql
|
||
-- 搜索既包含 "数据库" 又包含 "PostgreSQL" 的文章
|
||
SELECT title, content
|
||
FROM articles
|
||
WHERE content_tsvector @@ to_tsquery('chinese_mix', '数据库 & PostgreSQL');
|
||
```
|
||
|
||
```sql
|
||
-- 搜索包含 "AI" 或者 "改变" 的文章
|
||
SELECT title, content
|
||
FROM articles
|
||
WHERE content_tsvector @@ to_tsquery('chinese_mix', 'AI | 改变');
|
||
``` |