- 论坛徽章:
- 0
|
我在数据库插入数据的过程中偶然发现,汉字“太阳”和“天队”在pg里居然作为关键字是相同的...
我的客户端是GBK,服务端是Unicode.
$ pg_config --version
PostgreSQL 7.4.8
$ echo "太阳" >; /tmp/tmp1
$ echo "天队" >; /tmp/tmp2
$ iconv -f GBK -t UTF-8 /tmp/tmp1 | hexdump
0000000 a4e5 e9aa b398 000a
0000007
$ iconv -f GBK -t UTF-8 /tmp/tmp2 | hexdump
0000000 a4e5 e9a9 9f98 000a
0000007
$ psql html
html=>; set client_encoding='GBK';
SET
html=>; show server_encoding;
server_encoding
-----------------
UNICODE
(1 行)
html=>; show client_encoding;
client_encoding
-----------------
GBK
(1 行)
html=>; create table gbk (key varchar(64), value integer);
CREATE TABLE
html=>; insert into gbk values ('太阳', 1);
INSERT 2836917 1
html=>; insert into gbk values ('月亮', 2);
INSERT 2836918 1
html=>; insert into gbk values ('草原', 3);
INSERT 2836919 1
html=>; insert into gbk values ('天队', 4);
INSERT 2836920 1
html=>; select * from gbk;
key | value
------+-------
太阳 | 1
月亮 | 2
草原 | 3
天队 | 4
(4 行)
html=>; select * from gbk where key='草原';
key | value
------+-------
草原 | 3
(1 行)
html=>; select * from gbk where key='太阳';
key | value
------+-------
太阳 | 1
天队 | 4
(2 行)
html=>; \q
-------------------------------------------------------------
为什么会这样? |
|