1.創(chuàng)建常規(guī)的企業(yè)信息表
create table t_centerprises(
objectid bigint not null, /*唯一編號(hào)(6位行政區(qū)號(hào)+6位sn)*/
divid uuid not null, /*行政區(qū)唯一代碼*/
name text not null, /*企業(yè)名稱*/
address text not null, /*企業(yè)地址*/
post text, /*企業(yè)郵編*/
contacts text, /*聯(lián)系人*/
tel text, /*聯(lián)系電話*/
fax text, /*傳真*/
describe text, /*企業(yè)備注*/
date timestamp default now() not null, /*創(chuàng)建日期*/
constraint pk_centerprisess_objectid primary key (objectid),
constraint fk_centerprises_divid foreign key(divid) references ts_divisions(objectid) on delete cascade
);
create index idx_centerprises_divid on t_centerprises(divid);
2.需要使用的函數(shù)
/*轉(zhuǎn)換16進(jìn)制到字符*/
drop function if exists hex_to_string(text);
create or replace function hex_to_string( text)
returns text as
$$
declare
result text;
begin
execute 'select U''\' || $1 || '''' INTO result;
return result;
end;
$$ language plpgsql;
/*隨機(jī)生成漢字
漢字范圍U+4E00..U+9FA5
*/
drop function if exists gen_random_zh(int,int);
create or replace function gen_random_zh(imin int,imax int)
returns text as
$$
declare
vlen integer;
result text;
begin
result := '';
vlen = floor(random()*(imax-imin)+imin);
for i in 1..vlen loop
result := result || hex_to_string(to_hex(floor(random()*(42191-19968)+19968):integer));
end loop;
return result;
end;
$$ language plpgsql;
3.常規(guī)測(cè)試數(shù)據(jù)插入(5000000條)
insert into t_centerprises(objectid,divid,name,address,post,contacts,tel,fax,describe)
select (vdivid|| lpad(id::text,6,'0')):bigint as objectid,'110101',
gen_random_zh(5,25) as name,gen_random_zh(10,50) as address,
floor(random()*(699999-600000)+600000) as post,gen_random_zh(2,8) as contacts,
floor(random()*(69999999-60000000)+60000000) as tel,floor(random()*(69999999-60000000)+60000000) as fax,
gen_random_zh(32,128) as describe
from generate_series(1,5000000) as id;
在普通pc機(jī)上插入,大概完成時(shí)間約8小時(shí),過(guò)程不可監(jiān)控,并且cpu/內(nèi)存占用率高,磁盤(pán)基本滿負(fù)荷動(dòng)作,讀寫(xiě)率基本上都是100%.
4.改進(jìn)后的方法, 插入(10000000條)
do $$
declare vStart bigint;
declare vEnd bigint;
declare MAXVALE bigint;
declare INTERVAL bigint;
declare vprovince integer;
declare vprefecture integer;
declare vcounty integer;
declare vdivid text;
declare vdividex uuid;
begin
vprovince := 10;vprefecture := 1;vcounty := 1;
MAXVALE := 1000000;
INTERVAL := 1000; vStart := 1 ;vEnd := INTERVAL;
vdivid := (lpad(vprovince::text,2,'0') || lpad(vprefecture::text,2,'0') || lpad(vcounty::text,2,'0')):text;
vdividex := (select objectid from ts_divisions where province=vprovince and prefecture=vprefecture and county=vcounty);
loop
insert into t_centerprises(objectid,divid,name,address,post,contacts,tel,fax,describe)
select (vdivid|| lpad(id::text,6,'0')):bigint as objectid,vdividex as divid,
gen_random_zh(5,25) as name,gen_random_zh(10,50) as address,
floor(random()*(699999-600000)+600000) as post,gen_random_zh(2,8) as contacts,
floor(random()*(69999999-60000000)+60000000) as tel,floor(random()*(69999999-60000000)+60000000) as fax,
gen_random_zh(32,128) as describe
from generate_series(vStart,vEnd) as id;
raise notice '%', vEnd;
vStart := vEnd + 1; vEnd := vEnd + INTERVAL;
if( vEnd > MAXVALE ) then
return;
elsif(vEnd = MAXVALE) then
vEnd := vEnd - 1;
end if;
end loop;
end$$;
因?yàn)檫\(yùn)算原因, cpu/內(nèi)存占用率仍然很高, 硬盤(pán)負(fù)荷較小,讀寫(xiě)率也比較低,大概完成時(shí)間約1.5小時(shí).
補(bǔ)充:postgreSQL數(shù)據(jù)庫(kù) 向表中快速插入1000000條數(shù)據(jù)
不用創(chuàng)建函數(shù),直接向表中快速插入1000000條數(shù)據(jù)
create table tbl_test (id int, info text, c_time timestamp);
insert into tbl_test select generate_series(1,100000),md5(random():text),clock_timestamp();
select count(id) from tbl_test; --查看個(gè)數(shù)據(jù)條數(shù)
以上為個(gè)人經(jīng)驗(yàn),希望能給大家一個(gè)參考,也希望大家多多支持腳本之家。如有錯(cuò)誤或未考慮完全的地方,望不吝賜教。
您可能感興趣的文章:- 使用postgresql 模擬批量數(shù)據(jù)插入的案例
- PostgreSQL upsert(插入更新)數(shù)據(jù)的操作詳解
- postgreSQL數(shù)據(jù)庫(kù) 實(shí)現(xiàn)向表中快速插入1000000條數(shù)據(jù)
- Python隨機(jī)生成數(shù)據(jù)后插入到PostgreSQL
- postgres 使用存儲(chǔ)過(guò)程批量插入數(shù)據(jù)的操作