| -- |
| -- COPY |
| -- |
| |
| -- directory paths are passed to us in environment variables |
| \getenv abs_srcdir PG_ABS_SRCDIR |
| \getenv abs_builddir PG_ABS_BUILDDIR |
| |
| --- test copying in CSV mode with various styles |
| --- of embedded line ending characters |
| |
| create temp table copytest ( |
| style text, |
| test text, |
| filler int); |
| |
| insert into copytest values('DOS',E'abc\r\ndef',1); |
| insert into copytest values('Unix',E'abc\ndef',2); |
| insert into copytest values('Mac',E'abc\rdef',3); |
| insert into copytest values(E'esc\\ape',E'a\\r\\\r\\\n\\nb',4); |
| |
| \set filename :abs_builddir '/results/copytest.csv' |
| copy copytest to :'filename' csv; |
| |
| create temp table copytest2 (like copytest); |
| |
| copy copytest2 from :'filename' csv; |
| |
| select * from copytest except select * from copytest2 order by 1,2,3; |
| |
| truncate copytest2; |
| |
| --- same test but with an escape char different from quote char |
| |
| copy copytest to :'filename' csv quote '''' escape E'\\'; |
| |
| copy copytest2 from :'filename' csv quote '''' escape E'\\'; |
| |
| select * from copytest except select * from copytest2 order by 1,2,3; |
| |
| |
| -- test header line feature |
| |
| create temp table copytest3 ( |
| c1 int, |
| "col with , comma" text, |
| "col with "" quote" int) distributed by (c1); |
| |
| copy copytest3 from stdin csv header; |
| this is just a line full of junk that would error out if parsed |
| 1,a,1 |
| 2,b,2 |
| \. |
| |
| copy copytest3 to stdout csv header; |
| |
| create temp table copytest4 ( |
| c1 int, |
| "colname with tab: " text); |
| |
| copy copytest4 from stdin (header); |
| this is just a line full of junk that would error out if parsed |
| 1 a |
| 2 b |
| \. |
| |
| copy copytest4 to stdout (header); |
| |
| -- test copy from with a partitioned table |
| create table parted_copytest ( |
| a int, |
| b int, |
| c text |
| ) partition by list (b); |
| |
| create table parted_copytest_a1 (c text, b int, a int); |
| create table parted_copytest_a2 (a int, c text, b int); |
| |
| alter table parted_copytest_a1 set distributed by (a); |
| |
| alter table parted_copytest attach partition parted_copytest_a1 for values in(1); |
| alter table parted_copytest attach partition parted_copytest_a2 for values in(2); |
| |
| -- We must insert enough rows to trigger multi-inserts. These are only |
| -- enabled adaptively when there are few enough partition changes. |
| insert into parted_copytest select x,1,'One' from generate_series(1,1000) x; |
| insert into parted_copytest select x,2,'Two' from generate_series(1001,1010) x; |
| insert into parted_copytest select x,1,'One' from generate_series(1011,1020) x; |
| |
| \set filename :abs_builddir '/results/parted_copytest.csv' |
| copy (select * from parted_copytest order by a) to :'filename'; |
| |
| truncate parted_copytest; |
| |
| copy parted_copytest from :'filename'; |
| |
| -- Ensure COPY FREEZE errors for partitioned tables. |
| begin; |
| truncate parted_copytest; |
| copy parted_copytest from :'filename' (freeze); |
| rollback; |
| |
| select tableoid::regclass,count(*),sum(a) from parted_copytest |
| group by tableoid order by tableoid::regclass::name; |
| |
| truncate parted_copytest; |
| |
| -- create before insert row trigger on parted_copytest_a2 |
| create function part_ins_func() returns trigger language plpgsql as $$ |
| begin |
| return new; |
| end; |
| $$; |
| |
| create trigger part_ins_trig |
| before insert on parted_copytest_a2 |
| for each row |
| execute procedure part_ins_func(); |
| |
| copy parted_copytest from :'filename'; |
| |
| select tableoid::regclass,count(*),sum(a) from parted_copytest |
| group by tableoid order by tableoid::regclass::name; |
| |
| truncate table parted_copytest; |
| create index on parted_copytest (b); |
| drop trigger part_ins_trig on parted_copytest_a2; |
| |
| copy parted_copytest from stdin; |
| 1 1 str1 |
| 2 2 str2 |
| \. |
| |
| -- Ensure index entries were properly added during the copy. |
| select * from parted_copytest where b = 1; |
| select * from parted_copytest where b = 2; |
| |
| drop table parted_copytest; |
| |
| -- |
| -- Progress reporting for COPY |
| -- |
| create table tab_progress_reporting ( |
| name text, |
| age int4, |
| location point, |
| salary int4, |
| manager name |
| ); |
| |
| -- Add a trigger to catch and print the contents of the catalog view |
| -- pg_stat_progress_copy during data insertion. This allows to test |
| -- the validation of some progress reports for COPY FROM where the trigger |
| -- would fire. |
| create function notice_after_tab_progress_reporting() returns trigger AS |
| $$ |
| declare report record; |
| begin |
| -- The fields ignored here are the ones that may not remain |
| -- consistent across multiple runs. The sizes reported may differ |
| -- across platforms, so just check if these are strictly positive. |
| with progress_data as ( |
| select |
| relid::regclass::text as relname, |
| command, |
| type, |
| bytes_processed > 0 as has_bytes_processed, |
| bytes_total > 0 as has_bytes_total, |
| tuples_processed, |
| tuples_excluded |
| from pg_stat_progress_copy |
| where pid = pg_backend_pid()) |
| select into report (to_jsonb(r)) as value |
| from progress_data r; |
| |
| raise info 'progress: %', report.value::text; |
| return new; |
| end; |
| $$ language plpgsql; |
| |
| create trigger check_after_tab_progress_reporting |
| after insert on tab_progress_reporting |
| for each statement |
| execute function notice_after_tab_progress_reporting(); |
| |
| -- Generate COPY FROM report with PIPE. |
| copy tab_progress_reporting from stdin; |
| sharon 25 (15,12) 1000 sam |
| sam 30 (10,5) 2000 bill |
| bill 20 (11,10) 1000 sharon |
| \. |
| |
| -- Generate COPY FROM report with FILE, with some excluded tuples. |
| truncate tab_progress_reporting; |
| \set filename :abs_srcdir '/data/emp.data' |
| copy tab_progress_reporting from :'filename' |
| where (salary < 2000); |
| |
| drop trigger check_after_tab_progress_reporting on tab_progress_reporting; |
| drop function notice_after_tab_progress_reporting(); |
| drop table tab_progress_reporting; |
| |
| -- Test header matching feature |
| create table header_copytest ( |
| a int, |
| b int, |
| c text |
| ); |
| -- Make sure it works with dropped columns |
| alter table header_copytest drop column c; |
| alter table header_copytest add column c text; |
| copy header_copytest to stdout with (header match); |
| copy header_copytest from stdin with (header wrong_choice); |
| -- works |
| copy header_copytest from stdin with (header match); |
| a b c |
| 1 2 foo |
| \. |
| copy header_copytest (c, a, b) from stdin with (header match); |
| c a b |
| bar 3 4 |
| \. |
| copy header_copytest from stdin with (header match, format csv); |
| a,b,c |
| 5,6,baz |
| \. |
| -- errors |
| copy header_copytest (c, b, a) from stdin with (header match); |
| a b c |
| 1 2 foo |
| \. |
| copy header_copytest from stdin with (header match); |
| a b \N |
| 1 2 foo |
| \. |
| copy header_copytest from stdin with (header match); |
| a b |
| 1 2 |
| \. |
| copy header_copytest from stdin with (header match); |
| a b c d |
| 1 2 foo bar |
| \. |
| copy header_copytest from stdin with (header match); |
| a b d |
| 1 2 foo |
| \. |
| SELECT * FROM header_copytest ORDER BY a; |
| |
| -- Drop an extra column, in the middle of the existing set. |
| alter table header_copytest drop column b; |
| -- works |
| copy header_copytest (c, a) from stdin with (header match); |
| c a |
| foo 7 |
| \. |
| copy header_copytest (a, c) from stdin with (header match); |
| a c |
| 8 foo |
| \. |
| -- errors |
| copy header_copytest from stdin with (header match); |
| a ........pg.dropped.2........ c |
| 1 2 foo |
| \. |
| copy header_copytest (a, c) from stdin with (header match); |
| a c b |
| 1 foo 2 |
| \. |
| |
| SELECT * FROM header_copytest ORDER BY a; |
| drop table header_copytest; |
| |
| -- test COPY with overlong column defaults |
| create temp table oversized_column_default ( |
| col1 varchar(5) DEFAULT 'more than 5 chars', |
| col2 varchar(5)); |
| -- normal COPY should work |
| copy oversized_column_default from stdin; |
| \. |
| -- error if the column is excluded |
| copy oversized_column_default (col2) from stdin; |
| \. |
| -- error if the DEFAULT option is given |
| copy oversized_column_default from stdin (default ''); |
| \. |
| drop table oversized_column_default; |
| |
| |
| -- |
| -- Create partitioned table that does not allow bulk insertions, to test bugs |
| -- related to the reuse of BulkInsertState across partitions (only done when |
| -- not using bulk insert). Switching between partitions often makes it more |
| -- likely to encounter these bugs, so we just switch on roughly every insert |
| -- by having an even/odd number partition and inserting evenly distributed |
| -- data. |
| -- |
| CREATE TABLE parted_si ( |
| id int not null, |
| data text not null, |
| -- prevent use of bulk insert by having a volatile function |
| rand float8 not null default random() |
| ) |
| PARTITION BY LIST((id % 2)); |
| |
| CREATE TABLE parted_si_p_even PARTITION OF parted_si FOR VALUES IN (0); |
| CREATE TABLE parted_si_p_odd PARTITION OF parted_si FOR VALUES IN (1); |
| |
| -- Test that bulk relation extension handles reusing a single BulkInsertState |
| -- across partitions. Without the fix applied, this reliably reproduces |
| -- #18130 unless shared_buffers is extremely small (preventing any use use of |
| -- bulk relation extension). See |
| -- https://postgr.es/m/18130-7a86a7356a75209d%40postgresql.org |
| -- https://postgr.es/m/257696.1695670946%40sss.pgh.pa.us |
| \set filename :abs_srcdir '/data/desc.data' |
| COPY parted_si(id, data) FROM :'filename'; |
| |
| -- An earlier bug (see commit b1ecb9b3fcf) could end up using a buffer from |
| -- the wrong partition. This test is *not* guaranteed to trigger that bug, but |
| -- does so when shared_buffers is small enough. To test if we encountered the |
| -- bug, check that the partition condition isn't violated. |
| SELECT tableoid::regclass, id % 2 = 0 is_even, count(*) from parted_si GROUP BY 1, 2 ORDER BY 1; |
| |
| DROP TABLE parted_si; |