tps/srce.pgsql

DO $$

DECLARE _t text;
DECLARE _c text;

BEGIN
	
----------------------------------------------------build the column list of the temp table----------------------------------------------------------------

	SELECT
        string_agg(quote_ident(prs.key)||' '||prs.type,','),
        string_agg(quote_ident(prs.key),',')
    INTO
    	_t, 
        _c
    FROM 
        TPS.srce
        --unwrap the schema definition array
        LEFT JOIN LATERAL jsonb_populate_recordset(null::tps.srce_defn_schema, defn->'schema') prs ON TRUE
    WHERE   
        srce = 'PNCC'
    GROUP BY
        srce;
        
----------------------------------------------------add create table verbage in front of column list--------------------------------------------------------

    _t := format('CREATE TEMP TABLE csv_i (%s, id SERIAL)', _t);
    --RAISE NOTICE '%', _t;
    --RAISE NOTICE '%', _c;

    DROP TABLE IF EXISTS csv_i;
    
    EXECUTE _t;

----------------------------------------------------do the insert-------------------------------------------------------------------------------------------

    --the column list needs to be dynamic forcing this whole line to be dynamic
    _t := format('COPY csv_i (%s) FROM ''C:\Users\ptrowbridge\downloads\transsearchcsv.csv'' WITH (HEADER TRUE,DELIMITER '','', FORMAT CSV, ENCODING ''SQL_ASCII'',QUOTE ''"'');',_c);

    --RAISE NOTICE '%', _t;

    EXECUTE _t;


END
$$;

--*******************************************
--this needs to aggregate on id sequence
--*******************************************
WITH pending_list AS (
    SELECT
        ---creates a key value pair and then aggregates rows of key value pairs
        jsonb_object_agg(
                (ae.e::text[])[1],                                  --the key name
                (row_to_json(i)::jsonb) #> ae.e::text[]             --get the target value from the key from the csv row that has been converted to json
        ) json_key,
        row_to_json(i)::JSONB - 'id' rec,
        srce,
        --ae.rn,
        id
    FROM
        csv_i i
        INNER JOIN tps.srce s ON
            s.srce = 'PNCC'
        LEFT JOIN LATERAL JSONB_ARRAY_ELEMENTS_TEXT(defn->'unique_constraint'->'fields') WITH ORDINALITY ae(e, rn) ON TRUE
    GROUP BY
        i.*,
        srce,
        id
    ORDER BY    
        id
)
------results of an insert operation--------------
, inserted AS (
    INSERT INTO
        tps.trans (srce, rec)
    SELECT
        pl.srce
        ,pl.rec
    FROM 
        pending_list pl
        LEFT JOIN tps.trans t ON
            t.srce = pl.srce
            AND t.rec @> pl.json_key
        WHERE
            t IS NULL
    ----this conflict is only if an exact duplicate rec json happens, which will be rejected
    ----therefore, records may not be inserted due to ay matches with certain json fields, or if the entire json is a duplicate, reason is not specified
    RETURNING *
)
---------raw list of records not inserted----------
, not_inserted AS (
    SELECT
        srce
        ,rec
    FROM
        pending_list

    EXCEPT ALL

    SELECT 
        srce
        ,rec
    FROM 
        inserted
)
--------summarize records not inserted------------------
SELECT
    t.srce
    ,(ae.e::text[])[1] unq_constr
    ,MIN(rec #>> ae.e::text[]) min_text
    ,MAX(rec #>> ae.e::text[]) max_text
    ,JSONB_PRETTY(JSON_AGG(rec #> ae.e::text[] ORDER BY rec #>> ae.e::text[])::JSONB)
FROM
    not_inserted t
    INNER JOIN tps.srce s ON
        s.srce = t.srce
    LEFT JOIN LATERAL JSONB_ARRAY_ELEMENTS_TEXT(defn->'unique_constraint'->'fields') WITH ORDINALITY ae(e, rn) ON TRUE
GROUP BY
    t.srce
    ,(ae.e::text[])[1];
unwrap the newly created json arrangement and dynamically create a temp table 2017-10-11 00:17:21 -04:00			`DO $$`

get rid of insert 2017-10-15 13:05:20 -04:00			`DECLARE _t text;`
			`DECLARE _c text;`
unwrap the newly created json arrangement and dynamically create a temp table 2017-10-11 00:17:21 -04:00
get rid of insert 2017-10-15 13:05:20 -04:00			`BEGIN`
unwrap the newly created json arrangement and dynamically create a temp table 2017-10-11 00:17:21 -04:00
formatting 2017-10-11 00:29:38 -04:00			`----------------------------------------------------build the column list of the temp table----------------------------------------------------------------`

unwrap the newly created json arrangement and dynamically create a temp table 2017-10-11 00:17:21 -04:00			`SELECT`
add another variable to collect column list, add a serial column to temp, copy using column list, and then build json object based on json defn 2017-10-14 01:40:26 -04:00			`string_agg(quote_ident(prs.key)\|\|' '\|\|prs.type,','),`
			`string_agg(quote_ident(prs.key),',')`
unwrap the newly created json arrangement and dynamically create a temp table 2017-10-11 00:17:21 -04:00			`INTO`
add another variable to collect column list, add a serial column to temp, copy using column list, and then build json object based on json defn 2017-10-14 01:40:26 -04:00			`_t,`
			`_c`
unwrap the newly created json arrangement and dynamically create a temp table 2017-10-11 00:17:21 -04:00			`FROM`
			`TPS.srce`
			`--unwrap the schema definition array`
			`LEFT JOIN LATERAL jsonb_populate_recordset(null::tps.srce_defn_schema, defn->'schema') prs ON TRUE`
get rid of commented json sample, swap for pt branch files 2017-10-13 02:40:23 -04:00			`WHERE`
switch to PNCC 2017-10-18 14:11:57 -04:00			`srce = 'PNCC'`
unwrap the newly created json arrangement and dynamically create a temp table 2017-10-11 00:17:21 -04:00			`GROUP BY`
			`srce;`

formatting 2017-10-11 00:29:38 -04:00			`----------------------------------------------------add create table verbage in front of column list--------------------------------------------------------`

change COPY command to dynamic due to column list 2017-10-14 01:48:13 -04:00			`_t := format('CREATE TEMP TABLE csv_i (%s, id SERIAL)', _t);`
			`--RAISE NOTICE '%', _t;`
			`--RAISE NOTICE '%', _c;`
formatting 2017-10-11 00:29:38 -04:00
unwrap the newly created json arrangement and dynamically create a temp table 2017-10-11 00:17:21 -04:00			`DROP TABLE IF EXISTS csv_i;`

			`EXECUTE _t;`

change COPY command to dynamic due to column list 2017-10-14 01:48:13 -04:00			`----------------------------------------------------do the insert-------------------------------------------------------------------------------------------`
add another variable to collect column list, add a serial column to temp, copy using column list, and then build json object based on json defn 2017-10-14 01:40:26 -04:00
			`--the column list needs to be dynamic forcing this whole line to be dynamic`
switch to PNCC 2017-10-18 14:11:57 -04:00			`_t := format('COPY csv_i (%s) FROM ''C:\Users\ptrowbridge\downloads\transsearchcsv.csv'' WITH (HEADER TRUE,DELIMITER '','', FORMAT CSV, ENCODING ''SQL_ASCII'',QUOTE ''"'');',_c);`
change COPY command to dynamic due to column list 2017-10-14 01:48:13 -04:00
			`--RAISE NOTICE '%', _t;`

			`EXECUTE _t;`
get rid of commented json sample, swap for pt branch files 2017-10-13 02:40:23 -04:00

get rid of insert 2017-10-15 13:05:20 -04:00			`END`
unwrap the newly created json arrangement and dynamically create a temp table 2017-10-11 00:17:21 -04:00			`$$;`

get rid of insert 2017-10-15 13:05:20 -04:00			`--*******************************************`
change COPY command to dynamic due to column list 2017-10-14 01:48:13 -04:00			`--this needs to aggregate on id sequence`
get rid of insert 2017-10-15 13:05:20 -04:00			`--*******************************************`
add link to tps trans to find any potential import conflicts 2017-10-16 00:14:05 -04:00			`WITH pending_list AS (`
add insert as part of with a return rows not inserted, probably needs modified to show the keys not inserted and sorted 2017-10-18 00:55:00 -04:00			`SELECT`
			`---creates a key value pair and then aggregates rows of key value pairs`
			`jsonb_object_agg(`
			`(ae.e::text[])[1], --the key name`
			`(row_to_json(i)::jsonb) #> ae.e::text[] --get the target value from the key from the csv row that has been converted to json`
			`) json_key,`
get rid of id key in json, remove constraint 2017-10-18 01:40:09 -04:00			`row_to_json(i)::JSONB - 'id' rec,`
add insert as part of with a return rows not inserted, probably needs modified to show the keys not inserted and sorted 2017-10-18 00:55:00 -04:00			`srce,`
			`--ae.rn,`
			`id`
			`FROM`
			`csv_i i`
			`INNER JOIN tps.srce s ON`
switch to PNCC 2017-10-18 14:11:57 -04:00			`s.srce = 'PNCC'`
add insert as part of with a return rows not inserted, probably needs modified to show the keys not inserted and sorted 2017-10-18 00:55:00 -04:00			`LEFT JOIN LATERAL JSONB_ARRAY_ELEMENTS_TEXT(defn->'unique_constraint'->'fields') WITH ORDINALITY ae(e, rn) ON TRUE`
			`GROUP BY`
			`i.*,`
			`srce,`
			`id`
			`ORDER BY`
			`id`
add link to tps trans to find any potential import conflicts 2017-10-16 00:14:05 -04:00			`)`
add insert as part of with a return rows not inserted, probably needs modified to show the keys not inserted and sorted 2017-10-18 00:55:00 -04:00			`------results of an insert operation--------------`
			`, inserted AS (`
			`INSERT INTO`
			`tps.trans (srce, rec)`
			`SELECT`
			`pl.srce`
			`,pl.rec`
			`FROM`
			`pending_list pl`
			`LEFT JOIN tps.trans t ON`
			`t.srce = pl.srce`
			`AND t.rec @> pl.json_key`
			`WHERE`
			`t IS NULL`
			`----this conflict is only if an exact duplicate rec json happens, which will be rejected`
			`----therefore, records may not be inserted due to ay matches with certain json fields, or if the entire json is a duplicate, reason is not specified`
			`RETURNING *`
add link to tps trans to find any potential import conflicts 2017-10-16 00:14:05 -04:00			`)`
merge summary of records not inserted from pt branch 2017-10-18 14:10:07 -04:00			`---------raw list of records not inserted----------`
			`, not_inserted AS (`
			`SELECT`
			`srce`
			`,rec`
			`FROM`
			`pending_list`
add link to tps trans to find any potential import conflicts 2017-10-16 00:14:05 -04:00
merge summary of records not inserted from pt branch 2017-10-18 14:10:07 -04:00			`EXCEPT ALL`

			`SELECT`
			`srce`
			`,rec`
			`FROM`
			`inserted`
			`)`
			`--------summarize records not inserted------------------`
add insert as part of with a return rows not inserted, probably needs modified to show the keys not inserted and sorted 2017-10-18 00:55:00 -04:00			`SELECT`
merge summary of records not inserted from pt branch 2017-10-18 14:10:07 -04:00			`t.srce`
			`,(ae.e::text[])[1] unq_constr`
			`,MIN(rec #>> ae.e::text[]) min_text`
			`,MAX(rec #>> ae.e::text[]) max_text`
			`,JSONB_PRETTY(JSON_AGG(rec #> ae.e::text[] ORDER BY rec #>> ae.e::text[])::JSONB)`
add insert as part of with a return rows not inserted, probably needs modified to show the keys not inserted and sorted 2017-10-18 00:55:00 -04:00			`FROM`
merge summary of records not inserted from pt branch 2017-10-18 14:10:07 -04:00			`not_inserted t`
			`INNER JOIN tps.srce s ON`
			`s.srce = t.srce`
			`LEFT JOIN LATERAL JSONB_ARRAY_ELEMENTS_TEXT(defn->'unique_constraint'->'fields') WITH ORDINALITY ae(e, rn) ON TRUE`
			`GROUP BY`
			`t.srce`
			`,(ae.e::text[])[1];`