1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 258 259 260 261 262 263 264 265 266 267 268 269 270 271 272 273 274 275 276 277 278 279 280 281 282 283 284 285 286 287 288 289 290 291 292 293 294 295 296 297 298 299 300 301 302 303 304 305 306 307 308 309 310 311 312 313 314 315 316 317 318 319 320 321 322 323 324 325 326 327 328 329 330 331 332 333 334 335 336 337 338 339 340 341 342 343 344 345 346 347 348
|
/*
* Updater maker function.
*/
CREATE FUNCTION updater_maker(
p_src_table text
, p_type text
, p_control_field text
, p_dblink_id int
, p_boundary text DEFAULT NULL
, p_dest_table text DEFAULT NULL
, p_index boolean DEFAULT true
, p_filter text[] DEFAULT NULL
, p_condition text DEFAULT NULL
, p_pulldata boolean DEFAULT true
, p_pk_name text[] DEFAULT NULL
, p_pk_type text[] DEFAULT NULL
, p_jobmon boolean DEFAULT NULL
, p_debug boolean DEFAULT false)
RETURNS void
LANGUAGE plpgsql
AS $$
DECLARE
v_boundary_serial int;
v_boundary_time interval;
v_data_source text;
v_dblink_name text;
v_dblink_schema text;
v_dest_schema_name text;
v_dest_table_name text;
v_dst_active boolean;
v_field text;
v_insert_refresh_config text;
v_job_id bigint;
v_job_name text;
v_jobmon boolean;
v_jobmon_schema text;
v_key_type text;
v_link_exists boolean;
v_max_id bigint;
v_max_timestamp timestamptz;
v_old_search_path text;
v_pk_name text[] := p_pk_name;
v_pk_type text[] := p_pk_type;
v_remote_key_sql text;
v_sql text;
v_src_schema_name text;
v_src_table_name text;
v_step_id bigint;
v_table_exists boolean;
v_update_refresh_config text;
BEGIN
v_dblink_name := @extschema@.check_name_length('mimeo_updater_maker_'||p_src_table);
SELECT nspname INTO v_dblink_schema FROM pg_namespace n, pg_extension e WHERE e.extname = 'dblink' AND e.extnamespace = n.oid;
SELECT nspname INTO v_jobmon_schema FROM pg_namespace n, pg_extension e WHERE e.extname = 'pg_jobmon' AND e.extnamespace = n.oid;
SELECT current_setting('search_path') INTO v_old_search_path;
EXECUTE 'SELECT set_config(''search_path'',''@extschema@,'||COALESCE(v_jobmon_schema||',', '')||v_dblink_schema||',public'',''false'')';
IF (p_pk_name IS NULL AND p_pk_type IS NOT NULL) OR (p_pk_name IS NOT NULL AND p_pk_type IS NULL) THEN
RAISE EXCEPTION 'Cannot manually set primary/unique key field(s) without defining type(s) or vice versa';
END IF;
SELECT data_source INTO v_data_source FROM @extschema@.dblink_mapping_mimeo WHERE data_source_id = p_dblink_id;
IF NOT FOUND THEN
RAISE EXCEPTION 'ERROR: database link ID is incorrect %', p_dblink_id;
END IF;
IF p_dest_table IS NULL THEN
p_dest_table := p_src_table;
END IF;
IF position('.' in p_dest_table) > 0 AND position('.' in p_src_table) > 0 THEN
-- Do nothing. Schema & table variable names set below after table is created
ELSE
RAISE EXCEPTION 'Source (and destination) table must be schema qualified';
END IF;
IF p_jobmon IS TRUE AND v_jobmon_schema IS NULL THEN
RAISE EXCEPTION 'p_jobmon parameter set to TRUE, but unable to determine if pg_jobmon extension is installed';
ELSIF (p_jobmon IS TRUE OR p_jobmon IS NULL) AND v_jobmon_schema IS NOT NULL THEN
v_jobmon := true;
ELSE
v_jobmon := false;
END IF;
v_job_name := 'Updater Maker: '||p_src_table;
IF v_jobmon THEN
v_job_id := add_job(v_job_name);
PERFORM gdb(p_debug,'Job ID: '||v_job_id::text);
v_step_id := add_step(v_job_id,'Connecting to remote source');
END IF;
PERFORM dblink_connect(v_dblink_name, @extschema@.auth(p_dblink_id));
SELECT schemaname, tablename INTO v_src_schema_name, v_src_table_name
FROM dblink(v_dblink_name, format('
SELECT schemaname, tablename
FROM (
SELECT schemaname, tablename
FROM pg_catalog.pg_tables
WHERE schemaname ||''.''|| tablename = %L
UNION
SELECT schemaname, viewname AS tablename
FROM pg_catalog.pg_views
WHERE schemaname || ''.'' || viewname = %L
) tables LIMIT 1'
, p_src_table, p_src_table) )
t (schemaname text, tablename text);
IF v_src_table_name IS NULL THEN
RAISE EXCEPTION 'Source table missing (%)', p_src_table;
END IF;
-- Automatically get source primary/unique key if none given
IF p_pk_name IS NULL AND p_pk_type IS NULL THEN
SELECT v_key_type, indkey_names, indkey_types INTO v_key_type, v_pk_name, v_pk_type FROM fetch_replication_key(v_src_schema_name, v_src_table_name, v_dblink_name);
END IF;
IF v_pk_name IS NULL OR v_pk_type IS NULL THEN
RAISE EXCEPTION 'Source table has no valid primary key or unique index';
END IF;
IF p_filter IS NOT NULL THEN
FOREACH v_field IN ARRAY v_pk_name LOOP
IF v_field = ANY(p_filter) THEN
CONTINUE;
ELSE
RAISE EXCEPTION 'ERROR: filter list did not contain all columns that compose primary/unique key for source table %', p_src_table;
END IF;
END LOOP;
END IF;
IF v_jobmon THEN
PERFORM update_step(v_step_id, 'OK','Done');
v_step_id := add_step(v_job_id,'Adding configuration data');
END IF;
IF p_type = 'time' THEN
v_dst_active := @extschema@.dst_utc_check();
IF p_boundary IS NULL THEN
v_boundary_time = '10 minutes'::interval;
ELSE
v_boundary_time = p_boundary::interval;
END IF;
v_insert_refresh_config := 'INSERT INTO @extschema@.refresh_config_updater_time(
source_table
, type
, dest_table
, dblink
, control
, boundary
, pk_name
, pk_type
, last_value
, last_run
, dst_active
, filter
, condition
, jobmon)
VALUES('
||quote_literal(p_src_table)
||', '||quote_literal('updater_time')
||', '||quote_literal(p_dest_table)
||', '||quote_literal(p_dblink_id)
||', '||quote_literal(p_control_field)
||', '||quote_literal(v_boundary_time)
||', '||quote_literal(v_pk_name)
||', '||quote_literal(v_pk_type)
||', '||quote_literal('-infinity')
||', '||quote_literal(CURRENT_TIMESTAMP)
||', '||v_dst_active
||', '||COALESCE(quote_literal(p_filter), 'NULL')
||', '||COALESCE(quote_literal(p_condition), 'NULL')
||', '||v_jobmon||')';
PERFORM gdb(p_debug, 'v_insert_refresh_config: '||v_insert_refresh_config);
EXECUTE v_insert_refresh_config;
ELSIF p_type = 'serial' THEN
IF p_boundary IS NULL THEN
v_boundary_serial = 10;
ELSE
v_boundary_serial = p_boundary::int;
END IF;
v_insert_refresh_config := 'INSERT INTO @extschema@.refresh_config_updater_serial(
source_table
, type
, dest_table
, dblink
, control
, boundary
, pk_name
, pk_type
, last_value
, last_run
, filter
, condition
, jobmon)
VALUES('
||quote_literal(p_src_table)
||', '||quote_literal('updater_serial')
||', '||quote_literal(p_dest_table)
||', '||quote_literal(p_dblink_id)
||', '||quote_literal(p_control_field)
||', '||quote_literal(v_boundary_serial)
||', '||quote_literal(v_pk_name)
||', '||quote_literal(v_pk_type)
||', '||quote_literal(0)
||', '||quote_literal(CURRENT_TIMESTAMP)
||', '||COALESCE(quote_literal(p_filter), 'NULL')
||', '||COALESCE(quote_literal(p_condition), 'NULL')
||', '||v_jobmon||')';
PERFORM gdb(p_debug, 'v_insert_refresh_config: '||v_insert_refresh_config);
EXECUTE v_insert_refresh_config;
END IF;
SELECT p_table_exists FROM @extschema@.manage_dest_table(p_dest_table, NULL, NULL, p_debug) INTO v_table_exists;
SELECT schemaname, tablename
INTO v_dest_schema_name, v_dest_table_name
FROM pg_catalog.pg_tables
WHERE schemaname||'.'||tablename = p_dest_table;
IF v_jobmon THEN
PERFORM update_step(v_step_id, 'OK','Done');
END IF;
IF p_pulldata AND v_table_exists = false THEN
RAISE NOTICE 'Pulling all data from source...';
IF v_jobmon THEN
v_step_id := add_step(v_job_id,'Pulling data from source. Check for new job entry under REFRESH UPDATER for current status if this step has not finished');
END IF;
EXECUTE 'SELECT @extschema@.refresh_updater('||quote_literal(p_dest_table)||', p_repull := true, p_debug := '||p_debug||')';
END IF;
IF p_index AND v_table_exists = false THEN
IF v_jobmon THEN
v_step_id := add_step(v_job_id,'Creating indexes on destination table');
END IF;
PERFORM create_index(p_dest_table, v_src_schema_name, v_src_table_name, NULL, p_debug);
IF v_jobmon THEN
PERFORM update_step(v_step_id, 'OK','Done');
END IF;
ELSIF v_table_exists = false THEN
-- Ensure destination indexes that are needed for efficient replication are created even if p_index is set false
IF v_jobmon THEN
v_step_id := add_step(v_job_id,'Creating indexes needed for replication');
END IF;
PERFORM gdb(p_debug, 'Creating indexes needed for replication');
IF v_key_type = 'primary' THEN
EXECUTE format('ALTER TABLE %I.%I', v_dest_schema_name, v_dest_table_name)||' ADD PRIMARY KEY('||array_to_string(v_pk_name, ',')||')';
ELSE
EXECUTE format('CREATE UNIQUE INDEX ON %I.%I', v_dest_schema_name, v_dest_table_name)||' ('||array_to_string(v_pk_name, ',')||')';
END IF;
IF v_jobmon THEN
PERFORM update_step(v_step_id, 'OK','Done');
END IF;
END IF;
IF v_table_exists THEN
IF v_jobmon THEN
v_step_id := add_step(v_job_id, format('Destination table %s.%s already exists. No data or indexes were pulled from source', v_dest_schema_name, v_dest_table_name));
PERFORM update_step(v_step_id, 'OK','Done');
END IF;
RAISE NOTICE 'Destination table % already exists. No data or indexes was pulled from source', p_dest_table;
END IF;
RAISE NOTICE 'Analyzing destination table...';
IF v_jobmon THEN
v_step_id := add_step(v_job_id, 'Analyzing destination table');
END IF;
EXECUTE format('ANALYZE %I.%I', v_dest_schema_name, v_dest_table_name);
IF v_jobmon THEN
PERFORM update_step(v_step_id, 'OK','Done');
END IF;
PERFORM dblink_disconnect(v_dblink_name);
IF v_jobmon THEN
v_step_id := add_step(v_job_id, 'Obtaining max destination value of control column for config table');
END IF;
v_sql := format('SELECT max(%I) FROM %I.%I', p_control_field, v_dest_schema_name, v_dest_table_name);
PERFORM @extschema@.gdb(p_debug, v_sql);
IF p_type = 'time' THEN
RAISE NOTICE 'Getting the maximum destination timestamp...';
EXECUTE v_sql INTO v_max_timestamp;
v_sql := format('UPDATE %I.refresh_config_updater_time SET last_value = %L WHERE dest_table = %L'
, '@extschema@'
, COALESCE(v_max_timestamp, CURRENT_TIMESTAMP)
, p_dest_table);
PERFORM @extschema@.gdb(p_debug, v_sql);
EXECUTE v_sql;
ELSIF p_type = 'serial' THEN
RAISE NOTICE 'Getting the maximum destination id...';
EXECUTE v_sql INTO v_max_id;
v_sql := format('UPDATE %I.refresh_config_updater_serial SET last_value = %L WHERE dest_table = %L'
, '@extschema@'
, COALESCE(v_max_id, 0)
, p_dest_table);
PERFORM @extschema@.gdb(p_debug, v_sql);
EXECUTE v_sql;
END IF;
IF v_jobmon THEN
PERFORM update_step(v_step_id, 'OK','Done');
PERFORM close_job(v_job_id);
END IF;
EXECUTE 'SELECT set_config(''search_path'','''||v_old_search_path||''',''false'')';
RAISE NOTICE 'Done';
RETURN;
EXCEPTION
WHEN QUERY_CANCELED THEN
SELECT nspname INTO v_dblink_schema FROM pg_namespace n, pg_extension e WHERE e.extname = 'dblink' AND e.extnamespace = n.oid;
EXECUTE format('SELECT %I.dblink_get_connections() @> ARRAY[%L]', v_dblink_schema, v_dblink_name) INTO v_link_exists;
IF v_link_exists THEN
EXECUTE format('SELECT %I.dblink_disconnect(%L)', v_dblink_schema, v_dblink_name);
END IF;
RAISE EXCEPTION '%', SQLERRM;
WHEN OTHERS THEN
SELECT nspname INTO v_dblink_schema FROM pg_namespace n, pg_extension e WHERE e.extname = 'dblink' AND e.extnamespace = n.oid;
SELECT nspname INTO v_jobmon_schema FROM pg_namespace n, pg_extension e WHERE e.extname = 'pg_jobmon' AND e.extnamespace = n.oid;
SELECT jobmon INTO v_jobmon FROM @extschema@.refresh_config_updater WHERE dest_table = p_src_table;
v_jobmon := COALESCE(p_jobmon, v_jobmon);
EXECUTE format('SELECT %I.dblink_get_connections() @> ARRAY[%L]', v_dblink_schema, v_dblink_name) INTO v_link_exists;
IF v_link_exists THEN
EXECUTE format('SELECT %I.dblink_disconnect(%L)', v_dblink_schema, v_dblink_name);
END IF;
IF v_jobmon AND v_jobmon_schema IS NOT NULL THEN
IF v_job_id IS NULL THEN
EXECUTE format('SELECT %I.add_job(%L)', v_jobmon_schema, 'Inserter Maker: '||p_src_table) INTO v_job_id;
EXECUTE format('SELECT %I.add_step(%L, %L)', v_jobmon_schema, v_job_id, 'EXCEPTION before job logging started') INTO v_step_id;
END IF;
IF v_step_id IS NULL THEN
EXECUTE format('SELECT %I.add_step(%L, %L)', v_jobmon_schema, v_job_id, 'EXCEPTION before first step logged') INTO v_step_id;
END IF;
EXECUTE format('SELECT %I.update_step(%L, %L, %L)', v_jobmon_schema, v_step_id, 'CRITICAL', 'ERROR: '||COALESCE(SQLERRM,'unknown'));
EXECUTE format('SELECT %I.fail_job(%L)', v_jobmon_schema, v_job_id);
END IF;
RAISE EXCEPTION '%', SQLERRM;
END
$$;
|