forked from GoogleCloudPlatform/bigquery-utils
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathviews_with_nonoptimal_join_condition.sql
70 lines (65 loc) · 2.12 KB
/
views_with_nonoptimal_join_condition.sql
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
/*
* Copyright 2023 Google LLC
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
/*
* This script creates a table named, views_with_nonoptimal_join_condition,
* that contains a list of views with non-optimal join conditions.
*/
DECLARE projects ARRAY<STRING> DEFAULT (
SELECT ARRAY_AGG(DISTINCT project_id)
FROM `region-us.INFORMATION_SCHEMA.TABLE_STORAGE_BY_ORGANIZATION`
WHERE NOT deleted
);
CREATE SCHEMA IF NOT EXISTS optimization_workshop;
CREATE OR REPLACE TABLE optimization_workshop.views_with_nonoptimal_join_condition
(
view_name STRING,
view_url STRING,
view_definition STRING,
join_conditions ARRAY<STRING>
);
CREATE TEMP FUNCTION extract_nonoptimal_join_conditions(view_definition STRING) AS(
ARRAY_CONCAT(
REGEXP_EXTRACT_ALL(
REGEXP_REPLACE(UPPER(view_definition), r"\sON\s", "\nON "),
r"\nON\s+[A-Z_]+?\([^=]*?=[^=]*"
),
REGEXP_EXTRACT_ALL(
REGEXP_REPLACE(UPPER(view_definition), r"\sON\s", "\nON "),
r"\nON\s+[^=]*?=\s*[A-Z_]+?\([^=]*"
)));
FOR p IN (
SELECT project_id
FROM
UNNEST(projects) project_id
)
DO
BEGIN
EXECUTE IMMEDIATE FORMAT(r"""
INSERT INTO optimization_workshop.views_with_nonoptimal_join_condition
SELECT
table_name AS view_name,
bqutil.fn.table_url(table_catalog || '.' || table_schema || '.' || table_name) AS view_url,
view_definition,
extract_nonoptimal_join_conditions(view_definition) AS join_conditions
FROM
`%s.region-us.INFORMATION_SCHEMA.VIEWS`
WHERE
ARRAY_LENGTH(extract_nonoptimal_join_conditions(view_definition)) >= 1
""",
p.project_id);
EXCEPTION WHEN ERROR THEN SELECT @@error.message; --ignore errors
END;
END FOR;