forked from postgrespro/aqo
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathpreprocessing.c
392 lines (354 loc) · 11.5 KB
/
preprocessing.c
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
/*
*******************************************************************************
*
* QUERY PREPROCESSING HOOKS
*
* The main point of this module is to recognize somehow settings for the query.
* It may be considered as user interface.
*
* The configurable settings are:
* 'query_hash': hash of the type of the given query
* 'use_aqo': whether to use AQO estimations in query optimization
* 'learn_aqo': whether to update AQO data based on query execution
* statistics
* 'fspace_hash': hash of feature space to use with given query
* 'auto_tuning': whether AQO may change use_aqo and learn_aqo values
* for the next execution of such type of query using
* its self-tuning algorithm
*
* Currently the module works as follows:
* 1. Query type determination. We consider that two queries are of the same
* type if and only if they are equal or their difference is only in their
* constants. We use hash function, which returns the same value for all
* queries of the same type. This typing strategy is not the only possible
* one for adaptive query optimization. One can easily implement another
* typing strategy by changing hash function.
* 2. New query type proceeding. The handling policy for new query types is
* contained in variable 'aqo.mode'. It accepts five values:
* "intelligent", "forced", "controlled", "learn" and "disabled".
* Intelligent linking strategy means that for each new query type the new
* separate feature space is created. The hash of new feature space is
* set the same as the hash of new query type. Auto tuning is on by
* default in this mode. AQO also automatically memorizes query hash to
* query text mapping in aqo_query_texts table.
* Forced linking strategy means that every new query type is linked to
* the common feature space with hash 0, but we don't memorize
* the hash and the settings for this query.
* Controlled linking strategy means that new query types do not induce
* new feature spaces neither interact AQO somehow. In this mode the
* configuration of settings for different query types lies completely on
* user.
* Learn linking strategy is the same as intelligent one. The only
* difference is the default settings for the new query type:
* auto tuning is disabled.
* Disabled strategy means that AQO is disabled for all queries.
* 3. For given query type we determine its query_hash, use_aqo, learn_aqo,
* fspace_hash and auto_tuning parameters.
* 4. For given fspace_hash we may use its machine learning settings, but now
* the machine learning setting are fixed for all feature spaces.
*
*******************************************************************************
*
* Copyright (c) 2016-2021, Postgres Professional
*
* IDENTIFICATION
* aqo/preprocessing.c
*
*/
#include "aqo.h"
#include "access/parallel.h"
#include "access/table.h"
#include "commands/extension.h"
static bool isQueryUsingSystemRelation(Query *query);
static bool isQueryUsingSystemRelation_walker(Node *node, void *context);
/*
* Saves query text into query_text variable.
* Query text field in aqo_queries table is for user.
*/
void
get_query_text(ParseState *pstate, Query *query)
{
MemoryContext oldCxt;
/*
* Duplicate query string into private AQO memory context for guard
* from possible memory context switching.
*/
oldCxt = MemoryContextSwitchTo(AQOMemoryContext);
if (pstate)
query_text = pstrdup(pstate->p_sourcetext);
MemoryContextSwitchTo(oldCxt);
if (prev_post_parse_analyze_hook)
prev_post_parse_analyze_hook(pstate, query);
}
/*
* Calls standard query planner or its previous hook.
*/
PlannedStmt *
call_default_planner(Query *parse,
const char *query_string,
int cursorOptions,
ParamListInfo boundParams)
{
if (prev_planner_hook)
return prev_planner_hook(parse,
query_string,
cursorOptions,
boundParams);
else
return standard_planner(parse,
query_string,
cursorOptions,
boundParams);
}
/*
* Before query optimization we determine machine learning settings
* for the query.
* This hook computes query_hash, and sets values of learn_aqo,
* use_aqo and is_common flags for given query.
* Creates an entry in aqo_queries for new type of query if it is
* necessary, i. e. AQO mode is "intelligent".
*/
PlannedStmt *
aqo_planner(Query *parse,
const char *query_string,
int cursorOptions,
ParamListInfo boundParams)
{
bool query_is_stored;
Datum query_params[5];
bool query_nulls[5] = {false, false, false, false, false};
LOCKTAG tag;
selectivity_cache_clear();
/*
* We do not work inside an parallel worker now by reason of insert into
* the heap during planning. Transactions is synchronized between parallel
* sections. See GetCurrentCommandId() comments also.
*/
if ((parse->commandType != CMD_SELECT && parse->commandType != CMD_INSERT &&
parse->commandType != CMD_UPDATE && parse->commandType != CMD_DELETE) ||
strstr(application_name, "postgres_fdw") != NULL || /* Prevent distributed deadlocks */
strstr(application_name, "pgfdw:") != NULL || /* caused by fdw */
get_extension_oid("aqo", true) == InvalidOid ||
creating_extension ||
IsParallelWorker() ||
(aqo_mode == AQO_MODE_DISABLED && !force_collect_stat) ||
isQueryUsingSystemRelation(parse) ||
RecoveryInProgress())
{
disable_aqo_for_query();
return call_default_planner(parse,
query_string,
cursorOptions,
boundParams);
}
INSTR_TIME_SET_CURRENT(query_context.query_starttime);
query_context.query_hash = get_query_hash(parse, query_text);
if (query_is_deactivated(query_context.query_hash))
{
disable_aqo_for_query();
return call_default_planner(parse,
query_string,
cursorOptions,
boundParams);
}
/*
* find-add query and query text must be atomic operation to prevent
* concurrent insertions.
*/
init_lock_tag(&tag, (uint32) query_context.query_hash, (uint32) 0);
LockAcquire(&tag, ExclusiveLock, false, false);
query_is_stored = find_query(query_context.query_hash, &query_params[0],
&query_nulls[0]);
if (!query_is_stored)
{
switch (aqo_mode)
{
case AQO_MODE_INTELLIGENT:
query_context.adding_query = true;
query_context.learn_aqo = true;
query_context.use_aqo = false;
query_context.fspace_hash = query_context.query_hash;
query_context.auto_tuning = true;
query_context.collect_stat = true;
break;
case AQO_MODE_FORCED:
query_context.adding_query = false;
query_context.learn_aqo = true;
query_context.use_aqo = true;
query_context.auto_tuning = false;
query_context.fspace_hash = 0;
query_context.collect_stat = false;
break;
case AQO_MODE_CONTROLLED:
case AQO_MODE_FROZEN:
/*
* if query is not in the AQO knowledge base than disable AQO
* for this query.
*/
query_context.adding_query = false;
query_context.learn_aqo = false;
query_context.use_aqo = false;
query_context.auto_tuning = false;
query_context.collect_stat = false;
break;
case AQO_MODE_LEARN:
query_context.adding_query = true;
query_context.learn_aqo = true;
query_context.use_aqo = true;
query_context.fspace_hash = query_context.query_hash;
query_context.auto_tuning = false;
query_context.collect_stat = true;
break;
case AQO_MODE_DISABLED:
/* Should never happen */
query_context.fspace_hash = query_context.query_hash;
break;
default:
elog(ERROR, "unrecognized mode in AQO: %d", aqo_mode);
break;
}
if (query_context.adding_query || force_collect_stat)
{
/*
* Add query into the AQO knowledge base. To process an error with
* concurrent addition from another backend we will try to restart
* preprocessing routine.
*/
update_query(query_context.query_hash,
query_context.fspace_hash,
query_context.learn_aqo,
query_context.use_aqo,
query_context.auto_tuning);
add_query_text(query_context.query_hash, query_text);
}
}
else
{
query_context.adding_query = false;
query_context.learn_aqo = DatumGetBool(query_params[1]);
query_context.use_aqo = DatumGetBool(query_params[2]);
query_context.fspace_hash = DatumGetInt32(query_params[3]);
query_context.auto_tuning = DatumGetBool(query_params[4]);
query_context.collect_stat = query_context.auto_tuning;
if (!query_context.learn_aqo && !query_context.use_aqo &&
!query_context.auto_tuning)
add_deactivated_query(query_context.query_hash);
/*
* That we can do if query exists in database.
* Additional preference changes, based on AQO mode.
*/
switch (aqo_mode)
{
case AQO_MODE_FROZEN:
/*
* In this mode we will suppress all writings to the knowledge base.
* AQO will be used for all known queries, if it is not suppressed.
*/
query_context.learn_aqo = false;
query_context.auto_tuning = false;
query_context.collect_stat = false;
break;
case AQO_MODE_LEARN:
/*
* In this mode we want to learn with incoming query (if it is not
* suppressed manually) and collect stats.
*/
query_context.collect_stat = true;
query_context.fspace_hash = query_context.query_hash;
break;
case AQO_MODE_INTELLIGENT:
case AQO_MODE_FORCED:
case AQO_MODE_CONTROLLED:
case AQO_MODE_DISABLED:
/* Use preferences as set early. */
break;
default:
elog(ERROR, "Unrecognized aqo mode %d", aqo_mode);
}
}
LockRelease(&tag, ExclusiveLock, false);
/*
* This mode is possible here, because force collect statistics uses AQO
* machinery.
*/
if (aqo_mode == AQO_MODE_DISABLED)
disable_aqo_for_query();
if (force_collect_stat)
{
/*
* If this GUC is set, AQO will analyze query results and collect
* query execution statistics in any mode.
*/
query_context.collect_stat = true;
query_context.fspace_hash = query_context.query_hash;
}
return call_default_planner(parse,
query_string,
cursorOptions,
boundParams);
}
/*
* Turn off all AQO functionality for the current query.
*/
void
disable_aqo_for_query(void)
{
query_context.adding_query = false;
query_context.learn_aqo = false;
query_context.use_aqo = false;
query_context.auto_tuning = false;
query_context.collect_stat = false;
}
/*
* Examine a fully-parsed query, and return TRUE iff any relation underlying
* the query is a system relation.
*/
bool
isQueryUsingSystemRelation(Query *query)
{
return isQueryUsingSystemRelation_walker((Node *) query, NULL);
}
static bool
IsAQORelation(Relation rel)
{
char *relname = NameStr(rel->rd_rel->relname);
if (strcmp(relname, "aqo_data") == 0 ||
strcmp(relname, "aqo_query_texts") == 0 ||
strcmp(relname, "aqo_query_stat") == 0 ||
strcmp(relname, "aqo_queries") == 0 ||
strcmp(relname, "aqo_ignorance") == 0
)
return true;
return false;
}
bool
isQueryUsingSystemRelation_walker(Node *node, void *context)
{
if (node == NULL)
return false;
if (IsA(node, Query))
{
Query *query = (Query *) node;
ListCell *rtable;
foreach(rtable, query->rtable)
{
RangeTblEntry *rte = lfirst(rtable);
if (rte->rtekind == RTE_RELATION)
{
Relation rel = table_open(rte->relid, AccessShareLock);
bool is_catalog = IsCatalogRelation(rel);
bool is_aqo_rel = IsAQORelation(rel);
table_close(rel, AccessShareLock);
if (is_catalog || is_aqo_rel)
return true;
}
}
return query_tree_walker(query,
isQueryUsingSystemRelation_walker,
context,
0);
}
return expression_tree_walker(node,
isQueryUsingSystemRelation_walker,
context);
}