Project

General

Profile

1 3077 aaronmk
# Database import/export
2
3 3431 aaronmk
import operator
4
5 3077 aaronmk
import exc
6
import dicts
7
import sql
8
import sql_gen
9
import strings
10
import util
11
12 3081 aaronmk
##### Data cleanup
13
14
def cleanup_table(db, table, cols):
15
    table = sql_gen.as_Table(table)
16
    cols = map(sql_gen.as_Col, cols)
17
18
    expr = ('nullif(nullif(trim(both from %s), '+db.esc_value('')+'), '
19
        +db.esc_value(r'\N')+')')
20
    changes = [(v, sql_gen.CustomCode(expr % v.to_str(db)))
21
        for v in cols]
22
23
    sql.update(db, table, changes, in_place=True)
24
25 3078 aaronmk
##### Error tracking
26
27
def track_data_error(db, errors_table, cols, value, error_code, error):
28
    '''
29
    @param errors_table If None, does nothing.
30
    '''
31
    if errors_table == None or cols == (): return
32
33
    for col in cols:
34
        try:
35
            sql.insert(db, errors_table, dict(column=col.name, value=value,
36
                error_code=error_code, error=error), recover=True,
37
                cacheable=True, log_level=4)
38
        except sql.DuplicateKeyException: pass
39
40 3506 aaronmk
class ExcToErrorsTable(sql_gen.ExcToWarning):
41
    '''Handles an exception by saving it or converting it to a warning.'''
42
    def __init__(self, return_, srcs, errors_table):
43
        '''
44
        @param return_ See sql_gen.ExcToWarning
45
        @param srcs The column names for the errors table
46
        @param errors_table None|sql_gen.Table
47
        @pre The invalid value must be in a local variable "value" of type text.
48
        '''
49
        sql_gen.ExcToWarning.__init__(self, return_)
50
51
        self.srcs = srcs
52
        self.errors_table = errors_table
53 3501 aaronmk
54 3506 aaronmk
    def to_str(self, db):
55
        if not self.srcs or self.errors_table == None:
56
            return sql_gen.ExcToWarning.to_str(self, db)
57
58 3459 aaronmk
        errors_table_cols = map(sql_gen.Col,
59
            ['column', 'value', 'error_code', 'error'])
60 3465 aaronmk
        col_names_query = sql.mk_select(db, sql_gen.NamedValues('c', None,
61 3506 aaronmk
            [[c.name] for c in self.srcs]), order_by=None)
62
        insert_query = sql.mk_insert_select(db, self.errors_table,
63
            errors_table_cols,
64 3465 aaronmk
            sql_gen.Values(errors_table_cols).to_str(db))+';\n'
65 3506 aaronmk
        return '''\
66 3459 aaronmk
-- Save error in errors table.
67
DECLARE
68
    error_code text := SQLSTATE;
69
    error text := SQLERRM;
70
BEGIN
71
    -- Insert the value and error for *each* source column.
72 3467 aaronmk
'''+strings.indent(sql_gen.RowExcIgnore('text', col_names_query, insert_query,
73
    row_var=errors_table_cols[0]).to_str(db))+'''
74 3459 aaronmk
END;
75 3501 aaronmk
76 3506 aaronmk
'''+self.return_.to_str(db)
77 3459 aaronmk
78 3507 aaronmk
def data_exception_handler(*args, **kw_args):
79 3506 aaronmk
    '''Handles a data_exception by saving it or converting it to a warning.
80
    For params, see ExcToErrorsTable().
81
    '''
82
    return sql_gen.data_exception_handler(ExcToErrorsTable(*args, **kw_args))
83
84 3078 aaronmk
def cast(db, type_, col, errors_table=None):
85
    '''Casts an (unrenamed) column or value.
86
    If errors_table set and col has srcs, saves errors in errors_table (using
87 3360 aaronmk
    col's srcs attr as source columns). Otherwise, converts errors to warnings.
88 3078 aaronmk
    @param col str|sql_gen.Col|sql_gen.Literal
89
    @param errors_table None|sql_gen.Table|str
90
    '''
91
    col = sql_gen.as_Col(col)
92
93 3112 aaronmk
    # Don't convert exceptions to warnings for user-supplied constants
94
    if isinstance(col, sql_gen.Literal): return sql_gen.Cast(type_, col)
95
96 3078 aaronmk
    assert not isinstance(col, sql_gen.NamedCol)
97
98 3460 aaronmk
    function_name = strings.first_word(type_)
99 3459 aaronmk
    srcs = col.srcs
100 3112 aaronmk
    save_errors = (errors_table != None and isinstance(col, sql_gen.Col)
101
        and col.srcs != ())
102
    if save_errors:
103
        srcs = map(sql_gen.to_name_only_col, col.srcs)
104
        function_name = str(sql_gen.FunctionCall(function_name, *srcs))
105 3078 aaronmk
    function = db.TempFunction(function_name)
106
107 3464 aaronmk
    # Create function definition
108
    modifiers = 'STRICT'
109
    if not save_errors: modifiers = 'IMMUTABLE '+modifiers
110 3507 aaronmk
    handler = data_exception_handler('RETURN NULL;\n', srcs, errors_table)
111 3464 aaronmk
    body = sql_gen.CustomCode(handler.to_str(db, '''\
112 3467 aaronmk
/* The explicit cast to the return type is needed to make the cast happen
113
inside the try block. (Implicit casts to the return type happen at the end
114
of the function, outside any block.) */
115
RETURN value::'''+type_+''';
116 3464 aaronmk
'''))
117
    body.lang='plpgsql'
118 3500 aaronmk
    sql.define_func(db, sql_gen.FunctionDef(function, type_, body,
119
        [sql_gen.FunctionParam('value', 'text')], modifiers))
120 3464 aaronmk
121 3078 aaronmk
    return sql_gen.FunctionCall(function, col)
122
123
def cast_temp_col(db, type_, col, errors_table=None):
124
    '''Like cast(), but creates a new column with the cast values if the input
125
    is a column.
126
    @return The new column or cast value
127
    '''
128
    def cast_(col): return cast(db, type_, col, errors_table)
129
130
    try: col = sql_gen.underlying_col(col)
131
    except sql_gen.NoUnderlyingTableException: return sql_gen.wrap(cast_, col)
132
133
    table = col.table
134 3173 aaronmk
    new_col = sql_gen.suffixed_col(col, '::'+strings.first_word(type_))
135 3078 aaronmk
    expr = cast_(col)
136
137
    # Add column
138
    new_typed_col = sql_gen.TypedCol(new_col.name, type_)
139 3174 aaronmk
    sql.add_col(db, table, new_typed_col, comment=repr(col)+'::'+type_)
140 3078 aaronmk
    new_col.name = new_typed_col.name # propagate any renaming
141
142 3110 aaronmk
    sql.update(db, table, [(new_col, expr)], in_place=True, recover=True)
143 3078 aaronmk
144
    return new_col
145
146
def errors_table(db, table, if_exists=True):
147
    '''
148
    @param if_exists If set, returns None if the errors table doesn't exist
149
    @return None|sql_gen.Table
150
    '''
151
    table = sql_gen.as_Table(table)
152
    if table.srcs != (): table = table.srcs[0]
153
154
    errors_table = sql_gen.suffixed_table(table, '.errors')
155
    if if_exists and not sql.table_exists(db, errors_table): return None
156
    return errors_table
157
158
##### Import
159
160 3077 aaronmk
def put(db, table, row, pkey_=None, row_ct_ref=None):
161
    '''Recovers from errors.
162
    Only works under PostgreSQL (uses INSERT RETURNING).
163
    '''
164
    row = sql_gen.ColDict(db, table, row)
165
    if pkey_ == None: pkey_ = sql.pkey(db, table, recover=True)
166
167
    try:
168 3131 aaronmk
        cur = sql.insert(db, table, row, pkey_, recover=True, log_level=3.5)
169 3077 aaronmk
        if row_ct_ref != None and cur.rowcount >= 0:
170
            row_ct_ref[0] += cur.rowcount
171
        return sql.value(cur)
172
    except sql.DuplicateKeyException, e:
173
        row = sql_gen.ColDict(db, table,
174
            util.dict_subset_right_join(row, e.cols))
175 3131 aaronmk
        return sql.value(sql.select(db, table, [pkey_], row, recover=True,
176
            log_level=3.5))
177 3208 aaronmk
    except sql.NullValueException: return None
178 3077 aaronmk
179
def get(db, table, row, pkey, row_ct_ref=None, create=False):
180
    '''Recovers from errors'''
181
    try:
182
        return sql.value(sql.select(db, table, [pkey], row, limit=1,
183
            recover=True))
184
    except StopIteration:
185
        if not create: raise
186
        return put(db, table, row, pkey, row_ct_ref) # insert new row
187
188
def is_func_result(col):
189
    return col.table.name.find('(') >= 0 and col.name == 'result'
190
191
def into_table_name(out_table, in_tables0, mapping, is_func):
192
    def in_col_str(in_col):
193
        in_col = sql_gen.remove_col_rename(in_col)
194
        if isinstance(in_col, sql_gen.Col):
195
            table = in_col.table
196
            if table == in_tables0:
197
                in_col = sql_gen.to_name_only_col(in_col)
198
            elif is_func_result(in_col): in_col = table # omit col name
199
        return str(in_col)
200
201
    str_ = str(out_table)
202
    if is_func:
203
        str_ += '('
204
205
        try: value_in_col = mapping['value']
206
        except KeyError:
207
            str_ += ', '.join((str(k)+'='+in_col_str(v)
208
                for k, v in mapping.iteritems()))
209
        else: str_ += in_col_str(value_in_col)
210
211
        str_ += ')'
212
    else:
213
        out_col = 'rank'
214
        try: in_col = mapping[out_col]
215
        except KeyError: str_ += '_pkeys'
216
        else: # has a rank column, so hierarchical
217
            str_ += '['+str(out_col)+'='+in_col_str(in_col)+']'
218
    return str_
219
220
def put_table(db, out_table, in_tables, mapping, row_ct_ref=None, into=None,
221
    default=None, is_func=False, on_error=exc.raise_):
222
    '''Recovers from errors.
223
    Only works under PostgreSQL (uses INSERT RETURNING).
224
    IMPORTANT: Must be run at the *beginning* of a transaction.
225
    @param in_tables The main input table to select from, followed by a list of
226
        tables to join with it using the main input table's pkey
227
    @param mapping dict(out_table_col=in_table_col, ...)
228
        * out_table_col: str (*not* sql_gen.Col)
229
        * in_table_col: sql_gen.Col|literal-value
230
    @param into The table to contain the output and input pkeys.
231
        Defaults to `out_table.name+'_pkeys'`.
232
    @param default The *output* column to use as the pkey for missing rows.
233
        If this output column does not exist in the mapping, uses None.
234
    @param is_func Whether out_table is the name of a SQL function, not a table
235
    @return sql_gen.Col Where the output pkeys are made available
236
    '''
237 3474 aaronmk
    import psycopg2.extensions
238
239 3077 aaronmk
    out_table = sql_gen.as_Table(out_table)
240
241
    def log_debug(msg): db.log_debug(msg, level=1.5)
242
    def col_ustr(str_):
243
        return strings.repr_no_u(sql_gen.remove_col_rename(str_))
244
245
    log_debug('********** New iteration **********')
246
    log_debug('Inserting these input columns into '+strings.as_tt(
247
        out_table.to_str(db))+':\n'+strings.as_table(mapping, ustr=col_ustr))
248
249
    is_function = sql.function_exists(db, out_table)
250
251
    if is_function: out_pkey = 'result'
252
    else: out_pkey = sql.pkey(db, out_table, recover=True)
253
    out_pkey_col = sql_gen.as_Col(out_pkey, out_table)
254
255
    in_tables_ = in_tables[:] # don't modify input!
256 3432 aaronmk
    try: in_tables0 = in_tables_.pop(0) # first table is separate
257
    except IndexError: in_tables0 = None
258
    else:
259
        in_pkey = sql.pkey(db, in_tables0, recover=True)
260
        in_pkey_col = sql_gen.as_Col(in_pkey, in_tables0)
261 3431 aaronmk
262
    # Determine if can use optimization for only literal values
263
    is_literals = not reduce(operator.or_, map(sql_gen.is_table_col,
264 3434 aaronmk
        mapping.values()), False)
265 3431 aaronmk
    is_literals_or_function = is_literals or is_function
266
267 3432 aaronmk
    if in_tables0 == None: errors_table_ = None
268
    else: errors_table_ = errors_table(db, in_tables0)
269 3431 aaronmk
270
    # Create input joins from list of input tables
271 3077 aaronmk
    input_joins = [in_tables0]+[sql_gen.Join(v,
272
        {in_pkey: sql_gen.join_same_not_null}) for v in in_tables_]
273
274 3433 aaronmk
    if mapping == {} and not is_function: # need >= one column for INSERT SELECT
275
        mapping = {out_pkey: None} # ColDict will replace with default value
276
277 3431 aaronmk
    if not is_literals:
278
        if into == None:
279
            into = into_table_name(out_table, in_tables0, mapping, is_func)
280
        into = sql_gen.as_Table(into)
281
282
        # Set column sources
283
        in_cols = filter(sql_gen.is_table_col, mapping.values())
284
        for col in in_cols:
285
            if col.table == in_tables0: col.set_srcs(sql_gen.src_self)
286
287
        log_debug('Joining together input tables into temp table')
288
        # Place in new table so don't modify input and for speed
289
        in_table = sql_gen.Table('in')
290
        mapping = dicts.join(mapping, sql.flatten(db, in_table, input_joins,
291
            in_cols, preserve=[in_pkey_col]))
292
        input_joins = [in_table]
293
        db.log_debug('Temp table: '+strings.as_tt(in_table.to_str(db)), level=2)
294 3077 aaronmk
295
    mapping = sql_gen.ColDict(db, out_table, mapping)
296
        # after applying dicts.join() because that returns a plain dict
297
298
    # Resolve default value column
299
    if default != None:
300
        try: default = mapping[default]
301
        except KeyError:
302
            db.log_debug('Default value column '
303
                +strings.as_tt(strings.repr_no_u(default))
304
                +' does not exist in mapping, falling back to None', level=2.1)
305
            default = None
306
307 3287 aaronmk
    # Save default values for all rows since in_table may have rows deleted
308 3431 aaronmk
    if is_literals: pass
309
    elif is_function: full_in_table = in_table
310 3386 aaronmk
    else:
311
        full_in_table = sql_gen.suffixed_table(in_table, '_full')
312
        full_in_table_cols = [in_pkey_col]
313
        if default != None:
314
            full_in_table_cols.append(default)
315
            default = sql_gen.with_table(default, full_in_table)
316
        sql.run_query_into(db, sql.mk_select(db, in_table, full_in_table_cols,
317
            order_by=None), into=full_in_table, add_pkey_=True)
318 3287 aaronmk
319 3431 aaronmk
    if not is_literals:
320
        pkeys_names = [in_pkey, out_pkey]
321
        pkeys_cols = [in_pkey_col, out_pkey_col]
322 3077 aaronmk
323
    pkeys_table_exists_ref = [False]
324 3499 aaronmk
    def insert_into_pkeys(joins, cols=None, limit=None, **kw_args):
325 3477 aaronmk
        query = sql.mk_select(db, joins, cols, order_by=None, limit=limit)
326 3077 aaronmk
        if pkeys_table_exists_ref[0]:
327 3289 aaronmk
            sql.insert_select(db, into, pkeys_names, query, **kw_args)
328 3077 aaronmk
        else:
329 3304 aaronmk
            sql.run_query_into(db, query, into=into, add_pkey_=True, **kw_args)
330 3077 aaronmk
            pkeys_table_exists_ref[0] = True
331
332
    limit_ref = [None]
333 3418 aaronmk
    def mk_main_select(joins, cols):
334
        return sql.mk_select(db, joins, cols, limit=limit_ref[0], order_by=None)
335
336 3431 aaronmk
    if is_literals: insert_in_table = None
337
    else:
338
        insert_in_table = in_table
339
        insert_in_tables = [insert_in_table]
340 3352 aaronmk
    join_cols = sql_gen.ColDict(db, out_table)
341 3077 aaronmk
342
    exc_strs = set()
343
    def log_exc(e):
344
        e_str = exc.str_(e, first_line_only=True)
345
        log_debug('Caught exception: '+e_str)
346
        assert e_str not in exc_strs # avoid infinite loops
347
        exc_strs.add(e_str)
348
349
    def remove_all_rows():
350
        log_debug('Ignoring all rows')
351
        limit_ref[0] = 0 # just create an empty pkeys table
352
353 3352 aaronmk
    def ignore_cond(cond, e):
354
        out_table_cols = sql_gen.ColDict(db, out_table)
355
        out_table_cols.update(util.dict_subset_right_join({},
356
            sql.table_cols(db, out_table)))
357
358
        in_cols = []
359
        cond = sql.map_expr(db, cond, mapping, in_cols)
360
        cond = sql.map_expr(db, cond, out_table_cols)
361
362
        track_data_error(db, errors_table_, sql_gen.cols_srcs(in_cols), None,
363
            e.cause.pgcode,
364
            strings.ensure_newl(e.cause.pgerror)+'condition: '+cond)
365
366
        not_cond = sql_gen.NotCond(sql_gen.CustomCode(cond))
367
        log_debug('Ignoring rows where '+strings.as_tt(not_cond.to_str(db)))
368
        sql.delete(db, insert_in_table, not_cond)
369
370 3294 aaronmk
    not_null_cols = set()
371 3077 aaronmk
    def ignore(in_col, value, e):
372 3311 aaronmk
        in_col = sql_gen.with_table(in_col, insert_in_table)
373
374 3078 aaronmk
        track_data_error(db, errors_table_, in_col.srcs, value,
375 3077 aaronmk
            e.cause.pgcode, e.cause.pgerror)
376
        log_debug('Ignoring rows with '+strings.as_tt(repr(in_col))+' = '
377
            +strings.as_tt(repr(value)))
378 3294 aaronmk
379 3310 aaronmk
        sql.add_index(db, in_col, insert_in_table) # enable fast filtering
380 3294 aaronmk
        if value != None and in_col not in not_null_cols:
381
            # Try just mapping the value to NULL
382
            sql.update(db, insert_in_table, [(in_col, None)],
383
                sql_gen.ColValueCond(in_col, value))
384 3293 aaronmk
        else:
385 3309 aaronmk
            sql.delete(db, insert_in_table, sql_gen.ColValueCond(in_col, value))
386 3294 aaronmk
            if value == None: not_null_cols.add(in_col)
387 3077 aaronmk
388 3431 aaronmk
    if not is_literals:
389
        def insert_pkeys_table(which):
390
            return sql_gen.Table(sql_gen.concat(in_table.name,
391
                '_insert_'+which+'_pkeys'))
392
        insert_out_pkeys = insert_pkeys_table('out')
393
        insert_in_pkeys = insert_pkeys_table('in')
394 3077 aaronmk
395
    # Do inserts and selects
396
    while True:
397 3473 aaronmk
        has_joins = join_cols != {}
398
399 3077 aaronmk
        if limit_ref[0] == 0: # special case
400 3473 aaronmk
            assert not has_joins
401
402 3431 aaronmk
            if is_literals: return None
403 3472 aaronmk
            log_debug('Creating an empty output pkeys table')
404 3077 aaronmk
            cur = sql.run_query_into(db, sql.mk_select(db, out_table,
405 3312 aaronmk
                [out_pkey], order_by=None, limit=0), into=insert_out_pkeys)
406 3077 aaronmk
            break # don't do main case
407
408
        log_debug('Trying to insert new rows')
409
410
        # Prepare to insert new rows
411 3291 aaronmk
        if is_function:
412
            log_debug('Calling function on input rows')
413
            args = dict(((k.name, v) for k, v in mapping.iteritems()))
414
            func_call = sql_gen.NamedCol(out_pkey,
415
                sql_gen.FunctionCall(out_table, **args))
416 3477 aaronmk
417 3478 aaronmk
            if not is_literals:
418
                # Create empty pkeys table so its row type can be used
419 3499 aaronmk
                insert_into_pkeys(input_joins, [in_pkey_col, func_call],
420
                    limit=0, recover=True)
421
422
                # Create error handling wrapper function
423
                select_cols = [in_pkey_col]+args.values()
424
                args = dict(((k, sql_gen.with_table(v, sql_gen.Table('row')))
425
                    for k, v in args.iteritems()))
426
                func_call = sql_gen.FunctionCall(out_table, **args)
427
                wrapper = db.TempFunction(sql_gen.concat(into.name, '_wrap'))
428
                sql.define_func(db, sql_gen.FunctionDef(wrapper,
429
                    sql_gen.SetOf(into),
430
                    sql_gen.RowExcIgnore(sql_gen.RowType(in_table),
431
                        sql.mk_select(db, input_joins, order_by=None),
432
                        sql_gen.ReturnQuery(sql.mk_select(db,
433
                            fields=[sql_gen.Col(in_pkey, 'row'), func_call],
434
                            explain=False)),
435
                        exc_handler=sql_gen.plpythonu_error_handler)
436
                    ))
437
                wrapper_table = sql_gen.FunctionCall(wrapper)
438 3077 aaronmk
        else:
439 3291 aaronmk
            insert_args = dict(recover=True, cacheable=False)
440
            if has_joins:
441
                insert_args.update(dict(ignore=True))
442
            else:
443 3431 aaronmk
                insert_args.update(dict(returning=out_pkey))
444
                if not is_literals:
445
                    insert_args.update(dict(into=insert_out_pkeys))
446 3291 aaronmk
            main_select = mk_main_select([insert_in_table], [sql_gen.with_table(
447
                c, insert_in_table) for c in mapping.values()])
448 3077 aaronmk
449 3292 aaronmk
        try:
450
            cur = None
451 3077 aaronmk
            if is_function:
452 3431 aaronmk
                if is_literals: cur = sql.select(db, fields=[func_call])
453 3499 aaronmk
                else: insert_into_pkeys(wrapper_table, recover=True)
454 3077 aaronmk
            else:
455 3292 aaronmk
                cur = sql.insert_select(db, out_table, mapping.keys(),
456 3077 aaronmk
                    main_select, **insert_args)
457
            break # insert successful
458
        except sql.MissingCastException, e:
459
            log_exc(e)
460
461
            out_col = e.col
462
            type_ = e.type
463
464
            log_debug('Casting '+strings.as_tt(out_col)+' input to '
465
                +strings.as_tt(type_))
466 3111 aaronmk
            in_col = mapping[out_col]
467
            while True:
468
                try:
469
                    mapping[out_col] = cast_temp_col(db, type_, in_col,
470
                        errors_table_)
471
                    break # cast successful
472
                except sql.InvalidValueException, e:
473
                    log_exc(e)
474
475 3294 aaronmk
                    ignore(in_col, e.value, e)
476 3077 aaronmk
        except sql.DuplicateKeyException, e:
477
            log_exc(e)
478
479 3274 aaronmk
            # Different rows violating different unique constraints not
480
            # supported
481
            assert not join_cols
482
483 3077 aaronmk
            join_cols.update(util.dict_subset_right_join(mapping, e.cols))
484
            log_debug('Ignoring existing rows, comparing on these columns:\n'
485
                +strings.as_inline_table(join_cols, ustr=col_ustr))
486 3102 aaronmk
487 3431 aaronmk
            if is_literals:
488
                return sql.value(sql.select(db, out_table, [out_pkey_col],
489
                    mapping, order_by=None))
490
491 3102 aaronmk
            # Uniquify input table to avoid internal duplicate keys
492
            insert_in_table = sql.distinct_table(db, insert_in_table,
493 3358 aaronmk
                join_cols.values())
494 3144 aaronmk
            insert_in_tables.append(insert_in_table)
495 3077 aaronmk
        except sql.NullValueException, e:
496
            log_exc(e)
497
498
            out_col, = e.cols
499
            try: in_col = mapping[out_col]
500
            except KeyError:
501 3323 aaronmk
                msg = 'Missing mapping for NOT NULL column '+out_col
502
                log_debug(msg)
503
                if default == None: on_error(SyntaxError(msg)) # required col
504 3077 aaronmk
                remove_all_rows()
505 3294 aaronmk
            else: ignore(in_col, None, e)
506 3352 aaronmk
        except sql.CheckException, e:
507
            log_exc(e)
508
509
            ignore_cond(e.cond, e)
510 3413 aaronmk
        except sql.InvalidValueException, e:
511
            log_exc(e)
512
513
            for in_col in mapping.values(): ignore(in_col, e.value, e)
514 3474 aaronmk
        except psycopg2.extensions.TransactionRollbackError, e:
515
            log_exc(e)
516
            # retry
517 3077 aaronmk
        except sql.DatabaseErrors, e:
518
            log_exc(e)
519
520
            log_debug('No handler for exception')
521
            on_error(e)
522
            remove_all_rows()
523
        # after exception handled, rerun loop with additional constraints
524
525
    if cur != None and row_ct_ref != None and cur.rowcount >= 0:
526
        row_ct_ref[0] += cur.rowcount
527
528 3431 aaronmk
    if is_literals_or_function: pass # pkeys table already created
529 3077 aaronmk
    elif has_joins:
530
        select_joins = input_joins+[sql_gen.Join(out_table, join_cols)]
531
        log_debug('Getting output table pkeys of existing/inserted rows')
532 3306 aaronmk
        insert_into_pkeys(select_joins, pkeys_cols)
533 3077 aaronmk
    else:
534
        sql.add_row_num(db, insert_out_pkeys) # for joining with input pkeys
535
536
        log_debug('Getting input table pkeys of inserted rows')
537 3285 aaronmk
        # Note that mk_main_select() does not use ORDER BY. Instead, assume that
538
        # since the SELECT query is identical to the one used in INSERT SELECT,
539
        # its rows will be retrieved in the same order.
540 3077 aaronmk
        sql.run_query_into(db, mk_main_select(input_joins, [in_pkey]),
541
            into=insert_in_pkeys)
542
        sql.add_row_num(db, insert_in_pkeys) # for joining with output pkeys
543
544
        assert sql.table_row_count(db, insert_out_pkeys) == sql.table_row_count(
545
            db, insert_in_pkeys)
546
547
        log_debug('Combining output and input pkeys in inserted order')
548
        pkey_joins = [insert_in_pkeys, sql_gen.Join(insert_out_pkeys,
549
            {sql.row_num_col: sql_gen.join_same_not_null})]
550
        insert_into_pkeys(pkey_joins, pkeys_names)
551
552
        sql.empty_temp(db, [insert_out_pkeys, insert_in_pkeys])
553
554 3431 aaronmk
    if not is_literals_or_function:
555 3187 aaronmk
        log_debug('Setting pkeys of missing rows to '
556
            +strings.as_tt(repr(default)))
557 3287 aaronmk
        missing_rows_joins = [full_in_table, sql_gen.Join(into,
558 3187 aaronmk
            {in_pkey: sql_gen.join_same_not_null}, sql_gen.filter_out)]
559
            # must use join_same_not_null or query will take forever
560
        insert_into_pkeys(missing_rows_joins,
561 3287 aaronmk
            [sql_gen.Col(in_pkey, full_in_table),
562
            sql_gen.NamedCol(out_pkey, default)])
563 3187 aaronmk
    # otherwise, there is already an entry for every row
564 3077 aaronmk
565 3431 aaronmk
    if is_literals: return sql.value(cur)
566
    else:
567
        assert (sql.table_row_count(db, into)
568
            == sql.table_row_count(db, full_in_table))
569
570
        sql.empty_temp(db, insert_in_tables+[full_in_table])
571
572
        srcs = []
573
        if is_func: srcs = sql_gen.cols_srcs(in_cols)
574
        return sql_gen.Col(out_pkey, into, srcs)