Project

General

Profile

1
# SQL code generation
2

    
3
import copy
4
import itertools
5
import operator
6
from ordereddict import OrderedDict
7
import re
8
import UserDict
9
import warnings
10

    
11
import dicts
12
import exc
13
import iters
14
import lists
15
import objects
16
import regexp
17
import strings
18
import util
19

    
20
##### Names
21

    
22
identifier_max_len = 63 # works for both PostgreSQL and MySQL
23

    
24
def concat(str_, suffix):
25
    '''Preserves version so that it won't be truncated off the string, leading
26
    to collisions.'''
27
    # Preserve version
28
    match = re.match(r'^(.*?)((?:(?:#\d+)?\)?)*(?:\.\w+)+(?:::[\w ]+)*)$', str_)
29
    if match:
30
        str_, old_suffix = match.groups()
31
        suffix = old_suffix+suffix
32
    
33
    return strings.concat(str_, suffix, identifier_max_len)
34

    
35
def truncate(str_): return concat(str_, '')
36

    
37
def is_safe_name(name):
38
    '''A name is safe *and unambiguous* if it:
39
    * contains only *lowercase* word (\w) characters
40
    * doesn't start with a digit
41
    * contains "_", so that it's not a keyword
42
    '''
43
    return re.match(r'^(?=.*_)(?!\d)[^\WA-Z]+$', name)
44

    
45
def esc_name(name, quote='"'):
46
    return quote + name.replace(quote, quote+quote) + quote
47
        # doubling an embedded quote escapes it in both PostgreSQL and MySQL
48

    
49
def unesc_name(name, quote='"'):
50
    removed_ref = [False]
51
    name = strings.remove_prefix(quote, name, removed_ref)
52
    if removed_ref[0]:
53
        name = strings.remove_suffix(quote, name, removed_ref)
54
        assert removed_ref[0]
55
        name = name.replace(quote+quote, quote)
56
    return name
57

    
58
def clean_name(name): return name.replace('"', '').replace('`', '')
59

    
60
def esc_comment(comment): return '/*'+comment.replace('*/', '* /')+'*/'
61

    
62
def lstrip(str_):
63
    '''Also removes comments.'''
64
    if str_.startswith('/*'): comment, sep, str_ = str_.partition('*/')
65
    return str_.lstrip()
66

    
67
##### General SQL code objects
68

    
69
class MockDb:
70
    def esc_value(self, value): return strings.repr_no_u(value)
71
    
72
    def esc_name(self, name): return esc_name(name)
73
    
74
    def col_info(self, col):
75
        return TypedCol(col.name, '<type>', CustomCode('<default>'), True)
76

    
77
mockDb = MockDb()
78

    
79
class BasicObject(objects.BasicObject):
80
    def __str__(self): return clean_name(strings.repr_no_u(self))
81

    
82
##### Unparameterized code objects
83

    
84
class Code(BasicObject):
85
    def __init__(self, lang='sql'):
86
        self.lang = lang
87
    
88
    def to_str(self, db): raise NotImplementedError()
89
    
90
    def __repr__(self): return self.to_str(mockDb)
91

    
92
class CustomCode(Code):
93
    def __init__(self, str_):
94
        Code.__init__(self)
95
        
96
        self.str_ = str_
97
    
98
    def to_str(self, db): return self.str_
99

    
100
def as_Code(value, db=None):
101
    '''
102
    @param db If set, runs db.std_code() on the value.
103
    '''
104
    if isinstance(value, Code): return value
105
    
106
    if util.is_str(value):
107
        if db != None: value = db.std_code(value)
108
        return CustomCode(value)
109
    else: return Literal(value)
110

    
111
class Expr(Code):
112
    def __init__(self, expr):
113
        Code.__init__(self)
114
        
115
        self.expr = expr
116
    
117
    def to_str(self, db): return '('+self.expr.to_str(db)+')'
118

    
119
##### Names
120

    
121
class Name(Code):
122
    def __init__(self, name):
123
        Code.__init__(self)
124
        
125
        name = truncate(name)
126
        
127
        self.name = name
128
    
129
    def to_str(self, db): return db.esc_name(self.name)
130

    
131
def as_Name(value):
132
    if isinstance(value, Code): return value
133
    else: return Name(value)
134

    
135
##### Literal values
136

    
137
#### Primitives
138

    
139
class Literal(Code):
140
    def __init__(self, value):
141
        Code.__init__(self)
142
        
143
        self.value = value
144
    
145
    def to_str(self, db): return db.esc_value(self.value)
146

    
147
def as_Value(value):
148
    if isinstance(value, Code): return value
149
    else: return Literal(value)
150

    
151
def is_literal(value): return isinstance(value, Literal)
152

    
153
def is_null(value): return is_literal(value) and value.value == None
154

    
155
#### Composites
156

    
157
class List(Code):
158
    def __init__(self, values):
159
        Code.__init__(self)
160
        
161
        self.values = values
162
    
163
    def to_str(self, db): return ', '.join((v.to_str(db) for v in self.values))
164

    
165
class Tuple(List):
166
    def __init__(self, *values):
167
        List.__init__(self, values)
168
    
169
    def to_str(self, db): return '('+List.to_str(self, db)+')'
170

    
171
class Row(Tuple):
172
    def to_str(self, db): return 'ROW'+Tuple.to_str(self, db)
173

    
174
### Arrays
175

    
176
class Array(List):
177
    def __init__(self, values):
178
        values = map(remove_col_rename, values)
179
        
180
        List.__init__(self, values)
181
    
182
    def to_str(self, db): return 'ARRAY['+List.to_str(self, db)+']'
183

    
184
def to_Array(value):
185
    if isinstance(value, Array): return value
186
    return Array(lists.mk_seq(value))
187

    
188
##### Derived elements
189

    
190
src_self = object() # tells Col that it is its own source column
191

    
192
class Derived(Code):
193
    def __init__(self, srcs):
194
        '''An element which was derived from some other element(s).
195
        @param srcs See self.set_srcs()
196
        '''
197
        Code.__init__(self)
198
        
199
        self.set_srcs(srcs)
200
    
201
    def set_srcs(self, srcs, overwrite=True):
202
        '''
203
        @param srcs (self_type...)|src_self The element(s) this is derived from
204
        '''
205
        if not overwrite and self.srcs != (): return # already set
206
        
207
        if srcs == src_self: srcs = (self,)
208
        srcs = tuple(srcs) # make Col hashable
209
        self.srcs = srcs
210
    
211
    def _compare_on(self):
212
        compare_on = self.__dict__.copy()
213
        del compare_on['srcs'] # ignore
214
        return compare_on
215

    
216
def cols_srcs(cols): return lists.uniqify(iters.flatten((v.srcs for v in cols)))
217

    
218
##### Tables
219

    
220
class Table(Derived):
221
    def __init__(self, name, schema=None, srcs=(), is_temp=False):
222
        '''
223
        @param schema str|None (for no schema)
224
        @param srcs (Table...)|src_self See Derived.set_srcs()
225
        '''
226
        Derived.__init__(self, srcs)
227
        
228
        if util.is_str(name): name = truncate(name)
229
        
230
        self.name = name
231
        self.schema = schema
232
        self.is_temp = is_temp
233
        self.order_by = None
234
        self.index_cols = {}
235
    
236
    def to_str(self, db):
237
        str_ = ''
238
        if self.schema != None: str_ += as_Name(self.schema).to_str(db)+'.'
239
        str_ += as_Name(self.name).to_str(db)
240
        return str_
241
    
242
    def to_Table(self): return self
243
    
244
    def _compare_on(self):
245
        compare_on = Derived._compare_on(self)
246
        del compare_on['order_by'] # ignore
247
        del compare_on['index_cols'] # ignore
248
        return compare_on
249

    
250
def is_underlying_table(table):
251
    return isinstance(table, Table) and table.to_Table() is table
252

    
253
class NoUnderlyingTableException(Exception):
254
    def __init__(self, ref):
255
        Exception.__init__(self, 'for: '+strings.as_tt(strings.urepr(ref)))
256
        self.ref = ref
257

    
258
def underlying_table(table):
259
    table = remove_table_rename(table)
260
    if table != None and table.srcs:
261
        table, = table.srcs # for derived tables or row vars
262
    if not is_underlying_table(table): raise NoUnderlyingTableException(table)
263
    return table
264

    
265
def as_Table(table, schema=None):
266
    if table == None or isinstance(table, Code): return table
267
    else: return Table(table, schema)
268

    
269
def suffixed_table(table, suffix):
270
    table = copy.copy(table) # don't modify input!
271
    table.name = concat(table.name, suffix)
272
    return table
273

    
274
class NamedTable(Table):
275
    def __init__(self, name, code, cols=None):
276
        Table.__init__(self, name)
277
        
278
        code = as_Table(code)
279
        if not isinstance(code, (Table, FunctionCall, Expr)): code = Expr(code)
280
        if cols != None: cols = [to_name_only_col(c).to_Col() for c in cols]
281
        
282
        self.code = code
283
        self.cols = cols
284
    
285
    def to_str(self, db):
286
        str_ = self.code.to_str(db)
287
        if str_.find('\n') >= 0: whitespace = '\n'
288
        else: whitespace = ' '
289
        str_ += whitespace+'AS '+Table.to_str(self, db)
290
        if self.cols != None:
291
            str_ += ' ('+(', '.join((c.to_str(db) for c in self.cols)))+')'
292
        return str_
293
    
294
    def to_Table(self): return Table(self.name)
295

    
296
def remove_table_rename(table):
297
    if isinstance(table, NamedTable): table = table.code
298
    return table
299

    
300
##### Columns
301

    
302
class Col(Derived):
303
    def __init__(self, name, table=None, srcs=()):
304
        '''
305
        @param table Table|None (for no table)
306
        @param srcs (Col...)|src_self See Derived.set_srcs()
307
        '''
308
        Derived.__init__(self, srcs)
309
        
310
        if util.is_str(name): name = truncate(name)
311
        if util.is_str(table): table = Table(table)
312
        assert table == None or isinstance(table, Table)
313
        
314
        self.name = name
315
        self.table = table
316
    
317
    def to_str(self, db, for_str=False):
318
        str_ = as_Name(self.name).to_str(db)
319
        if for_str: str_ = clean_name(str_)
320
        if self.table != None:
321
            table = self.table.to_Table()
322
            if for_str: str_ = concat(strings.ustr(table), '.'+str_)
323
            else: str_ = table.to_str(db)+'.'+str_
324
        return str_
325
    
326
    def __str__(self): return self.to_str(mockDb, for_str=True)
327
    
328
    def to_Col(self): return self
329

    
330
def is_col(col): return isinstance(col, Col)
331

    
332
def is_table_col(col): return is_col(col) and col.table != None
333

    
334
def index_col(col):
335
    if not is_table_col(col): return None
336
    
337
    table = col.table
338
    try: name = table.index_cols[col.name]
339
    except KeyError: return None
340
    else: return Col(name, table, col.srcs)
341

    
342
def is_temp_col(col): return is_table_col(col) and col.table.is_temp
343

    
344
def as_Col(col, table=None, name=None):
345
    '''
346
    @param name If not None, any non-Col input will be renamed using NamedCol.
347
    '''
348
    if name != None:
349
        col = as_Value(col)
350
        if not isinstance(col, Col): col = NamedCol(name, col)
351
    
352
    if isinstance(col, Code): return col
353
    elif util.is_str(col): return Col(col, table)
354
    else: return Literal(col)
355

    
356
def with_table(col, table):
357
    if isinstance(col, NamedCol): pass # doesn't take a table
358
    elif isinstance(col, FunctionCall):
359
        col = copy.deepcopy(col) # don't modify input!
360
        col.args[0].table = table
361
    elif isinstance(col, Col):
362
        col = copy.copy(col) # don't modify input!
363
        col.table = table
364
    return col
365

    
366
def with_default_table(col, table):
367
    col = as_Col(col)
368
    if col.table == None: col = with_table(col, table)
369
    return col
370

    
371
def set_cols_table(table, cols):
372
    table = as_Table(table)
373
    
374
    for i, col in enumerate(cols):
375
        col = cols[i] = as_Col(col)
376
        col.table = table
377

    
378
def to_name_only_col(col, check_table=None):
379
    col = as_Col(col)
380
    if not is_table_col(col): return col
381
    
382
    if check_table != None:
383
        table = col.table
384
        assert table == None or table == check_table
385
    return Col(col.name)
386

    
387
def suffixed_col(col, suffix):
388
    return Col(concat(col.name, suffix), col.table, col.srcs)
389

    
390
def has_srcs(col): return is_col(col) and col.srcs
391

    
392
def cross_join_srcs(cols):
393
    cols = filter(has_srcs, cols) # empty srcs will mess up the cross join
394
    srcs = [[s.name for s in c.srcs] for c in cols]
395
    if not srcs: return [] # itertools.product() returns [()] for empty input
396
    return [Col(','.join(s)) for s in itertools.product(*srcs)]
397

    
398
class NamedCol(Col):
399
    def __init__(self, name, code):
400
        Col.__init__(self, name)
401
        
402
        code = as_Value(code)
403
        
404
        self.code = code
405
    
406
    def to_str(self, db):
407
        return self.code.to_str(db)+' AS '+Col.to_str(self, db)
408
    
409
    def to_Col(self): return Col(self.name)
410

    
411
def remove_col_rename(col):
412
    if isinstance(col, NamedCol): col = col.code
413
    return col
414

    
415
def underlying_col(col):
416
    col = remove_col_rename(col)
417
    if not isinstance(col, Col): raise NoUnderlyingTableException(col)
418
    
419
    return Col(col.name, underlying_table(col.table), col.srcs)
420

    
421
def wrap(wrap_func, value):
422
    '''Wraps a value, propagating any column renaming to the returned value.'''
423
    if isinstance(value, NamedCol):
424
        return NamedCol(value.name, wrap_func(value.code))
425
    else: return wrap_func(value)
426

    
427
class ColDict(dicts.DictProxy):
428
    '''A dict that automatically makes inserted entries Col objects.
429
    Anything that isn't a column is wrapped in a NamedCol with the key's column
430
    name by `as_Col(value, name=key.name)`.
431
    '''
432
    
433
    def __init__(self, db, keys_table, dict_={}):
434
        dicts.DictProxy.__init__(self, OrderedDict())
435
        
436
        keys_table = as_Table(keys_table)
437
        
438
        self.db = db
439
        self.table = keys_table
440
        self.update(dict_) # after setting vars because __setitem__() needs them
441
    
442
    def copy(self): return ColDict(self.db, self.table, self.inner.copy())
443
    
444
    def __getitem__(self, key):
445
        return dicts.DictProxy.__getitem__(self, self._key(key))
446
    
447
    def __setitem__(self, key, value):
448
        key = self._key(key)
449
        if value == None:
450
            try: value = self.db.col_info(key).default
451
            except NoUnderlyingTableException: pass # not a table column
452
        dicts.DictProxy.__setitem__(self, key, as_Col(value, name=key.name))
453
    
454
    def _key(self, key): return as_Col(key, self.table)
455

    
456
##### Definitions
457

    
458
class TypedCol(Col):
459
    def __init__(self, name, type_, default=None, nullable=True,
460
        constraints=None):
461
        assert default == None or isinstance(default, Code)
462
        
463
        Col.__init__(self, name)
464
        
465
        self.type = type_
466
        self.default = default
467
        self.nullable = nullable
468
        self.constraints = constraints
469
    
470
    def to_str(self, db):
471
        str_ = Col.to_str(self, db)+' '+as_Code(self.type).to_str(db)
472
        if not self.nullable: str_ += ' NOT NULL'
473
        if self.default != None: str_ += ' DEFAULT '+self.default.to_str(db)
474
        if self.constraints != None: str_ += ' '+self.constraints
475
        return str_
476
    
477
    def to_Col(self): return Col(self.name)
478

    
479
class SetOf(Code):
480
    def __init__(self, type_):
481
        Code.__init__(self)
482
        
483
        self.type = type_
484
    
485
    def to_str(self, db):
486
        return 'SETOF '+self.type.to_str(db)
487

    
488
class RowType(Code):
489
    def __init__(self, table):
490
        Code.__init__(self)
491
        
492
        self.table = table
493
    
494
    def to_str(self, db):
495
        return self.table.to_str(db)+'%ROWTYPE'
496

    
497
class ColType(Code):
498
    def __init__(self, col):
499
        Code.__init__(self)
500
        
501
        self.col = col
502
    
503
    def to_str(self, db):
504
        return self.col.to_str(db)+'%TYPE'
505

    
506
class ArrayType(Code):
507
    def __init__(self, elem_type):
508
        Code.__init__(self)
509
        elem_type = as_Code(elem_type)
510
        
511
        self.elem_type = elem_type
512
    
513
    def to_str(self, db):
514
        return self.elem_type.to_str(db)+'[]'
515

    
516
##### Functions
517

    
518
Function = Table
519
as_Function = as_Table
520

    
521
class InternalFunction(CustomCode): pass
522

    
523
#### Calls
524

    
525
class NamedArg(NamedCol):
526
    def __init__(self, name, value):
527
        NamedCol.__init__(self, name, value)
528
    
529
    def to_str(self, db):
530
        return Col.to_str(self, db)+' := '+self.code.to_str(db)
531

    
532
class FunctionCall(Code):
533
    def __init__(self, function, *args, **kw_args):
534
        '''
535
        @param args [Code|literal-value...] The function's arguments
536
        '''
537
        Code.__init__(self)
538
        
539
        function = as_Function(function)
540
        def filter_(arg): return remove_col_rename(as_Value(arg))
541
        args = map(filter_, args)
542
        args += [NamedArg(k, filter_(v)) for k, v in kw_args.iteritems()]
543
        
544
        self.function = function
545
        self.args = args
546
    
547
    def to_str(self, db):
548
        args_str = ', '.join((v.to_str(db) for v in self.args))
549
        return self.function.to_str(db)+'('+args_str+')'
550

    
551
def wrap_in_func(function, value):
552
    '''Wraps a value inside a function call.
553
    Propagates any column renaming to the returned value.
554
    '''
555
    return wrap(lambda v: FunctionCall(function, v), value)
556

    
557
def unwrap_func_call(func_call, check_name=None):
558
    '''Unwraps any function call to its first argument.
559
    Also removes any column renaming.
560
    '''
561
    func_call = remove_col_rename(func_call)
562
    if not isinstance(func_call, FunctionCall): return func_call
563
    
564
    if check_name != None:
565
        name = func_call.function.name
566
        assert name == None or name == check_name
567
    return func_call.args[0]
568

    
569
#### Definitions
570

    
571
class FunctionDef(Code):
572
    def __init__(self, function, return_type, body, params=[], modifiers=None):
573
        Code.__init__(self)
574
        
575
        return_type = as_Code(return_type)
576
        body = as_Code(body)
577
        
578
        self.function = function
579
        self.return_type = return_type
580
        self.body = body
581
        self.params = params
582
        self.modifiers = modifiers
583
    
584
    def to_str(self, db):
585
        params_str = (', '.join((p.to_str(db) for p in self.params)))
586
        str_ = '''\
587
CREATE FUNCTION '''+self.function.to_str(db)+'''('''+params_str+''')
588
RETURNS '''+self.return_type.to_str(db)+'''
589
LANGUAGE '''+self.body.lang+'''
590
'''
591
        if self.modifiers != None: str_ += self.modifiers+'\n'
592
        str_ += '''\
593
AS $$
594
'''+self.body.to_str(db)+'''
595
$$;
596
'''
597
        return str_
598

    
599
class FunctionParam(TypedCol):
600
    def __init__(self, name, type_, default=None, out=False):
601
        TypedCol.__init__(self, name, type_, default)
602
        
603
        self.out = out
604
    
605
    def to_str(self, db):
606
        str_ = TypedCol.to_str(self, db)
607
        if self.out: str_ = 'OUT '+str_
608
        return str_
609
    
610
    def to_Col(self): return Col(self.name)
611

    
612
### PL/pgSQL
613

    
614
class ReturnQuery(Code):
615
    def __init__(self, query):
616
        Code.__init__(self)
617
        
618
        query = as_Code(query)
619
        
620
        self.query = query
621
    
622
    def to_str(self, db):
623
        return 'RETURN QUERY\n'+strings.indent(self.query.to_str(db))+';\n'
624

    
625
## Exceptions
626

    
627
class BaseExcHandler(BasicObject):
628
    def to_str(self, db, body): raise NotImplementedError()
629
    
630
    def __repr__(self): return self.to_str(mockDb, '<body>')
631

    
632
suppress_exc = 'NULL;\n';
633

    
634
reraise_exc = 'RAISE USING ERRCODE = SQLSTATE, MESSAGE = SQLERRM;\n';
635

    
636
class ExcHandler(BaseExcHandler):
637
    def __init__(self, exc, handler=None):
638
        if handler != None: handler = as_Code(handler)
639
        
640
        self.exc = exc
641
        self.handler = handler
642
    
643
    def to_str(self, db, body):
644
        body = as_Code(body)
645
        
646
        if self.handler != None:
647
            handler_str = '\n'+strings.indent(self.handler.to_str(db), 2)
648
        else: handler_str = ' '+suppress_exc
649
        
650
        str_ = '''\
651
BEGIN
652
'''+strings.indent(body.to_str(db))+'''\
653
EXCEPTION
654
    WHEN '''+self.exc+''' THEN'''+handler_str+'''\
655
END;\
656
'''
657
        return str_
658

    
659
class NestedExcHandler(BaseExcHandler):
660
    def __init__(self, *handlers):
661
        '''
662
        @param handlers Sorted from outermost to innermost
663
        '''
664
        self.handlers = handlers
665
    
666
    def to_str(self, db, body):
667
        for handler in reversed(self.handlers): body = handler.to_str(db, body)
668
        return body
669

    
670
class ExcToWarning(Code):
671
    def __init__(self, return_):
672
        '''
673
        @param return_ Statement to return a default value in case of error
674
        '''
675
        Code.__init__(self)
676
        
677
        return_ = as_Code(return_)
678
        
679
        self.return_ = return_
680
    
681
    def to_str(self, db):
682
        return "RAISE WARNING '%', SQLERRM;\n"+self.return_.to_str(db)
683

    
684
unique_violation_handler = ExcHandler('unique_violation')
685

    
686
# Note doubled "\"s because inside Python string
687
plpythonu_error_handler = ExcHandler('internal_error', '''\
688
-- Handle PL/Python exceptions
689
DECLARE
690
    matches text[] := regexp_matches(SQLERRM,
691
        E'^(?:PL/Python: )?(\\\\w+): (.*)$'); -- .* also matches \\n
692
    exc_name text := matches[1];
693
    msg text := matches[2];
694
BEGIN
695
    /* Re-raise PL/Python exceptions with the PL/Python prefix removed.
696
    This allows the exception to be parsed like a native exception.
697
    Always raise as data_exception so it goes in the errors table. */
698
    IF exc_name IS NOT NULL THEN
699
        RAISE data_exception USING MESSAGE = msg;
700
    -- Re-raise non-PL/Python exceptions
701
    ELSE
702
        '''+reraise_exc+'''\
703
    END IF;
704
END;
705
''')
706

    
707
def data_exception_handler(handler):
708
    return ExcHandler('data_exception', handler)
709

    
710
row_var = Table('row')
711

    
712
class RowExcIgnore(Code):
713
    def __init__(self, row_type, select_query, with_row, cols=None,
714
        exc_handler=unique_violation_handler, row_var=row_var):
715
        '''
716
        @param row_type Ignored if a custom row_var is used.
717
        @pre If a custom row_var is used, it must already be defined.
718
        '''
719
        Code.__init__(self, lang='plpgsql')
720
        
721
        row_type = as_Code(row_type)
722
        select_query = as_Code(select_query)
723
        with_row = as_Code(with_row)
724
        row_var = as_Table(row_var)
725
        
726
        self.row_type = row_type
727
        self.select_query = select_query
728
        self.with_row = with_row
729
        self.cols = cols
730
        self.exc_handler = exc_handler
731
        self.row_var = row_var
732
    
733
    def to_str(self, db):
734
        if self.cols == None: row_vars = [self.row_var]
735
        else: row_vars = [Col(c.name, self.row_var) for c in self.cols]
736
        
737
        # Need an EXCEPTION block for each individual row because "When an error
738
        # is caught by an EXCEPTION clause, [...] all changes to persistent
739
        # database state within the block are rolled back."
740
        # This is unfortunate because "A block containing an EXCEPTION clause is
741
        # significantly more expensive to enter and exit than a block without
742
        # one."
743
        # (http://www.postgresql.org/docs/8.3/static/\
744
        # plpgsql-control-structures.html#PLPGSQL-ERROR-TRAPPING)
745
        str_ = '''\
746
FOR '''+(', '.join((v.to_str(db) for v in row_vars)))+''' IN
747
'''+strings.indent(self.select_query.to_str(db))+'''\
748
LOOP
749
'''+strings.indent(self.exc_handler.to_str(db, self.with_row))+'''\
750
END LOOP;
751
'''
752
        if self.row_var == row_var:
753
            str_ = '''\
754
DECLARE
755
    '''+self.row_var.to_str(db)+''' '''+self.row_type.to_str(db)+''';
756
BEGIN
757
'''+strings.indent(str_)+'''\
758
END;
759
'''
760
        return str_
761

    
762
##### Casts
763

    
764
class Cast(FunctionCall):
765
    def __init__(self, type_, value):
766
        type_ = as_Code(type_)
767
        value = as_Value(value)
768
        
769
        self.type_ = type_
770
        self.value = value
771
    
772
    def to_str(self, db):
773
        return 'CAST('+self.value.to_str(db)+' AS '+self.type_.to_str(db)+')'
774

    
775
def cast_literal(value):
776
    if not is_literal(value): return value
777
    
778
    if util.is_str(value.value): value = Cast('text', value)
779
    return value
780

    
781
##### Conditions
782

    
783
class NotCond(Code):
784
    def __init__(self, cond):
785
        Code.__init__(self)
786
        
787
        self.cond = cond
788
    
789
    def to_str(self, db): return 'NOT '+self.cond.to_str(db)
790

    
791
class ColValueCond(Code):
792
    def __init__(self, col, value):
793
        Code.__init__(self)
794
        
795
        value = as_ValueCond(value)
796
        
797
        self.col = col
798
        self.value = value
799
    
800
    def to_str(self, db): return self.value.to_str(db, self.col)
801

    
802
def combine_conds(conds, keyword=None):
803
    '''
804
    @param keyword The keyword to add before the conditions, if any
805
    '''
806
    str_ = ''
807
    if keyword != None:
808
        if conds == []: whitespace = ''
809
        elif len(conds) == 1: whitespace = ' '
810
        else: whitespace = '\n'
811
        str_ += keyword+whitespace
812
    
813
    str_ += '\nAND '.join(conds)
814
    return str_
815

    
816
##### Condition column comparisons
817

    
818
class ValueCond(BasicObject):
819
    def __init__(self, value):
820
        value = remove_col_rename(as_Value(value))
821
        
822
        self.value = value
823
    
824
    def to_str(self, db, left_value):
825
        '''
826
        @param left_value The Code object that the condition is being applied on
827
        '''
828
        raise NotImplemented()
829
    
830
    def __repr__(self): return self.to_str(mockDb, '<left_value>')
831

    
832
class CompareCond(ValueCond):
833
    def __init__(self, value, operator='='):
834
        '''
835
        @param operator By default, compares NULL values literally. Use '~=' or
836
            '~!=' to pass NULLs through.
837
        '''
838
        ValueCond.__init__(self, value)
839
        self.operator = operator
840
    
841
    def to_str(self, db, left_value):
842
        left_value = remove_col_rename(as_Col(left_value))
843
        
844
        right_value = self.value
845
        
846
        # Parse operator
847
        operator = self.operator
848
        passthru_null_ref = [False]
849
        operator = strings.remove_prefix('~', operator, passthru_null_ref)
850
        neg_ref = [False]
851
        operator = strings.remove_prefix('!', operator, neg_ref)
852
        equals = operator.endswith('=') # also includes <=, >=
853
        
854
        # Handle nullable columns
855
        check_null = False
856
        if not passthru_null_ref[0]: # NULLs compare equal
857
            try: left_value = ensure_not_null(db, left_value)
858
            except ensure_not_null_excs: # fall back to alternate method
859
                check_null = equals and isinstance(right_value, Col)
860
            else:
861
                if isinstance(left_value, EnsureNotNull):
862
                    right_value = ensure_not_null(db, right_value,
863
                        left_value.type) # apply same function to both sides
864
        
865
        if equals and is_null(right_value): operator = 'IS'
866
        
867
        left = left_value.to_str(db)
868
        right = right_value.to_str(db)
869
        
870
        # Create str
871
        str_ = left+' '+operator+' '+right
872
        if check_null:
873
            str_ = '('+str_+' OR ('+left+' IS NULL AND '+right+' IS NULL))'
874
        if neg_ref[0]: str_ = 'NOT '+str_
875
        return str_
876

    
877
# Tells as_ValueCond() to assume a non-ValueCond is a literal value
878
assume_literal = object()
879

    
880
def as_ValueCond(value, default_table=assume_literal):
881
    if not isinstance(value, ValueCond):
882
        if default_table is not assume_literal:
883
            value = with_default_table(value, default_table)
884
        return CompareCond(value)
885
    else: return value
886

    
887
##### Joins
888

    
889
join_same = object() # tells Join the left and right columns have the same name
890

    
891
# Tells Join the left and right columns have the same name and are never NULL
892
join_same_not_null = object()
893

    
894
filter_out = object() # tells Join to filter out rows that match the join
895

    
896
class Join(BasicObject):
897
    def __init__(self, table, mapping={}, type_=None):
898
        '''
899
        @param mapping dict(right_table_col=left_table_col, ...)
900
            * if left_table_col is join_same: left_table_col = right_table_col
901
              * Note that right_table_col must be a string
902
            * if left_table_col is join_same_not_null:
903
              left_table_col = right_table_col and both have NOT NULL constraint
904
              * Note that right_table_col must be a string
905
        @param type_ None (for plain join)|str (e.g. 'LEFT')|filter_out
906
            * filter_out: equivalent to 'LEFT' with the query filtered by
907
              `table_pkey IS NULL` (indicating no match)
908
        '''
909
        if util.is_str(table): table = Table(table)
910
        assert type_ == None or util.is_str(type_) or type_ is filter_out
911
        
912
        self.table = table
913
        self.mapping = mapping
914
        self.type_ = type_
915
    
916
    def to_str(self, db, left_table_):
917
        def join(entry):
918
            '''Parses non-USING joins'''
919
            right_table_col, left_table_col = entry
920
            
921
            # Switch order (right_table_col is on the left in the comparison)
922
            left = right_table_col
923
            right = left_table_col
924
            left_table = self.table
925
            right_table = left_table_
926
            
927
            # Parse left side
928
            left = with_default_table(left, left_table)
929
            
930
            # Parse special values
931
            left_on_right = Col(left.name, right_table)
932
            if right is join_same: right = left_on_right
933
            elif right is join_same_not_null:
934
                right = CompareCond(left_on_right, '~=')
935
            
936
            # Parse right side
937
            right = as_ValueCond(right, right_table)
938
            
939
            return right.to_str(db, left)
940
        
941
        # Create join condition
942
        type_ = self.type_
943
        joins = self.mapping
944
        if joins == {}: join_cond = None
945
        elif type_ is not filter_out and reduce(operator.and_,
946
            (v is join_same_not_null for v in joins.itervalues())):
947
            # all cols w/ USING, so can use simpler USING syntax
948
            cols = map(to_name_only_col, joins.iterkeys())
949
            join_cond = 'USING ('+(', '.join((c.to_str(db) for c in cols)))+')'
950
        else: join_cond = combine_conds(map(join, joins.iteritems()), 'ON')
951
        
952
        if isinstance(self.table, NamedTable): whitespace = '\n'
953
        else: whitespace = ' '
954
        
955
        # Create join
956
        if type_ is filter_out: type_ = 'LEFT'
957
        str_ = ''
958
        if type_ != None: str_ += type_+' '
959
        str_ += 'JOIN'+whitespace+self.table.to_str(db)
960
        if join_cond != None: str_ += whitespace+join_cond
961
        return str_
962
    
963
    def __repr__(self): return self.to_str(mockDb, '<left_table>')
964

    
965
##### Value exprs
966

    
967
all_cols = CustomCode('*')
968

    
969
default = CustomCode('DEFAULT')
970

    
971
row_count = FunctionCall(InternalFunction('COUNT'), all_cols)
972

    
973
class Coalesce(FunctionCall):
974
    def __init__(self, *args):
975
        FunctionCall.__init__(self, InternalFunction('COALESCE'), *args)
976

    
977
class Nullif(FunctionCall):
978
    def __init__(self, *args):
979
        FunctionCall.__init__(self, InternalFunction('NULLIF'), *args)
980

    
981
null_as_str = Cast('text', 'NULL')
982

    
983
def to_text(value): return Coalesce(Cast('text', value), null_as_str)
984

    
985
# See <http://www.postgresql.org/docs/8.3/static/datatype-numeric.html>
986
null_sentinels = {
987
    'character varying': r'\N',
988
    'double precision': 'NaN',
989
    'integer': 2147483647,
990
    'text': r'\N',
991
    'date': 'infinity',
992
    'timestamp with time zone': 'infinity',
993
    'taxonrank': 'unknown',
994
}
995

    
996
class EnsureNotNull(Coalesce):
997
    def __init__(self, value, type_):
998
        if isinstance(type_, ArrayType): null = []
999
        else: null = null_sentinels[type_]
1000
        Coalesce.__init__(self, as_Col(value), Cast(type_, null))
1001
        
1002
        self.type = type_
1003
    
1004
    def to_str(self, db):
1005
        col = self.args[0]
1006
        index_col_ = index_col(col)
1007
        if index_col_ != None: return index_col_.to_str(db)
1008
        return Coalesce.to_str(self, db)
1009

    
1010
#### Arrays
1011

    
1012
class ArrayMerge(FunctionCall):
1013
    def __init__(self, sep, array):
1014
        array = to_Array(array)
1015
        FunctionCall.__init__(self, InternalFunction('array_to_string'), array,
1016
            sep)
1017

    
1018
def merge_not_null(db, sep, values):
1019
    return ArrayMerge(sep, map(to_text, values))
1020

    
1021
##### Table exprs
1022

    
1023
class Values(Code):
1024
    def __init__(self, values):
1025
        '''
1026
        @param values [...]|[[...], ...] Can be one or multiple rows.
1027
        '''
1028
        Code.__init__(self)
1029
        
1030
        rows = values
1031
        if len(values) >= 1 and not lists.is_seq(values[0]): # only one row
1032
            rows = [values]
1033
        for i, row in enumerate(rows):
1034
            rows[i] = map(remove_col_rename, map(as_Value, row))
1035
        
1036
        self.rows = rows
1037
    
1038
    def to_str(self, db):
1039
        return 'VALUES '+(', '.join((Tuple(*r).to_str(db) for r in self.rows)))
1040

    
1041
def NamedValues(name, cols, values):
1042
    '''
1043
    @param cols None|[...]
1044
    @post `cols` will be changed to Col objects with the table set to `name`.
1045
    '''
1046
    table = NamedTable(name, Values(values), cols)
1047
    if cols != None: set_cols_table(table, cols)
1048
    return table
1049

    
1050
##### Database structure
1051

    
1052
def is_nullable(db, value):
1053
    if not is_table_col(value): return is_null(value)
1054
    try: return db.col_info(value).nullable
1055
    except NoUnderlyingTableException: return True # not a table column
1056

    
1057
text_types = set(['character varying', 'text'])
1058

    
1059
def is_text_type(type_): return type_ in text_types
1060

    
1061
def is_text_col(db, col): return is_text_type(db.col_info(col).type)
1062

    
1063
def canon_type(type_):
1064
    if type_ in text_types: return 'text'
1065
    else: return type_
1066

    
1067
ensure_not_null_excs = (NoUnderlyingTableException, KeyError)
1068

    
1069
def ensure_not_null(db, col, type_=None):
1070
    '''
1071
    @param col If type_ is not set, must have an underlying column.
1072
    @param type_ If set, overrides the underlying column's type and casts the
1073
        column to it if needed.
1074
    @return EnsureNotNull|Col
1075
    @throws ensure_not_null_excs
1076
    '''
1077
    col = remove_col_rename(col)
1078
    
1079
    try: col_type = db.col_info(underlying_col(col)).type
1080
    except NoUnderlyingTableException:
1081
        if type_ == None and is_null(col): raise # NULL has no type
1082
    else:
1083
        if type_ == None: type_ = col_type
1084
        elif type_ != col_type: col = Cast(type_, col)
1085
    
1086
    if is_nullable(db, col):
1087
        try: col = EnsureNotNull(col, type_)
1088
        except KeyError, e:
1089
            # Warn of no null sentinel for type, even if caller catches error
1090
            warnings.warn(UserWarning(exc.str_(e)))
1091
            raise
1092
    
1093
    return col
1094

    
1095
def try_mk_not_null(db, value):
1096
    '''
1097
    Warning: This function does not guarantee that its result is NOT NULL.
1098
    '''
1099
    try: return ensure_not_null(db, value)
1100
    except ensure_not_null_excs: return value
1101

    
1102
##### Expression transforming
1103

    
1104
true_expr = 'true'
1105
false_expr = 'false'
1106

    
1107
true_re = true_expr
1108
false_re = false_expr
1109
bool_re = r'(?:'+true_re+r'|'+false_re+r')'
1110
atom_re = r'(?:'+bool_re+r'|\([^()]*\)'+r')'
1111

    
1112
def logic_op_re(op, value_re, expr_re=''):
1113
    op_re = ' '+op+' '
1114
    return '(?:'+expr_re+op_re+value_re+'|'+value_re+op_re+expr_re+')'
1115

    
1116
not_re = r'\bNOT '
1117
not_false_re = not_re+false_re+r'\b'
1118
not_true_re = not_re+true_re+r'\b'
1119
and_false_re = logic_op_re('AND', false_re, atom_re)
1120
and_false_not_true_re = '(?:'+not_true_re+'|'+and_false_re+')'
1121
and_true_re = logic_op_re('AND', true_re)
1122
or_re = logic_op_re('OR', bool_re)
1123
or_and_true_re = '(?:'+and_true_re+'|'+or_re+')'
1124

    
1125
def simplify_parens(expr):
1126
    return regexp.sub_nested(r'\(('+atom_re+')\)', r'\1', expr)
1127

    
1128
def simplify_recursive(sub_func, expr):
1129
    '''
1130
    @param sub_func See regexp.sub_recursive() sub_func param
1131
    '''
1132
    return regexp.sub_recursive(lambda s: sub_func(simplify_parens(s)), expr)
1133
        # simplify_parens() is also done at end in final iteration
1134

    
1135
def simplify_expr(expr):
1136
    def simplify_logic_ops(expr):
1137
        total_n = 0
1138
        expr, n = re.subn(not_false_re, true_re, expr)
1139
        total_n += n
1140
        expr, n = re.subn(and_false_not_true_re, false_expr, expr)
1141
        total_n += n
1142
        expr, n = re.subn(or_and_true_re, r'', expr)
1143
        total_n += n
1144
        return expr, total_n
1145
    
1146
    expr = expr.replace('(NULL IS NULL)', true_expr)
1147
    expr = expr.replace('(NULL IS NOT NULL)', false_expr)
1148
    expr = simplify_recursive(simplify_logic_ops, expr)
1149
    return expr
1150

    
1151
name_re = r'(?:\w+|(?:"[^"]*")+)'
1152

    
1153
def parse_expr_col(str_):
1154
    match = re.match(r'^\('+name_re+r'\(('+name_re+r').*\)\)$', str_)
1155
    if match: str_ = match.group(1)
1156
    return unesc_name(str_)
1157

    
1158
def map_expr(db, expr, mapping, in_cols_found=None):
1159
    '''Replaces output columns with input columns in an expression.
1160
    @param in_cols_found If set, will be filled in with the expr's (input) cols
1161
    '''
1162
    for out, in_ in mapping.iteritems():
1163
        orig_expr = expr
1164
        out = to_name_only_col(out)
1165
        in_str = to_name_only_col(remove_col_rename(in_)).to_str(db)
1166
        
1167
        # Replace out both with and without quotes
1168
        expr = expr.replace(out.to_str(db), in_str)
1169
        expr = re.sub(r'(?<!["\'\.=\[])\b'+out.name+r'\b(?!["\',\.=\]])',
1170
            in_str, expr)
1171
        
1172
        if in_cols_found != None and expr != orig_expr: # replaced something
1173
            in_cols_found.append(in_)
1174
    
1175
    return simplify_expr(expr)
(29-29/42)