From 370c1f838d1363df4ef903794dbd487f386e8370 Mon Sep 17 00:00:00 2001 From: Oleg Silkin Date: Tue, 13 Aug 2019 00:30:19 -0400 Subject: [PATCH] Adds prototype query parser --- src/database/reader.py | 184 +++++++++++++++++++++++++++++++++++++++++ 1 file changed, 184 insertions(+) create mode 100644 src/database/reader.py diff --git a/src/database/reader.py b/src/database/reader.py new file mode 100644 index 0000000..1a83fc2 --- /dev/null +++ b/src/database/reader.py @@ -0,0 +1,184 @@ +import sqlite3 +import typing +import re + + + +SEARCH_PARAMS = { + 'timestamp': int, + 'is_hidden': bool, # boolean + 'comment_id': str, # strings + 'parent_id': str, + 'channel_name': str, + 'channel_url': str, + 'channel_id': str, + 'claim_id': str, + 'signature': str, + 'signing_ts': str, + 'comment': str, +} + +TABLE = 'COMMENTS_ON_CLAIMS' + + + + + +ID_PARAM_LENS = { + 'comment_id': 64, + 'channel_id': 40, + 'claim_id': 40, + 'signature': 128, + 'parent_id': 64 +} + +IDENTIFIERS = { + 'signature', + 'comment_id', + 'parent_id', + 'channel_id', + 'claim_id' +} + +GROUPABLE = { + 'channel_name', + 'channel_url' +} | IDENTIFIERS + +GROUP_PARAMS = re.compile(rf"({'|'.join(GROUPABLE)})s") +ID_PARAMS = re.compile(rf"({'|'.join(IDENTIFIERS)})") + + +def create_query(cols=None, **constraints): + table = 'COMMENTS_ON_CLAIMS' + for key in constraints.copy().keys(): + if GROUP_PARAMS.fullmatch(key): + constraint = constraints.pop(key) + constraints.update({ + f'{table}.{key[:-1]}__in': constraint + }) + elif ID_PARAMS.fullmatch(key): + constraint = constraints.pop(key) + if isinstance(constraint, str): + if len(constraint) < ID_PARAM_LENS[key]: + constraints[f'{table}.{key}__like'] = constraint + '%' + else: + constraints[f'{table}.{key}__eq'] = constraint + else: + constraint[f'{table}.{key}__is_null'] = True + + ops = {'>': '__gt', '>=': '__gte', '<': '__lt', '<=': '__lte'} + if 'timestamp' in constraints: + time = constraints.pop('timestamp') + prefix = f'{table}.timestamp' + if isinstance(time, str): + if len(time) > 2 and time[:2] in ops: + constraints[f'{prefix}{ops[time[:2]]}'] = int(time[2:]) + elif len(time) > 1 and time[:1] in ops: + constraints[f'{prefix}{ops[time[:1]]}'] = int(time[1:]) + else: + constraints[f'{prefix}__eq'] = int(time) + elif isinstance(time, int): + constraints[f'{prefix}__eq'] = time + + if 'channel_name' in constraints: + constraint = constraints.pop('channel_name') + prefix = f'{table}.channel_name' + if isinstance(constraint, str): + constraints[f'{prefix}__like'] = constraint + + if 'channel_is_null' in constraints: + constraint = constraints.pop('channel_is_null') + prefix = f'{table}.channel_id' + if isinstance(constraint, bool): + prefix += '__is_null' if constraint else '__is_not_null' + constraints[prefix] = True + + if 'channel_url' in constraints: + constraint = constraints.pop('channel_url') + prefix = f'{table}.channel_url__like' + if isinstance(constraint, str): + constraints[prefix] = constraint + + if 'is_hidden' in constraints: + constraint = constraints.pop('is_hidden') + if isinstance(constraint, bool): + constraints[f'{table}.is_hidden__is'] = constraint + else: + constraints[f'{table}.is_hidden__is'] = True + + if 'signing_ts' in constraints: + constraint = constraints.pop('signing_ts') + if isinstance(constraint, str): + constraints[f'{table}.signing_ts__like'] = constraint + elif isinstance(constraint, int): + constraints[f'{table}.signing_ts__eq'] = str(constraint) + elif constraint is None: + constraints[f'{table}.signing_ts__is_null'] = True + if 'comment' in constraints: + constraint = constraints.pop('comment') + if isinstance(constraint, str): + constraints[f'{table}.comment__like'] = constraint + + sql = ['SELECT'] + if isinstance(cols, (list, tuple)): + sql.append(', '.join(cols)) + elif isinstance(cols, dict): + sql.append(', '.join(f'{col} AS {cola}' for col, cola in cols.items())) + else: + sql.append('*') + sql += ['FROM', table] + if len(constraints) > 0: + conditions, constraints = constraints_to_sql(**constraints) + sql += ['WHERE', conditions] + + return '\n'.join(sql), constraints + + +OPS = { + 'eq': '=', + 'gt': '>', + 'lt': '<', + 'gte': '>=', + 'lte': '<=', + 'like': 'LIKE', + 'is': 'IS', + 'is_not': 'IS NOT', + 'is_null': 'IS NULL', + 'is_not_null': 'IS NOT NULL', + 'in': 'IN', + 'not_in': 'NOT IN' +} + + +def constraints_to_sql(**constraints): + sql_params = {} + sql_stmts = [] + for constraint, value in constraints.items(): + if constraint.find('__'): + col, op = constraint.split('__') + param = col.split('.')[1] + statement = [param, OPS[op]] + if op[-2:] == 'in' and isinstance(value, (list, tuple, set)): + param_list = ", ".join(f':{param}{i}' for i in range(len(value))) + statement.append(f'({param_list})') + sql_params.update({f'{param}{i}': v for i, v in enumerate(value)}) + elif 'null' not in op: + statement.append(':' + param) + sql_params[param] = value + sql_stmts.append(' '.join(statement)) + + inner_where = ' AND '.join(sql_stmts) + return inner_where, sql_params + + +def _page_to_limit(**constraints): + limit = constraints.pop('page_size', None) + page = constraints.pop('page', None) + if limit and isinstance(int, limit): + constraints['LIMIT'] = limit + if page and isinstance(page, int): + constraints['OFFSET'] = limit * (page - 1) + return constraints + +