refactor(sql): complete modularization of search builders and ID resolution

2026-01-06 17:58:34 -05:00
parent 56fe7ed953
commit 868a0060dc
3 changed files with 186 additions and 146 deletions
--- a/app/db_sql.py
+++ b/app/db_sql.py
@@ -20,7 +20,8 @@ from app.lib_sql_search import (
    sql_fulltext_qry_part as _sql_fulltext_qry_part,
    sql_enable_part as _sql_enable_part,
    sql_hidden_part as _sql_hidden_part,
-    sql_where_qry_part as _sql_where_qry_part
+    sql_where_qry_part as _sql_where_qry_part,
+    sql_search_qry_part as _sql_search_qry_part
 )

 from app.lib_redis_helpers import (
@@ -1768,156 +1769,32 @@ def sql_limit_offset_part(limit: int, offset: int = 0) -> bool|str:
 # ### END ### API DB SQL Methods ### sql_limit_offset_part() ###


-# ### BEGIN ### API DB SQL Methods ### sql_search_qry_part() ###
-# NEW 2026-01-02
-# Updated to support complex POST-based searches with recursive logical grouping.
-# Updated 2026-01-06 to handle missing default_qry_str column gracefully.
@logger_reset
+
+
 def sql_search_qry_part(
+
+
        search_query: Any, # SearchQuery model instance
+
+
        searchable_fields: List[str]|None = None, # List of allowed fields
+
+
        max_depth: int = 5, # Maximum recursion depth
+
+
        table_name: str|None = None, # Target table for schema validation
+
+
        ) -> tuple[str, dict]:
-    """
-    Recursively builds a SQL WHERE clause from a SearchQuery model.
-    Uses unique parameter names to prevent collisions.
-    Enforces security via field allowlist and recursion depth limits.
-    """
+
+
    log.setLevel(logging.INFO)
+
+
    log.debug(locals())

-    data = {}
-    param_counter = [0] 

-    def get_param_name():
-        param_counter[0] += 1
-        return f"sp_{param_counter[0]}"
+    return _sql_search_qry_part(search_query, searchable_fields, max_depth, table_name)

-    operator_map = {
-        "eq": "=",
-        "ne": "!=",
-        "gt": ">",
-        "gte": ">=",
-        "lt": "<",
-        "lte": "<=",
-        "like": "LIKE",
-        "in": "IN",
-        "is_null": "IS NULL",
-        "is_not_null": "IS NOT NULL",
-        "contains": "LIKE",
-        "icontains": "LIKE",
-        "startswith": "LIKE",
-        "istartswith": "LIKE",
-        "endswith": "LIKE",
-        "iendswith": "LIKE"
-    }
-
-    def process_node(query_node, current_depth: int) -> str:
-        if current_depth > max_depth:
-            raise HTTPException(status_code=400, detail=f"Search query too complex (max depth {max_depth} reached).")
-
-        clauses = []
-        
-        # Process 'query_string' (Standardized Full-Text Search)
-        if hasattr(query_node, 'query_string') and query_node.query_string:
-            if query_node.query_string == '%':
-                # Wildcard: Skip filtering for this part
-                pass
-            else:
-                # Check if default_qry_str exists in this table/view
-                use_match = True
-                if table_name:
-                    try:
-                        db.execute(text(f"SELECT default_qry_str FROM `{table_name}` LIMIT 0"))
-                    except:
-                        use_match = False
-                else:
-                    use_match = False # Safe default if no table_name
-
-                if use_match:
-                    p_name = get_param_name()
-                    clauses.append(f"MATCH( default_qry_str ) AGAINST( :{p_name} IN BOOLEAN MODE )")
-                    data[p_name] = query_node.query_string
-                elif searchable_fields:
-                    # Fallback: OR LIKE across all searchable fields
-                    like_clauses = []
-                    for field in searchable_fields:
-                        # Skip internal/numeric fields for full-text-like search
-                        if not any(x in field for x in ['_id', 'enable', 'hide', 'priority', 'sort', 'group', 'created_on', 'updated_on']):
-                            f_p_name = get_param_name()
-                            like_clauses.append(f"`{field}` LIKE :{f_p_name}")
-                            data[f_p_name] = f"%{query_node.query_string}%"
-                    if like_clauses:
-                        clauses.append(f"({' OR '.join(like_clauses)})")
-
-        # Process 'and' filters
-        if hasattr(query_node, 'and_filters') and query_node.and_filters:
-            and_clauses = []
-            for item in query_node.and_filters:
-                if hasattr(item, 'field'): # SearchFilter
-                    clause, item_data = process_filter(item)
-                    and_clauses.append(clause)
-                    data.update(item_data)
-                else: # Nested SearchQuery
-                    and_clauses.append(f"({process_node(item, current_depth + 1)})")
-            if and_clauses:
-                clauses.append(f"({' AND '.join(and_clauses)})")
-
-        # Process 'or' filters
-        if hasattr(query_node, 'or_filters') and query_node.or_filters:
-            or_clauses = []
-            for item in query_node.or_filters:
-                if hasattr(item, 'field'): # SearchFilter
-                    clause, item_data = process_filter(item)
-                    or_clauses.append(clause)
-                    data.update(item_data)
-                else: # Nested SearchQuery
-                    or_clauses.append(f"({process_node(item, current_depth + 1)})")
-            if or_clauses:
-                clauses.append(f"({' OR '.join(or_clauses)})")
-
-        return ' AND '.join(clauses)
-
-    def process_filter(f) -> tuple[str, dict]:
-        # Field Validation: Check against allowlist
-        if searchable_fields is not None and f.field not in searchable_fields:
-            raise HTTPException(status_code=400, detail=f"Searching on field '{f.field}' is not permitted.")
-
-        op_lower = f.op.lower()
-        sql_op = operator_map.get(op_lower)
-        if not sql_op:
-            raise HTTPException(status_code=400, detail=f"Unsupported search operator: {f.op}")
-
-        filter_data = {}
-        if op_lower in ['is_null', 'is_not_null']:
-            clause = f"`{f.field}` {sql_op}"
-        elif op_lower == 'in':
-            p_name = get_param_name()
-            clause = f"`{f.field}` IN (:{p_name})"
-            filter_data[p_name] = f.value
-        elif op_lower in ['contains', 'icontains']:
-            p_name = get_param_name()
-            clause = f"`{f.field}` LIKE :{p_name}"
-            filter_data[p_name] = f"%{f.value}%"
-        elif op_lower in ['startswith', 'istartswith']:
-            p_name = get_param_name()
-            clause = f"`{f.field}` LIKE :{p_name}"
-            filter_data[p_name] = f"{f.value}%"
-        elif op_lower in ['endswith', 'iendswith']:
-            p_name = get_param_name()
-            clause = f"`{f.field}` LIKE :{p_name}"
-            filter_data[p_name] = f"%{f.value}"
-        else:
-            p_name = get_param_name()
-            clause = f"`{f.field}` {sql_op} :{p_name}"
-            filter_data[p_name] = f.value
-        
-        return clause, filter_data
-
-    # Initial processing
-    sql_where = process_node(search_query, 1)
-    if sql_where:
-        return f"AND ({sql_where})", data
-    return "", {}
-# ### END ### API DB SQL Methods ### sql_search_qry_part() ###
--- a/app/lib_redis_helpers.py
+++ b/app/lib_redis_helpers.py
@@ -87,9 +87,9 @@ def redis_lookup_id_random(
            log.debug(f'SQL: SELECT result: {select_results}')
            if isinstance(select_results, dict):
                log.info(f"""SQL: Found ID Random for: {str(record_id_random)} = {str(select_results.get('id'))}""")
-                if rid := select_results.get('id'):
-                    r.setex(key_name, datetime.timedelta(minutes=minutes), value=rid)
-                    return int(rid)
+                if record_id := select_results.get('id'):
+                    r.setex(key_name, datetime.timedelta(minutes=minutes), value=record_id)
+                    return int(record_id)
                else:
                    log.error('The SQL result was not what was expected. The ID field was not found.')
                    return False
@@ -141,4 +141,87 @@ def reset_redis():
    """Flushes the Redis database used for ID caching."""
    r = redis.Redis(host=settings.REDIS['server'], port=settings.REDIS['port'], db=7, password=None, decode_responses=True)
    r.flushdb()
-    return True
+    return True
+
+
+def lookup_id_random_pop(
+        obj_data: dict,
+        log_lvl: int = logging.WARNING, # DEBUG, INFO, WARNING, ERROR, EXCEPTION, CRITICAL
+        ):
+    """
+    Look up and resolve id_random values to their id
+    Remove the unneeded *_id_random key from the dict
+    """
+    log.setLevel(log_lvl)
+    
+    # Common prefixes for ID resolution
+    id_prefixes = [
+        'account', 'activity_log', 'address', 'address_location', 'archive', 
+        'contact', 'contact_1', 'contact_2', 'cont_edu_cert', 'cont_edu_cert_person',
+        'event', 'event_id_random_only', 'event_abstract', 'event_badge', 
+        'event_badge_template', 'event_exhibit', 'event_file', 'event_location', 
+        'event_person', 'event_person_profile', 'event_presentation', 
+        'event_presenter', 'event_registration', 'event_session', 'event_track', 
+        'grant', 'hosted_file', 'journal', 'journal_entry', 'membership_group', 
+        'membership_person_group', 'membership_person', 'membership_type', 
+        'membership_person_type', 'order', 'order_line', 'order_cart', 
+        'order_cart_line', 'organization', 'page', 'person', 'poc_event_person', 
+        'poc_person', 'post', 'product', 'sponsorship', 'sponsorship_cfg', 
+        'site', 'user'
+    ]
+
+    for prefix in id_prefixes:
+        key = f'{prefix}_id_random'
+        if key in obj_data:
+            # Table name mapping
+            table = prefix
+            if prefix == 'address_location': table = 'address'
+            elif prefix in ['contact_1', 'contact_2']: table = 'contact'
+            elif prefix == 'event_id_random_only': table = 'event'
+            elif prefix == 'poc_event_person': table = 'event_person'
+            elif prefix == 'poc_person': table = 'person'
+            
+            resolved_id = redis_lookup_id_random(record_id_random=obj_data[key], table_name=table)
+            obj_data[f'{prefix if not prefix.endswith("_id_random_only") else prefix[:-15]+"_id_only"}'] = resolved_id
+            # Special case for event_id_random_only
+            target_id_key = f'{prefix[:-7]}' if prefix.endswith('_random') else f'{prefix}_id'
+            if prefix == 'event_id_random_only': target_id_key = 'event_id_only'
+            
+            obj_data[target_id_key] = resolved_id
+            obj_data.pop(key)
+
+    # Polymorphic links
+    polymorphic = [
+        ('for_type', 'for_id_random', 'for_id'),
+        ('link_to_type', 'link_to_id_random', 'link_to_id'),
+        ('object_type', 'object_id_random', 'object_id'),
+        ('to_object_type', 'to_object_id_random', 'to_object_id'),
+        ('from_object_type', 'from_object_id_random', 'from_object_id')
+    ]
+
+    for type_key, rand_key, id_key in polymorphic:
+        if type_key in obj_data and rand_key in obj_data:
+            obj_data[id_key] = redis_lookup_id_random(
+                record_id_random=obj_data.get(rand_key), 
+                table_name=obj_data.get(type_key)
+            )
+            obj_data.pop(rand_key)
+
+    return obj_data
+
+
+def get_account_id_w_for_type_id(
+        for_type: str, # This is the table name
+        for_id: int|str,
+        ) -> bool|int|None:
+    """Helper to find an account_id associated with an object."""
+    from app.db_sql import sql_select
+    log.setLevel(logging.WARNING)
+    
+    if fid := redis_lookup_id_random(record_id_random=for_id, table_name=for_type):
+        data = {'for_id': fid}
+        sql = f"SELECT account_id FROM `{for_type}` WHERE id = :for_id LIMIT 1;"
+        if result := sql_select(data=data, sql=sql):
+            return result.get('account_id')
+        return False
+    return None
--- a/app/lib_sql_search.py
+++ b/app/lib_sql_search.py
@@ -2,6 +2,8 @@
 Modular search builder and query generators for Aether.
 """
 import logging
+from typing import Any, List, Optional
+from fastapi import HTTPException
 from sqlalchemy import text

 log = logging.getLogger(__name__)
@@ -123,3 +125,81 @@ def sql_where_qry_part(qry_dict_li: list) -> tuple[str, dict]|bool:
            data[field] = val
        return ' '.join(clauses), data
    return False
+
+def sql_search_qry_part(
+        search_query: Any,
+        searchable_fields: List[str]|None = None,
+        max_depth: int = 5,
+        table_name: str|None = None,
+        ) -> tuple[str, dict]:
+    """Recursively builds a SQL WHERE clause from a SearchQuery model."""
+    from app.db_sql import db
+    data = {}
+    param_counter = [0] 
+
+    def get_param_name():
+        param_counter[0] += 1
+        return f"sp_{param_counter[0]}"
+
+    operator_map = {
+        "eq": "=", "ne": "!=", "gt": ">", "gte": ">=", "lt": "<", "lte": "<=",
+        "like": "LIKE", "in": "IN", "is_null": "IS NULL", "is_not_null": "IS NOT NULL",
+        "contains": "LIKE", "icontains": "LIKE", "startswith": "LIKE", "istartswith": "LIKE",
+        "endswith": "LIKE", "iendswith": "LIKE"
+    }
+
+    def process_node(query_node, current_depth: int) -> str:
+        if current_depth > max_depth:
+            raise HTTPException(status_code=400, detail=f"Search query too complex.")
+        clauses = []
+        if hasattr(query_node, 'query_string') and query_node.query_string:
+            if query_node.query_string == '%': pass
+            else:
+                use_match = True
+                if table_name:
+                    try: db.execute(text(f"SELECT default_qry_str FROM `{table_name}` LIMIT 0"))
+                    except: use_match = False
+                else: use_match = False
+                if use_match:
+                    p_name = get_param_name()
+                    clauses.append(f"MATCH( default_qry_str ) AGAINST( :{p_name} IN BOOLEAN MODE )")
+                    data[p_name] = query_node.query_string
+                elif searchable_fields:
+                    like_clauses = []
+                    for field in searchable_fields:
+                        if not any(x in field for x in ['_id', 'enable', 'hide', 'priority', 'sort', 'group', 'created_on', 'updated_on']):
+                            f_p_name = get_param_name()
+                            like_clauses.append(f"`{field}` LIKE :{f_p_name}")
+                            data[f_p_name] = f"%{query_node.query_string}%"
+                    if like_clauses: clauses.append(f"({' OR '.join(like_clauses)})")
+        for filter_attr in ['and_filters', 'or_filters']:
+            if hasattr(query_node, filter_attr) and getattr(query_node, filter_attr):
+                node_clauses = []
+                for item in getattr(query_node, filter_attr):
+                    if hasattr(item, 'field'):
+                        clause, item_data = process_filter(item)
+                        node_clauses.append(clause); data.update(item_data)
+                    else: node_clauses.append(f"({process_node(item, current_depth + 1)})")
+                if node_clauses:
+                    joiner = ' AND ' if 'and' in filter_attr else ' OR '
+                    clauses.append(f"({joiner.join(node_clauses)})")
+        return ' AND '.join(clauses)
+
+    def process_filter(f) -> tuple[str, dict]:
+        if searchable_fields is not None and f.field not in searchable_fields:
+            raise HTTPException(status_code=400, detail=f"Unauthorized search field '{f.field}'")
+        sql_op = operator_map.get(f.op.lower())
+        if not sql_op: raise HTTPException(status_code=400, detail=f"Unsupported operator: {f.op}")
+        filter_data = {}
+        if f.op.lower() in ['is_null', 'is_not_null']: clause = f"`{f.field}` {sql_op}"
+        else:
+            p_name = get_param_name()
+            if f.op.lower() == 'in': clause = f"`{f.field}` IN (:{p_name})"; filter_data[p_name] = f.value
+            elif f.op.lower() in ['contains', 'icontains']: clause = f"`{f.field}` LIKE :{p_name}"; filter_data[p_name] = f"%{f.value}%"
+            elif f.op.lower() in ['startswith', 'istartswith']: clause = f"`{f.field}` LIKE :{p_name}"; filter_data[p_name] = f"{f.value}%"
+            elif f.op.lower() in ['endswith', 'iendswith']: clause = f"`{f.field}` LIKE :{p_name}"; filter_data[p_name] = f"%{f.value}"
+            else: clause = f"`{f.field}` {sql_op} :{p_name}"; filter_data[p_name] = f.value
+        return clause, filter_data
+
+    sql_where = process_node(search_query, 1)
+    return (f"AND ({sql_where})", data) if sql_where else ("", {})