Coverage for /usr/local/lib/python3.12/site-packages/prefect/server/utilities/text_search

1"""Text search query parser

3Parses text search queries according to the following syntax:

5- Space-separated terms → OR logic (include)

6- Prefix with `-` or `!` → Exclude term

7- Prefix with `+` → Required term (AND logic, future)

8- Quote phrases → Match exact phrase

9- Backslash escapes → Allow quotes within phrases (\")

10- Case-insensitive, substring matching

11- 200 character limit

12"""

14from dataclasses import dataclass, field 1 ctx1b

17@dataclass 1 ctx1b

18class TextSearchQuery: 1 ctx1b

19 """Parsed text search query structure"""

21 include: list[str] = field(default_factory=list) # OR terms 1 ctx1b

22 exclude: list[str] = field(default_factory=list) # NOT terms (-/!) 1 ctx1b

23 required: list[str] = field(default_factory=list) # AND terms (+) 1 ctx1b

26def parse_text_search_query(query: str) -> TextSearchQuery: 1 ctx1b

27 """Parse a text search query string into structured components

29 Args:

30 query: The query string to parse

32 Returns:

33 TextSearchQuery with parsed include/exclude/required terms

34 """

36 # Handle empty/whitespace-only queries

37 if not query.strip(): 37 ↛ 38line 37 didn't jump to line 38 because the condition on line 37 was never true(empty)

38 return TextSearchQuery()

40 result = TextSearchQuery() (empty)

41 i = 0 (empty)

43 while i < len(query): (empty)

44 # Skip whitespace

45 if query[i].isspace(): (empty)

46 i += 1 (empty)

47 continue (empty)

49 # Check for prefix

50 prefix = None (empty)

51 if query[i] in "-!+": (empty)

52 prefix_char = query[i] (empty)

53 prefix_pos = i (empty)

54 i += 1 (empty)

56 # Check if this is immediately followed by a non-whitespace character

57 if i < len(query) and not query[i].isspace(): 57 ↛ 62line 57 didn't jump to line 62 because the condition on line 57 was always true(empty)

58 # Valid prefix (no space between prefix and term)

59 prefix = prefix_char (empty)

60 else:

61 # Prefix followed by space - ignore the prefix completely

62 i = prefix_pos + 1 # Skip the prefix character

63 prefix = None

64 continue

66 # Handle quoted phrases

67 if i < len(query) and query[i] == '"': (empty)

68 i += 1 # Skip opening quote (empty)

69 phrase_start = i (empty)

71 # Find closing quote, handling escaped quotes

72 while i < len(query): 72 ↛ 83line 72 didn't jump to line 83 because the condition on line 72 was always true(empty)

73 if query[i] == "\\" and i + 1 < len(query): 73 ↛ 75line 73 didn't jump to line 75 because the condition on line 73 was never true(empty)

74 # Skip escaped character

75 i += 2

76 elif query[i] == '"': (empty)

77 # Found unescaped closing quote

78 break (empty)

79 else:

80 i += 1 (empty)

82 # Extract phrase (even if quote is unclosed)

83 phrase = query[phrase_start:i] (empty)

85 if i < len(query): # Found closing quote 85 ↛ 89line 85 didn't jump to line 89 because the condition on line 85 was always true(empty)

86 i += 1 # Skip closing quote (empty)

88 # Unescape quotes and backslashes in the phrase

89 phrase = _unescape_phrase(phrase) (empty)

91 # Add to appropriate list based on prefix

92 if phrase.strip(): 92 ↛ 99line 92 didn't jump to line 99 because the condition on line 92 was always true(empty)

93 if prefix == "-" or prefix == "!": 93 ↛ 94line 93 didn't jump to line 94 because the condition on line 93 was never true(empty)

94 result.exclude.append(phrase)

95 elif prefix == "+": 95 ↛ 96line 95 didn't jump to line 96 because the condition on line 95 was never true(empty)

96 result.required.append(phrase)

97 else:

98 result.include.append(phrase) (empty)

99 continue (empty)

100

101 # Handle regular terms

102 if i < len(query): 102 ↛ 43line 102 didn't jump to line 43 because the condition on line 102 was always true(empty)

103 term_start = i (empty)

104

105 # Find end of term (next whitespace or quote)

106 while i < len(query) and not query[i].isspace() and query[i] != '"': (empty)

107 i += 1 (empty)

108

109 term = query[term_start:i] (empty)

110

111 # Add to appropriate list based on prefix

112 if term: 112 ↛ 43line 112 didn't jump to line 43 because the condition on line 112 was always true(empty)

113 if prefix == "-" or prefix == "!": (empty)

114 result.exclude.append(term) (empty)

115 elif prefix == "+": (empty)

116 result.required.append(term) (empty)

117 else:

118 result.include.append(term) (empty)

119

120 return result (empty)

121

122

123def _unescape_phrase(phrase: str) -> str: 1 ctx1b

124 """Unescape quotes and backslashes in a quoted phrase"""

125 # Process escapes in order: first backslashes, then quotes

126 result = [] (empty)

127 i = 0 (empty)

128 while i < len(phrase): (empty)

129 if phrase[i] == "\\" and i + 1 < len(phrase): 129 ↛ 130line 129 didn't jump to line 130 because the condition on line 129 was never true(empty)

130 next_char = phrase[i + 1]

131 if next_char == '"':

132 result.append('"')

133 i += 2

134 elif next_char == "\\":

135 result.append("\\")

136 i += 2

137 else:

138 # Not an escape sequence, keep the backslash

139 result.append("\\")

140 i += 1

141 else:

142 result.append(phrase[i]) (empty)

143 i += 1 (empty)

144 return "".join(result) (empty)

Coverage for /usr/local/lib/python3.12/site-packages/prefect/server/utilities/text_search_parser.py: 74%

74 statements