Add function for finding tags until a matching tag

This will allow flexibility in the future when collecting tags for the description and signature of symbols. The base is a function which accepts a callable which is called and iterated over, but 3 names with a partial function that has the callable supplied are provided to keep the outside interface neater.
author: Numerlor <[email protected]> 2020-07-20 03:55:31 +0200
committer: Numerlor <[email protected]> 2020-07-20 03:55:31 +0200
commit: 2b24579b49ced873e05e375051bbbb4ec2855b12 (patch)
tree: f06805e44b16e6283855a1fe7eb3a199c04d1e16
parent: Simplify cutoff text. (diff)
1 files changed, 35 insertions, 0 deletions
diff --git a/bot/cogs/doc/parsing.py b/bot/cogs/doc/parsing.py
index 994124e92..5e5a5be66 100644
--- a/bot/cogs/doc/parsing.py
+++ b/bot/cogs/doc/parsing.py
@@ -1,6 +1,7 @@
 import logging
 import re
 import string
+from functools import partial
 from typing import Callable, List, Optional, Tuple, Union
 
 from aiohttp import ClientSession
@@ -24,6 +25,40 @@ SEARCH_END_TAG_ATTRS = (
 )
 
 
+def find_elements_until_tag(
+        start_element: PageElement,
+        tag_filter: Union[Tuple[str, ...], Callable[[Tag], bool]],
+        *,
+        func: Callable,
+        limit: int = None,
+) -> List[str]:
+    """
+    Get all tags until a tag matching `tag_filter` is found.
+
+    `tag_filter` can be either a tuple of string names to check against,
+    or a filtering t.Callable that's applied to the tags.
+
+    `func` takes in a BeautifulSoup unbound method for finding multiple elements, such as `BeautifulSoup.find_all`.
+    That method is then iterated over and all tags until the matching tag are added to the return list as strings.
+    """
+    elements = []
+
+    for element in func(start_element, limit=limit):
+        if isinstance(tag_filter, tuple):
+            if element.name in tag_filter:
+                break
+        elif tag_filter(element):
+            break
+        elements.append(str(element))
+
+    return elements
+
+
+find_next_children_until_tag = partial(find_elements_until_tag, func=partial(BeautifulSoup.find_all, recursive=False))
+find_next_siblings_until_tag = partial(find_elements_until_tag, func=BeautifulSoup.find_next_siblings)
+find_previous_siblings_until_tag = partial(find_elements_until_tag, func=BeautifulSoup.find_previous_siblings)
+
+
 def parse_module_symbol(heading: PageElement) -> Optional[Tuple[None, str]]:
     """Get page content from the headerlink up to a table or a tag with its class in `SEARCH_END_TAG_ATTRS`."""
     start_tag = heading.find("a", attrs={"class": "headerlink"})
author	Numerlor <[email protected]>	2020-07-20 03:55:31 +0200
committer	Numerlor <[email protected]>	2020-07-20 03:55:31 +0200
commit	2b24579b49ced873e05e375051bbbb4ec2855b12 (patch)
tree	f06805e44b16e6283855a1fe7eb3a199c04d1e16
parent	Simplify cutoff text. (diff)