utils.py 7.4 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244
  1. "Misc. utility functions/classes for admin documentation generator."
  2. import re
  3. from email.errors import HeaderParseError
  4. from email.parser import HeaderParser
  5. from inspect import cleandoc
  6. from django.urls import reverse
  7. from django.utils.regex_helper import _lazy_re_compile
  8. from django.utils.safestring import mark_safe
  9. try:
  10. import docutils.core
  11. import docutils.nodes
  12. import docutils.parsers.rst.roles
  13. except ImportError:
  14. docutils_is_available = False
  15. else:
  16. docutils_is_available = True
  17. def get_view_name(view_func):
  18. if hasattr(view_func, "view_class"):
  19. klass = view_func.view_class
  20. return f"{klass.__module__}.{klass.__qualname__}"
  21. mod_name = view_func.__module__
  22. view_name = getattr(view_func, "__qualname__", view_func.__class__.__name__)
  23. return mod_name + "." + view_name
  24. def parse_docstring(docstring):
  25. """
  26. Parse out the parts of a docstring. Return (title, body, metadata).
  27. """
  28. if not docstring:
  29. return "", "", {}
  30. docstring = cleandoc(docstring)
  31. parts = re.split(r"\n{2,}", docstring)
  32. title = parts[0]
  33. if len(parts) == 1:
  34. body = ""
  35. metadata = {}
  36. else:
  37. parser = HeaderParser()
  38. try:
  39. metadata = parser.parsestr(parts[-1])
  40. except HeaderParseError:
  41. metadata = {}
  42. body = "\n\n".join(parts[1:])
  43. else:
  44. metadata = dict(metadata.items())
  45. if metadata:
  46. body = "\n\n".join(parts[1:-1])
  47. else:
  48. body = "\n\n".join(parts[1:])
  49. return title, body, metadata
  50. def parse_rst(text, default_reference_context, thing_being_parsed=None):
  51. """
  52. Convert the string from reST to an XHTML fragment.
  53. """
  54. overrides = {
  55. "doctitle_xform": True,
  56. "initial_header_level": 3,
  57. "default_reference_context": default_reference_context,
  58. "link_base": reverse("django-admindocs-docroot").rstrip("/"),
  59. "raw_enabled": False,
  60. "file_insertion_enabled": False,
  61. }
  62. thing_being_parsed = thing_being_parsed and "<%s>" % thing_being_parsed
  63. # Wrap ``text`` in some reST that sets the default role to ``cmsreference``,
  64. # then restores it.
  65. source = """
  66. .. default-role:: cmsreference
  67. %s
  68. .. default-role::
  69. """
  70. parts = docutils.core.publish_parts(
  71. source % text,
  72. source_path=thing_being_parsed,
  73. destination_path=None,
  74. writer_name="html",
  75. settings_overrides=overrides,
  76. )
  77. return mark_safe(parts["fragment"])
  78. #
  79. # reST roles
  80. #
  81. ROLES = {
  82. "model": "%s/models/%s/",
  83. "view": "%s/views/%s/",
  84. "template": "%s/templates/%s/",
  85. "filter": "%s/filters/#%s",
  86. "tag": "%s/tags/#%s",
  87. }
  88. def create_reference_role(rolename, urlbase):
  89. # Views and template names are case-sensitive.
  90. is_case_sensitive = rolename in ["template", "view"]
  91. def _role(name, rawtext, text, lineno, inliner, options=None, content=None):
  92. if options is None:
  93. options = {}
  94. node = docutils.nodes.reference(
  95. rawtext,
  96. text,
  97. refuri=(
  98. urlbase
  99. % (
  100. inliner.document.settings.link_base,
  101. text if is_case_sensitive else text.lower(),
  102. )
  103. ),
  104. **options,
  105. )
  106. return [node], []
  107. docutils.parsers.rst.roles.register_canonical_role(rolename, _role)
  108. def default_reference_role(
  109. name, rawtext, text, lineno, inliner, options=None, content=None
  110. ):
  111. if options is None:
  112. options = {}
  113. context = inliner.document.settings.default_reference_context
  114. node = docutils.nodes.reference(
  115. rawtext,
  116. text,
  117. refuri=(
  118. ROLES[context]
  119. % (
  120. inliner.document.settings.link_base,
  121. text.lower(),
  122. )
  123. ),
  124. **options,
  125. )
  126. return [node], []
  127. if docutils_is_available:
  128. docutils.parsers.rst.roles.register_canonical_role(
  129. "cmsreference", default_reference_role
  130. )
  131. for name, urlbase in ROLES.items():
  132. create_reference_role(name, urlbase)
  133. # Match the beginning of a named, unnamed, or non-capturing groups.
  134. named_group_matcher = _lazy_re_compile(r"\(\?P(<\w+>)")
  135. unnamed_group_matcher = _lazy_re_compile(r"\(")
  136. non_capturing_group_matcher = _lazy_re_compile(r"\(\?\:")
  137. def replace_metacharacters(pattern):
  138. """Remove unescaped metacharacters from the pattern."""
  139. return re.sub(
  140. r"((?:^|(?<!\\))(?:\\\\)*)(\\?)([?*+^$]|\\[bBAZ])",
  141. lambda m: m[1] + m[3] if m[2] else m[1],
  142. pattern,
  143. )
  144. def _get_group_start_end(start, end, pattern):
  145. # Handle nested parentheses, e.g. '^(?P<a>(x|y))/b' or '^b/((x|y)\w+)$'.
  146. unmatched_open_brackets, prev_char = 1, None
  147. for idx, val in enumerate(pattern[end:]):
  148. # Check for unescaped `(` and `)`. They mark the start and end of a
  149. # nested group.
  150. if val == "(" and prev_char != "\\":
  151. unmatched_open_brackets += 1
  152. elif val == ")" and prev_char != "\\":
  153. unmatched_open_brackets -= 1
  154. prev_char = val
  155. # If brackets are balanced, the end of the string for the current named
  156. # capture group pattern has been reached.
  157. if unmatched_open_brackets == 0:
  158. return start, end + idx + 1
  159. def _find_groups(pattern, group_matcher):
  160. prev_end = None
  161. for match in group_matcher.finditer(pattern):
  162. if indices := _get_group_start_end(match.start(0), match.end(0), pattern):
  163. start, end = indices
  164. if prev_end and start > prev_end or not prev_end:
  165. yield start, end, match
  166. prev_end = end
  167. def replace_named_groups(pattern):
  168. r"""
  169. Find named groups in `pattern` and replace them with the group name. E.g.,
  170. 1. ^(?P<a>\w+)/b/(\w+)$ ==> ^<a>/b/(\w+)$
  171. 2. ^(?P<a>\w+)/b/(?P<c>\w+)/$ ==> ^<a>/b/<c>/$
  172. 3. ^(?P<a>\w+)/b/(\w+) ==> ^<a>/b/(\w+)
  173. 4. ^(?P<a>\w+)/b/(?P<c>\w+) ==> ^<a>/b/<c>
  174. """
  175. group_pattern_and_name = [
  176. (pattern[start:end], match[1])
  177. for start, end, match in _find_groups(pattern, named_group_matcher)
  178. ]
  179. for group_pattern, group_name in group_pattern_and_name:
  180. pattern = pattern.replace(group_pattern, group_name)
  181. return pattern
  182. def replace_unnamed_groups(pattern):
  183. r"""
  184. Find unnamed groups in `pattern` and replace them with '<var>'. E.g.,
  185. 1. ^(?P<a>\w+)/b/(\w+)$ ==> ^(?P<a>\w+)/b/<var>$
  186. 2. ^(?P<a>\w+)/b/((x|y)\w+)$ ==> ^(?P<a>\w+)/b/<var>$
  187. 3. ^(?P<a>\w+)/b/(\w+) ==> ^(?P<a>\w+)/b/<var>
  188. 4. ^(?P<a>\w+)/b/((x|y)\w+) ==> ^(?P<a>\w+)/b/<var>
  189. """
  190. final_pattern, prev_end = "", None
  191. for start, end, _ in _find_groups(pattern, unnamed_group_matcher):
  192. if prev_end:
  193. final_pattern += pattern[prev_end:start]
  194. final_pattern += pattern[:start] + "<var>"
  195. prev_end = end
  196. return final_pattern + pattern[prev_end:]
  197. def remove_non_capturing_groups(pattern):
  198. r"""
  199. Find non-capturing groups in the given `pattern` and remove them, e.g.
  200. 1. (?P<a>\w+)/b/(?:\w+)c(?:\w+) => (?P<a>\\w+)/b/c
  201. 2. ^(?:\w+(?:\w+))a => ^a
  202. 3. ^a(?:\w+)/b(?:\w+) => ^a/b
  203. """
  204. group_start_end_indices = _find_groups(pattern, non_capturing_group_matcher)
  205. final_pattern, prev_end = "", None
  206. for start, end, _ in group_start_end_indices:
  207. final_pattern += pattern[prev_end:start]
  208. prev_end = end
  209. return final_pattern + pattern[prev_end:]