# Process html entity - {, ¯, ", ... import re from ..common.entities import entities from ..common.utils import fromCodePoint, isValidEntityCode from .state_inline import StateInline DIGITAL_RE = re.compile(r"^&#((?:x[a-f0-9]{1,6}|[0-9]{1,7}));", re.IGNORECASE) NAMED_RE = re.compile(r"^&([a-z][a-z0-9]{1,31});", re.IGNORECASE) def entity(state: StateInline, silent: bool) -> bool: pos = state.pos maximum = state.posMax if state.src[pos] != "&": return False if pos + 1 >= maximum: return False if state.src[pos + 1] == "#": if match := DIGITAL_RE.search(state.src[pos:]): if not silent: match1 = match.group(1) code = ( int(match1[1:], 16) if match1[0].lower() == "x" else int(match1, 10) ) token = state.push("text_special", "", 0) token.content = ( fromCodePoint(code) if isValidEntityCode(code) else fromCodePoint(0xFFFD) ) token.markup = match.group(0) token.info = "entity" state.pos += len(match.group(0)) return True else: if (match := NAMED_RE.search(state.src[pos:])) and match.group(1) in entities: if not silent: token = state.push("text_special", "", 0) token.content = entities[match.group(1)] token.markup = match.group(0) token.info = "entity" state.pos += len(match.group(0)) return True return False