3b1b-manim/manimlib/mobject/svg/labelled_string.py

517 lines
17 KiB
Python
Raw Normal View History

2022-03-30 21:57:27 +08:00
from __future__ import annotations
2022-04-11 23:44:33 +08:00
from abc import ABC, abstractmethod
import itertools as it
import re
2022-03-30 21:57:27 +08:00
from manimlib.constants import WHITE
from manimlib.logger import log
2022-03-30 21:57:27 +08:00
from manimlib.mobject.svg.svg_mobject import SVGMobject
from manimlib.mobject.types.vectorized_mobject import VGroup
2022-04-11 23:44:33 +08:00
from manimlib.utils.color import color_to_rgb
from manimlib.utils.color import rgb_to_hex
2022-03-30 21:57:27 +08:00
from manimlib.utils.config_ops import digest_config
from manimlib.utils.iterables import remove_list_redundancies
from typing import TYPE_CHECKING
if TYPE_CHECKING:
from colour import Color
from typing import Iterable, Sequence, TypeVar, Union
2022-03-30 21:57:27 +08:00
ManimColor = Union[str, Color]
Span = tuple[int, int]
Selector = Union[
str,
re.Pattern,
tuple[Union[int, None], Union[int, None]],
Iterable[Union[
str,
re.Pattern,
tuple[Union[int, None], Union[int, None]]
]]
]
T = TypeVar("T")
class LabelledString(SVGMobject, ABC):
"""
An abstract base class for `MTex` and `MarkupText`
"""
2022-03-30 21:57:27 +08:00
CONFIG = {
"height": None,
"stroke_width": 0,
"stroke_color": WHITE,
"path_string_config": {
"should_subdivide_sharp_curves": True,
"should_remove_null_curves": True,
},
2022-04-11 23:44:33 +08:00
"base_color": WHITE,
"isolate": (),
2022-03-30 21:57:27 +08:00
}
def __init__(self, string: str, **kwargs):
self.string = string
digest_config(self, kwargs)
if self.base_color is None:
self.base_color = WHITE
self.base_color_hex = self.color_to_hex(self.base_color)
2022-04-11 23:44:33 +08:00
self.full_span = (0, len(self.string))
2022-03-30 21:57:27 +08:00
self.parse()
super().__init__(**kwargs)
self.labels = [submob.label for submob in self.submobjects]
2022-03-30 21:57:27 +08:00
2022-04-06 22:38:33 +08:00
def get_file_path(self) -> str:
return self.get_file_path_by_content(self.original_content)
2022-03-30 21:57:27 +08:00
@abstractmethod
def get_file_path_by_content(self, content: str) -> str:
return ""
def generate_mobject(self) -> None:
super().generate_mobject()
file_path = self.get_file_path_by_content(self.labelled_content)
labelled_svg = SVGMobject(file_path)
num_submobjects = len(self.submobjects)
if num_submobjects != len(labelled_svg.submobjects):
log.warning(
"Cannot align submobjects of the labelled svg "
"to the original svg. Skip the labelling process."
)
submob_color_ints = [0] * num_submobjects
else:
submob_color_ints = [
self.hex_to_int(self.color_to_hex(submob.get_fill_color()))
for submob in labelled_svg.submobjects
]
unrecognized_colors = list(filter(
lambda color_int: color_int > len(self.labelled_spans),
submob_color_ints
))
if unrecognized_colors:
log.warning(
"Unrecognized color label(s) detected (%s, etc). "
"Skip the labelling process.",
self.int_to_hex(unrecognized_colors[0])
)
submob_color_ints = [0] * num_submobjects
2022-03-30 21:57:27 +08:00
2022-05-04 22:18:19 +08:00
#TODO: remove this
#if self.sort_labelled_submobs:
submob_indices = sorted(
range(num_submobjects),
key=lambda index: tuple(
self.submobjects[index].get_center()
)
)
labelled_submob_indices = sorted(
range(num_submobjects),
key=lambda index: tuple(
labelled_svg.submobjects[index].get_center()
)
)
submob_color_ints = [
submob_color_ints[
labelled_submob_indices[submob_indices.index(index)]
]
for index in range(num_submobjects)
]
for submob, color_int in zip(self.submobjects, submob_color_ints):
submob.label = color_int - 1
2022-03-30 21:57:27 +08:00
#@property
#@abstractmethod
#def sort_labelled_submobs(self) -> bool:
# return False
2022-04-10 08:36:13 +08:00
2022-03-30 21:57:27 +08:00
# Toolkits
2022-04-06 22:38:33 +08:00
def get_substr(self, span: Span) -> str:
return self.string[slice(*span)]
def find_spans(self, pattern: str) -> list[Span]:
return [
match_obj.span()
for match_obj in re.finditer(pattern, self.string)
]
2022-04-06 22:38:33 +08:00
def find_spans_by_selector(self, selector: Selector) -> list[Span]:
2022-04-27 23:04:24 +08:00
def find_spans_by_single_selector(sel):
if isinstance(sel, str):
2022-04-27 23:04:24 +08:00
return self.find_spans(re.escape(sel))
if isinstance(sel, re.Pattern):
result_iterator = sel.finditer(self.string)
if not sel.groups:
return [
match_obj.span()
for match_obj in result_iterator
]
return [
span
for match_obj in result_iterator
for span in match_obj.regs[1:]
if span != (-1, -1)
]
if isinstance(sel, tuple) and len(sel) == 2 and all(
2022-04-27 23:04:24 +08:00
isinstance(index, int) or index is None
for index in sel
):
l = self.full_span[1]
span = tuple(
min(index, l) if index >= 0 else max(index + l, 0)
if index is not None else default_index
for index, default_index in zip(sel, self.full_span)
)
2022-04-27 23:04:24 +08:00
return [span]
return None
result = find_spans_by_single_selector(selector)
if result is None:
result = []
for sel in selector:
spans = find_spans_by_single_selector(sel)
if spans is None:
raise TypeError(f"Invalid selector: '{sel}'")
result.extend(spans)
#return sorted(filter(
# lambda span: span[0] < span[1],
# self.remove_redundancies(result)
#))
return result
2022-03-30 21:57:27 +08:00
@staticmethod
def chain(*iterables: Iterable[T]) -> list[T]:
return list(it.chain(*iterables))
2022-03-30 21:57:27 +08:00
2022-04-06 22:38:33 +08:00
@staticmethod
def remove_redundancies(vals: Sequence[T]) -> list[T]:
return remove_list_redundancies(vals)
2022-04-06 22:38:33 +08:00
@staticmethod
def get_neighbouring_pairs(vals: Sequence[T]) -> list[tuple[T, T]]:
return list(zip(vals[:-1], vals[1:]))
2022-04-06 22:38:33 +08:00
2022-03-30 21:57:27 +08:00
@staticmethod
def compress_neighbours(vals: Sequence[T]) -> list[tuple[T, Span]]:
2022-03-30 21:57:27 +08:00
if not vals:
return []
unique_vals = [vals[0]]
indices = [0]
for index, val in enumerate(vals):
if val == unique_vals[-1]:
continue
unique_vals.append(val)
indices.append(index)
indices.append(len(vals))
2022-04-27 23:04:24 +08:00
val_ranges = LabelledString.get_neighbouring_pairs(indices)
return list(zip(unique_vals, val_ranges))
2022-03-30 21:57:27 +08:00
@staticmethod
def sort_obj_pairs_by_spans(
obj_pairs: list[tuple[Span, tuple[T, T]]]
) -> list[tuple[int, T]]:
return [
(index, obj)
for (index, _), obj in sorted([
(span, begin_obj)
for span, (begin_obj, _) in obj_pairs
] + [
(span[::-1], end_obj)
for span, (_, end_obj) in reversed(obj_pairs)
], key=lambda t: (t[0][0], -t[0][1]))
]
2022-03-30 21:57:27 +08:00
@staticmethod
def span_contains(span_0: Span, span_1: Span) -> bool:
return span_0[0] <= span_1[0] and span_0[1] >= span_1[1]
2022-03-30 21:57:27 +08:00
@staticmethod
def get_complement_spans(
universal_span: Span, interval_spans: list[Span]
) -> list[Span]:
if not interval_spans:
return [universal_span]
span_ends, span_begins = zip(*interval_spans)
return list(zip(
(universal_span[0], *span_begins),
(*span_ends, universal_span[1])
))
2022-03-30 21:57:27 +08:00
2022-05-04 22:18:19 +08:00
def replace_string(self, span: Span, repl_items: list[Span, str]):
if not repl_items:
return self.get_substr(span)
2022-04-06 22:38:33 +08:00
repl_spans, repl_strs = zip(*sorted(
repl_items, key=lambda t: t[0]
))
2022-04-06 22:38:33 +08:00
pieces = [
self.get_substr(piece_span)
for piece_span in self.get_complement_spans(span, repl_spans)
2022-04-06 22:38:33 +08:00
]
repl_strs = [*repl_strs, ""]
return "".join(self.chain(*zip(pieces, repl_strs)))
2022-03-30 21:57:27 +08:00
@staticmethod
def color_to_hex(color: ManimColor) -> str:
return rgb_to_hex(color_to_rgb(color))
2022-03-30 21:57:27 +08:00
2022-04-11 23:44:33 +08:00
@staticmethod
def hex_to_int(rgb_hex: str) -> int:
return int(rgb_hex[1:], 16)
2022-04-11 23:44:33 +08:00
@staticmethod
def int_to_hex(rgb_int: int) -> str:
return f"#{rgb_int:06x}".upper()
2022-03-31 10:36:14 +08:00
@staticmethod
2022-03-30 21:57:27 +08:00
@abstractmethod
def get_tag_string_pair(
attr_dict: dict[str, str], label_hex: str | None
) -> tuple[str, str]:
return ("", "")
2022-03-30 21:57:27 +08:00
# Parsing
def parse(self) -> None:
begin_cmd_spans, end_cmd_spans, cmd_spans = self.get_command_spans()
cmd_span_items = sorted(self.chain(
[(begin_cmd_span, 1) for begin_cmd_span in begin_cmd_spans],
[(end_cmd_span, -1) for end_cmd_span in end_cmd_spans],
[(cmd_span, 0) for cmd_span in cmd_spans],
), key=lambda t: t[0])
self.cmd_span_items = cmd_span_items
cmd_span_pairs = []
begin_cmd_spans_stack = []
for cmd_span, flag in cmd_span_items:
if flag == 1:
begin_cmd_spans_stack.append(cmd_span)
elif flag == -1:
if not begin_cmd_spans_stack:
raise ValueError("Missing '{' inserted")
begin_cmd_span = begin_cmd_spans_stack.pop()
cmd_span_pairs.append((begin_cmd_span, cmd_span))
if begin_cmd_spans_stack:
raise ValueError("Missing '}' inserted")
specified_items = self.get_specified_items(cmd_span_pairs)
split_items = [
(span, attr_dict)
for specified_span, attr_dict in specified_items
for span in self.split_span_by_levels(specified_span)[0]
]
command_repl_items = [
(span, self.get_replaced_substr(self.get_substr(span), flag))
for span, flag in cmd_span_items
]
self.command_repl_items = command_repl_items
self.specified_spans = [span for span, _ in specified_items]
2022-05-04 22:18:19 +08:00
labelled_spans = [span for span, _ in split_items]
if len(labelled_spans) >= 16777216:
raise ValueError("Cannot handle that many substrings")
for span_0, span_1 in it.product(labelled_spans, repeat=2):
if not span_0[0] < span_1[0] < span_0[1] < span_1[1]:
continue
raise ValueError(
"Partially overlapping substrings detected: "
f"'{self.get_substr(span_0)}' and '{self.get_substr(span_1)}'"
)
2022-05-04 22:18:19 +08:00
self.labelled_spans = labelled_spans
self.original_content, self.labelled_content = (
self.get_full_content_string(self.replace_string(
self.full_span, self.chain(
command_repl_items,
[
((index, index), inserted_str)
for index, inserted_str in self.sort_obj_pairs_by_spans([
(span, self.get_tag_string_pair(
attr_dict,
label_hex=self.int_to_hex(label + 1) if is_labelled else None
))
for label, (span, attr_dict) in enumerate(split_items)
])
]
)
), is_labelled=is_labelled)
for is_labelled in (False, True)
)
2022-05-04 22:18:19 +08:00
def split_span_by_levels(
self, arbitrary_span: Span
) -> tuple[list[Span], int, int]:
interval_span_items = self.cmd_span_items
interval_spans = [span for span, _ in interval_span_items]
interval_range = (
sum([
arbitrary_span[0] > interval_begin
for interval_begin, _ in interval_spans
]),
sum([
arbitrary_span[1] >= interval_end
for _, interval_end in interval_spans
])
)
complement_spans = self.get_complement_spans(self.full_span, interval_spans)
adjusted_span = (
max(arbitrary_span[0], complement_spans[interval_range[0]][0]),
min(arbitrary_span[1], complement_spans[interval_range[1]][1])
)
if adjusted_span[0] > adjusted_span[1]:
return [], 0, 0
2022-05-04 22:18:19 +08:00
upwards_stack = []
downwards_stack = []
for interval_index in range(*interval_range):
_, level_shift = interval_span_items[interval_index]
if level_shift == 1:
upwards_stack.append(interval_index)
elif level_shift == -1:
if upwards_stack:
upwards_stack.pop()
else:
downwards_stack.append(interval_index)
2022-05-04 22:18:19 +08:00
covered_interval_spans = [
interval_spans[piece_index]
for piece_index in self.chain(downwards_stack, upwards_stack)
]
result = self.get_complement_spans(adjusted_span, covered_interval_spans)
return result, len(downwards_stack), len(upwards_stack)
2022-03-30 21:57:27 +08:00
@abstractmethod
def get_command_spans(self) -> tuple[list[Span], list[Span], list[Span]]:
return [], [], []
2022-03-30 21:57:27 +08:00
@abstractmethod
def get_specified_items(
self, cmd_span_pairs: list[tuple[Span, Span]]
) -> list[tuple[Span, dict[str, str]]]:
return []
@abstractmethod
def get_replaced_substr(self, substr: str, flag: int) -> str:
return ""
@abstractmethod
def get_full_content_string(self, content_string: str, is_labelled: bool) -> str:
return ""
# Selector
2022-04-10 08:36:13 +08:00
@abstractmethod
2022-03-30 21:57:27 +08:00
def get_cleaned_substr(self, span: Span) -> str:
return ""
2022-03-30 21:57:27 +08:00
def get_group_part_items(self) -> list[tuple[str, list[int]]]:
if not self.labels:
2022-04-06 22:38:33 +08:00
return []
2022-04-27 23:04:24 +08:00
group_labels, labelled_submob_ranges = zip(
*self.compress_neighbours(self.labels)
2022-04-10 08:36:13 +08:00
)
2022-03-30 21:57:27 +08:00
ordered_spans = [
self.labelled_spans[label] if label != -1 else self.full_span
2022-03-30 21:57:27 +08:00
for label in group_labels
]
2022-04-06 22:38:33 +08:00
interval_spans = [
(
next_span[0]
if self.span_contains(prev_span, next_span)
else prev_span[1],
prev_span[1]
if self.span_contains(next_span, prev_span)
else next_span[0]
2022-03-30 21:57:27 +08:00
)
2022-04-06 22:38:33 +08:00
for prev_span, next_span in self.get_neighbouring_pairs(
ordered_spans
2022-03-30 21:57:27 +08:00
)
]
group_substrs = [
self.get_cleaned_substr(span) if span[0] < span[1] else ""
2022-04-06 22:38:33 +08:00
for span in self.get_complement_spans(
(ordered_spans[0][0], ordered_spans[-1][1]), interval_spans
2022-04-06 22:38:33 +08:00
)
2022-03-30 21:57:27 +08:00
]
submob_indices_lists = [
list(range(*submob_range))
2022-04-27 23:04:24 +08:00
for submob_range in labelled_submob_ranges
]
return list(zip(group_substrs, submob_indices_lists))
def get_submob_indices_list_by_span(
self, arbitrary_span: Span
) -> list[int]:
return [
submob_index
for submob_index, label in enumerate(self.labels)
if label != -1 and self.span_contains(
arbitrary_span, self.labelled_spans[label]
)
]
2022-04-10 08:36:13 +08:00
def get_specified_part_items(self) -> list[tuple[str, list[int]]]:
return [
(
self.get_substr(span),
self.get_submob_indices_list_by_span(span)
)
for span in self.specified_spans
]
2022-03-30 21:57:27 +08:00
def get_submob_indices_lists_by_selector(
self, selector: Selector
) -> list[list[int]]:
return list(filter(
lambda indices_list: indices_list,
[
self.get_submob_indices_list_by_span(span)
for span in self.find_spans_by_selector(selector)
]
))
2022-03-30 21:57:27 +08:00
def build_parts_from_indices_lists(
self, indices_lists: list[list[int]]
) -> VGroup:
return VGroup(*[
VGroup(*[
self.submobjects[submob_index]
for submob_index in indices_list
])
for indices_list in indices_lists
])
2022-05-04 22:18:19 +08:00
def build_groups(self) -> VGroup:
return self.build_parts_from_indices_lists([
indices_list
for _, indices_list in self.get_group_part_items()
])
def select_parts(self, selector: Selector) -> VGroup:
return self.build_parts_from_indices_lists(
self.get_submob_indices_lists_by_selector(selector)
)
def select_part(self, selector: Selector, index: int = 0) -> VGroup:
return self.select_parts(selector)[index]
2022-03-30 21:57:27 +08:00
def set_parts_color(self, selector: Selector, color: ManimColor):
self.select_parts(selector).set_color(color)
2022-03-30 21:57:27 +08:00
return self
def set_parts_color_by_dict(self, color_map: dict[Selector, ManimColor]):
for selector, color in color_map.items():
self.set_parts_color(selector, color)
2022-03-30 21:57:27 +08:00
return self
def get_string(self) -> str:
return self.string