summaryrefslogtreecommitdiff
path: root/src/layout/shaping.rs
diff options
context:
space:
mode:
authorMartin <mhaug@live.de>2021-04-07 13:50:21 +0200
committerGitHub <noreply@github.com>2021-04-07 13:50:21 +0200
commitdf58a4d89b67783b1ffc5c3b7282302d59db8c70 (patch)
tree2bdc3a7ad1704ccee7c14972df1fa3cb9c77097a /src/layout/shaping.rs
parent318eb9021edc493f5181247dbb7963de34126688 (diff)
parent3d2ee54848db80a8ede7e00fd5a53bc059138122 (diff)
Merge pull request #19 from typst/shape-runs 🔀
Text work
Diffstat (limited to 'src/layout/shaping.rs')
-rw-r--r--src/layout/shaping.rs396
1 files changed, 314 insertions, 82 deletions
diff --git a/src/layout/shaping.rs b/src/layout/shaping.rs
index 8d035516..faa178d3 100644
--- a/src/layout/shaping.rs
+++ b/src/layout/shaping.rs
@@ -1,30 +1,219 @@
+use std::borrow::Cow;
+use std::fmt::{self, Debug, Formatter};
+use std::ops::Range;
+
use fontdock::FaceId;
use rustybuzz::UnicodeBuffer;
use ttf_parser::GlyphId;
-use super::{Element, Frame, ShapedText};
+use super::{Element, Frame, Glyph, LayoutContext, Text};
use crate::env::FontLoader;
use crate::exec::FontProps;
-use crate::geom::{Point, Size};
+use crate::font::FaceBuf;
+use crate::geom::{Dir, Length, Point, Size};
+use crate::util::SliceExt;
+
+/// The result of shaping text.
+///
+/// This type contains owned or borrowed shaped text runs, which can be
+/// measured, used to reshape substrings more quickly and converted into a
+/// frame.
+pub struct ShapedText<'a> {
+ /// The text that was shaped.
+ pub text: &'a str,
+ /// The text direction.
+ pub dir: Dir,
+ /// The properties used for font selection.
+ pub props: &'a FontProps,
+ /// The font size.
+ pub size: Size,
+ /// The baseline from the top of the frame.
+ pub baseline: Length,
+ /// The shaped glyphs.
+ pub glyphs: Cow<'a, [ShapedGlyph]>,
+}
+
+/// A single glyph resulting from shaping.
+#[derive(Debug, Copy, Clone)]
+pub struct ShapedGlyph {
+ /// The font face the glyph is contained in.
+ pub face_id: FaceId,
+ /// The glyph's ID in the face.
+ pub glyph_id: GlyphId,
+ /// The advance width of the glyph.
+ pub x_advance: i32,
+ /// The horizontal offset of the glyph.
+ pub x_offset: i32,
+ /// The start index of the glyph in the source text.
+ pub text_index: usize,
+ /// Whether splitting the shaping result before this glyph would yield the
+ /// same results as shaping the parts to both sides of `text_index`
+ /// separately.
+ pub safe_to_break: bool,
+}
+
+/// A visual side.
+enum Side {
+ Left,
+ Right,
+}
+
+impl<'a> ShapedText<'a> {
+ /// Build the shaped text's frame.
+ pub fn build(&self, ctx: &mut LayoutContext) -> Frame {
+ let mut frame = Frame::new(self.size, self.baseline);
+ let mut offset = Length::ZERO;
+
+ for (face_id, group) in self.glyphs.as_ref().group_by_key(|g| g.face_id) {
+ let pos = Point::new(offset, self.baseline);
+ let mut text = Text {
+ face_id,
+ size: self.props.size,
+ color: self.props.color,
+ glyphs: vec![],
+ };
+
+ let face = ctx.env.fonts.face(face_id);
+ for glyph in group {
+ let x_advance = face.convert(glyph.x_advance).scale(self.props.size);
+ let x_offset = face.convert(glyph.x_offset).scale(self.props.size);
+ text.glyphs.push(Glyph { id: glyph.glyph_id, x_advance, x_offset });
+ offset += x_advance;
+ }
+
+ frame.push(pos, Element::Text(text));
+ }
+
+ frame
+ }
+
+ /// Reshape a range of the shaped text, reusing information from this
+ /// shaping process if possible.
+ pub fn reshape(
+ &'a self,
+ ctx: &mut LayoutContext,
+ text_range: Range<usize>,
+ ) -> ShapedText<'a> {
+ if let Some(glyphs) = self.slice_safe_to_break(text_range.clone()) {
+ let (size, baseline) = measure(&mut ctx.env.fonts, glyphs, self.props);
+ Self {
+ text: &self.text[text_range],
+ dir: self.dir,
+ props: self.props,
+ size,
+ baseline,
+ glyphs: Cow::Borrowed(glyphs),
+ }
+ } else {
+ shape(ctx, &self.text[text_range], self.dir, self.props)
+ }
+ }
+
+ /// Find the subslice of glyphs that represent the given text range if both
+ /// sides are safe to break.
+ fn slice_safe_to_break(&self, text_range: Range<usize>) -> Option<&[ShapedGlyph]> {
+ let Range { mut start, mut end } = text_range;
+ if !self.dir.is_positive() {
+ std::mem::swap(&mut start, &mut end);
+ }
+
+ let left = self.find_safe_to_break(start, Side::Left)?;
+ let right = self.find_safe_to_break(end, Side::Right)?;
+ Some(&self.glyphs[left .. right])
+ }
+
+ /// Find the glyph offset matching the text index that is most towards the
+ /// given side and safe-to-break.
+ fn find_safe_to_break(&self, text_index: usize, towards: Side) -> Option<usize> {
+ let ltr = self.dir.is_positive();
+
+ // Handle edge cases.
+ let len = self.glyphs.len();
+ if text_index == 0 {
+ return Some(if ltr { 0 } else { len });
+ } else if text_index == self.text.len() {
+ return Some(if ltr { len } else { 0 });
+ }
+
+ // Find any glyph with the text index.
+ let mut idx = self
+ .glyphs
+ .binary_search_by(|g| {
+ let ordering = g.text_index.cmp(&text_index);
+ if ltr { ordering } else { ordering.reverse() }
+ })
+ .ok()?;
+
+ let next = match towards {
+ Side::Left => usize::checked_sub,
+ Side::Right => usize::checked_add,
+ };
+
+ // Search for the outermost glyph with the text index.
+ while let Some(next) = next(idx, 1) {
+ if self.glyphs.get(next).map_or(true, |g| g.text_index != text_index) {
+ break;
+ }
+ idx = next;
+ }
+
+ // RTL needs offset one because the left side of the range should be
+ // exclusive and the right side inclusive, contrary to the normal
+ // behaviour of ranges.
+ if !ltr {
+ idx += 1;
+ }
+
+ self.glyphs[idx].safe_to_break.then(|| idx)
+ }
+}
-/// Shape text into a frame containing [`ShapedText`] runs.
-pub fn shape(text: &str, loader: &mut FontLoader, props: &FontProps) -> Frame {
- let mut frame = Frame::new(Size::ZERO);
- shape_segment(&mut frame, text, loader, props, props.families.iter(), None);
- frame
+impl Debug for ShapedText<'_> {
+ fn fmt(&self, f: &mut Formatter) -> fmt::Result {
+ write!(f, "Shaped({:?})", self.text)
+ }
+}
+
+/// Shape text into [`ShapedText`].
+pub fn shape<'a>(
+ ctx: &mut LayoutContext,
+ text: &'a str,
+ dir: Dir,
+ props: &'a FontProps,
+) -> ShapedText<'a> {
+ let loader = &mut ctx.env.fonts;
+
+ let mut glyphs = vec![];
+ let families = props.families.iter();
+ if !text.is_empty() {
+ shape_segment(loader, &mut glyphs, 0, text, dir, props, families, None);
+ }
+
+ let (size, baseline) = measure(loader, &glyphs, props);
+
+ ShapedText {
+ text,
+ dir,
+ props,
+ size,
+ baseline,
+ glyphs: Cow::Owned(glyphs),
+ }
}
-/// Shape text into a frame with font fallback using the `families` iterator.
+/// Shape text with font fallback using the `families` iterator.
fn shape_segment<'a>(
- frame: &mut Frame,
- text: &str,
loader: &mut FontLoader,
+ glyphs: &mut Vec<ShapedGlyph>,
+ base: usize,
+ text: &str,
+ dir: Dir,
props: &FontProps,
mut families: impl Iterator<Item = &'a str> + Clone,
- mut first: Option<FaceId>,
+ mut first_face: Option<FaceId>,
) {
// Select the font family.
- let (id, fallback) = loop {
+ let (face_id, fallback) = loop {
// Try to load the next available font family.
match families.next() {
Some(family) => match loader.query(family, props.variant) {
@@ -33,97 +222,140 @@ fn shape_segment<'a>(
},
// We're out of families, so we don't do any more fallback and just
// shape the tofus with the first face we originally used.
- None => match first {
+ None => match first_face {
Some(id) => break (id, false),
None => return,
},
}
};
- // Register that this is the first available font.
- if first.is_none() {
- first = Some(id);
- }
-
- // Find out some metrics and prepare the shaped text container.
- let face = loader.face(id);
- let ttf = face.ttf();
- let units_per_em = f64::from(ttf.units_per_em().unwrap_or(1000));
- let convert = |units| f64::from(units) / units_per_em * props.size;
- let top = convert(i32::from(props.top_edge.lookup(ttf)));
- let bottom = convert(i32::from(props.bottom_edge.lookup(ttf)));
- let mut shaped = ShapedText::new(id, props.size, top, bottom, props.color);
+ // Remember the id if this the first available face since we use that one to
+ // shape tofus.
+ first_face.get_or_insert(face_id);
// Fill the buffer with our text.
let mut buffer = UnicodeBuffer::new();
buffer.push_str(text);
- buffer.guess_segment_properties();
-
- // Find out the text direction.
- // TODO: Replace this once we do BiDi.
- let rtl = matches!(buffer.direction(), rustybuzz::Direction::RightToLeft);
+ buffer.set_direction(match dir {
+ Dir::LTR => rustybuzz::Direction::LeftToRight,
+ Dir::RTL => rustybuzz::Direction::RightToLeft,
+ _ => unimplemented!(),
+ });
// Shape!
- let glyphs = rustybuzz::shape(face.buzz(), &[], buffer);
- let info = glyphs.glyph_infos();
- let pos = glyphs.glyph_positions();
- let mut iter = info.iter().zip(pos).peekable();
-
- while let Some((info, pos)) = iter.next() {
- // Do font fallback if the glyph is a tofu.
- if info.codepoint == 0 && fallback {
- // Flush what we have so far.
- if !shaped.glyphs.is_empty() {
- place(frame, shaped);
- shaped = ShapedText::new(id, props.size, top, bottom, props.color);
- }
+ let buffer = rustybuzz::shape(loader.face(face_id).ttf(), &[], buffer);
+ let infos = buffer.glyph_infos();
+ let pos = buffer.glyph_positions();
+
+ // Collect the shaped glyphs, doing fallback and shaping parts again with
+ // the next font if necessary.
+ let mut i = 0;
+ while i < infos.len() {
+ let info = &infos[i];
+ let cluster = info.cluster as usize;
- // Determine the start and end cluster index of the tofu sequence.
- let mut start = info.cluster as usize;
- let mut end = info.cluster as usize;
- while let Some((info, _)) = iter.peek() {
- if info.codepoint != 0 {
- break;
+ if info.codepoint != 0 || !fallback {
+ // Add the glyph to the shaped output.
+ // TODO: Don't ignore y_advance and y_offset.
+ glyphs.push(ShapedGlyph {
+ face_id,
+ glyph_id: GlyphId(info.codepoint as u16),
+ x_advance: pos[i].x_advance,
+ x_offset: pos[i].x_offset,
+ text_index: base + cluster,
+ safe_to_break: !info.unsafe_to_break(),
+ });
+ } else {
+ // Determine the source text range for the tofu sequence.
+ let range = {
+ // First, search for the end of the tofu sequence.
+ let k = i;
+ while infos.get(i + 1).map_or(false, |info| info.codepoint == 0) {
+ i += 1;
}
- end = info.cluster as usize;
- iter.next();
- }
- // Because Harfbuzz outputs glyphs in visual order, the start
- // cluster actually corresponds to the last codepoint in
- // right-to-left text.
- if rtl {
- assert!(end <= start);
- std::mem::swap(&mut start, &mut end);
- }
+ // Then, determine the start and end text index.
+ //
+ // Examples:
+ // Everything is shown in visual order. Tofus are written as "_".
+ // We want to find out that the tofus span the text `2..6`.
+ // Note that the clusters are longer than 1 char.
+ //
+ // Left-to-right:
+ // Text: h a l i h a l l o
+ // Glyphs: A _ _ C E
+ // Clusters: 0 2 4 6 8
+ // k=1 i=2
+ //
+ // Right-to-left:
+ // Text: O L L A H I L A H
+ // Glyphs: E C _ _ A
+ // Clusters: 8 6 4 2 0
+ // k=2 i=3
+
+ let ltr = dir.is_positive();
+ let first = if ltr { k } else { i };
+ let start = infos[first].cluster as usize;
+
+ let last = if ltr { i.checked_add(1) } else { k.checked_sub(1) };
+ let end = last
+ .and_then(|last| infos.get(last))
+ .map_or(text.len(), |info| info.cluster as usize);
- // The end cluster index points right before the last character that
- // mapped to the tofu sequence. So we have to offset the end by one
- // char.
- let offset = text[end ..].chars().next().unwrap().len_utf8();
- let range = start .. end + offset;
+ start .. end
+ };
// Recursively shape the tofu sequence with the next family.
- shape_segment(frame, &text[range], loader, props, families.clone(), first);
- } else {
- // Add the glyph to the shaped output.
- // TODO: Don't ignore y_advance and y_offset.
- let glyph = GlyphId(info.codepoint as u16);
- shaped.glyphs.push(glyph);
- shaped.offsets.push(shaped.width + convert(pos.x_offset));
- shaped.width += convert(pos.x_advance);
+ shape_segment(
+ loader,
+ glyphs,
+ base + range.start,
+ &text[range],
+ dir,
+ props,
+ families.clone(),
+ first_face,
+ );
}
- }
- if !shaped.glyphs.is_empty() {
- place(frame, shaped)
+ i += 1;
}
}
-/// Place shaped text into a frame.
-fn place(frame: &mut Frame, shaped: ShapedText) {
- let offset = frame.size.width;
- frame.size.width += shaped.width;
- frame.size.height = frame.size.height.max(shaped.top - shaped.bottom);
- frame.push(Point::new(offset, shaped.top), Element::Text(shaped));
+/// Measure the size and baseline of a run of shaped glyphs with the given
+/// properties.
+fn measure(
+ loader: &mut FontLoader,
+ glyphs: &[ShapedGlyph],
+ props: &FontProps,
+) -> (Size, Length) {
+ let mut width = Length::ZERO;
+ let mut top = Length::ZERO;
+ let mut bottom = Length::ZERO;
+ let mut expand_vertical = |face: &FaceBuf| {
+ top = top.max(face.vertical_metric(props.top_edge).scale(props.size));
+ bottom = bottom.max(-face.vertical_metric(props.bottom_edge).scale(props.size));
+ };
+
+ if glyphs.is_empty() {
+ // When there are no glyphs, we just use the vertical metrics of the
+ // first available font.
+ for family in props.families.iter() {
+ if let Some(face_id) = loader.query(family, props.variant) {
+ expand_vertical(loader.face(face_id));
+ break;
+ }
+ }
+ } else {
+ for (face_id, group) in glyphs.group_by_key(|g| g.face_id) {
+ let face = loader.face(face_id);
+ expand_vertical(face);
+
+ for glyph in group {
+ width += face.convert(glyph.x_advance).scale(props.size);
+ }
+ }
+ }
+
+ (Size::new(width, top + bottom), top)
}