123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616 |
- // SPDX-License-Identifier: Unlicense OR MIT
- package text
- import (
- "bufio"
- "io"
- "strings"
- "unicode/utf8"
- giofont "gioui.org/font"
- "gioui.org/io/system"
- "gioui.org/op"
- "gioui.org/op/clip"
- "github.com/go-text/typesetting/font"
- "golang.org/x/image/math/fixed"
- )
- // WrapPolicy configures strategies for choosing where to break lines of text for line
- // wrapping.
- type WrapPolicy uint8
- const (
- // WrapHeuristically tries to minimize breaking within words (UAX#14 text segments)
- // while also ensuring that text fits within the given MaxWidth. It will only break
- // a line within a word (on a UAX#29 grapheme cluster boundary) when that word cannot
- // fit on a line by itself. Additionally, when the final word of a line is being
- // truncated, this policy will preserve as many symbols of that word as
- // possible before the truncator.
- WrapHeuristically WrapPolicy = iota
- // WrapWords does not permit words (UAX#14 text segments) to be broken across lines.
- // This means that sometimes long words will exceed the MaxWidth they are wrapped with.
- WrapWords
- // WrapGraphemes will maximize the amount of text on each line at the expense of readability,
- // breaking any word across lines on UAX#29 grapheme cluster boundaries to maximize the number of
- // grapheme clusters on each line.
- WrapGraphemes
- )
- // Parameters are static text shaping attributes applied to the entire shaped text.
- type Parameters struct {
- // Font describes the preferred typeface.
- Font giofont.Font
- // Alignment characterizes the positioning of text within the line. It does not directly
- // impact shaping, but is provided in order to allow efficient offset computation.
- Alignment Alignment
- // PxPerEm is the pixels-per-em to shape the text with.
- PxPerEm fixed.Int26_6
- // MaxLines limits the quantity of shaped lines. Zero means no limit.
- MaxLines int
- // Truncator is a string of text to insert where the shaped text was truncated, which
- // can currently ohly happen if MaxLines is nonzero and the text on the final line is
- // truncated.
- Truncator string
- // WrapPolicy configures how line breaks will be chosen when wrapping text across lines.
- WrapPolicy WrapPolicy
- // MinWidth and MaxWidth provide the minimum and maximum horizontal space constraints
- // for the shaped text.
- MinWidth, MaxWidth int
- // Locale provides primary direction and language information for the shaped text.
- Locale system.Locale
- // LineHeightScale is a scaling factor applied to the LineHeight of a paragraph. If zero, a default
- // value of 1.2 will be used.
- LineHeightScale float32
- // LineHeight is the distance between the baselines of two lines of text. If zero, the PxPerEm
- // of the any given paragraph will set the LineHeight of that paragraph. This value will be
- // scaled by LineHeightScale, so applications desiring a specific fixed value
- // should set LineHeightScale to 1.
- LineHeight fixed.Int26_6
- // forceTruncate controls whether the truncator string is inserted on the final line of
- // text with a MaxLines. It is unexported because this behavior only makes sense for the
- // shaper to control when it iterates paragraphs of text.
- forceTruncate bool
- // DisableSpaceTrim prevents the width of the final whitespace glyph on a line from being zeroed.
- // This is desirable for text editors (so that the whitespace can be selected), but is undesirable
- // for ordinary display text.
- DisableSpaceTrim bool
- }
- type FontFace = giofont.FontFace
- // Glyph describes a shaped font glyph. Many fields are distances relative
- // to the "dot", which is a point on the baseline (the line upon which glyphs
- // visually rest) for the line of text containing the glyph.
- //
- // Glyphs are organized into "glyph clusters," which are sequences that
- // may represent an arbitrary number of runes.
- //
- // Sequences of glyph clusters that share style parameters are grouped into "runs."
- //
- // "Document coordinates" are pixel values relative to the text's origin at (0,0)
- // in the upper-left corner" Displaying each shaped glyph at the document
- // coordinates of its dot will correctly visualize the text.
- type Glyph struct {
- // ID is a unique, per-shaper identifier for the shape of the glyph.
- // Glyphs from the same shaper will share an ID when they are from
- // the same face and represent the same glyph at the same size.
- ID GlyphID
- // X is the x coordinate of the dot for this glyph in document coordinates.
- X fixed.Int26_6
- // Y is the y coordinate of the dot for this glyph in document coordinates.
- Y int32
- // Advance is the logical width of the glyph. The glyph may be visually
- // wider than this.
- Advance fixed.Int26_6
- // Ascent is the distance from the dot to the logical top of glyphs in
- // this glyph's face. The specific glyph may be shorter than this.
- Ascent fixed.Int26_6
- // Descent is the distance from the dot to the logical bottom of glyphs
- // in this glyph's face. The specific glyph may descend less than this.
- Descent fixed.Int26_6
- // Offset encodes the origin of the drawing coordinate space for this glyph
- // relative to the dot. This value is used when converting glyphs to paths.
- Offset fixed.Point26_6
- // Bounds encodes the visual dimensions of the glyph relative to the dot.
- Bounds fixed.Rectangle26_6
- // Runes is the number of runes represented by the glyph cluster this glyph
- // belongs to. If Flags does not contain FlagClusterBreak, this value will
- // always be zero. The final glyph in the cluster contains the runes count
- // for the entire cluster.
- Runes uint16
- // Flags encode special properties of this glyph.
- Flags Flags
- }
- type Flags uint16
- const (
- // FlagTowardOrigin is set for glyphs in runs that flow
- // towards the origin (RTL).
- FlagTowardOrigin Flags = 1 << iota
- // FlagLineBreak is set for the last glyph in a line.
- FlagLineBreak
- // FlagRunBreak is set for the last glyph in a run. A run is a sequence of
- // glyphs sharing constant style properties (same size, same face, same
- // direction, etc...).
- FlagRunBreak
- // FlagClusterBreak is set for the last glyph in a glyph cluster. A glyph cluster is a
- // sequence of glyphs which are logically a single unit, but require multiple
- // symbols from a font to display.
- FlagClusterBreak
- // FlagParagraphBreak indicates that the glyph cluster does not represent actual
- // font glyphs, but was inserted by the shaper to represent line-breaking
- // whitespace characters. After a glyph with FlagParagraphBreak set, the shaper
- // will always return a glyph with FlagParagraphStart providing the X and Y
- // coordinates of the start of the next line, even if that line has no contents.
- FlagParagraphBreak
- // FlagParagraphStart indicates that the glyph starts a new paragraph.
- FlagParagraphStart
- // FlagTruncator indicates that the glyph is part of a special truncator run that
- // represents the portion of text removed due to truncation. A glyph with both
- // FlagTruncator and FlagClusterBreak will have a Runes field accounting for all
- // runes truncated.
- FlagTruncator
- )
- func (f Flags) String() string {
- var b strings.Builder
- if f&FlagParagraphStart != 0 {
- b.WriteString("S")
- } else {
- b.WriteString("_")
- }
- if f&FlagParagraphBreak != 0 {
- b.WriteString("P")
- } else {
- b.WriteString("_")
- }
- if f&FlagTowardOrigin != 0 {
- b.WriteString("T")
- } else {
- b.WriteString("_")
- }
- if f&FlagLineBreak != 0 {
- b.WriteString("L")
- } else {
- b.WriteString("_")
- }
- if f&FlagRunBreak != 0 {
- b.WriteString("R")
- } else {
- b.WriteString("_")
- }
- if f&FlagClusterBreak != 0 {
- b.WriteString("C")
- } else {
- b.WriteString("_")
- }
- if f&FlagTruncator != 0 {
- b.WriteString("…")
- } else {
- b.WriteString("_")
- }
- return b.String()
- }
- type GlyphID uint64
- // Shaper converts strings of text into glyphs that can be displayed. The same
- // Shaper should not be used in different goroutines.
- //
- // The Shaper controls text layout and has a cache, implemented as a map, and
- // so laying out text in two different goroutines can easily result in
- // concurrent access to said map, resulting in a panic.
- //
- // Practically speaking, this means you should use different Shapers for
- // different top-level windows.
- type Shaper struct {
- config struct {
- disableSystemFonts bool
- collection []FontFace
- }
- initialized bool
- shaper shaperImpl
- pathCache pathCache
- bitmapShapeCache bitmapShapeCache
- layoutCache layoutCache
- reader *bufio.Reader
- paragraph []byte
- // Iterator state.
- brokeParagraph bool
- pararagraphStart Glyph
- txt document
- line int
- run int
- glyph int
- // advance is the width of glyphs from the current run that have already been displayed.
- advance fixed.Int26_6
- // done tracks whether iteration is over.
- done bool
- err error
- }
- // ShaperOptions configure text shapers.
- type ShaperOption func(*Shaper)
- // NoSystemFonts can be used to disable system font loading.
- func NoSystemFonts() ShaperOption {
- return func(s *Shaper) {
- s.config.disableSystemFonts = true
- }
- }
- // WithCollection can be used to provide a collection of pre-loaded fonts to the shaper.
- func WithCollection(collection []FontFace) ShaperOption {
- return func(s *Shaper) {
- s.config.collection = collection
- }
- }
- // NewShaper constructs a shaper with the provided options.
- //
- // NewShaper must be called after [app.NewWindow], unless the [NoSystemFonts]
- // option is specified. This is an unfortunate restriction caused by some platforms
- // such as Android.
- func NewShaper(options ...ShaperOption) *Shaper {
- l := &Shaper{}
- for _, opt := range options {
- opt(l)
- }
- l.init()
- return l
- }
- func (l *Shaper) init() {
- if l.initialized {
- return
- }
- l.initialized = true
- l.reader = bufio.NewReader(nil)
- l.shaper = *newShaperImpl(!l.config.disableSystemFonts, l.config.collection)
- }
- // Layout text from an io.Reader according to a set of options. Results can be retrieved by
- // iteratively calling NextGlyph.
- func (l *Shaper) Layout(params Parameters, txt io.Reader) {
- l.init()
- l.layoutText(params, txt, "")
- }
- // LayoutString is Layout for strings.
- func (l *Shaper) LayoutString(params Parameters, str string) {
- l.init()
- l.layoutText(params, nil, str)
- }
- func (l *Shaper) reset(align Alignment) {
- l.line, l.run, l.glyph, l.advance = 0, 0, 0, 0
- l.done = false
- l.txt.reset()
- l.txt.alignment = align
- }
- // layoutText lays out a large text document by breaking it into paragraphs and laying
- // out each of them separately. This allows the shaping results to be cached independently
- // by paragraph. Only one of txt and str should be provided.
- func (l *Shaper) layoutText(params Parameters, txt io.Reader, str string) {
- l.reset(params.Alignment)
- if txt == nil && len(str) == 0 {
- l.txt.append(l.layoutParagraph(params, "", nil))
- return
- }
- l.reader.Reset(txt)
- truncating := params.MaxLines > 0
- var done bool
- var endByte int
- for !done {
- l.paragraph = l.paragraph[:0]
- if txt != nil {
- for {
- b, err := l.reader.ReadByte()
- if err != nil {
- // EOF or any other error ends processing here.
- done = true
- break
- }
- l.paragraph = append(l.paragraph, b)
- if b == '\n' {
- break
- }
- }
- if !done {
- _, re := l.reader.ReadByte()
- done = re != nil
- if !done {
- _ = l.reader.UnreadByte()
- }
- }
- } else {
- idx := strings.IndexByte(str, '\n')
- if idx == -1 {
- done = true
- endByte = len(str)
- } else {
- endByte = idx + 1
- done = endByte == len(str)
- }
- }
- if len(str[:endByte]) > 0 || (len(l.paragraph) > 0 || len(l.txt.lines) == 0) {
- params.forceTruncate = truncating && !done
- lines := l.layoutParagraph(params, str[:endByte], l.paragraph)
- if truncating {
- params.MaxLines -= len(lines.lines)
- if params.MaxLines == 0 {
- done = true
- // We've truncated the text, but we need to account for all of the runes we never
- // decoded in the truncator.
- var unreadRunes int
- if txt == nil {
- unreadRunes = utf8.RuneCountInString(str[endByte:])
- } else {
- for {
- _, _, e := l.reader.ReadRune()
- if e != nil {
- break
- }
- unreadRunes++
- }
- }
- l.txt.unreadRuneCount = unreadRunes
- }
- }
- l.txt.append(lines)
- }
- if done {
- return
- }
- str = str[endByte:]
- }
- }
- // layoutParagraph shapes and wraps a paragraph using the provided parameters.
- // It accepts the paragraph data in either string or rune format, preferring the
- // string in order to hit the shaper cache more quickly.
- func (l *Shaper) layoutParagraph(params Parameters, asStr string, asBytes []byte) document {
- if l == nil {
- return document{}
- }
- if len(asStr) == 0 && len(asBytes) > 0 {
- asStr = string(asBytes)
- }
- // Alignment is not part of the cache key because changing it does not impact shaping.
- lk := layoutKey{
- ppem: params.PxPerEm,
- maxWidth: params.MaxWidth,
- minWidth: params.MinWidth,
- maxLines: params.MaxLines,
- truncator: params.Truncator,
- locale: params.Locale,
- font: params.Font,
- forceTruncate: params.forceTruncate,
- wrapPolicy: params.WrapPolicy,
- str: asStr,
- lineHeight: params.LineHeight,
- lineHeightScale: params.LineHeightScale,
- }
- if l, ok := l.layoutCache.Get(lk); ok {
- return l
- }
- lines := l.shaper.LayoutRunes(params, []rune(asStr))
- l.layoutCache.Put(lk, lines)
- return lines
- }
- // NextGlyph returns the next glyph from the most recent shaping operation, if
- // any. If there are no more glyphs, ok will be false.
- func (l *Shaper) NextGlyph() (_ Glyph, ok bool) {
- l.init()
- if l.done {
- return Glyph{}, false
- }
- for {
- if l.line == len(l.txt.lines) {
- if l.brokeParagraph {
- l.brokeParagraph = false
- return l.pararagraphStart, true
- }
- if l.err == nil {
- l.err = io.EOF
- }
- return Glyph{}, false
- }
- line := l.txt.lines[l.line]
- if l.run == len(line.runs) {
- l.line++
- l.run = 0
- continue
- }
- run := line.runs[l.run]
- align := l.txt.alignment.Align(line.direction, line.width, l.txt.alignWidth)
- if l.line == 0 && l.run == 0 && len(run.Glyphs) == 0 {
- // The very first run is empty, which will only happen when the
- // entire text is a shaped empty string. Return a single synthetic
- // glyph to provide ascent/descent information to the caller.
- l.done = true
- return Glyph{
- X: align,
- Y: int32(line.yOffset),
- Runes: 0,
- Flags: FlagLineBreak | FlagClusterBreak | FlagRunBreak,
- Ascent: line.ascent,
- Descent: line.descent,
- }, true
- }
- if l.glyph == len(run.Glyphs) {
- l.run++
- l.glyph = 0
- l.advance = 0
- continue
- }
- glyphIdx := l.glyph
- rtl := run.Direction.Progression() == system.TowardOrigin
- if rtl {
- // If RTL, traverse glyphs backwards to ensure rune order.
- glyphIdx = len(run.Glyphs) - 1 - glyphIdx
- }
- g := run.Glyphs[glyphIdx]
- if rtl {
- // Modify the advance prior to computing runOffset to ensure that the
- // current glyph's width is subtracted in RTL.
- l.advance += g.xAdvance
- }
- // runOffset computes how far into the run the dot should be positioned.
- runOffset := l.advance
- if rtl {
- runOffset = run.Advance - l.advance
- }
- glyph := Glyph{
- ID: g.id,
- X: align + run.X + runOffset,
- Y: int32(line.yOffset),
- Ascent: line.ascent,
- Descent: line.descent,
- Advance: g.xAdvance,
- Runes: uint16(g.runeCount),
- Offset: fixed.Point26_6{
- X: g.xOffset,
- Y: g.yOffset,
- },
- Bounds: g.bounds,
- }
- if run.truncator {
- glyph.Flags |= FlagTruncator
- }
- l.glyph++
- if !rtl {
- l.advance += g.xAdvance
- }
- endOfRun := l.glyph == len(run.Glyphs)
- if endOfRun {
- glyph.Flags |= FlagRunBreak
- }
- endOfLine := endOfRun && l.run == len(line.runs)-1
- if endOfLine {
- glyph.Flags |= FlagLineBreak
- }
- endOfText := endOfLine && l.line == len(l.txt.lines)-1
- nextGlyph := l.glyph
- if rtl {
- nextGlyph = len(run.Glyphs) - 1 - nextGlyph
- }
- endOfCluster := endOfRun || run.Glyphs[nextGlyph].clusterIndex != g.clusterIndex
- if run.truncator {
- // Only emit a single cluster for the entire truncator sequence.
- endOfCluster = endOfRun
- }
- if endOfCluster {
- glyph.Flags |= FlagClusterBreak
- if run.truncator {
- glyph.Runes += uint16(l.txt.unreadRuneCount)
- }
- } else {
- glyph.Runes = 0
- }
- if run.Direction.Progression() == system.TowardOrigin {
- glyph.Flags |= FlagTowardOrigin
- }
- if l.brokeParagraph {
- glyph.Flags |= FlagParagraphStart
- l.brokeParagraph = false
- }
- if g.glyphCount == 0 {
- glyph.Flags |= FlagParagraphBreak
- l.brokeParagraph = true
- if endOfText {
- l.pararagraphStart = Glyph{
- Ascent: glyph.Ascent,
- Descent: glyph.Descent,
- Flags: FlagParagraphStart | FlagLineBreak | FlagRunBreak | FlagClusterBreak,
- }
- // If a glyph is both a paragraph break and the final glyph, it's a newline
- // at the end of the text. We must inform widgets like the text editor
- // of a valid cursor position they can use for "after" such a newline,
- // taking text alignment into account.
- l.pararagraphStart.X = l.txt.alignment.Align(line.direction, 0, l.txt.alignWidth)
- l.pararagraphStart.Y = glyph.Y + int32((glyph.Ascent + glyph.Descent).Ceil())
- }
- }
- return glyph, true
- }
- }
- const (
- facebits = 16
- sizebits = 16
- gidbits = 64 - facebits - sizebits
- )
- // newGlyphID encodes a face and a glyph id into a GlyphID.
- func newGlyphID(ppem fixed.Int26_6, faceIdx int, gid font.GID) GlyphID {
- if gid&^((1<<gidbits)-1) != 0 {
- panic("glyph id out of bounds")
- }
- if faceIdx&^((1<<facebits)-1) != 0 {
- panic("face index out of bounds")
- }
- if ppem&^((1<<sizebits)-1) != 0 {
- panic("ppem out of bounds")
- }
- // Mask off the upper 16 bits of ppem. This still allows values up to
- // 1023.
- ppem &= ((1 << sizebits) - 1)
- return GlyphID(faceIdx)<<(gidbits+sizebits) | GlyphID(ppem)<<(gidbits) | GlyphID(gid)
- }
- // splitGlyphID is the opposite of newGlyphID.
- func splitGlyphID(g GlyphID) (fixed.Int26_6, int, font.GID) {
- faceIdx := int(uint64(g) >> (gidbits + sizebits))
- ppem := fixed.Int26_6((g & ((1<<sizebits - 1) << gidbits)) >> gidbits)
- gid := font.GID(g) & (1<<gidbits - 1)
- return ppem, faceIdx, gid
- }
- // Shape converts the provided glyphs into a path. The path will enclose the forms
- // of all vector glyphs.
- // All glyphs are expected to be from a single line of text (their Y offsets are ignored).
- func (l *Shaper) Shape(gs []Glyph) clip.PathSpec {
- l.init()
- key := l.pathCache.hashGlyphs(gs)
- shape, ok := l.pathCache.Get(key, gs)
- if ok {
- return shape
- }
- pathOps := new(op.Ops)
- shape = l.shaper.Shape(pathOps, gs)
- l.pathCache.Put(key, gs, shape)
- return shape
- }
- // Bitmaps extracts bitmap glyphs from the provided slice and creates an op.CallOp to present
- // them. The returned op.CallOp will align correctly with the return value of Shape() for the
- // same gs slice.
- // All glyphs are expected to be from a single line of text (their Y offsets are ignored).
- func (l *Shaper) Bitmaps(gs []Glyph) op.CallOp {
- l.init()
- key := l.bitmapShapeCache.hashGlyphs(gs)
- call, ok := l.bitmapShapeCache.Get(key, gs)
- if ok {
- return call
- }
- callOps := new(op.Ops)
- call = l.shaper.Bitmaps(callOps, gs)
- l.bitmapShapeCache.Put(key, gs, call)
- return call
- }
|