From 4482a914f52311356f6f4b7a695d4075ca22c0c6 Mon Sep 17 00:00:00 2001
From: Meng Zhuo <mzh@golangcn.org>
Date: Tue, 17 Nov 2020 16:53:38 +0800
Subject: [PATCH 01/40] internal/language: fix resizeRange index wrong way

Fixes golang/go#42536

Change-Id: I572cdbb26d320c4d9a972d555ddc6427ce1f0348
Reviewed-on: https://go-review.googlesource.com/c/text/+/270697
Run-TryBot: Meng Zhuo <mzh@golangcn.org>
TryBot-Result: Go Bot <gobot@golang.org>
Reviewed-by: Marcel van Lohuizen <mpvl@golang.org>
Trust: Meng Zhuo <mzh@golangcn.org>
---
 internal/language/parse.go | 11 ++++++-----
 language/parse_test.go     |  1 +
 2 files changed, 7 insertions(+), 5 deletions(-)

diff --git a/internal/language/parse.go b/internal/language/parse.go
index 2be83e1da..a2fdad89d 100644
--- a/internal/language/parse.go
+++ b/internal/language/parse.go
@@ -133,14 +133,15 @@ func (s *scanner) resizeRange(oldStart, oldEnd, newSize int) {
 	s.start = oldStart
 	if end := oldStart + newSize; end != oldEnd {
 		diff := end - oldEnd
-		if end < cap(s.b) {
-			b := make([]byte, len(s.b)+diff)
+		var b []byte
+		if n := len(s.b) + diff; n > cap(s.b) {
+			b = make([]byte, n)
 			copy(b, s.b[:oldStart])
-			copy(b[end:], s.b[oldEnd:])
-			s.b = b
 		} else {
-			s.b = append(s.b[end:], s.b[oldEnd:]...)
+			b = s.b[:n:n]
 		}
+		copy(b[end:], s.b[oldEnd:])
+		s.b = b
 		s.next = end + (s.next - s.end)
 		s.end = end
 	}
diff --git a/language/parse_test.go b/language/parse_test.go
index 2ff28bfd3..041660c4e 100644
--- a/language/parse_test.go
+++ b/language/parse_test.go
@@ -318,6 +318,7 @@ func TestParseAcceptLanguage(t *testing.T) {
 		{nil, "aa;q", false},
 		{nil, "aa;q=", false},
 		{nil, "aa;q=.", false},
+		{nil, "00-t-0o", false},
 
 		// odd fallbacks
 		{

From 967b8f6126b019daebc17c221889cb59560fa8d1 Mon Sep 17 00:00:00 2001
From: Patrick Gundlach <gundlach@speedata.de>
Date: Thu, 5 Nov 2020 13:15:10 +0100
Subject: [PATCH 02/40] text/unicod/bidi: implement API, remove panics

The bidi API splits strings with mixed left-to-right (ltr) and
right-to-left (rtl) parts into substrings (segments). Each segment
contains a substring, a direction of text flow (either ltr or rtl)
and the start and end positions in the input.

The paragraph validators do not panic, instead the newParagraph function
returns an error message in case the input is invalid.

Fixes golang/go#42356

Change-Id: I90cafc8fadb0cf6936dfb1ab373586017147d709
Reviewed-on: https://go-review.googlesource.com/c/text/+/267857
Trust: Ian Lance Taylor <iant@golang.org>
Reviewed-by: Marcel van Lohuizen <mpvl@golang.org>
---
 unicode/bidi/bidi.go      | 221 ++++++++++++++++++++----
 unicode/bidi/bidi_test.go | 347 ++++++++++++++++++++++++++++++++++++++
 unicode/bidi/core.go      |  63 ++++---
 unicode/bidi/core_test.go |  10 +-
 4 files changed, 584 insertions(+), 57 deletions(-)
 create mode 100644 unicode/bidi/bidi_test.go

diff --git a/unicode/bidi/bidi.go b/unicode/bidi/bidi.go
index e8edc54cc..fd057601b 100644
--- a/unicode/bidi/bidi.go
+++ b/unicode/bidi/bidi.go
@@ -12,15 +12,14 @@
 // and without notice.
 package bidi // import "golang.org/x/text/unicode/bidi"
 
-// TODO:
-// The following functionality would not be hard to implement, but hinges on
-// the definition of a Segmenter interface. For now this is up to the user.
-// - Iterate over paragraphs
-// - Segmenter to iterate over runs directly from a given text.
-// Also:
+// TODO
 // - Transformer for reordering?
 // - Transformer (validator, really) for Bidi Rule.
 
+import (
+	"bytes"
+)
+
 // This API tries to avoid dealing with embedding levels for now. Under the hood
 // these will be computed, but the question is to which extent the user should
 // know they exist. We should at some point allow the user to specify an
@@ -49,7 +48,9 @@ const (
 	Neutral
 )
 
-type options struct{}
+type options struct {
+	defaultDirection Direction
+}
 
 // An Option is an option for Bidi processing.
 type Option func(*options)
@@ -66,12 +67,62 @@ type Option func(*options)
 // DefaultDirection sets the default direction for a Paragraph. The direction is
 // overridden if the text contains directional characters.
 func DefaultDirection(d Direction) Option {
-	panic("unimplemented")
+	return func(opts *options) {
+		opts.defaultDirection = d
+	}
 }
 
 // A Paragraph holds a single Paragraph for Bidi processing.
 type Paragraph struct {
-	// buffers
+	p          []byte
+	o          Ordering
+	opts       []Option
+	types      []Class
+	pairTypes  []bracketType
+	pairValues []rune
+	runes      []rune
+	options    options
+}
+
+// Initialize the p.pairTypes, p.pairValues and p.types from the input previously
+// set by p.SetBytes() or p.SetString(). Also limit the input up to (and including) a paragraph
+// separator (bidi class B).
+//
+// The function p.Order() needs these values to be set, so this preparation could be postponed.
+// But since the SetBytes and SetStrings functions return the length of the input up to the paragraph
+// separator, the whole input needs to be processed anyway and should not be done twice.
+//
+// The function has the same return values as SetBytes() / SetString()
+func (p *Paragraph) prepareInput() (n int, err error) {
+	p.runes = bytes.Runes(p.p)
+	bytecount := 0
+	// clear slices from previous SetString or SetBytes
+	p.pairTypes = nil
+	p.pairValues = nil
+	p.types = nil
+
+	for _, r := range p.runes {
+		props, i := LookupRune(r)
+		bytecount += i
+		cls := props.Class()
+		if cls == B {
+			return bytecount, nil
+		}
+		p.types = append(p.types, cls)
+		if props.IsOpeningBracket() {
+			p.pairTypes = append(p.pairTypes, bpOpen)
+			p.pairValues = append(p.pairValues, r)
+		} else if props.IsBracket() {
+			// this must be a closing bracket,
+			// since IsOpeningBracket is not true
+			p.pairTypes = append(p.pairTypes, bpClose)
+			p.pairValues = append(p.pairValues, r)
+		} else {
+			p.pairTypes = append(p.pairTypes, bpNone)
+			p.pairValues = append(p.pairValues, 0)
+		}
+	}
+	return bytecount, nil
 }
 
 // SetBytes configures p for the given paragraph text. It replaces text
@@ -80,70 +131,150 @@ type Paragraph struct {
 // consumed from b including this separator. Error may be non-nil if options are
 // given.
 func (p *Paragraph) SetBytes(b []byte, opts ...Option) (n int, err error) {
-	panic("unimplemented")
+	p.p = b
+	p.opts = opts
+	return p.prepareInput()
 }
 
-// SetString configures p for the given paragraph text. It replaces text
-// previously set by SetBytes or SetString. If b contains a paragraph separator
+// SetString configures s for the given paragraph text. It replaces text
+// previously set by SetBytes or SetString. If s contains a paragraph separator
 // it will only process the first paragraph and report the number of bytes
-// consumed from b including this separator. Error may be non-nil if options are
+// consumed from s including this separator. Error may be non-nil if options are
 // given.
 func (p *Paragraph) SetString(s string, opts ...Option) (n int, err error) {
-	panic("unimplemented")
+	p.p = []byte(s)
+	p.opts = opts
+	return p.prepareInput()
 }
 
 // IsLeftToRight reports whether the principle direction of rendering for this
 // paragraphs is left-to-right. If this returns false, the principle direction
 // of rendering is right-to-left.
 func (p *Paragraph) IsLeftToRight() bool {
-	panic("unimplemented")
+	return p.Direction() == LeftToRight
 }
 
 // Direction returns the direction of the text of this paragraph.
 //
 // The direction may be LeftToRight, RightToLeft, Mixed, or Neutral.
 func (p *Paragraph) Direction() Direction {
-	panic("unimplemented")
+	return p.o.Direction()
 }
 
+// TODO: what happens if the position is > len(input)? This should return an error.
+
 // RunAt reports the Run at the given position of the input text.
 //
 // This method can be used for computing line breaks on paragraphs.
 func (p *Paragraph) RunAt(pos int) Run {
-	panic("unimplemented")
+	c := 0
+	runNumber := 0
+	for i, r := range p.o.runes {
+		c += len(r)
+		if pos < c {
+			runNumber = i
+		}
+	}
+	return p.o.Run(runNumber)
+}
+
+func calculateOrdering(levels []level, runes []rune) Ordering {
+	var curDir Direction
+
+	prevDir := Neutral
+	prevI := 0
+
+	o := Ordering{}
+	// lvl = 0,2,4,...: left to right
+	// lvl = 1,3,5,...: right to left
+	for i, lvl := range levels {
+		if lvl%2 == 0 {
+			curDir = LeftToRight
+		} else {
+			curDir = RightToLeft
+		}
+		if curDir != prevDir {
+			if i > 0 {
+				o.runes = append(o.runes, runes[prevI:i])
+				o.directions = append(o.directions, prevDir)
+				o.startpos = append(o.startpos, prevI)
+			}
+			prevI = i
+			prevDir = curDir
+		}
+	}
+	o.runes = append(o.runes, runes[prevI:])
+	o.directions = append(o.directions, prevDir)
+	o.startpos = append(o.startpos, prevI)
+	return o
 }
 
 // Order computes the visual ordering of all the runs in a Paragraph.
 func (p *Paragraph) Order() (Ordering, error) {
-	panic("unimplemented")
+	if len(p.types) == 0 {
+		return Ordering{}, nil
+	}
+
+	for _, fn := range p.opts {
+		fn(&p.options)
+	}
+	lvl := level(-1)
+	if p.options.defaultDirection == RightToLeft {
+		lvl = 1
+	}
+	para, err := newParagraph(p.types, p.pairTypes, p.pairValues, lvl)
+	if err != nil {
+		return Ordering{}, err
+	}
+
+	levels := para.getLevels([]int{len(p.types)})
+
+	p.o = calculateOrdering(levels, p.runes)
+	return p.o, nil
 }
 
 // Line computes the visual ordering of runs for a single line starting and
 // ending at the given positions in the original text.
 func (p *Paragraph) Line(start, end int) (Ordering, error) {
-	panic("unimplemented")
+	lineTypes := p.types[start:end]
+	para, err := newParagraph(lineTypes, p.pairTypes[start:end], p.pairValues[start:end], -1)
+	if err != nil {
+		return Ordering{}, err
+	}
+	levels := para.getLevels([]int{len(lineTypes)})
+	o := calculateOrdering(levels, p.runes[start:end])
+	return o, nil
 }
 
 // An Ordering holds the computed visual order of runs of a Paragraph. Calling
 // SetBytes or SetString on the originating Paragraph invalidates an Ordering.
 // The methods of an Ordering should only be called by one goroutine at a time.
-type Ordering struct{}
+type Ordering struct {
+	runes      [][]rune
+	directions []Direction
+	startpos   []int
+}
 
 // Direction reports the directionality of the runs.
 //
 // The direction may be LeftToRight, RightToLeft, Mixed, or Neutral.
 func (o *Ordering) Direction() Direction {
-	panic("unimplemented")
+	return o.directions[0]
 }
 
 // NumRuns returns the number of runs.
 func (o *Ordering) NumRuns() int {
-	panic("unimplemented")
+	return len(o.runes)
 }
 
 // Run returns the ith run within the ordering.
 func (o *Ordering) Run(i int) Run {
-	panic("unimplemented")
+	r := Run{
+		runes:     o.runes[i],
+		direction: o.directions[i],
+		startpos:  o.startpos[i],
+	}
+	return r
 }
 
 // TODO: perhaps with options.
@@ -155,16 +286,19 @@ func (o *Ordering) Run(i int) Run {
 
 // A Run is a continuous sequence of characters of a single direction.
 type Run struct {
+	runes     []rune
+	direction Direction
+	startpos  int
 }
 
 // String returns the text of the run in its original order.
 func (r *Run) String() string {
-	panic("unimplemented")
+	return string(r.runes)
 }
 
 // Bytes returns the text of the run in its original order.
 func (r *Run) Bytes() []byte {
-	panic("unimplemented")
+	return []byte(r.String())
 }
 
 // TODO: methods for
@@ -174,25 +308,52 @@ func (r *Run) Bytes() []byte {
 
 // Direction reports the direction of the run.
 func (r *Run) Direction() Direction {
-	panic("unimplemented")
+	return r.direction
 }
 
-// Position of the Run within the text passed to SetBytes or SetString of the
+// Pos returns the position of the Run within the text passed to SetBytes or SetString of the
 // originating Paragraph value.
 func (r *Run) Pos() (start, end int) {
-	panic("unimplemented")
+	return r.startpos, r.startpos + len(r.runes) - 1
 }
 
 // AppendReverse reverses the order of characters of in, appends them to out,
 // and returns the result. Modifiers will still follow the runes they modify.
 // Brackets are replaced with their counterparts.
 func AppendReverse(out, in []byte) []byte {
-	panic("unimplemented")
+	ret := make([]byte, len(in)+len(out))
+	copy(ret, out)
+	inRunes := bytes.Runes(in)
+
+	for i, r := range inRunes {
+		prop, _ := LookupRune(r)
+		if prop.IsBracket() {
+			inRunes[i] = prop.reverseBracket(r)
+		}
+	}
+
+	for i, j := 0, len(inRunes)-1; i < j; i, j = i+1, j-1 {
+		inRunes[i], inRunes[j] = inRunes[j], inRunes[i]
+	}
+	copy(ret[len(out):], string(inRunes))
+
+	return ret
 }
 
 // ReverseString reverses the order of characters in s and returns a new string.
 // Modifiers will still follow the runes they modify. Brackets are replaced with
 // their counterparts.
 func ReverseString(s string) string {
-	panic("unimplemented")
+	input := []rune(s)
+	li := len(input)
+	ret := make([]rune, li)
+	for i, r := range input {
+		prop, _ := LookupRune(r)
+		if prop.IsBracket() {
+			ret[li-i-1] = prop.reverseBracket(r)
+		} else {
+			ret[li-i-1] = r
+		}
+	}
+	return string(ret)
 }
diff --git a/unicode/bidi/bidi_test.go b/unicode/bidi/bidi_test.go
new file mode 100644
index 000000000..88572f565
--- /dev/null
+++ b/unicode/bidi/bidi_test.go
@@ -0,0 +1,347 @@
+package bidi
+
+import (
+	"log"
+	"testing"
+)
+
+type runInformation struct {
+	str   string
+	dir   Direction
+	start int
+	end   int
+}
+
+func TestSimple(t *testing.T) {
+	str := "Hellö"
+	p := Paragraph{}
+	p.SetString(str)
+	order, err := p.Order()
+	if err != nil {
+		log.Fatal(err)
+	}
+	expectedRuns := []runInformation{
+		{"Hellö", LeftToRight, 0, 4},
+	}
+
+	if !p.IsLeftToRight() {
+		t.Error("p.IsLeftToRight() == false; want true")
+	}
+	if nr, want := order.NumRuns(), len(expectedRuns); nr != want {
+		t.Errorf("order.NumRuns() = %d; want %d", nr, want)
+	}
+	for i, want := range expectedRuns {
+		r := order.Run(i)
+		if got := r.String(); got != want.str {
+			t.Errorf("Run(%d) = %q; want %q", i, got, want.str)
+		}
+		if s, e := r.Pos(); s != want.start || e != want.end {
+			t.Errorf("Run(%d).start = %d, .end = %d; want start %d, end %d", i, s, e, want.start, want.end)
+		}
+		if d := r.Direction(); d != want.dir {
+			t.Errorf("Run(%d).Direction = %d; want %d", i, d, want.dir)
+		}
+	}
+}
+
+func TestMixed(t *testing.T) {
+	str := `العاشر ليونيكود (Unicode Conference)، الذي سيعقد في 10-12 آذار 1997 مبدينة`
+	p := Paragraph{}
+	p.SetString(str)
+	order, err := p.Order()
+	if err != nil {
+		log.Fatal(err)
+	}
+	if p.IsLeftToRight() {
+		t.Error("p.IsLeftToRight() == true; want false")
+	}
+
+	expectedRuns := []runInformation{
+		{"العاشر ليونيكود (", RightToLeft, 0, 16},
+		{"Unicode Conference", LeftToRight, 17, 34},
+		{")، الذي سيعقد في ", RightToLeft, 35, 51},
+		{"10", LeftToRight, 52, 53},
+		{"-", RightToLeft, 54, 54},
+		{"12", LeftToRight, 55, 56},
+		{" آذار ", RightToLeft, 57, 62},
+		{"1997", LeftToRight, 63, 66},
+		{" مبدينة", RightToLeft, 67, 73},
+	}
+
+	if nr, want := order.NumRuns(), len(expectedRuns); nr != want {
+		t.Errorf("order.NumRuns() = %d; want %d", nr, want)
+	}
+
+	for i, want := range expectedRuns {
+		r := order.Run(i)
+		if got := r.String(); got != want.str {
+			t.Errorf("Run(%d) = %q; want %q", i, got, want.str)
+		}
+		if s, e := r.Pos(); s != want.start || e != want.end {
+			t.Errorf("Run(%d).start = %d, .end = %d; want start = %d, end = %d", i, s, e, want.start, want.end)
+		}
+		if d := r.Direction(); d != want.dir {
+			t.Errorf("Run(%d).Direction = %d; want %d", i, d, want.dir)
+		}
+	}
+}
+
+func TestExplicitIsolate(t *testing.T) {
+	// https://www.w3.org/International/articles/inline-bidi-markup/uba-basics.en#beyond
+	str := "The names of these states in Arabic are \u2067مصر\u2069, \u2067البحرين\u2069 and \u2067الكويت\u2069 respectively."
+	p := Paragraph{}
+	p.SetString(str)
+	order, err := p.Order()
+	if err != nil {
+		log.Fatal(err)
+	}
+	if !p.IsLeftToRight() {
+		t.Error("p.IsLeftToRight() == false; want true")
+	}
+
+	expectedRuns := []runInformation{
+		{"The names of these states in Arabic are \u2067", LeftToRight, 0, 40},
+		{"مصر", RightToLeft, 41, 43},
+		{"\u2069, \u2067", LeftToRight, 44, 47},
+		{"البحرين", RightToLeft, 48, 54},
+		{"\u2069 and \u2067", LeftToRight, 55, 61},
+		{"الكويت", RightToLeft, 62, 67},
+		{"\u2069 respectively.", LeftToRight, 68, 82},
+	}
+
+	if nr, want := order.NumRuns(), len(expectedRuns); nr != want {
+		t.Errorf("order.NumRuns() = %d; want %d", nr, want)
+	}
+
+	for i, want := range expectedRuns {
+		r := order.Run(i)
+		if got := r.String(); got != want.str {
+			t.Errorf("Run(%d) = %q; want %q", i, got, want.str)
+		}
+		if s, e := r.Pos(); s != want.start || e != want.end {
+			t.Errorf("Run(%d).start = %d, .end = %d; want start = %d, end = %d", i, s, e, want.start, want.end)
+		}
+		if d := r.Direction(); d != want.dir {
+			t.Errorf("Run(%d).Direction = %d; want %d", i, d, want.dir)
+		}
+	}
+}
+
+func TestWithoutExplicitIsolate(t *testing.T) {
+	str := "The names of these states in Arabic are مصر, البحرين and الكويت respectively."
+	p := Paragraph{}
+	p.SetString(str)
+	order, err := p.Order()
+	if err != nil {
+		log.Fatal(err)
+	}
+	if !p.IsLeftToRight() {
+		t.Error("p.IsLeftToRight() == false; want true")
+	}
+
+	expectedRuns := []runInformation{
+		{"The names of these states in Arabic are ", LeftToRight, 0, 39},
+		{"مصر, البحرين", RightToLeft, 40, 51},
+		{" and ", LeftToRight, 52, 56},
+		{"الكويت", RightToLeft, 57, 62},
+		{" respectively.", LeftToRight, 63, 76},
+	}
+
+	if nr, want := order.NumRuns(), len(expectedRuns); nr != want {
+		t.Errorf("order.NumRuns() = %d; want %d", nr, want)
+	}
+
+	for i, want := range expectedRuns {
+		r := order.Run(i)
+		if got := r.String(); got != want.str {
+			t.Errorf("Run(%d) = %q; want %q", i, got, want.str)
+		}
+		if s, e := r.Pos(); s != want.start || e != want.end {
+			t.Errorf("Run(%d).start = %d, .end = %d; want start = %d, end = %d", i, s, e, want.start, want.end)
+		}
+		if d := r.Direction(); d != want.dir {
+			t.Errorf("Run(%d).Direction = %d; want %d", i, d, want.dir)
+		}
+	}
+}
+
+func TestLongUTF8(t *testing.T) {
+	str := `𠀀`
+	p := Paragraph{}
+	p.SetString(str)
+	order, err := p.Order()
+	if err != nil {
+		log.Fatal(err)
+	}
+	if !p.IsLeftToRight() {
+		t.Error("p.IsLeftToRight() == false; want true")
+	}
+
+	expectedRuns := []runInformation{
+		{"𠀀", LeftToRight, 0, 0},
+	}
+
+	if nr, want := order.NumRuns(), len(expectedRuns); nr != want {
+		t.Errorf("order.NumRuns() = %d; want %d", nr, want)
+	}
+
+	for i, want := range expectedRuns {
+		r := order.Run(i)
+		if got := r.String(); got != want.str {
+			t.Errorf("Run(%d) = %q; want %q", i, got, want.str)
+		}
+		if s, e := r.Pos(); s != want.start || e != want.end {
+			t.Errorf("Run(%d).start = %d, .end = %d; want start = %d, end = %d", i, s, e, want.start, want.end)
+		}
+		if d := r.Direction(); d != want.dir {
+			t.Errorf("Run(%d).Direction = %d; want %d", i, d, want.dir)
+		}
+	}
+}
+
+func TestLLongUTF8(t *testing.T) {
+	strTester := []struct {
+		str string
+		l   int
+	}{
+		{"ö", 2},
+		{"ॡ", 3},
+		{`𠀀`, 4},
+	}
+	for _, st := range strTester {
+		str := st.str
+		want := st.l
+		if _, l := LookupString(str); l != want {
+			t.Errorf("LookupString(%q) length = %d; want %d", str, l, want)
+		}
+
+	}
+
+}
+
+func TestMixedSimple(t *testing.T) {
+	str := `Uا`
+	p := Paragraph{}
+	p.SetString(str)
+	order, err := p.Order()
+	if err != nil {
+		log.Fatal(err)
+	}
+	if !p.IsLeftToRight() {
+		t.Error("p.IsLeftToRight() == false; want true")
+	}
+
+	expectedRuns := []runInformation{
+		{"U", LeftToRight, 0, 0},
+		{"ا", RightToLeft, 1, 1},
+	}
+
+	if nr, want := order.NumRuns(), len(expectedRuns); nr != want {
+		t.Errorf("order.NumRuns() = %d; want %d", nr, want)
+	}
+
+	for i, want := range expectedRuns {
+		r := order.Run(i)
+		if got := r.String(); got != want.str {
+			t.Errorf("Run(%d) = %q; want %q", i, got, want.str)
+		}
+		if s, e := r.Pos(); s != want.start || e != want.end {
+			t.Errorf("Run(%d).start = %d, .end = %d; want start = %d, end = %d", i, s, e, want.start, want.end)
+		}
+		if d := r.Direction(); d != want.dir {
+			t.Errorf("Run(%d).Direction = %d; want %d", i, d, want.dir)
+		}
+	}
+}
+
+func TestDefaultDirection(t *testing.T) {
+	str := "+"
+	p := Paragraph{}
+	p.SetString(str, DefaultDirection(RightToLeft))
+	_, err := p.Order()
+	if err != nil {
+		t.Error(err)
+		t.Fail()
+	}
+	if want, dir := false, p.IsLeftToRight(); want != dir {
+		t.Errorf("p.IsLeftToRight() = %t; want %t", dir, want)
+	}
+	p.SetString(str, DefaultDirection(LeftToRight))
+	_, err = p.Order()
+	if err != nil {
+		t.Error(err)
+		t.Fail()
+	}
+	if want, dir := true, p.IsLeftToRight(); want != dir {
+		t.Errorf("p.IsLeftToRight() = %t; want %t", dir, want)
+	}
+
+}
+
+func TestEmpty(t *testing.T) {
+	p := Paragraph{}
+	p.SetBytes([]byte{})
+	o, err := p.Order()
+	if err != nil {
+		t.Error("p.Order() return err != nil; want err == nil")
+	}
+	if nr := o.NumRuns(); nr != 0 {
+		t.Errorf("o.NumRuns() = %d; want 0", nr)
+	}
+}
+
+func TestNewline(t *testing.T) {
+	str := "Hello\nworld"
+	p := Paragraph{}
+	n, err := p.SetString(str)
+	if err != nil {
+		t.Error(err)
+	}
+	// 6 is the length up to and including the \n
+	if want := 6; n != want {
+		t.Errorf("SetString(%q) = nil, %d; want nil, %d", str, n, want)
+	}
+}
+
+func TestDoubleSetString(t *testing.T) {
+	str := "العاشر ليونيكود (Unicode Conference)،"
+	p := Paragraph{}
+	_, err := p.SetString(str)
+	if err != nil {
+		t.Error(err)
+	}
+	_, err = p.SetString(str)
+	if err != nil {
+		t.Error(err)
+	}
+	_, err = p.Order()
+	if err != nil {
+		t.Error(err)
+	}
+}
+
+func TestReverseString(t *testing.T) {
+	input := "(Hello)"
+	want := "(olleH)"
+	if str := ReverseString(input); str != want {
+		t.Errorf("ReverseString(%s) = %q; want %q", input, str, want)
+	}
+}
+
+func TestAppendReverse(t *testing.T) {
+	testcase := []struct {
+		inString  string
+		outString string
+		want      string
+	}{
+		{"", "Hëllo", "Hëllo"},
+		{"nice (wörld)", "", "(dlröw) ecin"},
+		{"nice (wörld)", "Hëllo", "Hëllo(dlröw) ecin"},
+	}
+	for _, tc := range testcase {
+		if r := AppendReverse([]byte(tc.outString), []byte(tc.inString)); string(r) != tc.want {
+			t.Errorf("AppendReverse([]byte(%q), []byte(%q) = %q; want %q", tc.outString, tc.inString, string(r), tc.want)
+		}
+	}
+
+}
diff --git a/unicode/bidi/core.go b/unicode/bidi/core.go
index 50deb6600..e4c081101 100644
--- a/unicode/bidi/core.go
+++ b/unicode/bidi/core.go
@@ -4,7 +4,10 @@
 
 package bidi
 
-import "log"
+import (
+	"fmt"
+	"log"
+)
 
 // This implementation is a port based on the reference implementation found at:
 // https://www.unicode.org/Public/PROGRAMS/BidiReferenceJava/
@@ -97,13 +100,20 @@ type paragraph struct {
 // rune (suggested is the rune of the open bracket for opening and matching
 // close brackets, after normalization). The embedding levels are optional, but
 // may be supplied to encode embedding levels of styled text.
-//
-// TODO: return an error.
-func newParagraph(types []Class, pairTypes []bracketType, pairValues []rune, levels level) *paragraph {
-	validateTypes(types)
-	validatePbTypes(pairTypes)
-	validatePbValues(pairValues, pairTypes)
-	validateParagraphEmbeddingLevel(levels)
+func newParagraph(types []Class, pairTypes []bracketType, pairValues []rune, levels level) (*paragraph, error) {
+	var err error
+	if err = validateTypes(types); err != nil {
+		return nil, err
+	}
+	if err = validatePbTypes(pairTypes); err != nil {
+		return nil, err
+	}
+	if err = validatePbValues(pairValues, pairTypes); err != nil {
+		return nil, err
+	}
+	if err = validateParagraphEmbeddingLevel(levels); err != nil {
+		return nil, err
+	}
 
 	p := &paragraph{
 		initialTypes:   append([]Class(nil), types...),
@@ -115,7 +125,7 @@ func newParagraph(types []Class, pairTypes []bracketType, pairValues []rune, lev
 		resultTypes: append([]Class(nil), types...),
 	}
 	p.run()
-	return p
+	return p, nil
 }
 
 func (p *paragraph) Len() int { return len(p.initialTypes) }
@@ -1001,58 +1011,61 @@ func typeForLevel(level level) Class {
 	return R
 }
 
-// TODO: change validation to not panic
-
-func validateTypes(types []Class) {
+func validateTypes(types []Class) error {
 	if len(types) == 0 {
-		log.Panic("types is null")
+		return fmt.Errorf("types is null")
 	}
 	for i, t := range types[:len(types)-1] {
 		if t == B {
-			log.Panicf("B type before end of paragraph at index: %d", i)
+			return fmt.Errorf("B type before end of paragraph at index: %d", i)
 		}
 	}
+	return nil
 }
 
-func validateParagraphEmbeddingLevel(embeddingLevel level) {
+func validateParagraphEmbeddingLevel(embeddingLevel level) error {
 	if embeddingLevel != implicitLevel &&
 		embeddingLevel != 0 &&
 		embeddingLevel != 1 {
-		log.Panicf("illegal paragraph embedding level: %d", embeddingLevel)
+		return fmt.Errorf("illegal paragraph embedding level: %d", embeddingLevel)
 	}
+	return nil
 }
 
-func validateLineBreaks(linebreaks []int, textLength int) {
+func validateLineBreaks(linebreaks []int, textLength int) error {
 	prev := 0
 	for i, next := range linebreaks {
 		if next <= prev {
-			log.Panicf("bad linebreak: %d at index: %d", next, i)
+			return fmt.Errorf("bad linebreak: %d at index: %d", next, i)
 		}
 		prev = next
 	}
 	if prev != textLength {
-		log.Panicf("last linebreak was %d, want %d", prev, textLength)
+		return fmt.Errorf("last linebreak was %d, want %d", prev, textLength)
 	}
+	return nil
 }
 
-func validatePbTypes(pairTypes []bracketType) {
+func validatePbTypes(pairTypes []bracketType) error {
 	if len(pairTypes) == 0 {
-		log.Panic("pairTypes is null")
+		return fmt.Errorf("pairTypes is null")
 	}
 	for i, pt := range pairTypes {
 		switch pt {
 		case bpNone, bpOpen, bpClose:
 		default:
-			log.Panicf("illegal pairType value at %d: %v", i, pairTypes[i])
+			return fmt.Errorf("illegal pairType value at %d: %v", i, pairTypes[i])
 		}
 	}
+	return nil
 }
 
-func validatePbValues(pairValues []rune, pairTypes []bracketType) {
+func validatePbValues(pairValues []rune, pairTypes []bracketType) error {
 	if pairValues == nil {
-		log.Panic("pairValues is null")
+		return fmt.Errorf("pairValues is null")
 	}
 	if len(pairTypes) != len(pairValues) {
-		log.Panic("pairTypes is different length from pairValues")
+		return fmt.Errorf("pairTypes is different length from pairValues")
 	}
+	return nil
 }
diff --git a/unicode/bidi/core_test.go b/unicode/bidi/core_test.go
index b653399c4..1c928af96 100644
--- a/unicode/bidi/core_test.go
+++ b/unicode/bidi/core_test.go
@@ -55,7 +55,10 @@ func TestBidiCore(t *testing.T) {
 				continue
 			}
 			lev := level(int(i) - 1)
-			par := newParagraph(types, pairTypes, pairValues, lev)
+			par, err := newParagraph(types, pairTypes, pairValues, lev)
+			if err != nil {
+				t.Error(err)
+			}
 
 			if *testLevels {
 				levels := par.getLevels([]int{len(types)})
@@ -142,7 +145,10 @@ func TestBidiCharacters(t *testing.T) {
 				pairValues = append(pairValues, p.reverseBracket(r))
 			}
 		}
-		par := newParagraph(types, pairTypes, pairValues, parLevel)
+		par, err := newParagraph(types, pairTypes, pairValues, parLevel)
+		if err != nil {
+			t.Error(err)
+		}
 
 		// Test results:
 		if got := par.embeddingLevel; got != wantLevel {

From 72ead5faa1c2426bebe794973c1cbbcf0cb89e5c Mon Sep 17 00:00:00 2001
From: Timothy Gu <timothygu99@gmail.com>
Date: Thu, 1 Oct 2020 13:29:14 -0400
Subject: [PATCH 03/40] internal/export/idna: Allow specifying CheckHyphens and
 CheckJoiners

This aligns with the options in the latest version of UTS 46, and in
particular allows implementing the WHATWG URL Standard.

Fixes golang/go#41732.

Change-Id: Iab577eff4303f3eea64512d07d968c891acf126f
Reviewed-on: https://go-review.googlesource.com/c/text/+/258837
Reviewed-by: Marcel van Lohuizen <mpvl@golang.org>
Reviewed-by: Nigel Tao <nigeltao@golang.org>
Run-TryBot: Marcel van Lohuizen <mpvl@golang.org>
TryBot-Result: Go Bot <gobot@golang.org>
Trust: Nigel Tao <nigeltao@golang.org>
---
 internal/export/idna/idna10.0.0.go      | 113 ++++++++++++++++--------
 internal/export/idna/idna10.0.0_test.go |   8 ++
 internal/export/idna/idna9.0.0.go       |  93 +++++++++++++------
 internal/export/idna/idna9.0.0_test.go  |   8 ++
 4 files changed, 154 insertions(+), 68 deletions(-)

diff --git a/internal/export/idna/idna10.0.0.go b/internal/export/idna/idna10.0.0.go
index 1244f9ce9..2ceb32768 100644
--- a/internal/export/idna/idna10.0.0.go
+++ b/internal/export/idna/idna10.0.0.go
@@ -65,15 +65,14 @@ func Transitional(transitional bool) Option {
 
 // VerifyDNSLength sets whether a Profile should fail if any of the IDN parts
 // are longer than allowed by the RFC.
+//
+// This option corresponds to the VerifyDnsLength flag in UTS #46.
 func VerifyDNSLength(verify bool) Option {
 	return func(o *options) { o.verifyDNSLength = verify }
 }
 
 // RemoveLeadingDots removes leading label separators. Leading runes that map to
 // dots, such as U+3002 IDEOGRAPHIC FULL STOP, are removed as well.
-//
-// This is the behavior suggested by the UTS #46 and is adopted by some
-// browsers.
 func RemoveLeadingDots(remove bool) Option {
 	return func(o *options) { o.removeLeadingDots = remove }
 }
@@ -81,6 +80,8 @@ func RemoveLeadingDots(remove bool) Option {
 // ValidateLabels sets whether to check the mandatory label validation criteria
 // as defined in Section 5.4 of RFC 5891. This includes testing for correct use
 // of hyphens ('-'), normalization, validity of runes, and the context rules.
+// In particular, ValidateLabels also sets the CheckHyphens and CheckJoiners flags
+// in UTS #46.
 func ValidateLabels(enable bool) Option {
 	return func(o *options) {
 		// Don't override existing mappings, but set one that at least checks
@@ -89,25 +90,48 @@ func ValidateLabels(enable bool) Option {
 			o.mapping = normalize
 		}
 		o.trie = trie
-		o.validateLabels = enable
-		o.fromPuny = validateFromPunycode
+		o.checkJoiners = enable
+		o.checkHyphens = enable
+		if enable {
+			o.fromPuny = validateFromPunycode
+		} else {
+			o.fromPuny = nil
+		}
+	}
+}
+
+// CheckHyphens sets whether to check for correct use of hyphens ('-') in
+// labels. Most web browsers do not have this option set, since labels such as
+// "r3---sn-apo3qvuoxuxbt-j5pe" are in common use.
+//
+// This option corresponds to the CheckHyphens flag in UTS #46.
+func CheckHyphens(enable bool) Option {
+	return func(o *options) { o.checkHyphens = enable }
+}
+
+// CheckJoiners sets whether to check the ContextJ rules as defined in Appendix
+// A of RFC 5892, concerning the use of joiner runes.
+//
+// This option corresponds to the CheckJoiners flag in UTS #46.
+func CheckJoiners(enable bool) Option {
+	return func(o *options) {
+		o.trie = trie
+		o.checkJoiners = enable
 	}
 }
 
 // StrictDomainName limits the set of permissible ASCII characters to those
 // allowed in domain names as defined in RFC 1034 (A-Z, a-z, 0-9 and the
-// hyphen). This is set by default for MapForLookup and ValidateForRegistration.
+// hyphen). This is set by default for MapForLookup and ValidateForRegistration,
+// but is only useful if ValidateLabels is set.
 //
 // This option is useful, for instance, for browsers that allow characters
 // outside this range, for example a '_' (U+005F LOW LINE). See
-// http://www.rfc-editor.org/std/std3.txt for more details This option
-// corresponds to the UseSTD3ASCIIRules option in UTS #46.
+// http://www.rfc-editor.org/std/std3.txt for more details.
+//
+// This option corresponds to the UseSTD3ASCIIRules flag in UTS #46.
 func StrictDomainName(use bool) Option {
-	return func(o *options) {
-		o.trie = trie
-		o.useSTD3Rules = use
-		o.fromPuny = validateFromPunycode
-	}
+	return func(o *options) { o.useSTD3Rules = use }
 }
 
 // NOTE: the following options pull in tables. The tables should not be linked
@@ -115,6 +139,8 @@ func StrictDomainName(use bool) Option {
 
 // BidiRule enables the Bidi rule as defined in RFC 5893. Any application
 // that relies on proper validation of labels should include this rule.
+//
+// This option corresponds to the CheckBidi flag in UTS #46.
 func BidiRule() Option {
 	return func(o *options) { o.bidirule = bidirule.ValidString }
 }
@@ -150,7 +176,8 @@ func MapForLookup() Option {
 type options struct {
 	transitional      bool
 	useSTD3Rules      bool
-	validateLabels    bool
+	checkHyphens      bool
+	checkJoiners      bool
 	verifyDNSLength   bool
 	removeLeadingDots bool
 
@@ -223,8 +250,11 @@ func (p *Profile) String() string {
 	if p.useSTD3Rules {
 		s += ":UseSTD3Rules"
 	}
-	if p.validateLabels {
-		s += ":ValidateLabels"
+	if p.checkHyphens {
+		s += ":CheckHyphens"
+	}
+	if p.checkJoiners {
+		s += ":CheckJoiners"
 	}
 	if p.verifyDNSLength {
 		s += ":VerifyDNSLength"
@@ -252,26 +282,29 @@ var (
 
 	punycode = &Profile{}
 	lookup   = &Profile{options{
-		transitional:   true,
-		useSTD3Rules:   true,
-		validateLabels: true,
-		trie:           trie,
-		fromPuny:       validateFromPunycode,
-		mapping:        validateAndMap,
-		bidirule:       bidirule.ValidString,
+		transitional: true,
+		useSTD3Rules: true,
+		checkHyphens: true,
+		checkJoiners: true,
+		trie:         trie,
+		fromPuny:     validateFromPunycode,
+		mapping:      validateAndMap,
+		bidirule:     bidirule.ValidString,
 	}}
 	display = &Profile{options{
-		useSTD3Rules:   true,
-		validateLabels: true,
-		trie:           trie,
-		fromPuny:       validateFromPunycode,
-		mapping:        validateAndMap,
-		bidirule:       bidirule.ValidString,
+		useSTD3Rules: true,
+		checkHyphens: true,
+		checkJoiners: true,
+		trie:         trie,
+		fromPuny:     validateFromPunycode,
+		mapping:      validateAndMap,
+		bidirule:     bidirule.ValidString,
 	}}
 	registration = &Profile{options{
 		useSTD3Rules:    true,
-		validateLabels:  true,
 		verifyDNSLength: true,
+		checkHyphens:    true,
+		checkJoiners:    true,
 		trie:            trie,
 		fromPuny:        validateFromPunycode,
 		mapping:         validateRegistration,
@@ -338,7 +371,7 @@ func (p *Profile) process(s string, toASCII bool) (string, error) {
 			}
 			isBidi = isBidi || bidirule.DirectionString(u) != bidi.LeftToRight
 			labels.set(u)
-			if err == nil && p.validateLabels {
+			if err == nil && p.fromPuny != nil {
 				err = p.fromPuny(p, u)
 			}
 			if err == nil {
@@ -679,16 +712,18 @@ func (p *Profile) validateLabel(s string) (err error) {
 		}
 		return nil
 	}
-	if !p.validateLabels {
-		return nil
-	}
-	trie := p.trie // p.validateLabels is only set if trie is set.
-	if len(s) > 4 && s[2] == '-' && s[3] == '-' {
-		return &labelError{s, "V2"}
+	if p.checkHyphens {
+		if len(s) > 4 && s[2] == '-' && s[3] == '-' {
+			return &labelError{s, "V2"}
+		}
+		if s[0] == '-' || s[len(s)-1] == '-' {
+			return &labelError{s, "V3"}
+		}
 	}
-	if s[0] == '-' || s[len(s)-1] == '-' {
-		return &labelError{s, "V3"}
+	if !p.checkJoiners {
+		return nil
 	}
+	trie := p.trie // p.checkJoiners is only set if trie is set.
 	// TODO: merge the use of this in the trie.
 	v, sz := trie.lookupString(s)
 	x := info(v)
diff --git a/internal/export/idna/idna10.0.0_test.go b/internal/export/idna/idna10.0.0_test.go
index ed01f9343..66ea636db 100644
--- a/internal/export/idna/idna10.0.0_test.go
+++ b/internal/export/idna/idna10.0.0_test.go
@@ -31,6 +31,8 @@ func TestLabelErrors(t *testing.T) {
 	lengthA := kind{"CheckLengthA", p.ToASCII}
 	p = New(MapForLookup(), StrictDomainName(false))
 	std3 := kind{"STD3", p.ToASCII}
+	p = New(MapForLookup(), CheckHyphens(false))
+	hyphens := kind{"CheckHyphens", p.ToASCII}
 
 	testCases := []struct {
 		kind
@@ -85,6 +87,12 @@ func TestLabelErrors(t *testing.T) {
 		{display, "*.foo.com", "*.foo.com", "P1"},
 		{std3, "*.foo.com", "*.foo.com", ""},
 
+		// Hyphens
+		{display, "r3---sn-apo3qvuoxuxbt-j5pe.googlevideo.com", "r3---sn-apo3qvuoxuxbt-j5pe.googlevideo.com", "V2"},
+		{hyphens, "r3---sn-apo3qvuoxuxbt-j5pe.googlevideo.com", "r3---sn-apo3qvuoxuxbt-j5pe.googlevideo.com", ""},
+		{display, "-label-.com", "-label-.com", "V3"},
+		{hyphens, "-label-.com", "-label-.com", ""},
+
 		// Don't map U+2490 (DIGIT NINE FULL STOP). This is the behavior of
 		// Chrome, Safari, and IE. Firefox will first map ⒐ to 9. and return
 		// lab9.be.
diff --git a/internal/export/idna/idna9.0.0.go b/internal/export/idna/idna9.0.0.go
index 25f2ac3e8..1ea943136 100644
--- a/internal/export/idna/idna9.0.0.go
+++ b/internal/export/idna/idna9.0.0.go
@@ -64,15 +64,14 @@ func Transitional(transitional bool) Option {
 
 // VerifyDNSLength sets whether a Profile should fail if any of the IDN parts
 // are longer than allowed by the RFC.
+//
+// This option corresponds to the VerifyDnsLength flag in UTS #46.
 func VerifyDNSLength(verify bool) Option {
 	return func(o *options) { o.verifyDNSLength = verify }
 }
 
 // RemoveLeadingDots removes leading label separators. Leading runes that map to
 // dots, such as U+3002 IDEOGRAPHIC FULL STOP, are removed as well.
-//
-// This is the behavior suggested by the UTS #46 and is adopted by some
-// browsers.
 func RemoveLeadingDots(remove bool) Option {
 	return func(o *options) { o.removeLeadingDots = remove }
 }
@@ -80,6 +79,8 @@ func RemoveLeadingDots(remove bool) Option {
 // ValidateLabels sets whether to check the mandatory label validation criteria
 // as defined in Section 5.4 of RFC 5891. This includes testing for correct use
 // of hyphens ('-'), normalization, validity of runes, and the context rules.
+// In particular, ValidateLabels also sets the CheckHyphens and CheckJoiners flags
+// in UTS #46.
 func ValidateLabels(enable bool) Option {
 	return func(o *options) {
 		// Don't override existing mappings, but set one that at least checks
@@ -88,25 +89,48 @@ func ValidateLabels(enable bool) Option {
 			o.mapping = normalize
 		}
 		o.trie = trie
-		o.validateLabels = enable
-		o.fromPuny = validateFromPunycode
+		o.checkJoiners = enable
+		o.checkHyphens = enable
+		if enable {
+			o.fromPuny = validateFromPunycode
+		} else {
+			o.fromPuny = nil
+		}
+	}
+}
+
+// CheckHyphens sets whether to check for correct use of hyphens ('-') in
+// labels. Most web browsers do not have this option set, since labels such as
+// "r3---sn-apo3qvuoxuxbt-j5pe" are in common use.
+//
+// This option corresponds to the CheckHyphens flag in UTS #46.
+func CheckHyphens(enable bool) Option {
+	return func(o *options) { o.checkHyphens = enable }
+}
+
+// CheckJoiners sets whether to check the ContextJ rules as defined in Appendix
+// A of RFC 5892, concerning the use of joiner runes.
+//
+// This option corresponds to the CheckJoiners flag in UTS #46.
+func CheckJoiners(enable bool) Option {
+	return func(o *options) {
+		o.trie = trie
+		o.checkJoiners = enable
 	}
 }
 
 // StrictDomainName limits the set of permissable ASCII characters to those
 // allowed in domain names as defined in RFC 1034 (A-Z, a-z, 0-9 and the
-// hyphen). This is set by default for MapForLookup and ValidateForRegistration.
+// hyphen). This is set by default for MapForLookup and ValidateForRegistration,
+// but is only useful if ValidateLabels is set.
 //
 // This option is useful, for instance, for browsers that allow characters
 // outside this range, for example a '_' (U+005F LOW LINE). See
-// http://www.rfc-editor.org/std/std3.txt for more details This option
-// corresponds to the UseSTD3ASCIIRules option in UTS #46.
+// http://www.rfc-editor.org/std/std3.txt for more details.
+//
+// This option corresponds to the UseSTD3ASCIIRules flag in UTS #46.
 func StrictDomainName(use bool) Option {
-	return func(o *options) {
-		o.trie = trie
-		o.useSTD3Rules = use
-		o.fromPuny = validateFromPunycode
-	}
+	return func(o *options) { o.useSTD3Rules = use }
 }
 
 // NOTE: the following options pull in tables. The tables should not be linked
@@ -114,6 +138,8 @@ func StrictDomainName(use bool) Option {
 
 // BidiRule enables the Bidi rule as defined in RFC 5893. Any application
 // that relies on proper validation of labels should include this rule.
+//
+// This option corresponds to the CheckBidi flag in UTS #46.
 func BidiRule() Option {
 	return func(o *options) { o.bidirule = bidirule.ValidString }
 }
@@ -150,7 +176,8 @@ func MapForLookup() Option {
 type options struct {
 	transitional      bool
 	useSTD3Rules      bool
-	validateLabels    bool
+	checkHyphens      bool
+	checkJoiners      bool
 	verifyDNSLength   bool
 	removeLeadingDots bool
 
@@ -223,8 +250,11 @@ func (p *Profile) String() string {
 	if p.useSTD3Rules {
 		s += ":UseSTD3Rules"
 	}
-	if p.validateLabels {
-		s += ":ValidateLabels"
+	if p.checkHyphens {
+		s += ":CheckHyphens"
+	}
+	if p.checkJoiners {
+		s += ":CheckJoiners"
 	}
 	if p.verifyDNSLength {
 		s += ":VerifyDNSLength"
@@ -253,9 +283,10 @@ var (
 	punycode = &Profile{}
 	lookup   = &Profile{options{
 		transitional:      true,
-		useSTD3Rules:      true,
-		validateLabels:    true,
 		removeLeadingDots: true,
+		useSTD3Rules:      true,
+		checkHyphens:      true,
+		checkJoiners:      true,
 		trie:              trie,
 		fromPuny:          validateFromPunycode,
 		mapping:           validateAndMap,
@@ -263,8 +294,9 @@ var (
 	}}
 	display = &Profile{options{
 		useSTD3Rules:      true,
-		validateLabels:    true,
 		removeLeadingDots: true,
+		checkHyphens:      true,
+		checkJoiners:      true,
 		trie:              trie,
 		fromPuny:          validateFromPunycode,
 		mapping:           validateAndMap,
@@ -272,8 +304,9 @@ var (
 	}}
 	registration = &Profile{options{
 		useSTD3Rules:    true,
-		validateLabels:  true,
 		verifyDNSLength: true,
+		checkHyphens:    true,
+		checkJoiners:    true,
 		trie:            trie,
 		fromPuny:        validateFromPunycode,
 		mapping:         validateRegistration,
@@ -337,7 +370,7 @@ func (p *Profile) process(s string, toASCII bool) (string, error) {
 				continue
 			}
 			labels.set(u)
-			if err == nil && p.validateLabels {
+			if err == nil && p.fromPuny != nil {
 				err = p.fromPuny(p, u)
 			}
 			if err == nil {
@@ -627,16 +660,18 @@ func (p *Profile) validateLabel(s string) error {
 	if p.bidirule != nil && !p.bidirule(s) {
 		return &labelError{s, "B"}
 	}
-	if !p.validateLabels {
-		return nil
-	}
-	trie := p.trie // p.validateLabels is only set if trie is set.
-	if len(s) > 4 && s[2] == '-' && s[3] == '-' {
-		return &labelError{s, "V2"}
+	if p.checkHyphens {
+		if len(s) > 4 && s[2] == '-' && s[3] == '-' {
+			return &labelError{s, "V2"}
+		}
+		if s[0] == '-' || s[len(s)-1] == '-' {
+			return &labelError{s, "V3"}
+		}
 	}
-	if s[0] == '-' || s[len(s)-1] == '-' {
-		return &labelError{s, "V3"}
+	if !p.checkJoiners {
+		return nil
 	}
+	trie := p.trie // p.checkJoiners is only set if trie is set.
 	// TODO: merge the use of this in the trie.
 	v, sz := trie.lookupString(s)
 	x := info(v)
diff --git a/internal/export/idna/idna9.0.0_test.go b/internal/export/idna/idna9.0.0_test.go
index 7047d744a..03b1267c3 100644
--- a/internal/export/idna/idna9.0.0_test.go
+++ b/internal/export/idna/idna9.0.0_test.go
@@ -31,6 +31,8 @@ func TestLabelErrors(t *testing.T) {
 	lengthA := kind{"CheckLengthA", p.ToASCII}
 	p = New(MapForLookup(), StrictDomainName(false))
 	std3 := kind{"STD3", p.ToASCII}
+	p = New(MapForLookup(), CheckHyphens(false))
+	hyphens := kind{"CheckHyphens", p.ToASCII}
 
 	testCases := []struct {
 		kind
@@ -81,6 +83,12 @@ func TestLabelErrors(t *testing.T) {
 		{display, "*.foo.com", "*.foo.com", "P1"},
 		{std3, "*.foo.com", "*.foo.com", ""},
 
+		// Hyphens
+		{display, "r3---sn-apo3qvuoxuxbt-j5pe.googlevideo.com", "r3---sn-apo3qvuoxuxbt-j5pe.googlevideo.com", "V2"},
+		{hyphens, "r3---sn-apo3qvuoxuxbt-j5pe.googlevideo.com", "r3---sn-apo3qvuoxuxbt-j5pe.googlevideo.com", ""},
+		{display, "-label-.com", "-label-.com", "V3"},
+		{hyphens, "-label-.com", "-label-.com", ""},
+
 		// Don't map U+2490 (DIGIT NINE FULL STOP). This is the behavior of
 		// Chrome, Safari, and IE. Firefox will first map ⒐ to 9. and return
 		// lab9.be.

From 305da72387dee5313eca46df90087abcbeb3f520 Mon Sep 17 00:00:00 2001
From: "igor.bolotnikov" <igor.v.bolotnikov@gmail.com>
Date: Mon, 26 Oct 2020 17:55:30 +0300
Subject: [PATCH 04/40] internal/number: possible out of range error avoiding

Case when r.Increment > 0 and r.IncrementScale == len(scales) in *Decimal.ConvertFloat method is taken into account.
It led to unexpected out of range panic.

fixes golang/go#42147

Change-Id: Ic26e67010b766bdbd322a3853489f6d1ecb0dcfc
Reviewed-on: https://go-review.googlesource.com/c/text/+/265021
Reviewed-by: Marcel van Lohuizen <mpvl@golang.org>
Trust: Russ Cox <rsc@golang.org>
---
 internal/number/decimal.go      | 2 +-
 internal/number/decimal_test.go | 5 +++++
 2 files changed, 6 insertions(+), 1 deletion(-)

diff --git a/internal/number/decimal.go b/internal/number/decimal.go
index 9b4035ec4..cb656db6c 100644
--- a/internal/number/decimal.go
+++ b/internal/number/decimal.go
@@ -379,7 +379,7 @@ func (d *Decimal) ConvertFloat(r RoundingContext, x float64, size int) {
 	if r.Increment > 0 {
 		scale := int(r.IncrementScale)
 		mult := 1.0
-		if scale > len(scales) {
+		if scale >= len(scales) {
 			mult = math.Pow(10, float64(scale))
 		} else {
 			mult = scales[scale]
diff --git a/internal/number/decimal_test.go b/internal/number/decimal_test.go
index 97c7e25b6..670e806e5 100644
--- a/internal/number/decimal_test.go
+++ b/internal/number/decimal_test.go
@@ -248,6 +248,10 @@ func TestConvert(t *testing.T) {
 	inc0_05 := RoundingContext{Increment: 5, IncrementScale: 2}
 	inc0_05.SetScale(2)
 	inc50 := RoundingContext{Increment: 50}
+	incScaleEqualToScalesLen := RoundingContext{Increment: 1, IncrementScale: 0}
+	if len(scales) <= math.MaxUint8 {
+		incScaleEqualToScalesLen.IncrementScale = uint8(len(scales))
+	}
 	prec3 := RoundingContext{}
 	prec3.SetPrecision(3)
 	roundShift := RoundingContext{DigitShift: 2, MaxFractionDigits: 2}
@@ -309,6 +313,7 @@ func TestConvert(t *testing.T) {
 		{math.Inf(-1), inc50, "-Inf"},
 		{math.NaN(), inc50, "NaN"},
 		{"clearly not a number", scale2, "NaN"},
+		{0.0, incScaleEqualToScalesLen, "0"},
 	}
 	for _, tc := range testCases {
 		var d Decimal

From c27b9fd57aec08b1104313fb190f0ecc6d23095f Mon Sep 17 00:00:00 2001
From: Garry McNulty <garrmcnu@gmail.com>
Date: Mon, 24 Feb 2020 21:48:34 +0000
Subject: [PATCH 05/40] encoding/simplifiedchinese: fix incorrect transform
 count to avoid infinite loop

If the final character in the source buffer is a single '~' escape
character, size is not updated. The loop either doesn't make progress if
size is zero, or size retains the value from a previous iteration which
may return an incorrect source bytes consumed count.
Count the single '~' as 1 byte consumed.

Fixes golang/go#35118

Change-Id: I3eadf1b4cb632a7c4dc4255325b467a6907c10c0
Reviewed-on: https://go-review.googlesource.com/c/text/+/220460
Reviewed-by: Nigel Tao <nigeltao@golang.org>
Trust: Nigel Tao <nigeltao@golang.org>
Trust: Marcel van Lohuizen <mpvl@golang.org>
---
 encoding/simplifiedchinese/all_test.go | 2 ++
 encoding/simplifiedchinese/hzgb2312.go | 2 +-
 2 files changed, 3 insertions(+), 1 deletion(-)

diff --git a/encoding/simplifiedchinese/all_test.go b/encoding/simplifiedchinese/all_test.go
index b369da21a..a556c94dd 100644
--- a/encoding/simplifiedchinese/all_test.go
+++ b/encoding/simplifiedchinese/all_test.go
@@ -53,6 +53,8 @@ func TestNonRepertoire(t *testing.T) {
 		{dec, GB18030, strings.Repeat("\xfe\x30", n), strings.Repeat("\ufffd0", n)},
 
 		{dec, HZGB2312, "~/", "\ufffd"},
+		{dec, HZGB2312, "~", "\ufffd"},
+		{dec, HZGB2312, "~~~", "~\ufffd"},
 		{dec, HZGB2312, "~{a\x80", "\ufffd"},
 		{dec, HZGB2312, "~{a\x80", "\ufffd"},
 		{dec, HZGB2312, "~{" + strings.Repeat("z~", n), strings.Repeat("\ufffd", n)},
diff --git a/encoding/simplifiedchinese/hzgb2312.go b/encoding/simplifiedchinese/hzgb2312.go
index eb3157f0b..e15b7bf6a 100644
--- a/encoding/simplifiedchinese/hzgb2312.go
+++ b/encoding/simplifiedchinese/hzgb2312.go
@@ -57,7 +57,7 @@ loop:
 					err = transform.ErrShortSrc
 					break loop
 				}
-				r = utf8.RuneError
+				r, size = utf8.RuneError, 1
 				goto write
 			}
 			size = 2

From 75a595aef632b07c6eeaaa805adb6f0f66e4130e Mon Sep 17 00:00:00 2001
From: Julie Qiu <julie@golang.org>
Date: Mon, 7 Dec 2020 16:52:09 -0500
Subject: [PATCH 06/40] README.md: add badge to pkg.go.dev

Change-Id: Iae82dbce741d2eaa03bcae046842589f0764c933
Reviewed-on: https://go-review.googlesource.com/c/text/+/275890
Reviewed-by: Dmitri Shuralyov <dmitshur@golang.org>
Run-TryBot: Julie Qiu <julie@golang.org>
Trust: Julie Qiu <julie@golang.org>
---
 README.md | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/README.md b/README.md
index 61d5ee4d1..85cd3d001 100644
--- a/README.md
+++ b/README.md
@@ -1,5 +1,7 @@
 # Go Text
 
+[![Go Reference](https://pkg.go.dev/badge/golang.org/x/text.svg)](https://pkg.go.dev/golang.org/x/text)
+
 This repository holds supplementary Go libraries for text processing, many involving Unicode.
 
 ## Semantic Versioning

From 8f690f22cf1c026c950adddf3d45258bfd0912f0 Mon Sep 17 00:00:00 2001
From: Russ Cox <rsc@golang.org>
Date: Fri, 19 Feb 2021 18:54:44 -0500
Subject: [PATCH 07/40] all: go fmt ./...

Make all our package sources use Go 1.17 gofmt format
(adding //go:build lines).

Not strictly necessary but will avoid spurious changes
as files are edited.

Part of //go:build change (#41184).
See https://golang.org/design/draft-gobuild

Change-Id: I8f1f65728dad29d63bc5a1ea5fdb4cbac255c7e5
Reviewed-on: https://go-review.googlesource.com/c/text/+/294372
Trust: Russ Cox <rsc@golang.org>
Run-TryBot: Russ Cox <rsc@golang.org>
TryBot-Result: Go Bot <gobot@golang.org>
Reviewed-by: Jason A. Donenfeld <Jason@zx2c4.com>
Reviewed-by: Ian Lance Taylor <iant@golang.org>
---
 cases/gen.go                              | 1 +
 cases/gen_trieval.go                      | 1 +
 cases/icu.go                              | 1 +
 cases/icu_test.go                         | 1 +
 cases/tables10.0.0.go                     | 1 +
 cases/tables10.0.0_test.go                | 1 +
 cases/tables11.0.0.go                     | 1 +
 cases/tables11.0.0_test.go                | 1 +
 cases/tables12.0.0.go                     | 1 +
 cases/tables12.0.0_test.go                | 1 +
 cases/tables13.0.0.go                     | 1 +
 cases/tables13.0.0_test.go                | 1 +
 cases/tables9.0.0.go                      | 1 +
 cases/tables9.0.0_test.go                 | 1 +
 cmd/gotext/examples/rewrite/printer.go    | 1 +
 collate/maketables.go                     | 1 +
 collate/tools/colcmp/darwin.go            | 1 +
 collate/tools/colcmp/icu.go               | 1 +
 currency/gen.go                           | 1 +
 currency/gen_common.go                    | 1 +
 date/gen.go                               | 1 +
 encoding/charmap/maketables.go            | 1 +
 encoding/htmlindex/gen.go                 | 1 +
 encoding/ianaindex/ascii.go               | 4 ++--
 encoding/ianaindex/ascii_test.go          | 2 +-
 encoding/ianaindex/gen.go                 | 1 +
 encoding/internal/identifier/gen.go       | 1 +
 encoding/japanese/maketables.go           | 1 +
 encoding/korean/maketables.go             | 1 +
 encoding/simplifiedchinese/maketables.go  | 1 +
 encoding/traditionalchinese/maketables.go | 1 +
 feature/plural/gen.go                     | 1 +
 feature/plural/gen_common.go              | 1 +
 gen.go                                    | 1 +
 internal/export/idna/gen.go               | 1 +
 internal/export/idna/gen10.0.0_test.go    | 1 +
 internal/export/idna/gen9.0.0_test.go     | 1 +
 internal/export/idna/gen_common.go        | 1 +
 internal/export/idna/gen_trieval.go       | 1 +
 internal/export/idna/idna10.0.0.go        | 2 ++
 internal/export/idna/idna10.0.0_test.go   | 1 +
 internal/export/idna/idna9.0.0.go         | 2 ++
 internal/export/idna/idna9.0.0_test.go    | 1 +
 internal/export/idna/tables10.0.0.go      | 1 +
 internal/export/idna/tables11.0.0.go      | 1 +
 internal/export/idna/tables12.0.0.go      | 1 +
 internal/export/idna/tables13.0.0.go      | 1 +
 internal/export/idna/tables9.0.0.go       | 1 +
 internal/export/unicode/gen.go            | 1 +
 internal/language/compact/gen.go          | 1 +
 internal/language/compact/gen_index.go    | 1 +
 internal/language/compact/gen_parents.go  | 1 +
 internal/language/gen.go                  | 1 +
 internal/language/gen_common.go           | 1 +
 internal/number/gen.go                    | 1 +
 internal/number/gen_common.go             | 1 +
 internal/testtext/gc.go                   | 1 +
 internal/testtext/gccgo.go                | 1 +
 internal/testtext/go1_6.go                | 1 +
 internal/testtext/go1_7.go                | 1 +
 internal/triegen/data_test.go             | 1 +
 internal/triegen/gen_test.go              | 1 +
 language/display/maketables.go            | 1 +
 language/gen.go                           | 1 +
 language/go1_1.go                         | 1 +
 language/go1_2.go                         | 1 +
 message/catalog/go19.go                   | 1 +
 message/catalog/gopre19.go                | 1 +
 message/pipeline/go19_test.go             | 1 +
 secure/bidirule/bidirule10.0.0.go         | 1 +
 secure/bidirule/bidirule10.0.0_test.go    | 1 +
 secure/bidirule/bidirule9.0.0.go          | 1 +
 secure/bidirule/bidirule9.0.0_test.go     | 1 +
 secure/precis/benchmark_test.go           | 1 +
 secure/precis/enforce10.0.0_test.go       | 1 +
 secure/precis/enforce9.0.0_test.go        | 1 +
 secure/precis/gen.go                      | 1 +
 secure/precis/gen_trieval.go              | 1 +
 secure/precis/tables10.0.0.go             | 1 +
 secure/precis/tables11.0.0.go             | 1 +
 secure/precis/tables12.0.0.go             | 1 +
 secure/precis/tables13.0.0.go             | 1 +
 secure/precis/tables9.0.0.go              | 1 +
 unicode/bidi/gen.go                       | 1 +
 unicode/bidi/gen_ranges.go                | 1 +
 unicode/bidi/gen_trieval.go               | 1 +
 unicode/bidi/tables10.0.0.go              | 1 +
 unicode/bidi/tables11.0.0.go              | 1 +
 unicode/bidi/tables12.0.0.go              | 1 +
 unicode/bidi/tables13.0.0.go              | 1 +
 unicode/bidi/tables9.0.0.go               | 1 +
 unicode/cldr/makexml.go                   | 1 +
 unicode/norm/data10.0.0_test.go           | 1 +
 unicode/norm/data11.0.0_test.go           | 1 +
 unicode/norm/data12.0.0_test.go           | 1 +
 unicode/norm/data13.0.0_test.go           | 1 +
 unicode/norm/data9.0.0_test.go            | 1 +
 unicode/norm/forminfo_test.go             | 1 +
 unicode/norm/maketables.go                | 1 +
 unicode/norm/tables10.0.0.go              | 1 +
 unicode/norm/tables11.0.0.go              | 1 +
 unicode/norm/tables12.0.0.go              | 1 +
 unicode/norm/tables13.0.0.go              | 1 +
 unicode/norm/tables9.0.0.go               | 1 +
 unicode/norm/triegen.go                   | 1 +
 unicode/rangetable/gen.go                 | 1 +
 unicode/rangetable/tables10.0.0.go        | 1 +
 unicode/rangetable/tables11.0.0.go        | 1 +
 unicode/rangetable/tables12.0.0.go        | 1 +
 unicode/rangetable/tables13.0.0.go        | 1 +
 unicode/rangetable/tables9.0.0.go         | 1 +
 unicode/runenames/gen.go                  | 1 +
 unicode/runenames/tables10.0.0.go         | 1 +
 unicode/runenames/tables11.0.0.go         | 1 +
 unicode/runenames/tables12.0.0.go         | 1 +
 unicode/runenames/tables13.0.0.go         | 1 +
 unicode/runenames/tables9.0.0.go          | 1 +
 width/gen.go                              | 1 +
 width/gen_common.go                       | 1 +
 width/gen_trieval.go                      | 1 +
 width/tables10.0.0.go                     | 1 +
 width/tables11.0.0.go                     | 1 +
 width/tables12.0.0.go                     | 1 +
 width/tables13.0.0.go                     | 1 +
 width/tables9.0.0.go                      | 1 +
 125 files changed, 128 insertions(+), 3 deletions(-)

diff --git a/cases/gen.go b/cases/gen.go
index e7bccc8be..a041fede1 100644
--- a/cases/gen.go
+++ b/cases/gen.go
@@ -2,6 +2,7 @@
 // Use of this source code is governed by a BSD-style
 // license that can be found in the LICENSE file.
 
+//go:build ignore
 // +build ignore
 
 // This program generates the trie for casing operations. The Unicode casing
diff --git a/cases/gen_trieval.go b/cases/gen_trieval.go
index 26fadd6c5..6c7222a73 100644
--- a/cases/gen_trieval.go
+++ b/cases/gen_trieval.go
@@ -2,6 +2,7 @@
 // Use of this source code is governed by a BSD-style
 // license that can be found in the LICENSE file.
 
+//go:build ignore
 // +build ignore
 
 package main
diff --git a/cases/icu.go b/cases/icu.go
index 46530d1e4..2dc84b39e 100644
--- a/cases/icu.go
+++ b/cases/icu.go
@@ -2,6 +2,7 @@
 // Use of this source code is governed by a BSD-style
 // license that can be found in the LICENSE file.
 
+//go:build icu
 // +build icu
 
 package cases
diff --git a/cases/icu_test.go b/cases/icu_test.go
index e2b0adafd..f3ed83834 100644
--- a/cases/icu_test.go
+++ b/cases/icu_test.go
@@ -2,6 +2,7 @@
 // Use of this source code is governed by a BSD-style
 // license that can be found in the LICENSE file.
 
+//go:build icu
 // +build icu
 
 package cases
diff --git a/cases/tables10.0.0.go b/cases/tables10.0.0.go
index 5c87950cc..ca9923105 100644
--- a/cases/tables10.0.0.go
+++ b/cases/tables10.0.0.go
@@ -1,5 +1,6 @@
 // Code generated by running "go generate" in golang.org/x/text. DO NOT EDIT.
 
+//go:build go1.10 && !go1.13
 // +build go1.10,!go1.13
 
 package cases
diff --git a/cases/tables10.0.0_test.go b/cases/tables10.0.0_test.go
index 186065c9f..779eaf56d 100644
--- a/cases/tables10.0.0_test.go
+++ b/cases/tables10.0.0_test.go
@@ -1,5 +1,6 @@
 // Code generated by running "go generate" in golang.org/x/text. DO NOT EDIT.
 
+//go:build go1.10 && !go1.13
 // +build go1.10,!go1.13
 
 package cases
diff --git a/cases/tables11.0.0.go b/cases/tables11.0.0.go
index 84d270183..b1106b417 100644
--- a/cases/tables11.0.0.go
+++ b/cases/tables11.0.0.go
@@ -1,5 +1,6 @@
 // Code generated by running "go generate" in golang.org/x/text. DO NOT EDIT.
 
+//go:build go1.13 && !go1.14
 // +build go1.13,!go1.14
 
 package cases
diff --git a/cases/tables11.0.0_test.go b/cases/tables11.0.0_test.go
index 2f441af6b..bc8fc54ba 100644
--- a/cases/tables11.0.0_test.go
+++ b/cases/tables11.0.0_test.go
@@ -1,5 +1,6 @@
 // Code generated by running "go generate" in golang.org/x/text. DO NOT EDIT.
 
+//go:build go1.13 && !go1.14
 // +build go1.13,!go1.14
 
 package cases
diff --git a/cases/tables12.0.0.go b/cases/tables12.0.0.go
index edee17d09..ae7dc2407 100644
--- a/cases/tables12.0.0.go
+++ b/cases/tables12.0.0.go
@@ -1,5 +1,6 @@
 // Code generated by running "go generate" in golang.org/x/text. DO NOT EDIT.
 
+//go:build go1.14 && !go1.16
 // +build go1.14,!go1.16
 
 package cases
diff --git a/cases/tables12.0.0_test.go b/cases/tables12.0.0_test.go
index b017b4385..04f3b6b80 100644
--- a/cases/tables12.0.0_test.go
+++ b/cases/tables12.0.0_test.go
@@ -1,5 +1,6 @@
 // Code generated by running "go generate" in golang.org/x/text. DO NOT EDIT.
 
+//go:build go1.14 && !go1.16
 // +build go1.14,!go1.16
 
 package cases
diff --git a/cases/tables13.0.0.go b/cases/tables13.0.0.go
index 90a2453fc..cd874775b 100644
--- a/cases/tables13.0.0.go
+++ b/cases/tables13.0.0.go
@@ -1,5 +1,6 @@
 // Code generated by running "go generate" in golang.org/x/text. DO NOT EDIT.
 
+//go:build go1.16
 // +build go1.16
 
 package cases
diff --git a/cases/tables13.0.0_test.go b/cases/tables13.0.0_test.go
index 82f3e19c5..57c78a81f 100644
--- a/cases/tables13.0.0_test.go
+++ b/cases/tables13.0.0_test.go
@@ -1,5 +1,6 @@
 // Code generated by running "go generate" in golang.org/x/text. DO NOT EDIT.
 
+//go:build go1.16
 // +build go1.16
 
 package cases
diff --git a/cases/tables9.0.0.go b/cases/tables9.0.0.go
index 4949fa724..636d5d14d 100644
--- a/cases/tables9.0.0.go
+++ b/cases/tables9.0.0.go
@@ -1,5 +1,6 @@
 // Code generated by running "go generate" in golang.org/x/text. DO NOT EDIT.
 
+//go:build !go1.10
 // +build !go1.10
 
 package cases
diff --git a/cases/tables9.0.0_test.go b/cases/tables9.0.0_test.go
index 398d25331..ac804f48b 100644
--- a/cases/tables9.0.0_test.go
+++ b/cases/tables9.0.0_test.go
@@ -1,5 +1,6 @@
 // Code generated by running "go generate" in golang.org/x/text. DO NOT EDIT.
 
+//go:build !go1.10
 // +build !go1.10
 
 package cases
diff --git a/cmd/gotext/examples/rewrite/printer.go b/cmd/gotext/examples/rewrite/printer.go
index 9ed055620..309d19573 100644
--- a/cmd/gotext/examples/rewrite/printer.go
+++ b/cmd/gotext/examples/rewrite/printer.go
@@ -2,6 +2,7 @@
 // Use of this source code is governed by a BSD-style
 // license that can be found in the LICENSE file.
 
+//go:build ignore
 // +build ignore
 
 package main
diff --git a/collate/maketables.go b/collate/maketables.go
index 3b25d7bfa..59afeb9c2 100644
--- a/collate/maketables.go
+++ b/collate/maketables.go
@@ -2,6 +2,7 @@
 // Use of this source code is governed by a BSD-style
 // license that can be found in the LICENSE file.
 
+//go:build ignore
 // +build ignore
 
 // Collation table generator.
diff --git a/collate/tools/colcmp/darwin.go b/collate/tools/colcmp/darwin.go
index d2300e3e2..1be326751 100644
--- a/collate/tools/colcmp/darwin.go
+++ b/collate/tools/colcmp/darwin.go
@@ -2,6 +2,7 @@
 // Use of this source code is governed by a BSD-style
 // license that can be found in the LICENSE file.
 
+//go:build darwin
 // +build darwin
 
 package main
diff --git a/collate/tools/colcmp/icu.go b/collate/tools/colcmp/icu.go
index 76de40427..b816acf7c 100644
--- a/collate/tools/colcmp/icu.go
+++ b/collate/tools/colcmp/icu.go
@@ -2,6 +2,7 @@
 // Use of this source code is governed by a BSD-style
 // license that can be found in the LICENSE file.
 
+//go:build icu
 // +build icu
 
 package main
diff --git a/currency/gen.go b/currency/gen.go
index da7712fc5..4a2c85549 100644
--- a/currency/gen.go
+++ b/currency/gen.go
@@ -2,6 +2,7 @@
 // Use of this source code is governed by a BSD-style
 // license that can be found in the LICENSE file.
 
+//go:build ignore
 // +build ignore
 
 // Generator for currency-related data.
diff --git a/currency/gen_common.go b/currency/gen_common.go
index e1cea2494..e483bed26 100644
--- a/currency/gen_common.go
+++ b/currency/gen_common.go
@@ -2,6 +2,7 @@
 // Use of this source code is governed by a BSD-style
 // license that can be found in the LICENSE file.
 
+//go:build ignore
 // +build ignore
 
 package main
diff --git a/date/gen.go b/date/gen.go
index 1fff91905..b58b9f75d 100644
--- a/date/gen.go
+++ b/date/gen.go
@@ -2,6 +2,7 @@
 // Use of this source code is governed by a BSD-style
 // license that can be found in the LICENSE file.
 
+//go:build ignore
 // +build ignore
 
 package main
diff --git a/encoding/charmap/maketables.go b/encoding/charmap/maketables.go
index f7941701e..70bf360c4 100644
--- a/encoding/charmap/maketables.go
+++ b/encoding/charmap/maketables.go
@@ -2,6 +2,7 @@
 // Use of this source code is governed by a BSD-style
 // license that can be found in the LICENSE file.
 
+//go:build ignore
 // +build ignore
 
 package main
diff --git a/encoding/htmlindex/gen.go b/encoding/htmlindex/gen.go
index ac6b4a77f..d47f8dbd8 100644
--- a/encoding/htmlindex/gen.go
+++ b/encoding/htmlindex/gen.go
@@ -2,6 +2,7 @@
 // Use of this source code is governed by a BSD-style
 // license that can be found in the LICENSE file.
 
+//go:build ignore
 // +build ignore
 
 package main
diff --git a/encoding/ianaindex/ascii.go b/encoding/ianaindex/ascii.go
index 9792f8137..2b9824f82 100644
--- a/encoding/ianaindex/ascii.go
+++ b/encoding/ianaindex/ascii.go
@@ -10,8 +10,8 @@ import (
 
 	"golang.org/x/text/encoding"
 	"golang.org/x/text/encoding/internal"
-	"golang.org/x/text/transform"
 	"golang.org/x/text/encoding/internal/identifier"
+	"golang.org/x/text/transform"
 )
 
 type asciiDecoder struct {
@@ -22,7 +22,7 @@ func (d asciiDecoder) Transform(dst, src []byte, atEOF bool) (nDst, nSrc int, er
 	for _, c := range src {
 		if c > unicode.MaxASCII {
 			r := unicode.ReplacementChar
-			if nDst + utf8.RuneLen(r) > len(dst) {
+			if nDst+utf8.RuneLen(r) > len(dst) {
 				err = transform.ErrShortDst
 				break
 			}
diff --git a/encoding/ianaindex/ascii_test.go b/encoding/ianaindex/ascii_test.go
index a184ab970..873ec7e6f 100644
--- a/encoding/ianaindex/ascii_test.go
+++ b/encoding/ianaindex/ascii_test.go
@@ -5,8 +5,8 @@
 package ianaindex
 
 import (
-	"unicode"
 	"testing"
+	"unicode"
 
 	"golang.org/x/text/encoding"
 )
diff --git a/encoding/ianaindex/gen.go b/encoding/ianaindex/gen.go
index 1b61b820d..61d236621 100644
--- a/encoding/ianaindex/gen.go
+++ b/encoding/ianaindex/gen.go
@@ -2,6 +2,7 @@
 // Use of this source code is governed by a BSD-style
 // license that can be found in the LICENSE file.
 
+//go:build ignore
 // +build ignore
 
 package main
diff --git a/encoding/internal/identifier/gen.go b/encoding/internal/identifier/gen.go
index 26cfef9c6..039cb270c 100644
--- a/encoding/internal/identifier/gen.go
+++ b/encoding/internal/identifier/gen.go
@@ -2,6 +2,7 @@
 // Use of this source code is governed by a BSD-style
 // license that can be found in the LICENSE file.
 
+//go:build ignore
 // +build ignore
 
 package main
diff --git a/encoding/japanese/maketables.go b/encoding/japanese/maketables.go
index 023957a67..3066a39c0 100644
--- a/encoding/japanese/maketables.go
+++ b/encoding/japanese/maketables.go
@@ -2,6 +2,7 @@
 // Use of this source code is governed by a BSD-style
 // license that can be found in the LICENSE file.
 
+//go:build ignore
 // +build ignore
 
 package main
diff --git a/encoding/korean/maketables.go b/encoding/korean/maketables.go
index c84034fb6..9552286f6 100644
--- a/encoding/korean/maketables.go
+++ b/encoding/korean/maketables.go
@@ -2,6 +2,7 @@
 // Use of this source code is governed by a BSD-style
 // license that can be found in the LICENSE file.
 
+//go:build ignore
 // +build ignore
 
 package main
diff --git a/encoding/simplifiedchinese/maketables.go b/encoding/simplifiedchinese/maketables.go
index 55016c786..44988bfd1 100644
--- a/encoding/simplifiedchinese/maketables.go
+++ b/encoding/simplifiedchinese/maketables.go
@@ -2,6 +2,7 @@
 // Use of this source code is governed by a BSD-style
 // license that can be found in the LICENSE file.
 
+//go:build ignore
 // +build ignore
 
 package main
diff --git a/encoding/traditionalchinese/maketables.go b/encoding/traditionalchinese/maketables.go
index cf7fdb31a..33f790598 100644
--- a/encoding/traditionalchinese/maketables.go
+++ b/encoding/traditionalchinese/maketables.go
@@ -2,6 +2,7 @@
 // Use of this source code is governed by a BSD-style
 // license that can be found in the LICENSE file.
 
+//go:build ignore
 // +build ignore
 
 package main
diff --git a/feature/plural/gen.go b/feature/plural/gen.go
index 42f2f8676..b9c5f2493 100644
--- a/feature/plural/gen.go
+++ b/feature/plural/gen.go
@@ -2,6 +2,7 @@
 // Use of this source code is governed by a BSD-style
 // license that can be found in the LICENSE file.
 
+//go:build ignore
 // +build ignore
 
 package main
diff --git a/feature/plural/gen_common.go b/feature/plural/gen_common.go
index 24aa41505..bd92a4d45 100644
--- a/feature/plural/gen_common.go
+++ b/feature/plural/gen_common.go
@@ -2,6 +2,7 @@
 // Use of this source code is governed by a BSD-style
 // license that can be found in the LICENSE file.
 
+//go:build ignore
 // +build ignore
 
 package main
diff --git a/gen.go b/gen.go
index 177bc0bda..04ff6035c 100644
--- a/gen.go
+++ b/gen.go
@@ -2,6 +2,7 @@
 // Use of this source code is governed by a BSD-style
 // license that can be found in the LICENSE file.
 
+//go:build ignore
 // +build ignore
 
 // gen runs go generate on Unicode- and CLDR-related package in the text
diff --git a/internal/export/idna/gen.go b/internal/export/idna/gen.go
index 4ad98046f..1109c1895 100644
--- a/internal/export/idna/gen.go
+++ b/internal/export/idna/gen.go
@@ -2,6 +2,7 @@
 // Use of this source code is governed by a BSD-style
 // license that can be found in the LICENSE file.
 
+//go:build ignore
 // +build ignore
 
 // This program generates the trie for idna operations. The Unicode casing
diff --git a/internal/export/idna/gen10.0.0_test.go b/internal/export/idna/gen10.0.0_test.go
index c5dfdde61..0ac9497d3 100644
--- a/internal/export/idna/gen10.0.0_test.go
+++ b/internal/export/idna/gen10.0.0_test.go
@@ -2,6 +2,7 @@
 // Use of this source code is governed by a BSD-style
 // license that can be found in the LICENSE file.
 
+//go:build go1.10
 // +build go1.10
 
 package idna
diff --git a/internal/export/idna/gen9.0.0_test.go b/internal/export/idna/gen9.0.0_test.go
index 0e66f0b16..47b9ef90f 100644
--- a/internal/export/idna/gen9.0.0_test.go
+++ b/internal/export/idna/gen9.0.0_test.go
@@ -2,6 +2,7 @@
 // Use of this source code is governed by a BSD-style
 // license that can be found in the LICENSE file.
 
+//go:build !go1.10
 // +build !go1.10
 
 package idna
diff --git a/internal/export/idna/gen_common.go b/internal/export/idna/gen_common.go
index 360a02b8e..8d87ba28d 100644
--- a/internal/export/idna/gen_common.go
+++ b/internal/export/idna/gen_common.go
@@ -2,6 +2,7 @@
 // Use of this source code is governed by a BSD-style
 // license that can be found in the LICENSE file.
 
+//go:build ignore
 // +build ignore
 
 package main
diff --git a/internal/export/idna/gen_trieval.go b/internal/export/idna/gen_trieval.go
index 0de99b08a..9d92407f2 100644
--- a/internal/export/idna/gen_trieval.go
+++ b/internal/export/idna/gen_trieval.go
@@ -2,6 +2,7 @@
 // Use of this source code is governed by a BSD-style
 // license that can be found in the LICENSE file.
 
+//go:build ignore
 // +build ignore
 
 package main
diff --git a/internal/export/idna/idna10.0.0.go b/internal/export/idna/idna10.0.0.go
index 2ceb32768..3e7bac3cb 100644
--- a/internal/export/idna/idna10.0.0.go
+++ b/internal/export/idna/idna10.0.0.go
@@ -2,7 +2,9 @@
 // Use of this source code is governed by a BSD-style
 // license that can be found in the LICENSE file.
 
+//go:build go1.10
 // +build go1.10
+
 //go:generate go run gen.go gen_trieval.go gen_common.go
 
 // Package idna implements IDNA2008 using the compatibility processing
diff --git a/internal/export/idna/idna10.0.0_test.go b/internal/export/idna/idna10.0.0_test.go
index 66ea636db..4142bfa84 100644
--- a/internal/export/idna/idna10.0.0_test.go
+++ b/internal/export/idna/idna10.0.0_test.go
@@ -2,6 +2,7 @@
 // Use of this source code is governed by a BSD-style
 // license that can be found in the LICENSE file.
 
+//go:build go1.10
 // +build go1.10
 
 package idna
diff --git a/internal/export/idna/idna9.0.0.go b/internal/export/idna/idna9.0.0.go
index 1ea943136..7acecb800 100644
--- a/internal/export/idna/idna9.0.0.go
+++ b/internal/export/idna/idna9.0.0.go
@@ -2,7 +2,9 @@
 // Use of this source code is governed by a BSD-style
 // license that can be found in the LICENSE file.
 
+//go:build !go1.10
 // +build !go1.10
+
 //go:generate go run gen.go gen_trieval.go gen_common.go
 
 // Package idna implements IDNA2008 using the compatibility processing
diff --git a/internal/export/idna/idna9.0.0_test.go b/internal/export/idna/idna9.0.0_test.go
index 03b1267c3..b76b79628 100644
--- a/internal/export/idna/idna9.0.0_test.go
+++ b/internal/export/idna/idna9.0.0_test.go
@@ -2,6 +2,7 @@
 // Use of this source code is governed by a BSD-style
 // license that can be found in the LICENSE file.
 
+//go:build !go1.10
 // +build !go1.10
 
 package idna
diff --git a/internal/export/idna/tables10.0.0.go b/internal/export/idna/tables10.0.0.go
index 54fddb4b1..d1d62ef45 100644
--- a/internal/export/idna/tables10.0.0.go
+++ b/internal/export/idna/tables10.0.0.go
@@ -1,5 +1,6 @@
 // Code generated by running "go generate" in golang.org/x/text. DO NOT EDIT.
 
+//go:build go1.10 && !go1.13
 // +build go1.10,!go1.13
 
 package idna
diff --git a/internal/export/idna/tables11.0.0.go b/internal/export/idna/tables11.0.0.go
index 8ce0811fd..167efba71 100644
--- a/internal/export/idna/tables11.0.0.go
+++ b/internal/export/idna/tables11.0.0.go
@@ -1,5 +1,6 @@
 // Code generated by running "go generate" in golang.org/x/text. DO NOT EDIT.
 
+//go:build go1.13 && !go1.14
 // +build go1.13,!go1.14
 
 package idna
diff --git a/internal/export/idna/tables12.0.0.go b/internal/export/idna/tables12.0.0.go
index f39f0cb4c..ab40f7bcc 100644
--- a/internal/export/idna/tables12.0.0.go
+++ b/internal/export/idna/tables12.0.0.go
@@ -1,5 +1,6 @@
 // Code generated by running "go generate" in golang.org/x/text. DO NOT EDIT.
 
+//go:build go1.14 && !go1.16
 // +build go1.14,!go1.16
 
 package idna
diff --git a/internal/export/idna/tables13.0.0.go b/internal/export/idna/tables13.0.0.go
index e8c7a36d7..390c5e56d 100644
--- a/internal/export/idna/tables13.0.0.go
+++ b/internal/export/idna/tables13.0.0.go
@@ -1,5 +1,6 @@
 // Code generated by running "go generate" in golang.org/x/text. DO NOT EDIT.
 
+//go:build go1.16
 // +build go1.16
 
 package idna
diff --git a/internal/export/idna/tables9.0.0.go b/internal/export/idna/tables9.0.0.go
index 8b65fa167..4074b5332 100644
--- a/internal/export/idna/tables9.0.0.go
+++ b/internal/export/idna/tables9.0.0.go
@@ -1,5 +1,6 @@
 // Code generated by running "go generate" in golang.org/x/text. DO NOT EDIT.
 
+//go:build !go1.10
 // +build !go1.10
 
 package idna
diff --git a/internal/export/unicode/gen.go b/internal/export/unicode/gen.go
index afdc94de6..9e4114fc3 100644
--- a/internal/export/unicode/gen.go
+++ b/internal/export/unicode/gen.go
@@ -2,6 +2,7 @@
 // Use of this source code is governed by a BSD-style
 // license that can be found in the LICENSE file.
 
+//go:build ignore
 // +build ignore
 
 // Unicode table generator.
diff --git a/internal/language/compact/gen.go b/internal/language/compact/gen.go
index 0c36a052f..400c1f08f 100644
--- a/internal/language/compact/gen.go
+++ b/internal/language/compact/gen.go
@@ -2,6 +2,7 @@
 // Use of this source code is governed by a BSD-style
 // license that can be found in the LICENSE file.
 
+//go:build ignore
 // +build ignore
 
 // Language tag table generator.
diff --git a/internal/language/compact/gen_index.go b/internal/language/compact/gen_index.go
index 136cefaf0..51c0d2d36 100644
--- a/internal/language/compact/gen_index.go
+++ b/internal/language/compact/gen_index.go
@@ -2,6 +2,7 @@
 // Use of this source code is governed by a BSD-style
 // license that can be found in the LICENSE file.
 
+//go:build ignore
 // +build ignore
 
 package main
diff --git a/internal/language/compact/gen_parents.go b/internal/language/compact/gen_parents.go
index 9543d5832..1f4a6e855 100644
--- a/internal/language/compact/gen_parents.go
+++ b/internal/language/compact/gen_parents.go
@@ -2,6 +2,7 @@
 // Use of this source code is governed by a BSD-style
 // license that can be found in the LICENSE file.
 
+//go:build ignore
 // +build ignore
 
 package main
diff --git a/internal/language/gen.go b/internal/language/gen.go
index cdcc7febc..27c43dc96 100644
--- a/internal/language/gen.go
+++ b/internal/language/gen.go
@@ -2,6 +2,7 @@
 // Use of this source code is governed by a BSD-style
 // license that can be found in the LICENSE file.
 
+//go:build ignore
 // +build ignore
 
 // Language tag table generator.
diff --git a/internal/language/gen_common.go b/internal/language/gen_common.go
index c419ceeb1..84dd4de1d 100644
--- a/internal/language/gen_common.go
+++ b/internal/language/gen_common.go
@@ -2,6 +2,7 @@
 // Use of this source code is governed by a BSD-style
 // license that can be found in the LICENSE file.
 
+//go:build ignore
 // +build ignore
 
 package main
diff --git a/internal/number/gen.go b/internal/number/gen.go
index c836221bf..5341747fe 100644
--- a/internal/number/gen.go
+++ b/internal/number/gen.go
@@ -2,6 +2,7 @@
 // Use of this source code is governed by a BSD-style
 // license that can be found in the LICENSE file.
 
+//go:build ignore
 // +build ignore
 
 package main
diff --git a/internal/number/gen_common.go b/internal/number/gen_common.go
index b1b41a73a..f20ad7fef 100644
--- a/internal/number/gen_common.go
+++ b/internal/number/gen_common.go
@@ -2,6 +2,7 @@
 // Use of this source code is governed by a BSD-style
 // license that can be found in the LICENSE file.
 
+//go:build ignore
 // +build ignore
 
 package main
diff --git a/internal/testtext/gc.go b/internal/testtext/gc.go
index a54e1bcbd..a6365f9b4 100644
--- a/internal/testtext/gc.go
+++ b/internal/testtext/gc.go
@@ -2,6 +2,7 @@
 // Use of this source code is governed by a BSD-style
 // license that can be found in the LICENSE file.
 
+//go:build !gccgo
 // +build !gccgo
 
 package testtext
diff --git a/internal/testtext/gccgo.go b/internal/testtext/gccgo.go
index 30e98efff..e880af3da 100644
--- a/internal/testtext/gccgo.go
+++ b/internal/testtext/gccgo.go
@@ -2,6 +2,7 @@
 // Use of this source code is governed by a BSD-style
 // license that can be found in the LICENSE file.
 
+//go:build gccgo
 // +build gccgo
 
 package testtext
diff --git a/internal/testtext/go1_6.go b/internal/testtext/go1_6.go
index 7b2384738..f633e8956 100644
--- a/internal/testtext/go1_6.go
+++ b/internal/testtext/go1_6.go
@@ -2,6 +2,7 @@
 // Use of this source code is governed by a BSD-style
 // license that can be found in the LICENSE file.
 
+//go:build !go1.7
 // +build !go1.7
 
 package testtext
diff --git a/internal/testtext/go1_7.go b/internal/testtext/go1_7.go
index 66f9cf787..228bf4249 100644
--- a/internal/testtext/go1_7.go
+++ b/internal/testtext/go1_7.go
@@ -2,6 +2,7 @@
 // Use of this source code is governed by a BSD-style
 // license that can be found in the LICENSE file.
 
+//go:build go1.7
 // +build go1.7
 
 package testtext
diff --git a/internal/triegen/data_test.go b/internal/triegen/data_test.go
index 91de547a5..a47efacd0 100644
--- a/internal/triegen/data_test.go
+++ b/internal/triegen/data_test.go
@@ -1,4 +1,5 @@
 // This file is generated with "go test -tags generate". DO NOT EDIT!
+//go:build !generate
 // +build !generate
 
 package triegen_test
diff --git a/internal/triegen/gen_test.go b/internal/triegen/gen_test.go
index 831627d7a..6bd137dd6 100644
--- a/internal/triegen/gen_test.go
+++ b/internal/triegen/gen_test.go
@@ -2,6 +2,7 @@
 // Use of this source code is governed by a BSD-style
 // license that can be found in the LICENSE file.
 
+//go:build generate
 // +build generate
 
 package triegen_test
diff --git a/language/display/maketables.go b/language/display/maketables.go
index b520e8ae6..a6cbcc6d6 100644
--- a/language/display/maketables.go
+++ b/language/display/maketables.go
@@ -2,6 +2,7 @@
 // Use of this source code is governed by a BSD-style
 // license that can be found in the LICENSE file.
 
+//go:build ignore
 // +build ignore
 
 // Generator for display name tables.
diff --git a/language/gen.go b/language/gen.go
index 3004eb42c..445882e56 100644
--- a/language/gen.go
+++ b/language/gen.go
@@ -2,6 +2,7 @@
 // Use of this source code is governed by a BSD-style
 // license that can be found in the LICENSE file.
 
+//go:build ignore
 // +build ignore
 
 // Language tag table generator.
diff --git a/language/go1_1.go b/language/go1_1.go
index 380f4c09f..c7435583b 100644
--- a/language/go1_1.go
+++ b/language/go1_1.go
@@ -2,6 +2,7 @@
 // Use of this source code is governed by a BSD-style
 // license that can be found in the LICENSE file.
 
+//go:build !go1.2
 // +build !go1.2
 
 package language
diff --git a/language/go1_2.go b/language/go1_2.go
index 38268c57a..77aaaa299 100644
--- a/language/go1_2.go
+++ b/language/go1_2.go
@@ -2,6 +2,7 @@
 // Use of this source code is governed by a BSD-style
 // license that can be found in the LICENSE file.
 
+//go:build go1.2
 // +build go1.2
 
 package language
diff --git a/message/catalog/go19.go b/message/catalog/go19.go
index 147fc7cf5..4e5e87f8f 100644
--- a/message/catalog/go19.go
+++ b/message/catalog/go19.go
@@ -2,6 +2,7 @@
 // Use of this source code is governed by a BSD-style
 // license that can be found in the LICENSE file.
 
+//go:build go1.9
 // +build go1.9
 
 package catalog
diff --git a/message/catalog/gopre19.go b/message/catalog/gopre19.go
index a9753b905..9e14685a5 100644
--- a/message/catalog/gopre19.go
+++ b/message/catalog/gopre19.go
@@ -2,6 +2,7 @@
 // Use of this source code is governed by a BSD-style
 // license that can be found in the LICENSE file.
 
+//go:build !go1.9
 // +build !go1.9
 
 package catalog
diff --git a/message/pipeline/go19_test.go b/message/pipeline/go19_test.go
index c9517c130..10d9eda29 100644
--- a/message/pipeline/go19_test.go
+++ b/message/pipeline/go19_test.go
@@ -2,6 +2,7 @@
 // Use of this source code is governed by a BSD-style
 // license that can be found in the LICENSE file.
 
+//go:build go1.9
 // +build go1.9
 
 package pipeline
diff --git a/secure/bidirule/bidirule10.0.0.go b/secure/bidirule/bidirule10.0.0.go
index e4c62289f..8a7392c4a 100644
--- a/secure/bidirule/bidirule10.0.0.go
+++ b/secure/bidirule/bidirule10.0.0.go
@@ -2,6 +2,7 @@
 // Use of this source code is governed by a BSD-style
 // license that can be found in the LICENSE file.
 
+//go:build go1.10
 // +build go1.10
 
 package bidirule
diff --git a/secure/bidirule/bidirule10.0.0_test.go b/secure/bidirule/bidirule10.0.0_test.go
index 06ec5f5df..dd5271c0e 100644
--- a/secure/bidirule/bidirule10.0.0_test.go
+++ b/secure/bidirule/bidirule10.0.0_test.go
@@ -2,6 +2,7 @@
 // Use of this source code is governed by a BSD-style
 // license that can be found in the LICENSE file.
 
+//go:build go1.10
 // +build go1.10
 
 package bidirule
diff --git a/secure/bidirule/bidirule9.0.0.go b/secure/bidirule/bidirule9.0.0.go
index 02b9e1e9d..bb0a92001 100644
--- a/secure/bidirule/bidirule9.0.0.go
+++ b/secure/bidirule/bidirule9.0.0.go
@@ -2,6 +2,7 @@
 // Use of this source code is governed by a BSD-style
 // license that can be found in the LICENSE file.
 
+//go:build !go1.10
 // +build !go1.10
 
 package bidirule
diff --git a/secure/bidirule/bidirule9.0.0_test.go b/secure/bidirule/bidirule9.0.0_test.go
index 008874ed3..e0bd1b486 100644
--- a/secure/bidirule/bidirule9.0.0_test.go
+++ b/secure/bidirule/bidirule9.0.0_test.go
@@ -2,6 +2,7 @@
 // Use of this source code is governed by a BSD-style
 // license that can be found in the LICENSE file.
 
+//go:build !go1.10
 // +build !go1.10
 
 package bidirule
diff --git a/secure/precis/benchmark_test.go b/secure/precis/benchmark_test.go
index 6337d0063..faed65437 100644
--- a/secure/precis/benchmark_test.go
+++ b/secure/precis/benchmark_test.go
@@ -2,6 +2,7 @@
 // Use of this source code is governed by a BSD-style
 // license that can be found in the LICENSE file.
 
+//go:build go1.7
 // +build go1.7
 
 package precis
diff --git a/secure/precis/enforce10.0.0_test.go b/secure/precis/enforce10.0.0_test.go
index 34da1503b..7dd7bd550 100644
--- a/secure/precis/enforce10.0.0_test.go
+++ b/secure/precis/enforce10.0.0_test.go
@@ -2,6 +2,7 @@
 // Use of this source code is governed by a BSD-style
 // license that can be found in the LICENSE file.
 
+//go:build go1.10
 // +build go1.10
 
 package precis
diff --git a/secure/precis/enforce9.0.0_test.go b/secure/precis/enforce9.0.0_test.go
index 209745551..98765cd7c 100644
--- a/secure/precis/enforce9.0.0_test.go
+++ b/secure/precis/enforce9.0.0_test.go
@@ -2,6 +2,7 @@
 // Use of this source code is governed by a BSD-style
 // license that can be found in the LICENSE file.
 
+//go:build !go1.10
 // +build !go1.10
 
 package precis
diff --git a/secure/precis/gen.go b/secure/precis/gen.go
index 946acbaa1..99ead4298 100644
--- a/secure/precis/gen.go
+++ b/secure/precis/gen.go
@@ -5,6 +5,7 @@
 // Unicode table generator.
 // Data read from the web.
 
+//go:build ignore
 // +build ignore
 
 package main
diff --git a/secure/precis/gen_trieval.go b/secure/precis/gen_trieval.go
index 308510c9a..6fc5d1e3d 100644
--- a/secure/precis/gen_trieval.go
+++ b/secure/precis/gen_trieval.go
@@ -2,6 +2,7 @@
 // Use of this source code is governed by a BSD-style
 // license that can be found in the LICENSE file.
 
+//go:build ignore
 // +build ignore
 
 package main
diff --git a/secure/precis/tables10.0.0.go b/secure/precis/tables10.0.0.go
index 362d2729b..816474950 100644
--- a/secure/precis/tables10.0.0.go
+++ b/secure/precis/tables10.0.0.go
@@ -1,5 +1,6 @@
 // Code generated by running "go generate" in golang.org/x/text. DO NOT EDIT.
 
+//go:build go1.10 && !go1.13
 // +build go1.10,!go1.13
 
 package precis
diff --git a/secure/precis/tables11.0.0.go b/secure/precis/tables11.0.0.go
index 0db5a9e7b..a40e55d6c 100644
--- a/secure/precis/tables11.0.0.go
+++ b/secure/precis/tables11.0.0.go
@@ -1,5 +1,6 @@
 // Code generated by running "go generate" in golang.org/x/text. DO NOT EDIT.
 
+//go:build go1.13 && !go1.14
 // +build go1.13,!go1.14
 
 package precis
diff --git a/secure/precis/tables12.0.0.go b/secure/precis/tables12.0.0.go
index a2392892a..254bbc793 100644
--- a/secure/precis/tables12.0.0.go
+++ b/secure/precis/tables12.0.0.go
@@ -1,5 +1,6 @@
 // Code generated by running "go generate" in golang.org/x/text. DO NOT EDIT.
 
+//go:build go1.14 && !go1.16
 // +build go1.14,!go1.16
 
 package precis
diff --git a/secure/precis/tables13.0.0.go b/secure/precis/tables13.0.0.go
index e3ddd7302..aad68b35e 100644
--- a/secure/precis/tables13.0.0.go
+++ b/secure/precis/tables13.0.0.go
@@ -1,5 +1,6 @@
 // Code generated by running "go generate" in golang.org/x/text. DO NOT EDIT.
 
+//go:build go1.16
 // +build go1.16
 
 package precis
diff --git a/secure/precis/tables9.0.0.go b/secure/precis/tables9.0.0.go
index dacaf6a4e..2292b7cb0 100644
--- a/secure/precis/tables9.0.0.go
+++ b/secure/precis/tables9.0.0.go
@@ -1,5 +1,6 @@
 // Code generated by running "go generate" in golang.org/x/text. DO NOT EDIT.
 
+//go:build !go1.10
 // +build !go1.10
 
 package precis
diff --git a/unicode/bidi/gen.go b/unicode/bidi/gen.go
index 987fc169c..ab2b8bf6f 100644
--- a/unicode/bidi/gen.go
+++ b/unicode/bidi/gen.go
@@ -2,6 +2,7 @@
 // Use of this source code is governed by a BSD-style
 // license that can be found in the LICENSE file.
 
+//go:build ignore
 // +build ignore
 
 package main
diff --git a/unicode/bidi/gen_ranges.go b/unicode/bidi/gen_ranges.go
index 02c3b505d..10f09895f 100644
--- a/unicode/bidi/gen_ranges.go
+++ b/unicode/bidi/gen_ranges.go
@@ -2,6 +2,7 @@
 // Use of this source code is governed by a BSD-style
 // license that can be found in the LICENSE file.
 
+//go:build ignore
 // +build ignore
 
 package main
diff --git a/unicode/bidi/gen_trieval.go b/unicode/bidi/gen_trieval.go
index 9cb994289..eac0f7645 100644
--- a/unicode/bidi/gen_trieval.go
+++ b/unicode/bidi/gen_trieval.go
@@ -2,6 +2,7 @@
 // Use of this source code is governed by a BSD-style
 // license that can be found in the LICENSE file.
 
+//go:build ignore
 // +build ignore
 
 package main
diff --git a/unicode/bidi/tables10.0.0.go b/unicode/bidi/tables10.0.0.go
index d8c94e1bd..42fa8d72c 100644
--- a/unicode/bidi/tables10.0.0.go
+++ b/unicode/bidi/tables10.0.0.go
@@ -1,5 +1,6 @@
 // Code generated by running "go generate" in golang.org/x/text. DO NOT EDIT.
 
+//go:build go1.10 && !go1.13
 // +build go1.10,!go1.13
 
 package bidi
diff --git a/unicode/bidi/tables11.0.0.go b/unicode/bidi/tables11.0.0.go
index 16b11db53..56a0e1ea2 100644
--- a/unicode/bidi/tables11.0.0.go
+++ b/unicode/bidi/tables11.0.0.go
@@ -1,5 +1,6 @@
 // Code generated by running "go generate" in golang.org/x/text. DO NOT EDIT.
 
+//go:build go1.13 && !go1.14
 // +build go1.13,!go1.14
 
 package bidi
diff --git a/unicode/bidi/tables12.0.0.go b/unicode/bidi/tables12.0.0.go
index 647f2d427..baacf32b4 100644
--- a/unicode/bidi/tables12.0.0.go
+++ b/unicode/bidi/tables12.0.0.go
@@ -1,5 +1,6 @@
 // Code generated by running "go generate" in golang.org/x/text. DO NOT EDIT.
 
+//go:build go1.14 && !go1.16
 // +build go1.14,!go1.16
 
 package bidi
diff --git a/unicode/bidi/tables13.0.0.go b/unicode/bidi/tables13.0.0.go
index c937d0976..f248effae 100644
--- a/unicode/bidi/tables13.0.0.go
+++ b/unicode/bidi/tables13.0.0.go
@@ -1,5 +1,6 @@
 // Code generated by running "go generate" in golang.org/x/text. DO NOT EDIT.
 
+//go:build go1.16
 // +build go1.16
 
 package bidi
diff --git a/unicode/bidi/tables9.0.0.go b/unicode/bidi/tables9.0.0.go
index 0ca0193eb..f517fdb20 100644
--- a/unicode/bidi/tables9.0.0.go
+++ b/unicode/bidi/tables9.0.0.go
@@ -1,5 +1,6 @@
 // Code generated by running "go generate" in golang.org/x/text. DO NOT EDIT.
 
+//go:build !go1.10
 // +build !go1.10
 
 package bidi
diff --git a/unicode/cldr/makexml.go b/unicode/cldr/makexml.go
index eb26306df..3c1fd26ea 100644
--- a/unicode/cldr/makexml.go
+++ b/unicode/cldr/makexml.go
@@ -2,6 +2,7 @@
 // Use of this source code is governed by a BSD-style
 // license that can be found in the LICENSE file.
 
+//go:build ignore
 // +build ignore
 
 // This tool generates types for the various XML formats of CLDR.
diff --git a/unicode/norm/data10.0.0_test.go b/unicode/norm/data10.0.0_test.go
index 56441e72f..54ee4d24f 100644
--- a/unicode/norm/data10.0.0_test.go
+++ b/unicode/norm/data10.0.0_test.go
@@ -1,5 +1,6 @@
 // Code generated by running "go generate" in golang.org/x/text. DO NOT EDIT.
 
+//go:build go1.10 && !go1.13
 // +build go1.10,!go1.13
 
 package norm
diff --git a/unicode/norm/data11.0.0_test.go b/unicode/norm/data11.0.0_test.go
index ee8ec8b53..5b0e03743 100644
--- a/unicode/norm/data11.0.0_test.go
+++ b/unicode/norm/data11.0.0_test.go
@@ -1,5 +1,6 @@
 // Code generated by running "go generate" in golang.org/x/text. DO NOT EDIT.
 
+//go:build go1.13 && !go1.14
 // +build go1.13,!go1.14
 
 package norm
diff --git a/unicode/norm/data12.0.0_test.go b/unicode/norm/data12.0.0_test.go
index 1555292a2..48cdbc5ff 100644
--- a/unicode/norm/data12.0.0_test.go
+++ b/unicode/norm/data12.0.0_test.go
@@ -1,5 +1,6 @@
 // Code generated by running "go generate" in golang.org/x/text. DO NOT EDIT.
 
+//go:build go1.14 && !go1.16
 // +build go1.14,!go1.16
 
 package norm
diff --git a/unicode/norm/data13.0.0_test.go b/unicode/norm/data13.0.0_test.go
index 9455866e5..3c390d02a 100644
--- a/unicode/norm/data13.0.0_test.go
+++ b/unicode/norm/data13.0.0_test.go
@@ -1,5 +1,6 @@
 // Code generated by running "go generate" in golang.org/x/text. DO NOT EDIT.
 
+//go:build go1.16
 // +build go1.16
 
 package norm
diff --git a/unicode/norm/data9.0.0_test.go b/unicode/norm/data9.0.0_test.go
index b1be64d55..77175bc8f 100644
--- a/unicode/norm/data9.0.0_test.go
+++ b/unicode/norm/data9.0.0_test.go
@@ -1,5 +1,6 @@
 // Code generated by running "go generate" in golang.org/x/text. DO NOT EDIT.
 
+//go:build !go1.10
 // +build !go1.10
 
 package norm
diff --git a/unicode/norm/forminfo_test.go b/unicode/norm/forminfo_test.go
index e15ba9bee..96f097088 100644
--- a/unicode/norm/forminfo_test.go
+++ b/unicode/norm/forminfo_test.go
@@ -2,6 +2,7 @@
 // Use of this source code is governed by a BSD-style
 // license that can be found in the LICENSE file.
 
+//go:build test
 // +build test
 
 package norm
diff --git a/unicode/norm/maketables.go b/unicode/norm/maketables.go
index 30a3aa933..0d24d2117 100644
--- a/unicode/norm/maketables.go
+++ b/unicode/norm/maketables.go
@@ -2,6 +2,7 @@
 // Use of this source code is governed by a BSD-style
 // license that can be found in the LICENSE file.
 
+//go:build ignore
 // +build ignore
 
 // Normalization table generator.
diff --git a/unicode/norm/tables10.0.0.go b/unicode/norm/tables10.0.0.go
index 26fbd55a1..f5a078827 100644
--- a/unicode/norm/tables10.0.0.go
+++ b/unicode/norm/tables10.0.0.go
@@ -1,5 +1,6 @@
 // Code generated by running "go generate" in golang.org/x/text. DO NOT EDIT.
 
+//go:build go1.10 && !go1.13
 // +build go1.10,!go1.13
 
 package norm
diff --git a/unicode/norm/tables11.0.0.go b/unicode/norm/tables11.0.0.go
index 2c58f09ba..cb7239c43 100644
--- a/unicode/norm/tables11.0.0.go
+++ b/unicode/norm/tables11.0.0.go
@@ -1,5 +1,6 @@
 // Code generated by running "go generate" in golang.org/x/text. DO NOT EDIT.
 
+//go:build go1.13 && !go1.14
 // +build go1.13,!go1.14
 
 package norm
diff --git a/unicode/norm/tables12.0.0.go b/unicode/norm/tables12.0.0.go
index 7e1ae096e..11b273300 100644
--- a/unicode/norm/tables12.0.0.go
+++ b/unicode/norm/tables12.0.0.go
@@ -1,5 +1,6 @@
 // Code generated by running "go generate" in golang.org/x/text. DO NOT EDIT.
 
+//go:build go1.14 && !go1.16
 // +build go1.14,!go1.16
 
 package norm
diff --git a/unicode/norm/tables13.0.0.go b/unicode/norm/tables13.0.0.go
index 9ea1b4214..96a130d30 100644
--- a/unicode/norm/tables13.0.0.go
+++ b/unicode/norm/tables13.0.0.go
@@ -1,5 +1,6 @@
 // Code generated by running "go generate" in golang.org/x/text. DO NOT EDIT.
 
+//go:build go1.16
 // +build go1.16
 
 package norm
diff --git a/unicode/norm/tables9.0.0.go b/unicode/norm/tables9.0.0.go
index 942906929..0175eae50 100644
--- a/unicode/norm/tables9.0.0.go
+++ b/unicode/norm/tables9.0.0.go
@@ -1,5 +1,6 @@
 // Code generated by running "go generate" in golang.org/x/text. DO NOT EDIT.
 
+//go:build !go1.10
 // +build !go1.10
 
 package norm
diff --git a/unicode/norm/triegen.go b/unicode/norm/triegen.go
index 45d711900..cce64352f 100644
--- a/unicode/norm/triegen.go
+++ b/unicode/norm/triegen.go
@@ -2,6 +2,7 @@
 // Use of this source code is governed by a BSD-style
 // license that can be found in the LICENSE file.
 
+//go:build ignore
 // +build ignore
 
 // Trie table generator.
diff --git a/unicode/rangetable/gen.go b/unicode/rangetable/gen.go
index c2d36741c..fc4eee0a9 100644
--- a/unicode/rangetable/gen.go
+++ b/unicode/rangetable/gen.go
@@ -2,6 +2,7 @@
 // Use of this source code is governed by a BSD-style
 // license that can be found in the LICENSE file.
 
+//go:build ignore
 // +build ignore
 
 package main
diff --git a/unicode/rangetable/tables10.0.0.go b/unicode/rangetable/tables10.0.0.go
index 3dfcd8293..a34fbe294 100644
--- a/unicode/rangetable/tables10.0.0.go
+++ b/unicode/rangetable/tables10.0.0.go
@@ -1,5 +1,6 @@
 // Code generated by running "go generate" in golang.org/x/text. DO NOT EDIT.
 
+//go:build go1.10 && !go1.13
 // +build go1.10,!go1.13
 
 package rangetable
diff --git a/unicode/rangetable/tables11.0.0.go b/unicode/rangetable/tables11.0.0.go
index 1df829f06..31949f0ff 100644
--- a/unicode/rangetable/tables11.0.0.go
+++ b/unicode/rangetable/tables11.0.0.go
@@ -1,5 +1,6 @@
 // Code generated by running "go generate" in golang.org/x/text. DO NOT EDIT.
 
+//go:build go1.13 && !go1.14
 // +build go1.13,!go1.14
 
 package rangetable
diff --git a/unicode/rangetable/tables12.0.0.go b/unicode/rangetable/tables12.0.0.go
index e9d25c51e..9d4d724a6 100644
--- a/unicode/rangetable/tables12.0.0.go
+++ b/unicode/rangetable/tables12.0.0.go
@@ -1,5 +1,6 @@
 // Code generated by running "go generate" in golang.org/x/text. DO NOT EDIT.
 
+//go:build go1.14 && !go1.16
 // +build go1.14,!go1.16
 
 package rangetable
diff --git a/unicode/rangetable/tables13.0.0.go b/unicode/rangetable/tables13.0.0.go
index 921e4f7b1..3dcaad44e 100644
--- a/unicode/rangetable/tables13.0.0.go
+++ b/unicode/rangetable/tables13.0.0.go
@@ -1,5 +1,6 @@
 // Code generated by running "go generate" in golang.org/x/text. DO NOT EDIT.
 
+//go:build go1.16
 // +build go1.16
 
 package rangetable
diff --git a/unicode/rangetable/tables9.0.0.go b/unicode/rangetable/tables9.0.0.go
index aef876d96..32a7ac1ce 100644
--- a/unicode/rangetable/tables9.0.0.go
+++ b/unicode/rangetable/tables9.0.0.go
@@ -1,5 +1,6 @@
 // Code generated by running "go generate" in golang.org/x/text. DO NOT EDIT.
 
+//go:build !go1.10
 // +build !go1.10
 
 package rangetable
diff --git a/unicode/runenames/gen.go b/unicode/runenames/gen.go
index 5633ba62d..4f4a0201a 100644
--- a/unicode/runenames/gen.go
+++ b/unicode/runenames/gen.go
@@ -2,6 +2,7 @@
 // Use of this source code is governed by a BSD-style
 // license that can be found in the LICENSE file.
 
+//go:build ignore
 // +build ignore
 
 package main
diff --git a/unicode/runenames/tables10.0.0.go b/unicode/runenames/tables10.0.0.go
index e74a21c2a..9ff9ad9cc 100644
--- a/unicode/runenames/tables10.0.0.go
+++ b/unicode/runenames/tables10.0.0.go
@@ -1,5 +1,6 @@
 // Code generated by running "go generate" in golang.org/x/text. DO NOT EDIT.
 
+//go:build go1.10 && !go1.13
 // +build go1.10,!go1.13
 
 package runenames
diff --git a/unicode/runenames/tables11.0.0.go b/unicode/runenames/tables11.0.0.go
index 8b41b53b3..ba179885b 100644
--- a/unicode/runenames/tables11.0.0.go
+++ b/unicode/runenames/tables11.0.0.go
@@ -1,5 +1,6 @@
 // Code generated by running "go generate" in golang.org/x/text. DO NOT EDIT.
 
+//go:build go1.13 && !go1.14
 // +build go1.13,!go1.14
 
 package runenames
diff --git a/unicode/runenames/tables12.0.0.go b/unicode/runenames/tables12.0.0.go
index 4f71b9af2..7355a569b 100644
--- a/unicode/runenames/tables12.0.0.go
+++ b/unicode/runenames/tables12.0.0.go
@@ -1,5 +1,6 @@
 // Code generated by running "go generate" in golang.org/x/text. DO NOT EDIT.
 
+//go:build go1.14 && !go1.16
 // +build go1.14,!go1.16
 
 package runenames
diff --git a/unicode/runenames/tables13.0.0.go b/unicode/runenames/tables13.0.0.go
index b08f64835..4b74848a3 100644
--- a/unicode/runenames/tables13.0.0.go
+++ b/unicode/runenames/tables13.0.0.go
@@ -1,5 +1,6 @@
 // Code generated by running "go generate" in golang.org/x/text. DO NOT EDIT.
 
+//go:build go1.16
 // +build go1.16
 
 package runenames
diff --git a/unicode/runenames/tables9.0.0.go b/unicode/runenames/tables9.0.0.go
index 912c39613..0e8d95565 100644
--- a/unicode/runenames/tables9.0.0.go
+++ b/unicode/runenames/tables9.0.0.go
@@ -1,5 +1,6 @@
 // Code generated by running "go generate" in golang.org/x/text. DO NOT EDIT.
 
+//go:build !go1.10
 // +build !go1.10
 
 package runenames
diff --git a/width/gen.go b/width/gen.go
index 092277e1f..36e4156b3 100644
--- a/width/gen.go
+++ b/width/gen.go
@@ -2,6 +2,7 @@
 // Use of this source code is governed by a BSD-style
 // license that can be found in the LICENSE file.
 
+//go:build ignore
 // +build ignore
 
 // This program generates the trie for width operations. The generated table
diff --git a/width/gen_common.go b/width/gen_common.go
index 601e75268..24c49ff55 100644
--- a/width/gen_common.go
+++ b/width/gen_common.go
@@ -2,6 +2,7 @@
 // Use of this source code is governed by a BSD-style
 // license that can be found in the LICENSE file.
 
+//go:build ignore
 // +build ignore
 
 package main
diff --git a/width/gen_trieval.go b/width/gen_trieval.go
index c17334aa6..cf1a3b29f 100644
--- a/width/gen_trieval.go
+++ b/width/gen_trieval.go
@@ -2,6 +2,7 @@
 // Use of this source code is governed by a BSD-style
 // license that can be found in the LICENSE file.
 
+//go:build ignore
 // +build ignore
 
 package main
diff --git a/width/tables10.0.0.go b/width/tables10.0.0.go
index decb8e480..186b1d4ef 100644
--- a/width/tables10.0.0.go
+++ b/width/tables10.0.0.go
@@ -1,5 +1,6 @@
 // Code generated by running "go generate" in golang.org/x/text. DO NOT EDIT.
 
+//go:build go1.10 && !go1.13
 // +build go1.10,!go1.13
 
 package width
diff --git a/width/tables11.0.0.go b/width/tables11.0.0.go
index 3c75e428f..990f7622f 100644
--- a/width/tables11.0.0.go
+++ b/width/tables11.0.0.go
@@ -1,5 +1,6 @@
 // Code generated by running "go generate" in golang.org/x/text. DO NOT EDIT.
 
+//go:build go1.13 && !go1.14
 // +build go1.13,!go1.14
 
 package width
diff --git a/width/tables12.0.0.go b/width/tables12.0.0.go
index 543942b9e..85296297e 100644
--- a/width/tables12.0.0.go
+++ b/width/tables12.0.0.go
@@ -1,5 +1,6 @@
 // Code generated by running "go generate" in golang.org/x/text. DO NOT EDIT.
 
+//go:build go1.14 && !go1.16
 // +build go1.14,!go1.16
 
 package width
diff --git a/width/tables13.0.0.go b/width/tables13.0.0.go
index 804264ca6..bac3f1aee 100644
--- a/width/tables13.0.0.go
+++ b/width/tables13.0.0.go
@@ -1,5 +1,6 @@
 // Code generated by running "go generate" in golang.org/x/text. DO NOT EDIT.
 
+//go:build go1.16
 // +build go1.16
 
 package width
diff --git a/width/tables9.0.0.go b/width/tables9.0.0.go
index 7069e2634..b3db84f6f 100644
--- a/width/tables9.0.0.go
+++ b/width/tables9.0.0.go
@@ -1,5 +1,6 @@
 // Code generated by running "go generate" in golang.org/x/text. DO NOT EDIT.
 
+//go:build !go1.10
 // +build !go1.10
 
 package width

From e3aa4adf54f644ca0cb35f1f1fb19b239c40ef04 Mon Sep 17 00:00:00 2001
From: Marcel van Lohuizen <mpvl@golang.org>
Date: Thu, 18 Feb 2021 08:31:59 +0100
Subject: [PATCH 08/40] language: allow variable number of types per key in -u-
 extension

This also fixes CVE-2020-28851. This was an off-by one
error, but is fixed by handling all cases according to the spec.

These valid case seem to be not used in practice much,
if at all, but the main benefit is that it makes all valid BCP 47
language tags also valid -u extensions. Fixing the code
to handle BCP 47 results in cleaner and seemingly more
robust code.

The main difference is as follows. The old impementation
assumed a -u- extension of the form:

    <tag> "-u"  { "-" <attr> } { "-" <key> "-" <type> } [ <otherExtensions> ]

where <attr> and <type> are of length 3-8 and a <key> is of length 2.

According to the spec, though, the format is

    <tag> "-u"  { "-" <attr> } { "-" <key> { "-" <type> } } [ <otherExtensions> ]

So every key may be associated with zero or more types, instead of
exactly one.

The new code now handles this.

The language.Tag.TypeForKey method is now defined to only
return the first entry or nothing at all. This is for backwards
compatibilty reasons.

Fixes golang/go#42535

Change-Id: I23aec4e1c4d8807fc2ffc0eb3a08de2d8150219f
Reviewed-on: https://go-review.googlesource.com/c/text/+/293549
Trust: Marcel van Lohuizen <mpvl@golang.org>
Run-TryBot: Marcel van Lohuizen <mpvl@golang.org>
TryBot-Result: Go Bot <gobot@golang.org>
Reviewed-by: Russ Cox <rsc@golang.org>
---
 internal/language/language.go      | 90 ++++++++++++++----------------
 internal/language/language_test.go | 14 ++++-
 internal/language/parse.go         | 28 +++++-----
 internal/language/parse_test.go    | 23 ++++----
 language/language.go               |  4 ++
 language/language_test.go          | 13 +++++
 language/parse_test.go             | 22 ++++----
 7 files changed, 108 insertions(+), 86 deletions(-)

diff --git a/internal/language/language.go b/internal/language/language.go
index 1e74d1aff..f41aedcfc 100644
--- a/internal/language/language.go
+++ b/internal/language/language.go
@@ -303,9 +303,17 @@ func (t Tag) Extensions() []string {
 // are of the allowed values defined for the Unicode locale extension ('u') in
 // https://www.unicode.org/reports/tr35/#Unicode_Language_and_Locale_Identifiers.
 // TypeForKey will traverse the inheritance chain to get the correct value.
+//
+// If there are multiple types associated with a key, only the first will be
+// returned. If there is no type associated with a key, it returns the empty
+// string.
 func (t Tag) TypeForKey(key string) string {
-	if start, end, _ := t.findTypeForKey(key); end != start {
-		return t.str[start:end]
+	if _, start, end, _ := t.findTypeForKey(key); end != start {
+		s := t.str[start:end]
+		if p := strings.IndexByte(s, '-'); p >= 0 {
+			s = s[:p]
+		}
+		return s
 	}
 	return ""
 }
@@ -329,13 +337,13 @@ func (t Tag) SetTypeForKey(key, value string) (Tag, error) {
 
 	// Remove the setting if value is "".
 	if value == "" {
-		start, end, _ := t.findTypeForKey(key)
-		if start != end {
-			// Remove key tag and leading '-'.
-			start -= 4
-
+		start, sep, end, _ := t.findTypeForKey(key)
+		if start != sep {
 			// Remove a possible empty extension.
-			if (end == len(t.str) || t.str[end+2] == '-') && t.str[start-2] == '-' {
+			switch {
+			case t.str[start-2] != '-': // has previous elements.
+			case end == len(t.str), // end of string
+				end+2 < len(t.str) && t.str[end+2] == '-': // end of extension
 				start -= 2
 			}
 			if start == int(t.pVariant) && end == len(t.str) {
@@ -381,14 +389,14 @@ func (t Tag) SetTypeForKey(key, value string) (Tag, error) {
 		t.str = string(buf[:uStart+len(b)])
 	} else {
 		s := t.str
-		start, end, hasExt := t.findTypeForKey(key)
-		if start == end {
+		start, sep, end, hasExt := t.findTypeForKey(key)
+		if start == sep {
 			if hasExt {
 				b = b[2:]
 			}
-			t.str = fmt.Sprintf("%s-%s%s", s[:start], b, s[end:])
+			t.str = fmt.Sprintf("%s-%s%s", s[:sep], b, s[end:])
 		} else {
-			t.str = fmt.Sprintf("%s%s%s", s[:start], value, s[end:])
+			t.str = fmt.Sprintf("%s-%s%s", s[:start+3], value, s[end:])
 		}
 	}
 	return t, nil
@@ -399,10 +407,10 @@ func (t Tag) SetTypeForKey(key, value string) (Tag, error) {
 // wasn't found. The hasExt return value reports whether an -u extension was present.
 // Note: the extensions are typically very small and are likely to contain
 // only one key-type pair.
-func (t Tag) findTypeForKey(key string) (start, end int, hasExt bool) {
+func (t Tag) findTypeForKey(key string) (start, sep, end int, hasExt bool) {
 	p := int(t.pExt)
 	if len(key) != 2 || p == len(t.str) || p == 0 {
-		return p, p, false
+		return p, p, p, false
 	}
 	s := t.str
 
@@ -410,10 +418,10 @@ func (t Tag) findTypeForKey(key string) (start, end int, hasExt bool) {
 	for p++; s[p] != 'u'; p++ {
 		if s[p] > 'u' {
 			p--
-			return p, p, false
+			return p, p, p, false
 		}
 		if p = nextExtension(s, p); p == len(s) {
-			return len(s), len(s), false
+			return len(s), len(s), len(s), false
 		}
 	}
 	// Proceed to the hyphen following the extension name.
@@ -424,40 +432,28 @@ func (t Tag) findTypeForKey(key string) (start, end int, hasExt bool) {
 
 	// Iterate over keys until we get the end of a section.
 	for {
-		// p points to the hyphen preceding the current token.
-		if p3 := p + 3; s[p3] == '-' {
-			// Found a key.
-			// Check whether we just processed the key that was requested.
-			if curKey == key {
-				return start, p, true
-			}
-			// Set to the next key and continue scanning type tokens.
-			curKey = s[p+1 : p3]
-			if curKey > key {
-				return p, p, true
-			}
-			// Start of the type token sequence.
-			start = p + 4
-			// A type is at least 3 characters long.
-			p += 7 // 4 + 3
-		} else {
-			// Attribute or type, which is at least 3 characters long.
-			p += 4
-		}
-		// p points past the third character of a type or attribute.
-		max := p + 5 // maximum length of token plus hyphen.
-		if len(s) < max {
-			max = len(s)
+		end = p
+		for p++; p < len(s) && s[p] != '-'; p++ {
 		}
-		for ; p < max && s[p] != '-'; p++ {
+		n := p - end - 1
+		if n <= 2 && curKey == key {
+			if sep < end {
+				sep++
+			}
+			return start, sep, end, true
 		}
-		// Bail if we have exhausted all tokens or if the next token starts
-		// a new extension.
-		if p == len(s) || s[p+2] == '-' {
-			if curKey == key {
-				return start, p, true
+		switch n {
+		case 0, // invalid string
+			1: // next extension
+			return end, end, end, true
+		case 2:
+			// next key
+			curKey = s[end+1 : p]
+			if curKey > key {
+				return end, end, end, true
 			}
-			return p, p, true
+			start = end
+			sep = p
 		}
 	}
 }
diff --git a/internal/language/language_test.go b/internal/language/language_test.go
index 6c7c10836..8244c1c8a 100644
--- a/internal/language/language_test.go
+++ b/internal/language/language_test.go
@@ -432,7 +432,9 @@ func TestSetTypeForKey(t *testing.T) {
 		{"co", "pinyin", "en-u-co-phonebk-cu-xau", "en-u-co-pinyin-cu-xau", false},
 		{"co", "pinyin", "en-u-co-phonebk-v-xx", "en-u-co-pinyin-v-xx", false},
 		{"co", "pinyin", "en-u-co-phonebk-x-x", "en-u-co-pinyin-x-x", false},
+		{"co", "pinyin", "en-u-co-x-x", "en-u-co-pinyin-x-x", false},
 		{"nu", "arabic", "en-u-co-phonebk-nu-vaai", "en-u-co-phonebk-nu-arabic", false},
+		{"nu", "arabic", "en-u-co-phonebk-nu", "en-u-co-phonebk-nu-arabic", false},
 		// add to existing -u extension
 		{"co", "pinyin", "en-u-ca-gregory", "en-u-ca-gregory-co-pinyin", false},
 		{"co", "pinyin", "en-u-ca-gregory-nu-vaai", "en-u-ca-gregory-co-pinyin-nu-vaai", false},
@@ -441,8 +443,12 @@ func TestSetTypeForKey(t *testing.T) {
 		{"ca", "gregory", "en-u-co-pinyin", "en-u-ca-gregory-co-pinyin", false},
 		// remove pair
 		{"co", "", "en-u-co-phonebk", "en", false},
+		{"co", "", "en-u-co", "en", false},
+		{"co", "", "en-u-co-v", "en", false},
+		{"co", "", "en-u-co-v-", "en", false},
 		{"co", "", "en-u-ca-gregory-co-phonebk", "en-u-ca-gregory", false},
 		{"co", "", "en-u-co-phonebk-nu-arabic", "en-u-nu-arabic", false},
+		{"co", "", "en-u-co-nu-arabic", "en-u-nu-arabic", false},
 		{"co", "", "en", "en", false},
 		// add -u extension
 		{"co", "pinyin", "en", "en-u-co-pinyin", false},
@@ -504,6 +510,8 @@ func TestFindKeyAndType(t *testing.T) {
 		{"cu", false, "en-a-va-v-va", "en-a-va"},
 		{"cu", false, "en-x-a", "en"},
 		// Tags with the -u extension.
+		{"nu", true, "en-u-cu-nu", "en-u-cu"},
+		{"cu", true, "en-u-cu-nu", "en-u"},
 		{"co", true, "en-u-co-standard", "standard"},
 		{"co", true, "yue-u-co-pinyin", "pinyin"},
 		{"co", true, "en-u-co-abc", "abc"},
@@ -519,9 +527,9 @@ func TestFindKeyAndType(t *testing.T) {
 		{"cu", true, "en-u-co-abc-def-nu-arabic", "en-u-co-abc-def"},
 	}
 	for i, tt := range tests {
-		start, end, hasExt := Make(tt.in).findTypeForKey(tt.key)
-		if start != end {
-			res := tt.in[start:end]
+		start, sep, end, hasExt := Make(tt.in).findTypeForKey(tt.key)
+		if sep != end {
+			res := tt.in[sep:end]
 			if res != tt.out {
 				t.Errorf("%d:%s: was %q; want %q", i, tt.in, res, tt.out)
 			}
diff --git a/internal/language/parse.go b/internal/language/parse.go
index a2fdad89d..c696fd0bd 100644
--- a/internal/language/parse.go
+++ b/internal/language/parse.go
@@ -138,7 +138,7 @@ func (s *scanner) resizeRange(oldStart, oldEnd, newSize int) {
 			b = make([]byte, n)
 			copy(b, s.b[:oldStart])
 		} else {
-			b = s.b[:n:n]
+			b = s.b[:n]
 		}
 		copy(b[end:], s.b[oldEnd:])
 		s.b = b
@@ -483,7 +483,7 @@ func parseExtensions(scan *scanner) int {
 func parseExtension(scan *scanner) int {
 	start, end := scan.start, scan.end
 	switch scan.token[0] {
-	case 'u':
+	case 'u': // https://www.ietf.org/rfc/rfc6067.txt
 		attrStart := end
 		scan.scan()
 		for last := []byte{}; len(scan.token) > 2; scan.scan() {
@@ -503,27 +503,29 @@ func parseExtension(scan *scanner) int {
 			last = scan.token
 			end = scan.end
 		}
+		// Scan key-type sequences. A key is of length 2 and may be followed
+		// by 0 or more "type" subtags from 3 to the maximum of 8 letters.
 		var last, key []byte
 		for attrEnd := end; len(scan.token) == 2; last = key {
 			key = scan.token
-			keyEnd := scan.end
-			end = scan.acceptMinSize(3)
+			end = scan.end
+			for scan.scan(); end < scan.end && len(scan.token) > 2; scan.scan() {
+				end = scan.end
+			}
 			// TODO: check key value validity
-			if keyEnd == end || bytes.Compare(key, last) != 1 {
+			if bytes.Compare(key, last) != 1 || scan.err != nil {
 				// We have an invalid key or the keys are not sorted.
 				// Start scanning keys from scratch and reorder.
 				p := attrEnd + 1
 				scan.next = p
 				keys := [][]byte{}
 				for scan.scan(); len(scan.token) == 2; {
-					keyStart, keyEnd := scan.start, scan.end
-					end = scan.acceptMinSize(3)
-					if keyEnd != end {
-						keys = append(keys, scan.b[keyStart:end])
-					} else {
-						scan.setError(ErrSyntax)
-						end = keyStart
+					keyStart := scan.start
+					end = scan.end
+					for scan.scan(); end < scan.end && len(scan.token) > 2; scan.scan() {
+						end = scan.end
 					}
+					keys = append(keys, scan.b[keyStart:end])
 				}
 				sort.Stable(bytesSort{keys, 2})
 				if n := len(keys); n > 0 {
@@ -547,7 +549,7 @@ func parseExtension(scan *scanner) int {
 				break
 			}
 		}
-	case 't':
+	case 't': // https://www.ietf.org/rfc/rfc6497.txt
 		scan.scan()
 		if n := len(scan.token); n >= 2 && n <= 3 && isAlpha(scan.token[1]) {
 			_, end = parseTag(scan)
diff --git a/internal/language/parse_test.go b/internal/language/parse_test.go
index 0cc97d7a5..e1d428aa6 100644
--- a/internal/language/parse_test.go
+++ b/internal/language/parse_test.go
@@ -164,13 +164,13 @@ func parseTests() []parseTest {
 		{in: "en-9-aa-0-aa-z-bb-x-a", lang: "en", extList: []string{"0-aa", "9-aa", "z-bb", "x-a"}, changed: true},
 		{in: "en-u-c", lang: "en", ext: "", invalid: true},
 		{in: "en-u-co-phonebk", lang: "en", ext: "u-co-phonebk"},
-		{in: "en-u-co-phonebk-ca", lang: "en", ext: "u-co-phonebk", invalid: true},
-		{in: "en-u-nu-arabic-co-phonebk-ca", lang: "en", ext: "u-co-phonebk-nu-arabic", invalid: true, changed: true},
-		{in: "en-u-nu-arabic-co-phonebk-ca-x", lang: "en", ext: "u-co-phonebk-nu-arabic", invalid: true, changed: true},
-		{in: "en-u-nu-arabic-co-phonebk-ca-s", lang: "en", ext: "u-co-phonebk-nu-arabic", invalid: true, changed: true},
-		{in: "en-u-nu-arabic-co-phonebk-ca-a12345678", lang: "en", ext: "u-co-phonebk-nu-arabic", invalid: true, changed: true},
-		{in: "en-u-co-phonebook", lang: "en", ext: "", invalid: true},
-		{in: "en-u-co-phonebook-cu-xau", lang: "en", ext: "u-cu-xau", invalid: true, changed: true},
+		{in: "en-u-co-phonebk-ca", lang: "en", ext: "u-ca-co-phonebk", changed: true},
+		{in: "en-u-nu-arabic-co-phonebk-ca", lang: "en", ext: "u-ca-co-phonebk-nu-arabic", changed: true},
+		{in: "en-u-nu-arabic-co-phonebk-ca-x", lang: "en", ext: "u-ca-co-phonebk-nu-arabic", invalid: true, changed: true},
+		{in: "en-u-nu-arabic-co-phonebk-ca-s", lang: "en", ext: "u-ca-co-phonebk-nu-arabic", invalid: true, changed: true},
+		{in: "en-u-nu-arabic-co-phonebk-ca-a12345678", lang: "en", ext: "u-ca-co-phonebk-nu-arabic", invalid: true, changed: true},
+		{in: "en-u-co-phonebook", lang: "en", ext: "u-co", invalid: true},
+		{in: "en-u-co-phonebook-cu-xau", lang: "en", ext: "u-co-cu-xau", invalid: true, changed: true},
 		{in: "en-Cyrl-u-co-phonebk", lang: "en", script: "Cyrl", ext: "u-co-phonebk"},
 		{in: "en-US-u-co-phonebk", lang: "en", region: "US", ext: "u-co-phonebk"},
 		{in: "en-US-u-co-phonebk-cu-xau", lang: "en", region: "US", ext: "u-co-phonebk-cu-xau"},
@@ -179,9 +179,8 @@ func parseTests() []parseTest {
 		{in: "en-u-def-abc-cu-xua-co-phonebk", lang: "en", ext: "u-abc-def-co-phonebk-cu-xua", changed: true},
 		{in: "en-u-def-abc", lang: "en", ext: "u-abc-def", changed: true},
 		{in: "en-u-cu-xua-co-phonebk-a-cd", lang: "en", extList: []string{"a-cd", "u-co-phonebk-cu-xua"}, changed: true},
-		// Invalid "u" extension. Drop invalid parts.
-		{in: "en-u-cu-co-phonebk", lang: "en", extList: []string{"u-co-phonebk"}, invalid: true, changed: true},
-		{in: "en-u-cu-xau-co", lang: "en", extList: []string{"u-cu-xau"}, invalid: true},
+		{in: "en-u-cu-co-phonebk", lang: "en", extList: []string{"u-co-phonebk-cu"}, changed: true},
+		{in: "en-u-cu-xau-co", lang: "en", extList: []string{"u-co-cu-xau"}, changed: true},
 		// LDML spec is not specific about it, but remove duplicates and return an error if the values differ.
 		{in: "en-u-cu-xau-co-phonebk-cu-xau", lang: "en", ext: "u-co-phonebk-cu-xau", changed: true},
 		// No change as the result is a substring of the original!
@@ -351,8 +350,8 @@ func TestErrors(t *testing.T) {
 		{"aa-AB", mkInvalid("AB")},
 		// ill-formed wins over invalid.
 		{"ac-u", ErrSyntax},
-		{"ac-u-ca", ErrSyntax},
-		{"ac-u-ca-co-pinyin", ErrSyntax},
+		{"ac-u-ca", mkInvalid("ac")},
+		{"ac-u-ca-co-pinyin", mkInvalid("ac")},
 		{"noob", ErrSyntax},
 	}
 	for _, tt := range tests {
diff --git a/language/language.go b/language/language.go
index abfa17f66..289b3a36d 100644
--- a/language/language.go
+++ b/language/language.go
@@ -412,6 +412,10 @@ func (t Tag) Extensions() []Extension {
 // are of the allowed values defined for the Unicode locale extension ('u') in
 // https://www.unicode.org/reports/tr35/#Unicode_Language_and_Locale_Identifiers.
 // TypeForKey will traverse the inheritance chain to get the correct value.
+//
+// If there are multiple types associated with a key, only the first will be
+// returned. If there is no type associated with a key, it returns the empty
+// string.
 func (t Tag) TypeForKey(key string) string {
 	if !compact.Tag(t).MayHaveExtensions() {
 		if key != "rg" && key != "va" {
diff --git a/language/language_test.go b/language/language_test.go
index f7711ba34..b2e3ce3c5 100644
--- a/language/language_test.go
+++ b/language/language_test.go
@@ -523,6 +523,13 @@ func TestCanonicalize(t *testing.T) {
 		{"en-GB-u-rg-usz", "en-GB-u-rg-usz", Raw},
 		{"en-GB-u-rg-usz-va-posix", "en-GB-u-rg-usz-va-posix", Raw},
 		{"en-GB-u-rg-usz-co-phonebk", "en-GB-u-co-phonebk-rg-usz", Raw},
+
+		// CVE-2020-28851
+		// invalid key-value pair of -u- extension.
+		{"ES-u-000-00", "es-u-000-00", Raw},
+		{"ES-u-000-00-v-00", "es-u-000-00-v-00", Raw},
+		// reordered and unknown extension.
+		{"ES-v-00-u-000-00", "es-u-000-00-v-00", Raw},
 	}
 	for i, tt := range tests {
 		in, _ := Raw.Parse(tt.in)
@@ -553,6 +560,12 @@ func TestTypeForKey(t *testing.T) {
 		{"rg", "en-u-rg-gbzzzz", "gbzzzz"},
 		{"nu", "en-u-co-phonebk-nu-arabic", "arabic"},
 		{"kc", "cmn-u-co-stroke", ""},
+		{"rg", "cmn-u-rg", ""},
+		{"rg", "cmn-u-rg-co-stroke", ""},
+		{"co", "cmn-u-rg-co-stroke", "stroke"},
+		{"co", "cmn-u-co-rg-gbzzzz", ""},
+		{"rg", "cmn-u-co-rg-gbzzzz", "gbzzzz"},
+		{"rg", "cmn-u-rg-gbzzzz-nlzzzz", "gbzzzz"},
 	}
 	for _, tt := range tests {
 		if v := Make(tt.in).TypeForKey(tt.key); v != tt.out {
diff --git a/language/parse_test.go b/language/parse_test.go
index 041660c4e..4b7e64db3 100644
--- a/language/parse_test.go
+++ b/language/parse_test.go
@@ -101,13 +101,13 @@ func parseTests() []parseTest {
 		{in: "en-9-aa-0-aa-z-bb-x-a", lang: "en", extList: []string{"0-aa", "9-aa", "z-bb", "x-a"}, changed: true},
 		{in: "en-u-c", lang: "en", ext: "", invalid: true},
 		{in: "en-u-co-phonebk", lang: "en", ext: "u-co-phonebk"},
-		{in: "en-u-co-phonebk-ca", lang: "en", ext: "u-co-phonebk", invalid: true},
-		{in: "en-u-nu-arabic-co-phonebk-ca", lang: "en", ext: "u-co-phonebk-nu-arabic", invalid: true, changed: true},
-		{in: "en-u-nu-arabic-co-phonebk-ca-x", lang: "en", ext: "u-co-phonebk-nu-arabic", invalid: true, changed: true},
-		{in: "en-u-nu-arabic-co-phonebk-ca-s", lang: "en", ext: "u-co-phonebk-nu-arabic", invalid: true, changed: true},
-		{in: "en-u-nu-arabic-co-phonebk-ca-a12345678", lang: "en", ext: "u-co-phonebk-nu-arabic", invalid: true, changed: true},
-		{in: "en-u-co-phonebook", lang: "en", ext: "", invalid: true},
-		{in: "en-u-co-phonebook-cu-xau", lang: "en", ext: "u-cu-xau", invalid: true, changed: true},
+		{in: "en-u-co-phonebk-ca", lang: "en", ext: "u-ca-co-phonebk", invalid: true},
+		{in: "en-u-nu-arabic-co-phonebk-ca", lang: "en", ext: "u-ca-co-phonebk-nu-arabic", invalid: true, changed: true},
+		{in: "en-u-nu-arabic-co-phonebk-ca-x", lang: "en", ext: "u-ca-co-phonebk-nu-arabic", invalid: true, changed: true},
+		{in: "en-u-nu-arabic-co-phonebk-ca-s", lang: "en", ext: "u-ca-co-phonebk-nu-arabic", invalid: true, changed: true},
+		{in: "en-u-nu-arabic-co-phonebk-ca-a12345678", lang: "en", ext: "u-ca-co-phonebk-nu-arabic", invalid: true, changed: true},
+		{in: "en-u-co-phonebook", lang: "en", ext: "u-co", invalid: true},
+		{in: "en-u-co-phonebook-cu-xau", lang: "en", ext: "u-co-cu-xau", invalid: true, changed: true},
 		{in: "en-Cyrl-u-co-phonebk", lang: "en", script: "Cyrl", ext: "u-co-phonebk"},
 		{in: "en-US-u-co-phonebk", lang: "en", region: "US", ext: "u-co-phonebk"},
 		{in: "en-US-u-co-phonebk-cu-xau", lang: "en", region: "US", ext: "u-co-phonebk-cu-xau"},
@@ -117,8 +117,8 @@ func parseTests() []parseTest {
 		{in: "en-u-def-abc", lang: "en", ext: "u-abc-def", changed: true},
 		{in: "en-u-cu-xua-co-phonebk-a-cd", lang: "en", extList: []string{"a-cd", "u-co-phonebk-cu-xua"}, changed: true},
 		// Invalid "u" extension. Drop invalid parts.
-		{in: "en-u-cu-co-phonebk", lang: "en", extList: []string{"u-co-phonebk"}, invalid: true, changed: true},
-		{in: "en-u-cu-xau-co", lang: "en", extList: []string{"u-cu-xau"}, invalid: true},
+		{in: "en-u-cu-co-phonebk", lang: "en", extList: []string{"u-co-phonebk-cu"}, invalid: true, changed: true},
+		{in: "en-u-cu-xau-co", lang: "en", extList: []string{"u-co-cu-xau"}, invalid: true},
 		// We allow duplicate keys as the LDML spec does not explicitly prohibit it.
 		// TODO: Consider eliminating duplicates and returning an error.
 		{in: "en-u-cu-xau-co-phonebk-cu-xau", lang: "en", ext: "u-co-phonebk-cu-xau", changed: true},
@@ -219,8 +219,8 @@ func TestErrors(t *testing.T) {
 		{"aa-AB", mkInvalid("AB")},
 		// ill-formed wins over invalid.
 		{"ac-u", errSyntax},
-		{"ac-u-ca", errSyntax},
-		{"ac-u-ca-co-pinyin", errSyntax},
+		{"ac-u-ca", mkInvalid("ac")},
+		{"ac-u-ca-co-pinyin", mkInvalid("ac")},
 		{"noob", errSyntax},
 	}
 	for _, tt := range tests {

From e328d63cff14134669501e0e154e4f141c784322 Mon Sep 17 00:00:00 2001
From: Marcel van Lohuizen <mpvl@golang.org>
Date: Mon, 29 Mar 2021 16:31:20 +0200
Subject: [PATCH 09/40] language: fix off-by-one error

Regions are encoded starting from 1. However, one of the
region-related tables assumed 0-based indices. This
caused a crash when used with ZZ, the largest region.

Fixes golang/go#43834

Change-Id: Iaed6b9d2683cd50504e6d33c8a6df8b21dd1687d
Reviewed-on: https://go-review.googlesource.com/c/text/+/305469
Trust: Marcel van Lohuizen <mpvl@golang.org>
Run-TryBot: Marcel van Lohuizen <mpvl@golang.org>
TryBot-Result: Go Bot <gobot@golang.org>
Reviewed-by: Seth Vargo <sethvargo@google.com>
Reviewed-by: Ian Lance Taylor <iant@golang.org>
---
 language/gen.go        |  4 +++-
 language/match_test.go | 14 ++++++++++++++
 language/tables.go     |  8 ++++----
 3 files changed, 21 insertions(+), 5 deletions(-)

diff --git a/language/gen.go b/language/gen.go
index 445882e56..60bdf64d0 100644
--- a/language/gen.go
+++ b/language/gen.go
@@ -150,7 +150,9 @@ func (b *builder) writeMatchData() {
 		regions := strings.Split(g.Contains, " ")
 		regionHierarchy[g.Type] = append(regionHierarchy[g.Type], regions...)
 	}
-	regionToGroups := make([]uint8, language.NumRegions)
+	// Regions start at 1, so the slice must be one larger than the number of
+	// regions.
+	regionToGroups := make([]uint8, language.NumRegions+1)
 
 	idToIndex := map[string]uint8{}
 	for i, mv := range lm[0].MatchVariable {
diff --git a/language/match_test.go b/language/match_test.go
index c21b86372..a6df3e1dc 100644
--- a/language/match_test.go
+++ b/language/match_test.go
@@ -224,6 +224,20 @@ func (t haveTag) String() string {
 	return fmt.Sprintf("%v:%d:%v:%v-%v|%v", t.tag, t.index, t.conf, t.maxRegion, t.maxScript, t.altScript)
 }
 
+func TestIssue43834(t *testing.T) {
+	matcher := NewMatcher([]Tag{English})
+
+	// ZZ is the largest region code and should not cause overflow.
+	desired, _, err := ParseAcceptLanguage("en-ZZ")
+	if err != nil {
+		t.Error(err)
+	}
+	_, i, _ := matcher.Match(desired...)
+	if i != 0 {
+		t.Errorf("got %v; want 0", i)
+	}
+}
+
 func TestBestMatchAlloc(t *testing.T) {
 	m := NewMatcher(makeTagList("en sr nl"))
 	// Go allocates when creating a list of tags from a single tag!
diff --git a/language/tables.go b/language/tables.go
index 87e58a02a..96b57f610 100644
--- a/language/tables.go
+++ b/language/tables.go
@@ -47,7 +47,7 @@ const (
 	_Zzzz = 251
 )
 
-var regionToGroups = []uint8{ // 357 elements
+var regionToGroups = []uint8{ // 358 elements
 	// Entry 0 - 3F
 	0x00, 0x00, 0x00, 0x04, 0x04, 0x00, 0x00, 0x04,
 	0x00, 0x00, 0x00, 0x00, 0x04, 0x04, 0x04, 0x00,
@@ -98,8 +98,8 @@ var regionToGroups = []uint8{ // 357 elements
 	0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
 	0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
 	0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
-	0x00, 0x00, 0x00, 0x00, 0x00,
-} // Size: 381 bytes
+	0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
+} // Size: 382 bytes
 
 var paradigmLocales = [][3]uint16{ // 3 elements
 	0: [3]uint16{0x139, 0x0, 0x7b},
@@ -295,4 +295,4 @@ var matchRegion = []regionIntelligibility{ // 15 elements
 	14: {lang: 0x529, script: 0x3c, group: 0x80, distance: 0x5},
 } // Size: 114 bytes
 
-// Total table size 1471 bytes (1KiB); checksum: 4CB1CD46
+// Total table size 1472 bytes (1KiB); checksum: F86C669

From c2d28a6ddf6cb833e996ccb00cbb4206394958d2 Mon Sep 17 00:00:00 2001
From: Carl Menezes <carleeto@gmail.com>
Date: Sun, 11 Apr 2021 00:32:09 +0000
Subject: [PATCH 10/40] number: match input example to be Dutch as in the
 output

Change-Id: I5d1eaf79aa267121ce08dc3990b86ff30c8e0505
GitHub-Last-Rev: 0421867699811a7e6569e1d1d38943118d5c282d
GitHub-Pull-Request: golang/text#21
Reviewed-on: https://go-review.googlesource.com/c/text/+/297589
Reviewed-by: Emmanuel Odeke <emmanuel@orijtech.com>
Reviewed-by: Tobias Klauser <tobias.klauser@gmail.com>
Run-TryBot: Emmanuel Odeke <emmanuel@orijtech.com>
TryBot-Result: Go Bot <gobot@golang.org>
---
 number/doc.go | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/number/doc.go b/number/doc.go
index 2ad8d431a..925383acc 100644
--- a/number/doc.go
+++ b/number/doc.go
@@ -19,7 +19,7 @@
 //
 //    p := message.NewPrinter(language.Dutch)
 //
-//    p.Printf("There are %v bikes per household.", number.Decimal(1.2))
+//    p.Printf("Er zijn %v fietsen per huishouden.", number.Decimal(1.2))
 //    // Prints: Er zijn 1,2 fietsen per huishouden.
 //
 //

From 5c7c50ebbd4f5b0d53b9b2fcdbeb92ffb732a06e Mon Sep 17 00:00:00 2001
From: "Bryan C. Mills" <bcmills@google.com>
Date: Fri, 30 Apr 2021 09:29:37 -0400
Subject: [PATCH 11/40] go.mod: upgrade to go 1.17

This change was produced using 'go mod tidy -go=1.17'
with a go command built at CL 315210.

This activates lazy loading, and updates the go.mod file to maintain
the lazy-loading invariants (namely, including an explicit requirement
for every package transitively imported by the main module).

Note that this does *not* prevent users with earlier go versions from
successfully building packages from this module.

For golang/go#36460

Change-Id: Iabb65fc3ed9727abecc3926abcecd445c967d0a9
Reviewed-on: https://go-review.googlesource.com/c/text/+/315571
Trust: Bryan C. Mills <bcmills@google.com>
Run-TryBot: Bryan C. Mills <bcmills@google.com>
TryBot-Result: Go Bot <gobot@golang.org>
Reviewed-by: Alexander Rakoczy <alex@golang.org>
Reviewed-by: Marcel van Lohuizen <mpvl@golang.org>
---
 go.mod | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/go.mod b/go.mod
index 8ff7ecb6f..63bc05f20 100644
--- a/go.mod
+++ b/go.mod
@@ -2,4 +2,4 @@ module golang.org/x/text
 
 require golang.org/x/tools v0.0.0-20180917221912-90fa682c2a6e
 
-go 1.11
+go 1.17

From 3115f89c4b99a620c7f1a4395a2b4405e95b82b6 Mon Sep 17 00:00:00 2001
From: Deepak S <deepakspavoodath@gmail.com>
Date: Sat, 22 May 2021 08:20:00 +0000
Subject: [PATCH 12/40] language: use multiple runs in TestBestMatchAlloc

AllocsPerRun sets runtime.GOMAXPROCS to 1, but it doesn't prevent the runtime from descheduling a goroutine
and performing an allocation somewhere in the background.
This commit changes the test to use a number of runs large enough to average away the occasional noisy allocation.

Fixes golang/go#45809

Change-Id: Ibf904016d0c067740469c8e861079611440222a1
GitHub-Last-Rev: 1606b6969a4d462804dda8d98b9c4432241e87ea
GitHub-Pull-Request: golang/text#23
Reviewed-on: https://go-review.googlesource.com/c/text/+/321737
Reviewed-by: Bryan C. Mills <bcmills@google.com>
Trust: Michael Knyszek <mknyszek@google.com>
---
 language/match_test.go | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/language/match_test.go b/language/match_test.go
index a6df3e1dc..313580b60 100644
--- a/language/match_test.go
+++ b/language/match_test.go
@@ -242,7 +242,7 @@ func TestBestMatchAlloc(t *testing.T) {
 	m := NewMatcher(makeTagList("en sr nl"))
 	// Go allocates when creating a list of tags from a single tag!
 	list := []Tag{English}
-	avg := testtext.AllocsPerRun(1, func() {
+	avg := testtext.AllocsPerRun(100, func() {
 		m.Match(list...)
 	})
 	if avg > 0 {

From 383b2e75a7a4198c42f8f87833eefb772868a56f Mon Sep 17 00:00:00 2001
From: Russ Cox <rsc@golang.org>
Date: Mon, 9 Aug 2021 15:09:12 -0400
Subject: [PATCH 13/40] language: turn parsing panics into ErrSyntax

We keep finding new panics in the language parser.
Limit the damage by reporting those inputs as syntax errors.

Change-Id: I786fe127c3df7e4c8e042d15095d3acf3c4e4a50
Reviewed-on: https://go-review.googlesource.com/c/text/+/340830
Trust: Russ Cox <rsc@golang.org>
Run-TryBot: Russ Cox <rsc@golang.org>
TryBot-Result: Go Bot <gobot@golang.org>
Reviewed-by: Roland Shoemaker <roland@golang.org>
---
 internal/language/language.go | 43 +++++++++++++++++++++++++++++++----
 internal/language/parse.go    |  7 ++++++
 language/parse.go             | 22 ++++++++++++++++++
 3 files changed, 68 insertions(+), 4 deletions(-)

diff --git a/internal/language/language.go b/internal/language/language.go
index f41aedcfc..6105bc7fa 100644
--- a/internal/language/language.go
+++ b/internal/language/language.go
@@ -251,6 +251,13 @@ func (t Tag) Parent() Tag {
 
 // ParseExtension parses s as an extension and returns it on success.
 func ParseExtension(s string) (ext string, err error) {
+	defer func() {
+		if recover() != nil {
+			ext = ""
+			err = ErrSyntax
+		}
+	}()
+
 	scan := makeScannerString(s)
 	var end int
 	if n := len(scan.token); n != 1 {
@@ -461,7 +468,14 @@ func (t Tag) findTypeForKey(key string) (start, sep, end int, hasExt bool) {
 // ParseBase parses a 2- or 3-letter ISO 639 code.
 // It returns a ValueError if s is a well-formed but unknown language identifier
 // or another error if another error occurred.
-func ParseBase(s string) (Language, error) {
+func ParseBase(s string) (l Language, err error) {
+	defer func() {
+		if recover() != nil {
+			l = 0
+			err = ErrSyntax
+		}
+	}()
+
 	if n := len(s); n < 2 || 3 < n {
 		return 0, ErrSyntax
 	}
@@ -472,7 +486,14 @@ func ParseBase(s string) (Language, error) {
 // ParseScript parses a 4-letter ISO 15924 code.
 // It returns a ValueError if s is a well-formed but unknown script identifier
 // or another error if another error occurred.
-func ParseScript(s string) (Script, error) {
+func ParseScript(s string) (scr Script, err error) {
+	defer func() {
+		if recover() != nil {
+			scr = 0
+			err = ErrSyntax
+		}
+	}()
+
 	if len(s) != 4 {
 		return 0, ErrSyntax
 	}
@@ -489,7 +510,14 @@ func EncodeM49(r int) (Region, error) {
 // ParseRegion parses a 2- or 3-letter ISO 3166-1 or a UN M.49 code.
 // It returns a ValueError if s is a well-formed but unknown region identifier
 // or another error if another error occurred.
-func ParseRegion(s string) (Region, error) {
+func ParseRegion(s string) (r Region, err error) {
+	defer func() {
+		if recover() != nil {
+			r = 0
+			err = ErrSyntax
+		}
+	}()
+
 	if n := len(s); n < 2 || 3 < n {
 		return 0, ErrSyntax
 	}
@@ -578,7 +606,14 @@ type Variant struct {
 
 // ParseVariant parses and returns a Variant. An error is returned if s is not
 // a valid variant.
-func ParseVariant(s string) (Variant, error) {
+func ParseVariant(s string) (v Variant, err error) {
+	defer func() {
+		if recover() != nil {
+			v = Variant{}
+			err = ErrSyntax
+		}
+	}()
+
 	s = strings.ToLower(s)
 	if id, ok := variantIndex[s]; ok {
 		return Variant{id, s}, nil
diff --git a/internal/language/parse.go b/internal/language/parse.go
index c696fd0bd..47ee0fed1 100644
--- a/internal/language/parse.go
+++ b/internal/language/parse.go
@@ -232,6 +232,13 @@ func Parse(s string) (t Tag, err error) {
 	if s == "" {
 		return Und, ErrSyntax
 	}
+	defer func() {
+		if recover() != nil {
+			t = Und
+			err = ErrSyntax
+			return
+		}
+	}()
 	if len(s) <= maxAltTaglen {
 		b := [maxAltTaglen]byte{}
 		for i, c := range s {
diff --git a/language/parse.go b/language/parse.go
index 11acfd885..59b041008 100644
--- a/language/parse.go
+++ b/language/parse.go
@@ -43,6 +43,13 @@ func Parse(s string) (t Tag, err error) {
 // https://www.unicode.org/reports/tr35/#Unicode_Language_and_Locale_Identifiers.
 // The resulting tag is canonicalized using the canonicalization type c.
 func (c CanonType) Parse(s string) (t Tag, err error) {
+	defer func() {
+		if recover() != nil {
+			t = Tag{}
+			err = language.ErrSyntax
+		}
+	}()
+
 	tt, err := language.Parse(s)
 	if err != nil {
 		return makeTag(tt), err
@@ -79,6 +86,13 @@ func Compose(part ...interface{}) (t Tag, err error) {
 // tag is returned after canonicalizing using CanonType c. If one or more errors
 // are encountered, one of the errors is returned.
 func (c CanonType) Compose(part ...interface{}) (t Tag, err error) {
+	defer func() {
+		if recover() != nil {
+			t = Tag{}
+			err = language.ErrSyntax
+		}
+	}()
+
 	var b language.Builder
 	if err = update(&b, part...); err != nil {
 		return und, err
@@ -142,6 +156,14 @@ var errInvalidWeight = errors.New("ParseAcceptLanguage: invalid weight")
 // Tags with a weight of zero will be dropped. An error will be returned if the
 // input could not be parsed.
 func ParseAcceptLanguage(s string) (tag []Tag, q []float32, err error) {
+	defer func() {
+		if recover() != nil {
+			tag = nil
+			q = nil
+			err = language.ErrSyntax
+		}
+	}()
+
 	var entry string
 	for s != "" {
 		if entry, s = split(s, ','); entry == "" {

From 2ca5a52dcb2f184d71fbbf2a28372c5882d990a8 Mon Sep 17 00:00:00 2001
From: Rich Hong <hong.rich@gmail.com>
Date: Mon, 28 Sep 2020 16:32:38 -0400
Subject: [PATCH 14/40] internal/language: fix canonicalization of extlang

parseTag tries to replace <lang>-<extlang> with <extlang>, but <extlang>
itself can also be replaced with its canonical form which can be a
different length than the original <extlang>. The existing
implementation assumes that the length of <extlang> is 3 and would leave
scanner positions in an incorrect state if the length of <extlang> is
not 3.

Fixes golang/go#41617

Change-Id: Ie0da320530e2545f9b521e7b8cf503d854c50b45
Reviewed-on: https://go-review.googlesource.com/c/text/+/260177
Run-TryBot: Alberto Donizetti <alb.donizetti@gmail.com>
TryBot-Result: Go Bot <gobot@golang.org>
Trust: Alberto Donizetti <alb.donizetti@gmail.com>
Trust: Cherry Mui <cherryyz@google.com>
Trust: Marcel van Lohuizen <mpvl@golang.org>
Reviewed-by: Marcel van Lohuizen <mpvl@golang.org>
---
 internal/language/compact/parse_test.go |  5 +++++
 internal/language/language_test.go      |  2 ++
 internal/language/parse.go              | 24 ++++++++++++++----------
 internal/language/parse_test.go         | 10 +++++++++-
 language/language_test.go               |  2 ++
 language/parse_test.go                  |  5 +++++
 6 files changed, 37 insertions(+), 11 deletions(-)

diff --git a/internal/language/compact/parse_test.go b/internal/language/compact/parse_test.go
index abe3a58c0..2db200b88 100644
--- a/internal/language/compact/parse_test.go
+++ b/internal/language/compact/parse_test.go
@@ -122,6 +122,11 @@ func parseTests() []parseTest {
 		{in: "en-t-nl-abcd", lang: "en", ext: "t-nl", invalid: true},
 		{in: "en-t-nl-latn", lang: "en", ext: "t-nl-latn"},
 		{in: "en-t-t0-abcd-x-a", lang: "en", extList: []string{"t-t0-abcd", "x-a"}},
+		{in: "en_t_pt_MLt", lang: "en", ext: "t-pt-mlt", changed: true},
+		{in: "en-t-fr-est", lang: "en", ext: "t-fr-est", changed: false},
+		{in: "fr-est", lang: "et", changed: true},
+		{in: "fr-est-t-fr-est", lang: "et", ext: "t-fr-est", changed: true},
+		{in: "fr-est-Cyrl", lang: "et", script: "Cyrl", changed: true},
 		// invalid
 		{in: "", lang: "und", invalid: true},
 		{in: "-", lang: "und", invalid: true},
diff --git a/internal/language/language_test.go b/internal/language/language_test.go
index 8244c1c8a..668034d03 100644
--- a/internal/language/language_test.go
+++ b/internal/language/language_test.go
@@ -681,6 +681,8 @@ var (
 		"en-t-t0-abcd",
 		"en-t-nl-latn",
 		"en-t-t0-abcd-x-a",
+		"en_t_pt_MLt",
+		"en-t-fr-est",
 	}
 	// Change, but not memory allocation required.
 	benchSimpleChange = []string{
diff --git a/internal/language/parse.go b/internal/language/parse.go
index 47ee0fed1..aad1e0acf 100644
--- a/internal/language/parse.go
+++ b/internal/language/parse.go
@@ -270,7 +270,7 @@ func parse(scan *scanner, s string) (t Tag, err error) {
 	} else if n >= 4 {
 		return Und, ErrSyntax
 	} else { // the usual case
-		t, end = parseTag(scan)
+		t, end = parseTag(scan, true)
 		if n := len(scan.token); n == 1 {
 			t.pExt = uint16(end)
 			end = parseExtensions(scan)
@@ -296,7 +296,8 @@ func parse(scan *scanner, s string) (t Tag, err error) {
 
 // parseTag parses language, script, region and variants.
 // It returns a Tag and the end position in the input that was parsed.
-func parseTag(scan *scanner) (t Tag, end int) {
+// If doNorm is true, then <lang>-<extlang> will be normalized to <extlang>.
+func parseTag(scan *scanner, doNorm bool) (t Tag, end int) {
 	var e error
 	// TODO: set an error if an unknown lang, script or region is encountered.
 	t.LangID, e = getLangID(scan.token)
@@ -307,14 +308,17 @@ func parseTag(scan *scanner) (t Tag, end int) {
 	for len(scan.token) == 3 && isAlpha(scan.token[0]) {
 		// From http://tools.ietf.org/html/bcp47, <lang>-<extlang> tags are equivalent
 		// to a tag of the form <extlang>.
-		lang, e := getLangID(scan.token)
-		if lang != 0 {
-			t.LangID = lang
-			copy(scan.b[langStart:], lang.String())
-			scan.b[langStart+3] = '-'
-			scan.start = langStart + 4
+		if doNorm {
+			lang, e := getLangID(scan.token)
+			if lang != 0 {
+				t.LangID = lang
+				langStr := lang.String()
+				copy(scan.b[langStart:], langStr)
+				scan.b[langStart+len(langStr)] = '-'
+				scan.start = langStart + len(langStr) + 1
+			}
+			scan.gobble(e)
 		}
-		scan.gobble(e)
 		end = scan.scan()
 	}
 	if len(scan.token) == 4 && isAlpha(scan.token[0]) {
@@ -559,7 +563,7 @@ func parseExtension(scan *scanner) int {
 	case 't': // https://www.ietf.org/rfc/rfc6497.txt
 		scan.scan()
 		if n := len(scan.token); n >= 2 && n <= 3 && isAlpha(scan.token[1]) {
-			_, end = parseTag(scan)
+			_, end = parseTag(scan, false)
 			scan.toLower(start, end)
 		}
 		for len(scan.token) == 2 && !isAlpha(scan.token[1]) {
diff --git a/internal/language/parse_test.go b/internal/language/parse_test.go
index e1d428aa6..0af9e8a25 100644
--- a/internal/language/parse_test.go
+++ b/internal/language/parse_test.go
@@ -192,6 +192,14 @@ func parseTests() []parseTest {
 		{in: "en-t-nl-abcd", lang: "en", ext: "t-nl", invalid: true},
 		{in: "en-t-nl-latn", lang: "en", ext: "t-nl-latn"},
 		{in: "en-t-t0-abcd-x-a", lang: "en", extList: []string{"t-t0-abcd", "x-a"}},
+		{in: "en_t_pt_MLt", lang: "en", ext: "t-pt-mlt", changed: true},
+		{in: "en-t-fr-est", lang: "en", ext: "t-fr-est", changed: false},
+		{in: "fr-est", lang: "et", changed: false},
+		{in: "fr-est-Cyrl", lang: "et", script: "Cyrl", changed: false},
+		// The same input here is used in both TestParse and TestParseExtensions.
+		// changed should be true for this input in TestParse but changed should be false for this input in TestParseExtensions
+		// because the entire input has been reformatted but the extension part hasn't.
+		// {in: "fr-est-t-fr-est", lang: "et", ext: "t-fr-est", changed: true},
 		// invalid
 		{in: "", lang: "und", invalid: true},
 		{in: "-", lang: "und", invalid: true},
@@ -299,7 +307,7 @@ func TestParseTag(t *testing.T) {
 			return Tag{}, true
 		}
 		scan := makeScannerString(tt.in)
-		id, end := parseTag(&scan)
+		id, end := parseTag(&scan, true)
 		id.str = string(scan.b[:end])
 		tt.ext = ""
 		tt.extList = []string{}
diff --git a/language/language_test.go b/language/language_test.go
index b2e3ce3c5..d45706c98 100644
--- a/language/language_test.go
+++ b/language/language_test.go
@@ -723,6 +723,8 @@ var (
 		"en-t-t0-abcd",
 		"en-t-nl-latn",
 		"en-t-t0-abcd-x-a",
+		"en_t_pt_MLt",
+		"en-t-fr-est",
 	}
 	// Change, but not memory allocation required.
 	benchSimpleChange = []string{
diff --git a/language/parse_test.go b/language/parse_test.go
index 4b7e64db3..e1e5653ad 100644
--- a/language/parse_test.go
+++ b/language/parse_test.go
@@ -129,6 +129,11 @@ func parseTests() []parseTest {
 		{in: "en-t-nl-abcd", lang: "en", ext: "t-nl", invalid: true},
 		{in: "en-t-nl-latn", lang: "en", ext: "t-nl-latn"},
 		{in: "en-t-t0-abcd-x-a", lang: "en", extList: []string{"t-t0-abcd", "x-a"}},
+		{in: "en_t_pt_MLt", lang: "en", ext: "t-pt-mlt", changed: true},
+		{in: "en-t-fr-est", lang: "en", ext: "t-fr-est", changed: false},
+		{in: "fr-est", lang: "et", changed: true},
+		{in: "fr-est-t-fr-est", lang: "et", ext: "t-fr-est", changed: true},
+		{in: "fr-est-Cyrl", lang: "et", script: "Cyrl", changed: true},
 		// invalid
 		{in: "", lang: "und", invalid: true},
 		{in: "-", lang: "und", invalid: true},

From 29bf0102df0c3c8844ae296826d1a9e7302f26df Mon Sep 17 00:00:00 2001
From: Marcel van Lohuizen <mpvl@golang.org>
Date: Mon, 3 May 2021 20:14:09 +0000
Subject: [PATCH 15/40] Revert "number: match input example to be Dutch as in
 the output"

This reverts commit c2d28a6ddf6cb833e996ccb00cbb4206394958d2.

Reason for revert: This change was incorrect. The examples were supposed to demonstrate that the API can provide translations.

Change-Id: I247d5509136d34ce4c82a8ac2de50dad3f652a78
Reviewed-on: https://go-review.googlesource.com/c/text/+/316529
Reviewed-by: Emmanuel Odeke <emmanuel@orijtech.com>
Reviewed-by: Alberto Donizetti <alb.donizetti@gmail.com>
Run-TryBot: Emmanuel Odeke <emmanuel@orijtech.com>
Run-TryBot: Alberto Donizetti <alb.donizetti@gmail.com>
Trust: Cherry Mui <cherryyz@google.com>
---
 number/doc.go | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/number/doc.go b/number/doc.go
index 925383acc..2ad8d431a 100644
--- a/number/doc.go
+++ b/number/doc.go
@@ -19,7 +19,7 @@
 //
 //    p := message.NewPrinter(language.Dutch)
 //
-//    p.Printf("Er zijn %v fietsen per huishouden.", number.Decimal(1.2))
+//    p.Printf("There are %v bikes per household.", number.Decimal(1.2))
 //    // Prints: Er zijn 1,2 fietsen per huishouden.
 //
 //

From 22bfdb67013842b9fed978a6f362b3edee086066 Mon Sep 17 00:00:00 2001
From: Amelia Downs <adowns@vmware.com>
Date: Mon, 13 Sep 2021 16:17:04 -0400
Subject: [PATCH 16/40] language: fix ExampleMatcher output

This removes the "TODO" after the output section, which was preventing
this test from running properly and from running in pkg.go.dev. Fixing
this revealed that many of the outputs were out of date and needed to be
updated as well.

Fixes: golang/go#48361

Change-Id: I495e4eb83f071d4d9810bf44bfabe3258a6220c8
Reviewed-on: https://go-review.googlesource.com/c/text/+/349552
Trust: Alberto Donizetti <alb.donizetti@gmail.com>
Trust: Marcel van Lohuizen <mpvl@golang.org>
Run-TryBot: Alberto Donizetti <alb.donizetti@gmail.com>
Run-TryBot: Marcel van Lohuizen <mpvl@golang.org>
TryBot-Result: Go Bot <gobot@golang.org>
Reviewed-by: Alberto Donizetti <alb.donizetti@gmail.com>
Reviewed-by: Amelia Downs <adowns@vmware.com>
Reviewed-by: Marcel van Lohuizen <mpvl@golang.org>
---
 language/examples_test.go | 58 +++++++++++++++++++--------------------
 1 file changed, 28 insertions(+), 30 deletions(-)

diff --git a/language/examples_test.go b/language/examples_test.go
index ad089a3f4..61401f252 100644
--- a/language/examples_test.go
+++ b/language/examples_test.go
@@ -247,24 +247,28 @@ func ExampleMatcher() {
 	// This is the set of tags from which we want to pick the best match. These
 	// can be, for example, the supported languages for some package.
 	tags := []language.Tag{
-		language.English,
-		language.BritishEnglish,
-		language.French,
-		language.Afrikaans,
-		language.BrazilianPortuguese,
-		language.EuropeanPortuguese,
-		language.Croatian,
-		language.SimplifiedChinese,
-		language.Raw.Make("iw-IL"),
-		language.Raw.Make("iw"),
-		language.Raw.Make("he"),
+		language.English,             // en
+		language.BritishEnglish,      // en-GB
+		language.French,              // fr
+		language.Afrikaans,           // af
+		language.BrazilianPortuguese, // pt-BR
+		language.EuropeanPortuguese,  // pt-PT
+		language.SimplifiedChinese,   // zh-Hans
+		language.Raw.Make("iw-IL"),   // Hebrew from Israel
+		language.Raw.Make("iw"),      // Hebrew
+		language.Raw.Make("he"),      // Hebrew
 	}
 	m := language.NewMatcher(tags)
 
 	// A simple match.
 	fmt.Println(m.Match(language.Make("fr")))
 
-	// Australian English is closer to British than American English.
+	// Australian English is closer to British English than American English.
+	// The resulting match is "en-GB-u-rg-auzzzz". The first language listed,
+	// "en-GB", is the matched language. Next is the region override prefix
+	// "-u-rg-", the region override "au", and the region override suffix "zzzz".
+	// The region override is for things like currency, dates, and measurement
+	// systems.
 	fmt.Println(m.Match(language.Make("en-AU")))
 
 	// Default to the first tag passed to the Matcher if there is no match.
@@ -275,15 +279,12 @@ func ExampleMatcher() {
 
 	fmt.Println("----")
 
-	// Someone specifying sr-Latn is probably fine with getting Croatian.
-	fmt.Println(m.Match(language.Make("sr-Latn")))
-
 	// We match SimplifiedChinese, but with Low confidence.
 	fmt.Println(m.Match(language.TraditionalChinese))
 
-	// Serbian in Latin script is a closer match to Croatian than Traditional
-	// Chinese to Simplified Chinese.
-	fmt.Println(m.Match(language.TraditionalChinese, language.Make("sr-Latn")))
+	// British English is closer to Australian English than Traditional Chinese
+	// to Simplified Chinese.
+	fmt.Println(m.Match(language.TraditionalChinese, language.Make("en-AU")))
 
 	fmt.Println("----")
 
@@ -297,7 +298,7 @@ func ExampleMatcher() {
 
 	fmt.Println("----")
 
-	// If a Matcher is initialized with a language and it's deprecated version,
+	// If a Matcher is initialized with a language and its deprecated version,
 	// it will distinguish between them.
 	fmt.Println(m.Match(language.Raw.Make("iw")))
 
@@ -319,26 +320,23 @@ func ExampleMatcher() {
 
 	// Output:
 	// fr 2 Exact
-	// en-GB 1 High
+	// en-GB-u-rg-auzzzz 1 High
 	// en 0 No
 	// en 0 No
 	// ----
-	// hr 6 High
-	// zh-Hans 7 Low
-	// hr 6 High
+	// zh-Hans 6 Low
+	// en-GB-u-rg-auzzzz 1 High
 	// ----
-	// pt-BR 4 High
-	// fr 2 High
-	// af 3 High
+	// pt-BR 4 Exact
+	// fr-u-rg-bezzzz 2 High
+	// af-u-rg-nazzzz 3 High
 	// ----
-	// iw 9 Exact
-	// he 10 Exact
+	// iw-IL 7 Exact
+	// he-u-rg-ilzzzz 9 Exact
 	// ----
 	// fr-u-cu-frf 2 Exact
 	// fr-u-cu-frf 2 High
 	// en-u-co-phonebk 0 No
-
-	// TODO: "he" should be "he-u-rg-IL High"
 }
 
 func ExampleMatchStrings() {

From 1b993004bb667a0b60e9bff6aa6dd173d4103d42 Mon Sep 17 00:00:00 2001
From: "Bryan C. Mills" <bcmills@google.com>
Date: Thu, 30 Sep 2021 11:59:03 -0400
Subject: [PATCH 17/40] all: upgrade x/tools to latest

Apparently the x/text/message/pipeline test uses x/tools/go/ssa to
introspect something, and as of CL 352953 the 'runtime' package needs
a newer version of x/tools/go/ssa (probably to pick up CL 333110).

Fixes golang/go#48701
Updates golang/go#47091

Change-Id: I78474f5ad037744906f5c771a7af7e0195f65173
Reviewed-on: https://go-review.googlesource.com/c/text/+/353350
Trust: Bryan C. Mills <bcmills@google.com>
Trust: Josh Bleecher Snyder <josharian@gmail.com>
Run-TryBot: Bryan C. Mills <bcmills@google.com>
TryBot-Result: Go Bot <gobot@golang.org>
Reviewed-by: Josh Bleecher Snyder <josharian@gmail.com>
---
 go.mod                            |  8 +++++++-
 go.sum                            | 27 +++++++++++++++++++++++++-
 message/pipeline/pipeline_test.go | 32 ++++++++++++++++++++++++++++---
 3 files changed, 62 insertions(+), 5 deletions(-)

diff --git a/go.mod b/go.mod
index 63bc05f20..32d3aa025 100644
--- a/go.mod
+++ b/go.mod
@@ -1,5 +1,11 @@
 module golang.org/x/text
 
-require golang.org/x/tools v0.0.0-20180917221912-90fa682c2a6e
+require golang.org/x/tools v0.1.7
+
+require (
+	golang.org/x/mod v0.4.2 // indirect
+	golang.org/x/sys v0.0.0-20210809222454-d867a43fc93e // indirect
+	golang.org/x/xerrors v0.0.0-20200804184101-5ec99f83aff1 // indirect
+)
 
 go 1.17
diff --git a/go.sum b/go.sum
index 6a308d730..13ba81505 100644
--- a/go.sum
+++ b/go.sum
@@ -1,2 +1,27 @@
-golang.org/x/tools v0.0.0-20180917221912-90fa682c2a6e h1:FDhOuMEY4JVRztM/gsbk+IKUQ8kj74bxZrgw87eMMVc=
+github.com/yuin/goldmark v1.4.0/go.mod h1:mwnBkeHKe2W/ZEtQ+71ViKU8L12m81fl3OWwC1Zlc8k=
+golang.org/x/crypto v0.0.0-20190308221718-c2843e01d9a2/go.mod h1:djNgcEr1/C05ACkg1iLfiJU5Ep61QUkGW8qpdssI0+w=
+golang.org/x/crypto v0.0.0-20191011191535-87dc89f01550/go.mod h1:yigFU9vqHzYiE8UmvKecakEJjdnWj3jj499lnFckfCI=
+golang.org/x/mod v0.4.2 h1:Gz96sIWK3OalVv/I/qNygP42zyoKp3xptRVCWRFEBvo=
+golang.org/x/mod v0.4.2/go.mod h1:s0Qsj1ACt9ePp/hMypM3fl4fZqREWJwdYDEqhRiZZUA=
+golang.org/x/net v0.0.0-20190404232315-eb5bcb51f2a3/go.mod h1:t9HGtf8HONx5eT2rtn7q6eTqICYqUVnKs3thJo3Qplg=
+golang.org/x/net v0.0.0-20190620200207-3b0461eec859/go.mod h1:z5CRVTTTmAJ677TzLLGU+0bjPO0LkuOLi4/5GtJWs/s=
+golang.org/x/net v0.0.0-20210805182204-aaa1db679c0d/go.mod h1:9nx3DQGgdP8bBQD5qxJ1jj9UTztislL4KSBs9R2vV5Y=
+golang.org/x/sync v0.0.0-20190423024810-112230192c58/go.mod h1:RxMgew5VJxzue5/jJTE5uejpjVlOe/izrB70Jof72aM=
+golang.org/x/sync v0.0.0-20210220032951-036812b2e83c/go.mod h1:RxMgew5VJxzue5/jJTE5uejpjVlOe/izrB70Jof72aM=
+golang.org/x/sys v0.0.0-20190215142949-d0b11bdaac8a/go.mod h1:STP8DvDyc/dI5b8T5hshtkjS+E42TnysNCUPdjciGhY=
+golang.org/x/sys v0.0.0-20190412213103-97732733099d/go.mod h1:h1NjWce9XRLGQEsW7wpKNCjG9DtNlClVuFLEZdDNbEs=
+golang.org/x/sys v0.0.0-20201119102817-f84b799fce68/go.mod h1:h1NjWce9XRLGQEsW7wpKNCjG9DtNlClVuFLEZdDNbEs=
+golang.org/x/sys v0.0.0-20210423082822-04245dca01da/go.mod h1:h1NjWce9XRLGQEsW7wpKNCjG9DtNlClVuFLEZdDNbEs=
+golang.org/x/sys v0.0.0-20210809222454-d867a43fc93e h1:WUoyKPm6nCo1BnNUvPGnFG3T5DUVem42yDJZZ4CNxMA=
+golang.org/x/sys v0.0.0-20210809222454-d867a43fc93e/go.mod h1:oPkhp1MJrh7nUepCBck5+mAzfO9JrbApNNgaTdGDITg=
+golang.org/x/term v0.0.0-20201126162022-7de9c90e9dd1/go.mod h1:bj7SfCRtBDWHUb9snDiAeCFNEtKQo2Wmx5Cou7ajbmo=
+golang.org/x/text v0.3.0/go.mod h1:NqM8EUOU14njkJ3fqMW+pc6Ldnwhi/IjpwHt7yyuwOQ=
+golang.org/x/text v0.3.6/go.mod h1:5Zoc/QRtKVWzQhOtBMvqHzDpF6irO9z98xDceosuGiQ=
 golang.org/x/tools v0.0.0-20180917221912-90fa682c2a6e/go.mod h1:n7NCudcB/nEzxVGmLbDWY5pfWTLqBcC2KZ6jyYvM4mQ=
+golang.org/x/tools v0.0.0-20191119224855-298f0cb1881e/go.mod h1:b+2E5dAYhXwXZwtnZ6UAqBI28+e2cm9otk0dWdXHAEo=
+golang.org/x/tools v0.1.7 h1:6j8CgantCy3yc8JGBqkDLMKWqZ0RDU2g1HVgacojGWQ=
+golang.org/x/tools v0.1.7/go.mod h1:LGqMHiF4EqQNHR1JncWGqT5BVaXmza+X+BDGol+dOxo=
+golang.org/x/xerrors v0.0.0-20190717185122-a985d3407aa7/go.mod h1:I/5z698sn9Ka8TeJc9MKroUUfqBBauWjQqLJ2OPfmY0=
+golang.org/x/xerrors v0.0.0-20191011141410-1b5146add898/go.mod h1:I/5z698sn9Ka8TeJc9MKroUUfqBBauWjQqLJ2OPfmY0=
+golang.org/x/xerrors v0.0.0-20200804184101-5ec99f83aff1 h1:go1bK/D/BFZV2I8cIQd1NKEZ+0owSTG1fDTci4IqFcE=
+golang.org/x/xerrors v0.0.0-20200804184101-5ec99f83aff1/go.mod h1:I/5z698sn9Ka8TeJc9MKroUUfqBBauWjQqLJ2OPfmY0=
diff --git a/message/pipeline/pipeline_test.go b/message/pipeline/pipeline_test.go
index fe3b5daff..51c14a50b 100644
--- a/message/pipeline/pipeline_test.go
+++ b/message/pipeline/pipeline_test.go
@@ -139,18 +139,44 @@ func initTestdataModule(t *testing.T, dst string) {
 	}
 
 	goMod := fmt.Sprintf(`module testdata
-go 1.11
-require golang.org/x/text v0.0.0-00010101000000-000000000000
-replace golang.org/x/text v0.0.0-00010101000000-000000000000 => %s
+
+replace golang.org/x/text => %s
 `, xTextDir)
 	if err := ioutil.WriteFile(filepath.Join(dst, "go.mod"), []byte(goMod), 0644); err != nil {
 		t.Fatal(err)
 	}
 
+	// Copy in the checksums from the parent module so that we won't
+	// need to re-fetch them from the checksum database.
 	data, err := ioutil.ReadFile(filepath.Join(xTextDir, "go.sum"))
+	if err != nil {
+		t.Fatal(err)
+	}
 	if err := ioutil.WriteFile(filepath.Join(dst, "go.sum"), data, 0644); err != nil {
 		t.Fatal(err)
 	}
+
+	// We've added a replacement for the parent version of x/text,
+	// but now we need to populate the correct version.
+	// (We can't just replace the zero-version because x/text
+	// may indirectly depend on some nonzero version of itself.)
+	//
+	// We use 'go get' instead of 'go mod tidy' to avoid the old-release
+	// compatibility check when graph pruning is enabled, and to avoid doing
+	// more work than necessary for test dependencies of imported packages
+	// (we're not going to run those tests here anyway).
+	//
+	// We 'go get' the packages in the testdata module — not specific dependencies
+	// of those packages — so that they will resolve to whatever version is
+	// already required in the (replaced) x/text go.mod file.
+
+	getCmd := exec.Command("go", "get", "-d", "./...")
+	getCmd.Dir = dst
+	getCmd.Env = append(os.Environ(), "PWD="+dst, "GOPROXY=off", "GOCACHE=off")
+	if out, err := getCmd.CombinedOutput(); err != nil {
+		t.Logf("%s", out)
+		t.Fatal(err)
+	}
 }
 
 func checkOutput(t *testing.T, gen string, testdataDir string) {

From 5bd84dd9b33bd2bdebd8a6a6477920a8e492d47f Mon Sep 17 00:00:00 2001
From: Alexander Yastrebov <yastrebov.alex@gmail.com>
Date: Sun, 3 Oct 2021 03:13:22 +0000
Subject: [PATCH 18/40] =?UTF-8?q?encoding/simplifiedchinese:=20Fixes=20?=
 =?UTF-8?q?=E2=82=AC=20encoding=20in=20GB18030?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

The euro sign is an exception which is given a single byte code of 0x80
in Microsoft's later versions of CP936/GBK and a two byte code of A2 E3
in GB18030. https://en.wikipedia.org/wiki/GB_18030#cite_note-4

Fixes golang/go#48691

Change-Id: I6a4460274d4313ad1d03bcd8070373af674691eb
GitHub-Last-Rev: acbbc50f20d663452f8da77cf2a66d8d893bec1d
GitHub-Pull-Request: golang/text#26
Reviewed-on: https://go-review.googlesource.com/c/text/+/353712
Reviewed-by: Nigel Tao <nigeltao@golang.org>
Trust: Nigel Tao <nigeltao@golang.org>
Trust: Alberto Donizetti <alb.donizetti@gmail.com>
Run-TryBot: Nigel Tao <nigeltao@golang.org>
TryBot-Result: Go Bot <gobot@golang.org>
---
 encoding/simplifiedchinese/all_test.go | 10 ++++++++++
 encoding/simplifiedchinese/gbk.go      |  6 +++++-
 2 files changed, 15 insertions(+), 1 deletion(-)

diff --git a/encoding/simplifiedchinese/all_test.go b/encoding/simplifiedchinese/all_test.go
index a556c94dd..fbb623cd2 100644
--- a/encoding/simplifiedchinese/all_test.go
+++ b/encoding/simplifiedchinese/all_test.go
@@ -40,7 +40,9 @@ func TestNonRepertoire(t *testing.T) {
 		{enc, HZGB2312, "a갂", "a"},
 		{enc, HZGB2312, "\u6cf5갂", "~{1C~}"},
 
+		{dec, GBK, "\xa2\xe3", "€"},
 		{dec, GB18030, "\x80", "€"},
+
 		{dec, GB18030, "\x81", "\ufffd"},
 		{dec, GB18030, "\x81\x20", "\ufffd "},
 		{dec, GB18030, "\xfe\xfe", "\ufffd"},
@@ -125,6 +127,14 @@ func TestBasics(t *testing.T) {
 		encPrefix: "~{",
 		encoded:   ";(<dR;:x>F#,6@WCN^O`GW!#",
 		utf8:      "花间一壶酒，独酌无相亲。",
+	}, {
+		e:       GBK,
+		encoded: "\x80",
+		utf8:    "€",
+	}, {
+		e:       GB18030,
+		encoded: "\xa2\xe3",
+		utf8:    "€",
 	}}
 
 	for _, tc := range testCases {
diff --git a/encoding/simplifiedchinese/gbk.go b/encoding/simplifiedchinese/gbk.go
index b89c45b03..0e0fabfd6 100644
--- a/encoding/simplifiedchinese/gbk.go
+++ b/encoding/simplifiedchinese/gbk.go
@@ -55,6 +55,8 @@ loop:
 		// Microsoft's Code Page 936 extends GBK 1.0 to encode the euro sign U+20AC
 		// as 0x80. The HTML5 specification at http://encoding.spec.whatwg.org/#gbk
 		// says to treat "gbk" as Code Page 936.
+		// GBK’s decoder is gb18030’s decoder. https://encoding.spec.whatwg.org/#gbk-decoder
+		// If byte is 0x80, return code point U+20AC. https://encoding.spec.whatwg.org/#gb18030-decoder
 		case c0 == 0x80:
 			r, size = '€', 1
 
@@ -180,7 +182,9 @@ func (e gbkEncoder) Transform(dst, src []byte, atEOF bool) (nDst, nSrc int, err
 				// Microsoft's Code Page 936 extends GBK 1.0 to encode the euro sign U+20AC
 				// as 0x80. The HTML5 specification at http://encoding.spec.whatwg.org/#gbk
 				// says to treat "gbk" as Code Page 936.
-				if r == '€' {
+				// GBK’s encoder is gb18030’s encoder with its _is GBK_ set to true. https://encoding.spec.whatwg.org/#gbk-encoder
+				// If _is GBK_ is true and code point is U+20AC, return byte 0x80. https://encoding.spec.whatwg.org/#gb18030-encoder
+				if !e.gb18030 && r == '€' {
 					r = 0x80
 					goto write1
 				}

From bb1c79828956f0f6753be0920efcecf32ba55f93 Mon Sep 17 00:00:00 2001
From: Timothy Gu <timothygu99@gmail.com>
Date: Thu, 6 May 2021 12:39:25 -0700
Subject: [PATCH 19/40] internal/export/idna: make Transitional an actual
 toggle

Previously, it always enabled transitional processing instead of
toggling, despite the fact that it took a boolean argument.

For golang/go#30940.

Change-Id: I00ad51ec55abfb2de28deb8c98f949989ece1099
Reviewed-on: https://go-review.googlesource.com/c/text/+/317729
Reviewed-by: Ian Lance Taylor <iant@golang.org>
Reviewed-by: Damien Neil <dneil@google.com>
Trust: Damien Neil <dneil@google.com>
Run-TryBot: Damien Neil <dneil@google.com>
TryBot-Result: Go Bot <gobot@golang.org>
---
 internal/export/idna/conformance_test.go |  3 +++
 internal/export/idna/idna10.0.0.go       |  4 ++--
 internal/export/idna/idna10.0.0_test.go  | 12 +++++++++---
 internal/export/idna/idna9.0.0.go        |  4 ++--
 internal/export/idna/idna9.0.0_test.go   | 12 +++++++++---
 5 files changed, 25 insertions(+), 10 deletions(-)

diff --git a/internal/export/idna/conformance_test.go b/internal/export/idna/conformance_test.go
index 1cdf43ca9..3e0e87518 100644
--- a/internal/export/idna/conformance_test.go
+++ b/internal/export/idna/conformance_test.go
@@ -2,6 +2,9 @@
 // Use of this source code is governed by a BSD-style
 // license that can be found in the LICENSE file.
 
+//go:build go1.10
+// +build go1.10
+
 package idna
 
 import (
diff --git a/internal/export/idna/idna10.0.0.go b/internal/export/idna/idna10.0.0.go
index 3e7bac3cb..e6b62a287 100644
--- a/internal/export/idna/idna10.0.0.go
+++ b/internal/export/idna/idna10.0.0.go
@@ -59,10 +59,10 @@ type Option func(*options)
 // Transitional sets a Profile to use the Transitional mapping as defined in UTS
 // #46. This will cause, for example, "ß" to be mapped to "ss". Using the
 // transitional mapping provides a compromise between IDNA2003 and IDNA2008
-// compatibility. It is used by most browsers when resolving domain names. This
+// compatibility. It is used by some browsers when resolving domain names. This
 // option is only meaningful if combined with MapForLookup.
 func Transitional(transitional bool) Option {
-	return func(o *options) { o.transitional = true }
+	return func(o *options) { o.transitional = transitional }
 }
 
 // VerifyDNSLength sets whether a Profile should fail if any of the IDN parts
diff --git a/internal/export/idna/idna10.0.0_test.go b/internal/export/idna/idna10.0.0_test.go
index 4142bfa84..0b9f7a862 100644
--- a/internal/export/idna/idna10.0.0_test.go
+++ b/internal/export/idna/idna10.0.0_test.go
@@ -34,6 +34,10 @@ func TestLabelErrors(t *testing.T) {
 	std3 := kind{"STD3", p.ToASCII}
 	p = New(MapForLookup(), CheckHyphens(false))
 	hyphens := kind{"CheckHyphens", p.ToASCII}
+	p = New(MapForLookup(), Transitional(true))
+	transitional := kind{"Transitional", p.ToASCII}
+	p = New(MapForLookup(), Transitional(false))
+	nontransitional := kind{"Nontransitional", p.ToASCII}
 
 	testCases := []struct {
 		kind
@@ -95,14 +99,16 @@ func TestLabelErrors(t *testing.T) {
 		{hyphens, "-label-.com", "-label-.com", ""},
 
 		// Don't map U+2490 (DIGIT NINE FULL STOP). This is the behavior of
-		// Chrome, Safari, and IE. Firefox will first map ⒐ to 9. and return
-		// lab9.be.
+		// Chrome, modern Firefox, Safari, and IE.
 		{resolve, "lab⒐be", "xn--labbe-zh9b", "P1"}, // encode("lab⒐be")
 		{display, "lab⒐be", "lab⒐be", "P1"},
-
 		{resolve, "plan⒐faß.de", "xn--planfass-c31e.de", "P1"}, // encode("plan⒐fass") + ".de"
 		{display, "Plan⒐faß.de", "plan⒐faß.de", "P1"},
 
+		// Transitional vs Nontransitional processing
+		{transitional, "Plan9faß.de", "plan9fass.de", ""},
+		{nontransitional, "Plan9faß.de", "xn--plan9fa-6va.de", ""},
+
 		// Chrome 54.0 recognizes the error and treats this input verbatim as a
 		// search string.
 		// Safari 10.0 (non-conform spec) decomposes "⒈" and computes the
diff --git a/internal/export/idna/idna9.0.0.go b/internal/export/idna/idna9.0.0.go
index 7acecb800..4979fdc17 100644
--- a/internal/export/idna/idna9.0.0.go
+++ b/internal/export/idna/idna9.0.0.go
@@ -58,10 +58,10 @@ type Option func(*options)
 // Transitional sets a Profile to use the Transitional mapping as defined in UTS
 // #46. This will cause, for example, "ß" to be mapped to "ss". Using the
 // transitional mapping provides a compromise between IDNA2003 and IDNA2008
-// compatibility. It is used by most browsers when resolving domain names. This
+// compatibility. It is used by some browsers when resolving domain names. This
 // option is only meaningful if combined with MapForLookup.
 func Transitional(transitional bool) Option {
-	return func(o *options) { o.transitional = true }
+	return func(o *options) { o.transitional = transitional }
 }
 
 // VerifyDNSLength sets whether a Profile should fail if any of the IDN parts
diff --git a/internal/export/idna/idna9.0.0_test.go b/internal/export/idna/idna9.0.0_test.go
index b76b79628..524727b1b 100644
--- a/internal/export/idna/idna9.0.0_test.go
+++ b/internal/export/idna/idna9.0.0_test.go
@@ -34,6 +34,10 @@ func TestLabelErrors(t *testing.T) {
 	std3 := kind{"STD3", p.ToASCII}
 	p = New(MapForLookup(), CheckHyphens(false))
 	hyphens := kind{"CheckHyphens", p.ToASCII}
+	p = New(MapForLookup(), Transitional(true))
+	transitional := kind{"Transitional", p.ToASCII}
+	p = New(MapForLookup(), Transitional(false))
+	nontransitional := kind{"Nontransitional", p.ToASCII}
 
 	testCases := []struct {
 		kind
@@ -91,14 +95,16 @@ func TestLabelErrors(t *testing.T) {
 		{hyphens, "-label-.com", "-label-.com", ""},
 
 		// Don't map U+2490 (DIGIT NINE FULL STOP). This is the behavior of
-		// Chrome, Safari, and IE. Firefox will first map ⒐ to 9. and return
-		// lab9.be.
+		// Chrome, modern Firefox, Safari, and IE.
 		{resolve, "lab⒐be", "xn--labbe-zh9b", "P1"}, // encode("lab⒐be")
 		{display, "lab⒐be", "lab⒐be", "P1"},
-
 		{resolve, "plan⒐faß.de", "xn--planfass-c31e.de", "P1"}, // encode("plan⒐fass") + ".de"
 		{display, "Plan⒐faß.de", "plan⒐faß.de", "P1"},
 
+		// Transitional vs Nontransitional processing
+		{transitional, "Plan9faß.de", "plan9fass.de", ""},
+		{nontransitional, "Plan9faß.de", "xn--plan9fa-6va.de", ""},
+
 		// Chrome 54.0 recognizes the error and treats this input verbatim as a
 		// search string.
 		// Safari 10.0 (non-conform spec) decomposes "⒈" and computes the

From 86e65b86426d37ada82226be2e8c1afae6bdc178 Mon Sep 17 00:00:00 2001
From: Timothy Gu <timothygu99@gmail.com>
Date: Thu, 6 May 2021 14:25:55 -0700
Subject: [PATCH 20/40] internal/export/idna: fix int32 overflows

Prefer multiplication (int64(b)*int64(c) > MaxInt32) over division (b >
MaxInt32/c) for overflow checking as it is a little faster on 386, and a
LOT faster on amd64.

For golang/go#28233.

Change-Id: Ibf42529b93b699417781adc7eca6e66474f00bbf
Reviewed-on: https://go-review.googlesource.com/c/text/+/317731
Run-TryBot: Ian Lance Taylor <iant@golang.org>
TryBot-Result: Go Bot <gobot@golang.org>
Reviewed-by: Ian Lance Taylor <iant@golang.org>
Trust: Damien Neil <dneil@google.com>
---
 internal/export/idna/punycode.go      | 36 +++++++++++++++++++--------
 internal/export/idna/punycode_test.go |  1 +
 2 files changed, 26 insertions(+), 11 deletions(-)

diff --git a/internal/export/idna/punycode.go b/internal/export/idna/punycode.go
index f0cbd487b..7e96febf1 100644
--- a/internal/export/idna/punycode.go
+++ b/internal/export/idna/punycode.go
@@ -47,6 +47,7 @@ func decode(encoded string) (string, error) {
 		}
 	}
 	i, n, bias := int32(0), initialN, initialBias
+	overflow := false
 	for pos < len(encoded) {
 		oldI, w := i, int32(1)
 		for k := base; ; k += base {
@@ -58,29 +59,32 @@ func decode(encoded string) (string, error) {
 				return "", punyError(encoded)
 			}
 			pos++
-			i += digit * w
-			if i < 0 {
+			i, overflow = madd(i, digit, w)
+			if overflow {
 				return "", punyError(encoded)
 			}
 			t := k - bias
-			if t < tmin {
+			if k <= bias {
 				t = tmin
-			} else if t > tmax {
+			} else if k >= bias+tmax {
 				t = tmax
 			}
 			if digit < t {
 				break
 			}
-			w *= base - t
-			if w >= math.MaxInt32/base {
+			w, overflow = madd(0, w, base-t)
+			if overflow {
 				return "", punyError(encoded)
 			}
 		}
+		if len(output) >= 1024 {
+			return "", punyError(encoded)
+		}
 		x := int32(len(output) + 1)
 		bias = adapt(i-oldI, x, oldI == 0)
 		n += i / x
 		i %= x
-		if n > utf8.MaxRune || len(output) >= 1024 {
+		if n < 0 || n > utf8.MaxRune {
 			return "", punyError(encoded)
 		}
 		output = append(output, 0)
@@ -113,6 +117,7 @@ func encode(prefix, s string) (string, error) {
 	if b > 0 {
 		output = append(output, '-')
 	}
+	overflow := false
 	for remaining != 0 {
 		m := int32(0x7fffffff)
 		for _, r := range s {
@@ -120,8 +125,8 @@ func encode(prefix, s string) (string, error) {
 				m = r
 			}
 		}
-		delta += (m - n) * (h + 1)
-		if delta < 0 {
+		delta, overflow = madd(delta, m-n, h+1)
+		if overflow {
 			return "", punyError(s)
 		}
 		n = m
@@ -139,9 +144,9 @@ func encode(prefix, s string) (string, error) {
 			q := delta
 			for k := base; ; k += base {
 				t := k - bias
-				if t < tmin {
+				if k <= bias {
 					t = tmin
-				} else if t > tmax {
+				} else if k >= bias+tmax {
 					t = tmax
 				}
 				if q < t {
@@ -162,6 +167,15 @@ func encode(prefix, s string) (string, error) {
 	return string(output), nil
 }
 
+// madd computes a + (b * c), detecting overflow.
+func madd(a, b, c int32) (next int32, overflow bool) {
+	p := int64(b) * int64(c)
+	if p > math.MaxInt32-int64(a) {
+		return 0, true
+	}
+	return a + int32(p), false
+}
+
 func decodeDigit(x byte) (digit int32, ok bool) {
 	switch {
 	case '0' <= x && x <= '9':
diff --git a/internal/export/idna/punycode_test.go b/internal/export/idna/punycode_test.go
index 2d99239ec..5cf0c968a 100644
--- a/internal/export/idna/punycode_test.go
+++ b/internal/export/idna/punycode_test.go
@@ -177,6 +177,7 @@ var punycodeErrorTestCases = [...]string{
 	"decode 9999999999a",  // "9999999999a" overflows the int32 calculation.
 
 	"encode " + strings.Repeat("x", 65536) + "\uff00", // int32 overflow.
+	"encode " + strings.Repeat("x", 65666) + "\uffff", // int32 overflow. issue #28233
 }
 
 func TestPunycodeErrors(t *testing.T) {

From 593da8d90fd448917a9ef0ca582e8d2bbe50ab2b Mon Sep 17 00:00:00 2001
From: Damien Neil <dneil@google.com>
Date: Thu, 28 Oct 2021 17:50:34 -0700
Subject: [PATCH 21/40] internal/export/idna: avoid strconv.Unquote errors on
 surrogate halves

The IDNA test data includes surrogate halves, which strconv.Unquote
reports an error for as of Go 1.18.

Change-Id: I9eb954aa3ab3a177ab0984d0da7caee7a47920a5
Reviewed-on: https://go-review.googlesource.com/c/text/+/359554
Trust: Damien Neil <dneil@google.com>
Run-TryBot: Damien Neil <dneil@google.com>
TryBot-Result: Go Bot <gobot@golang.org>
Reviewed-by: Ian Lance Taylor <iant@golang.org>
---
 internal/export/idna/idna_test.go | 14 +++++++++-----
 1 file changed, 9 insertions(+), 5 deletions(-)

diff --git a/internal/export/idna/idna_test.go b/internal/export/idna/idna_test.go
index 7235452c2..e568d3b90 100644
--- a/internal/export/idna/idna_test.go
+++ b/internal/export/idna/idna_test.go
@@ -5,7 +5,9 @@
 package idna
 
 import (
+	"encoding/hex"
 	"fmt"
+	"regexp"
 	"strconv"
 	"strings"
 	"testing"
@@ -99,12 +101,14 @@ func doTest(t *testing.T, f func(string) (string, error), name, input, want, err
 	})
 }
 
+var unescapeRE = regexp.MustCompile(`\\u([0-9a-zA-Z]{4})`)
+
 func unescape(s string) string {
-	s, err := strconv.Unquote(`"` + s + `"`)
-	if err != nil {
-		panic(err)
-	}
-	return s
+	return unescapeRE.ReplaceAllStringFunc(s, func(v string) string {
+		var d [2]byte
+		hex.Decode(d[:], []byte(v[2:]))
+		return string(rune(d[0])<<8 | rune(d[1]))
+	})
 }
 
 func BenchmarkProfile(b *testing.B) {

From 835dae61a3f3b1dd4f513e19a270937411e179f5 Mon Sep 17 00:00:00 2001
From: Damien Neil <dneil@google.com>
Date: Thu, 28 Oct 2021 17:47:46 -0700
Subject: [PATCH 22/40] internal/export/idna: use nontransitional processing in
 Go 1.18

Updates golang/go#46001
Updates golang/go#47510

Change-Id: I1e978a3c6230abfd0b1aaab0c7343b33dda1ba64
Reviewed-on: https://go-review.googlesource.com/c/text/+/359634
Trust: Damien Neil <dneil@google.com>
Run-TryBot: Damien Neil <dneil@google.com>
TryBot-Result: Go Bot <gobot@golang.org>
Reviewed-by: Timothy Gu <timothygu99@gmail.com>
Reviewed-by: Ian Lance Taylor <iant@golang.org>
---
 internal/export/idna/example_test.go    | 27 ++++++++++++-------------
 internal/export/idna/go118.go           | 12 +++++++++++
 internal/export/idna/idna10.0.0.go      |  2 +-
 internal/export/idna/idna10.0.0_test.go | 14 ++++++++++---
 internal/export/idna/idna_test.go       |  2 +-
 internal/export/idna/pre_go118.go       | 10 +++++++++
 6 files changed, 48 insertions(+), 19 deletions(-)
 create mode 100644 internal/export/idna/go118.go
 create mode 100644 internal/export/idna/pre_go118.go

diff --git a/internal/export/idna/example_test.go b/internal/export/idna/example_test.go
index 6e6b8727c..4c7352bdc 100644
--- a/internal/export/idna/example_test.go
+++ b/internal/export/idna/example_test.go
@@ -13,27 +13,26 @@ import (
 func ExampleProfile() {
 	// Raw Punycode has no restrictions and does no mappings.
 	fmt.Println(idna.ToASCII(""))
-	fmt.Println(idna.ToASCII("*.faß.com"))
-	fmt.Println(idna.Punycode.ToASCII("*.faß.com"))
+	fmt.Println(idna.ToASCII("*.GÖPHER.com"))
+	fmt.Println(idna.Punycode.ToASCII("*.GÖPHER.com"))
 
-	// Rewrite IDN for lookup. This (currently) uses transitional mappings to
-	// find a balance between IDNA2003 and IDNA2008 compatibility.
+	// Rewrite IDN for lookup.
 	fmt.Println(idna.Lookup.ToASCII(""))
-	fmt.Println(idna.Lookup.ToASCII("www.faß.com"))
+	fmt.Println(idna.Lookup.ToASCII("www.GÖPHER.com"))
 
-	// Convert an IDN to ASCII for registration purposes. This changes the
-	// encoding, but reports an error if the input was illformed.
-	fmt.Println(idna.Registration.ToASCII(""))
-	fmt.Println(idna.Registration.ToASCII("www.faß.com"))
+	// Convert an IDN to ASCII for registration purposes.
+	// This reports an error if the input was illformed.
+	fmt.Println(idna.Registration.ToASCII("www.GÖPHER.com"))
+	fmt.Println(idna.Registration.ToASCII("www.göpher.com"))
 
 	// Output:
 	//  <nil>
-	// *.xn--fa-hia.com <nil>
-	// *.xn--fa-hia.com <nil>
+	// *.xn--GPHER-1oa.com <nil>
+	// *.xn--GPHER-1oa.com <nil>
 	//  <nil>
-	// www.fass.com <nil>
-	//  idna: invalid label ""
-	// www.xn--fa-hia.com <nil>
+	// www.xn--gpher-jua.com <nil>
+	// www.xn--GPHER-1oa.com idna: disallowed rune U+0047
+	// www.xn--gpher-jua.com <nil>
 }
 
 func ExampleNew() {
diff --git a/internal/export/idna/go118.go b/internal/export/idna/go118.go
new file mode 100644
index 000000000..941a7aaff
--- /dev/null
+++ b/internal/export/idna/go118.go
@@ -0,0 +1,12 @@
+// Copyright 2021 The Go Authors. All rights reserved.
+// Use of this source code is governed by a BSD-style
+// license that can be found in the LICENSE file.
+
+//go:build go1.18
+// +build go1.18
+
+package idna
+
+// Transitional processing is disabled by default in Go 1.18.
+// https://golang.org/issue/47510
+const transitionalLookup = false
diff --git a/internal/export/idna/idna10.0.0.go b/internal/export/idna/idna10.0.0.go
index e6b62a287..0e7571d16 100644
--- a/internal/export/idna/idna10.0.0.go
+++ b/internal/export/idna/idna10.0.0.go
@@ -284,7 +284,7 @@ var (
 
 	punycode = &Profile{}
 	lookup   = &Profile{options{
-		transitional: true,
+		transitional: transitionalLookup,
 		useSTD3Rules: true,
 		checkHyphens: true,
 		checkJoiners: true,
diff --git a/internal/export/idna/idna10.0.0_test.go b/internal/export/idna/idna10.0.0_test.go
index 0b9f7a862..c3365bc6a 100644
--- a/internal/export/idna/idna10.0.0_test.go
+++ b/internal/export/idna/idna10.0.0_test.go
@@ -102,7 +102,7 @@ func TestLabelErrors(t *testing.T) {
 		// Chrome, modern Firefox, Safari, and IE.
 		{resolve, "lab⒐be", "xn--labbe-zh9b", "P1"}, // encode("lab⒐be")
 		{display, "lab⒐be", "lab⒐be", "P1"},
-		{resolve, "plan⒐faß.de", "xn--planfass-c31e.de", "P1"}, // encode("plan⒐fass") + ".de"
+		{transitional, "plan⒐faß.de", "xn--planfass-c31e.de", "P1"}, // encode("plan⒐fass") + ".de"
 		{display, "Plan⒐faß.de", "plan⒐faß.de", "P1"},
 
 		// Transitional vs Nontransitional processing
@@ -115,10 +115,10 @@ func TestLabelErrors(t *testing.T) {
 		// punycode on the result using transitional mapping.
 		// Firefox 49.0.1 goes haywire on this string and prints a bunch of what
 		// seems to be nested punycode encodings.
-		{resolve, "日本⒈co.ßßß.de", "xn--co-wuw5954azlb.ssssss.de", "P1"},
+		{transitional, "日本⒈co.ßßß.de", "xn--co-wuw5954azlb.ssssss.de", "P1"},
 		{display, "日本⒈co.ßßß.de", "日本⒈co.ßßß.de", "P1"},
 
-		{resolve, "a\u200Cb", "ab", ""},
+		{transitional, "a\u200Cb", "ab", ""},
 		{display, "a\u200Cb", "a\u200Cb", "C"},
 
 		{resolve, encode("a\u200Cb"), encode("a\u200Cb"), "C"},
@@ -153,3 +153,11 @@ func TestLabelErrors(t *testing.T) {
 		doTest(t, tc.f, tc.name, tc.input, tc.want, tc.wantErr)
 	}
 }
+
+func TestTransitionalDefault(t *testing.T) {
+	want := "xn--strae-oqa.de"
+	if transitionalLookup {
+		want = "strasse.de"
+	}
+	doTest(t, Lookup.ToASCII, "Lookup", "straße.de", want, "")
+}
diff --git a/internal/export/idna/idna_test.go b/internal/export/idna/idna_test.go
index e568d3b90..a13b67348 100644
--- a/internal/export/idna/idna_test.go
+++ b/internal/export/idna/idna_test.go
@@ -45,7 +45,7 @@ func TestProfiles(t *testing.T) {
 			VerifyDNSLength(true),
 			BidiRule(),
 		)},
-		{"Lookup", lookup, New(MapForLookup(), BidiRule(), Transitional(true))},
+		{"Lookup", lookup, New(MapForLookup(), BidiRule(), Transitional(transitionalLookup))},
 		{"Display", display, New(MapForLookup(), BidiRule())},
 	}
 	for _, tc := range testCases {
diff --git a/internal/export/idna/pre_go118.go b/internal/export/idna/pre_go118.go
new file mode 100644
index 000000000..ab3fa2e8c
--- /dev/null
+++ b/internal/export/idna/pre_go118.go
@@ -0,0 +1,10 @@
+// Copyright 2021 The Go Authors. All rights reserved.
+// Use of this source code is governed by a BSD-style
+// license that can be found in the LICENSE file.
+
+//go:build !go1.18
+// +build !go1.18
+
+package idna
+
+const transitionalLookup = true

From 8da7c0fd2b032cc0b7be90fcb2d361c5ebc40fef Mon Sep 17 00:00:00 2001
From: Damien Neil <dneil@google.com>
Date: Mon, 1 Nov 2021 13:27:11 -0700
Subject: [PATCH 23/40] gen.go: copy all tablesXX.X.X.go versions to
 golang.org/x/net

Remove logic that copies only the most current tablesXX.X.X.go,
renaming it to tables.go. The golang.org/x/net/idna package
currently contains all the versioned files and no tables.go,
so this change makes gen.go consistent with the last export.

Change-Id: Ic2797b45ec998873651eda04ed56ada29788f0f0
Reviewed-on: https://go-review.googlesource.com/c/text/+/360380
Trust: Damien Neil <dneil@google.com>
Trust: Marcel van Lohuizen <mpvl@golang.org>
Run-TryBot: Damien Neil <dneil@google.com>
Run-TryBot: Marcel van Lohuizen <mpvl@golang.org>
TryBot-Result: Go Bot <gobot@golang.org>
Reviewed-by: Marcel van Lohuizen <mpvl@golang.org>
---
 gen.go | 6 ------
 1 file changed, 6 deletions(-)

diff --git a/gen.go b/gen.go
index 04ff6035c..fb2fb94a7 100644
--- a/gen.go
+++ b/gen.go
@@ -256,12 +256,6 @@ func copyPackage(dirSrc, dirDst, search, replace string) {
 			filepath.Dir(file) != dirSrc {
 			return nil
 		}
-		if strings.HasPrefix(base, "tables") {
-			if !strings.HasSuffix(base, gen.UnicodeVersion()+".go") {
-				return nil
-			}
-			base = "tables.go"
-		}
 		b, err := ioutil.ReadFile(file)
 		if err != nil || bytes.Contains(b, []byte("\n// +build ignore")) {
 			return err

From 85a1c56496a61b2c4e607faaf3369d473cf2589d Mon Sep 17 00:00:00 2001
From: Amelia Downs <adowns@vmware.com>
Date: Mon, 1 Nov 2021 16:41:32 -0400
Subject: [PATCH 24/40] text/collate: add testable examples

Change-Id: Id3915137c4d365ec82ce74d8212e7b6cfb6fb200
Reviewed-on: https://go-review.googlesource.com/c/text/+/360494
Run-TryBot: Ian Lance Taylor <iant@golang.org>
TryBot-Result: Go Bot <gobot@golang.org>
Reviewed-by: Ian Lance Taylor <iant@golang.org>
Reviewed-by: Marcel van Lohuizen <mpvl@golang.org>
Trust: Marcel van Lohuizen <mpvl@golang.org>
---
 collate/example_sort_test.go | 56 +++++++++++++++++++++++++
 collate/examples_test.go     | 79 ++++++++++++++++++++++++++++++++++++
 2 files changed, 135 insertions(+)
 create mode 100644 collate/example_sort_test.go
 create mode 100644 collate/examples_test.go

diff --git a/collate/example_sort_test.go b/collate/example_sort_test.go
new file mode 100644
index 000000000..e86c02a7a
--- /dev/null
+++ b/collate/example_sort_test.go
@@ -0,0 +1,56 @@
+// Copyright 2021 The Go Authors. All rights reserved.
+// Use of this source code is governed by a BSD-style
+// license that can be found in the LICENSE file.
+
+package collate_test
+
+import (
+	"fmt"
+
+	"golang.org/x/text/collate"
+	"golang.org/x/text/language"
+)
+
+type book struct {
+	title string
+}
+
+type bookcase struct {
+	books []book
+}
+
+func (bc bookcase) Len() int {
+	return len(bc.books)
+}
+
+func (bc bookcase) Swap(i, j int) {
+	temp := bc.books[i]
+	bc.books[i] = bc.books[j]
+	bc.books[j] = temp
+}
+
+func (bc bookcase) Bytes(i int) []byte {
+	// returns the bytes of text at index i
+	return []byte(bc.books[i].title)
+}
+
+func ExampleCollator_Sort() {
+	bc := bookcase{
+		books: []book{
+			{title: "If Cats Disappeared from the World"},
+			{title: "The Guest Cat"},
+			{title: "Catwings"},
+		},
+	}
+
+	cc := collate.New(language.English)
+	cc.Sort(bc)
+
+	for _, b := range bc.books {
+		fmt.Println(b.title)
+	}
+	// Output:
+	// Catwings
+	// If Cats Disappeared from the World
+	// The Guest Cat
+}
diff --git a/collate/examples_test.go b/collate/examples_test.go
new file mode 100644
index 000000000..0a42a6d21
--- /dev/null
+++ b/collate/examples_test.go
@@ -0,0 +1,79 @@
+// Copyright 2021 The Go Authors. All rights reserved.
+// Use of this source code is governed by a BSD-style
+// license that can be found in the LICENSE file.
+
+package collate_test
+
+import (
+	"fmt"
+
+	"golang.org/x/text/collate"
+	"golang.org/x/text/language"
+)
+
+func ExampleNew() {
+	letters := []string{"ä", "å", "ö", "o", "a"}
+
+	ec := collate.New(language.English)
+	ec.SortStrings(letters)
+	fmt.Printf("English Sorting: %v\n", letters)
+
+	sc := collate.New(language.Swedish)
+	sc.SortStrings(letters)
+	fmt.Printf("Swedish Sorting: %v\n", letters)
+
+	numbers := []string{"0", "11", "01", "2", "3", "23"}
+
+	ec.SortStrings(numbers)
+	fmt.Printf("Alphabetic Sorting: %v\n", numbers)
+
+	nc := collate.New(language.English, collate.Numeric)
+	nc.SortStrings(numbers)
+	fmt.Printf("Numeric Sorting: %v\n", numbers)
+	// Output:
+	// English Sorting: [a å ä o ö]
+	// Swedish Sorting: [a o å ä ö]
+	// Alphabetic Sorting: [0 01 11 2 23 3]
+	// Numeric Sorting: [0 01 2 3 11 23]
+}
+
+func ExampleCollator_SortStrings() {
+	c := collate.New(language.English)
+	words := []string{"meow", "woof", "bark", "moo"}
+	c.SortStrings(words)
+	fmt.Println(words)
+	// Output:
+	// [bark meow moo woof]
+}
+
+func ExampleCollator_CompareString() {
+	c := collate.New(language.English)
+	r := c.CompareString("meow", "woof")
+	fmt.Println(r)
+
+	r = c.CompareString("woof", "meow")
+	fmt.Println(r)
+
+	r = c.CompareString("meow", "meow")
+	fmt.Println(r)
+	// Output:
+	// -1
+	// 1
+	// 0
+}
+
+func ExampleCollator_Compare() {
+	c := collate.New(language.English)
+	r := c.Compare([]byte("meow"), []byte("woof"))
+	fmt.Println(r)
+
+	r = c.Compare([]byte("woof"), []byte("meow"))
+	fmt.Println(r)
+
+	r = c.Compare([]byte("meow"), []byte("meow"))
+	fmt.Println(r)
+	// Output:
+	// -1
+	// 1
+	// 0
+}

From 459fa287ae002e3df243c0bd10ea915f5c64f687 Mon Sep 17 00:00:00 2001
From: Alexander Yastrebov <yastrebov.alex@gmail.com>
Date: Mon, 18 Oct 2021 14:56:52 +0000
Subject: [PATCH 25/40] text/currency: format currency amount according to the
 locale

Fixes golang/go#47623

Change-Id: Ie6be9db93bf58f597f1ea4d864fcb507235b1018
GitHub-Last-Rev: 4c8f3557daf5440390c0775ed6e71ec80f8c11e8
GitHub-Pull-Request: golang/text#27
Reviewed-on: https://go-review.googlesource.com/c/text/+/353935
Reviewed-by: Marcel van Lohuizen <mpvl@golang.org>
Trust: Marcel van Lohuizen <mpvl@golang.org>
Trust: Ian Lance Taylor <iant@golang.org>
Run-TryBot: Marcel van Lohuizen <mpvl@golang.org>
TryBot-Result: Go Bot <gobot@golang.org>
---
 currency/format.go      | 36 +++++++++++++++++++++---------------
 currency/format_test.go | 23 ++++++++++++++++++++---
 2 files changed, 41 insertions(+), 18 deletions(-)

diff --git a/currency/format.go b/currency/format.go
index 11152632a..cc4570d3b 100644
--- a/currency/format.go
+++ b/currency/format.go
@@ -6,11 +6,13 @@ package currency
 
 import (
 	"fmt"
-	"io"
 	"sort"
 
 	"golang.org/x/text/internal/format"
 	"golang.org/x/text/internal/language/compact"
+	"golang.org/x/text/internal/number"
+
+	"golang.org/x/text/language"
 )
 
 // Amount is an amount-currency unit pair.
@@ -34,8 +36,6 @@ func (a Amount) Currency() Unit { return a.currency }
 //
 // Add/Sub/Div/Mul/Round.
 
-var space = []byte(" ")
-
 // Format implements fmt.Formatter. It accepts format.State for
 // language-specific rendering.
 func (a Amount) Format(s fmt.State, verb rune) {
@@ -58,9 +58,11 @@ type formattedValue struct {
 // Format implements fmt.Formatter. It accepts format.State for
 // language-specific rendering.
 func (v formattedValue) Format(s fmt.State, verb rune) {
+	var tag language.Tag
 	var lang compact.ID
 	if state, ok := s.(format.State); ok {
-		lang, _ = compact.RegionalID(compact.Tag(state.Language()))
+		tag = state.Language()
+		lang, _ = compact.RegionalID(compact.Tag(tag))
 	}
 
 	// Get the options. Use DefaultFormat if not present.
@@ -73,18 +75,22 @@ func (v formattedValue) Format(s fmt.State, verb rune) {
 		cur = opt.currency
 	}
 
-	// TODO: use pattern.
-	io.WriteString(s, opt.symbol(lang, cur))
+	sym := opt.symbol(lang, cur)
 	if v.amount != nil {
-		s.Write(space)
-
-		// TODO: apply currency-specific rounding
-		scale, _ := opt.kind.Rounding(cur)
-		if _, ok := s.Precision(); !ok {
-			fmt.Fprintf(s, "%.*f", scale, v.amount)
-		} else {
-			fmt.Fprint(s, v.amount)
-		}
+		var f number.Formatter
+		f.InitDecimal(tag)
+
+		scale, increment := opt.kind.Rounding(cur)
+		f.RoundingContext.SetScale(scale)
+		f.RoundingContext.Increment = uint32(increment)
+		f.RoundingContext.IncrementScale = uint8(scale)
+		f.RoundingContext.Mode = number.ToNearestAway
+
+		d := f.Append(nil, v.amount)
+
+		fmt.Fprint(s, sym, " ", string(d))
+	} else {
+		fmt.Fprint(s, sym)
 	}
 }
 
diff --git a/currency/format_test.go b/currency/format_test.go
index 0aa0d58af..5cb11ebc9 100644
--- a/currency/format_test.go
+++ b/currency/format_test.go
@@ -12,8 +12,10 @@ import (
 )
 
 var (
+	de    = language.German
 	en    = language.English
 	fr    = language.French
+	de_CH = language.MustParse("de-CH")
 	en_US = language.AmericanEnglish
 	en_GB = language.BritishEnglish
 	en_AU = language.MustParse("en-AU")
@@ -42,20 +44,35 @@ func TestFormatting(t *testing.T) {
 
 		9:  {en, 9.0, Symbol.Default(EUR), "€ 9.00"},
 		10: {en, 10.123, Symbol.Default(KRW), "₩ 10"},
-		11: {fr, 11.52, Symbol.Default(TWD), "TWD 11.52"},
+		11: {fr, 11.52, Symbol.Default(TWD), "TWD 11,52"},
 		12: {en, 12.123, Symbol.Default(czk), "CZK 12.12"},
 		13: {en, 13.123, Symbol.Default(czk).Kind(Cash), "CZK 13"},
 		14: {en, 14.12345, ISO.Default(MustParseISO("CLF")), "CLF 14.1235"},
 		15: {en, USD.Amount(15.00), ISO.Default(TWD), "USD 15.00"},
 		16: {en, KRW.Amount(16.00), ISO.Kind(Cash), "KRW 16"},
 
-		// TODO: support integers as well.
-
 		17: {en, USD, nil, "USD"},
 		18: {en, USD, ISO, "USD"},
 		19: {en, USD, Symbol, "$"},
 		20: {en_GB, USD, Symbol, "US$"},
 		21: {en_AU, USD, NarrowSymbol, "$"},
+
+		// https://en.wikipedia.org/wiki/Decimal_separator
+		22: {de, EUR.Amount(1234567.89), nil, "EUR 1.234.567,89"},
+		23: {fr, EUR.Amount(1234567.89), nil, "EUR 1\u00a0234\u00a0567,89"},
+		24: {en_AU, EUR.Amount(1234567.89), nil, "EUR 1,234,567.89"},
+		25: {de_CH, EUR.Amount(1234567.89), nil, "EUR 1’234’567.89"},
+
+		// https://en.wikipedia.org/wiki/Cash_rounding
+		26: {de, NOK.Amount(2.49), ISO.Kind(Cash), "NOK 2"},
+		27: {de, NOK.Amount(2.50), ISO.Kind(Cash), "NOK 3"},
+		28: {de, DKK.Amount(0.24), ISO.Kind(Cash), "DKK 0,00"},
+		29: {de, DKK.Amount(0.25), ISO.Kind(Cash), "DKK 0,50"},
+
+		// integers
+		30: {de, EUR.Amount(1234567), nil, "EUR 1.234.567,00"},
+		31: {en, CNY.Amount(0), NarrowSymbol, "¥ 0.00"},
+		32: {en, CNY.Amount(0), Symbol, "CN¥ 0.00"},
 	}
 	for i, tc := range testCases {
 		p := message.NewPrinter(tc.tag)

From 310d592b71f764a238114c372e0ce7db4ecb560a Mon Sep 17 00:00:00 2001
From: Sean Liao <seankhliao@gmail.com>
Date: Thu, 21 Oct 2021 19:49:33 +0200
Subject: [PATCH 26/40] cmd/gotext: only match files ending with pattern

Exclude files with other extensions like .json.swp from editors.

Fixes golang/go#48983

Change-Id: Id74ca7ae208688cf900661d641e5403d453da33c
Reviewed-on: https://go-review.googlesource.com/c/text/+/357734
Reviewed-by: Marcel van Lohuizen <mpvl@golang.org>
Trust: Marcel van Lohuizen <mpvl@golang.org>
Trust: Ian Lance Taylor <iant@golang.org>
Run-TryBot: Marcel van Lohuizen <mpvl@golang.org>
TryBot-Result: Go Bot <gobot@golang.org>
---
 cmd/gotext/main.go | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/cmd/gotext/main.go b/cmd/gotext/main.go
index f31dd4fbd..c8dc7990a 100644
--- a/cmd/gotext/main.go
+++ b/cmd/gotext/main.go
@@ -48,7 +48,7 @@ func config() (*pipeline.Config, error) {
 	return &pipeline.Config{
 		SourceLanguage:      tag,
 		Supported:           getLangs(),
-		TranslationsPattern: `messages\.(.*)\.json`,
+		TranslationsPattern: `messages\.(.*)\.json$`,
 		GenFile:             *out,
 	}, nil
 }

From 7d8748685ddeb50953764cb62aa1064f0d928d61 Mon Sep 17 00:00:00 2001
From: Shengyu Zhang <zhangshengyu.0@bytedance.com>
Date: Tue, 2 Nov 2021 09:32:53 +0000
Subject: [PATCH 27/40] text/unicod/bidi: remove duplicate assignment

Fixes golang/go#43623

Change-Id: I4da134cccaf6a9e5331229a0ac2a60e5cb711e92
GitHub-Last-Rev: ae0f2d91f86dfd045bb403f5906ba80d2b9092de
GitHub-Pull-Request: golang/text#29
Reviewed-on: https://go-review.googlesource.com/c/text/+/358834
Reviewed-by: Marcel van Lohuizen <mpvl@golang.org>
Trust: Marcel van Lohuizen <mpvl@golang.org>
Trust: Ian Lance Taylor <iant@golang.org>
---
 unicode/bidi/core.go | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/unicode/bidi/core.go b/unicode/bidi/core.go
index e4c081101..fde188a33 100644
--- a/unicode/bidi/core.go
+++ b/unicode/bidi/core.go
@@ -495,9 +495,9 @@ func (s *isolatingRunSequence) resolveWeakTypes() {
 		if t == NSM {
 			s.types[i] = precedingCharacterType
 		} else {
-			if t.in(LRI, RLI, FSI, PDI) {
-				precedingCharacterType = ON
-			}
+			// if t.in(LRI, RLI, FSI, PDI) {
+			// 	precedingCharacterType = ON
+			// }
 			precedingCharacterType = t
 		}
 	}

From 18b340fc7af22495828ffbe71e9f9e22583bc7a9 Mon Sep 17 00:00:00 2001
From: Amelia Downs <adowns@vmware.com>
Date: Fri, 29 Oct 2021 13:32:13 -0400
Subject: [PATCH 28/40] language: fix typo in update docs

Change-Id: Ied188b87f0a9a1a4fb160b2a7ba239ed70b843a6
Reviewed-on: https://go-review.googlesource.com/c/text/+/359715
Reviewed-by: Ian Lance Taylor <iant@golang.org>
Reviewed-by: Amelia Downs <adowns@vmware.com>
Trust: Cherry Mui <cherryyz@google.com>
---
 language/match.go | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/language/match.go b/language/match.go
index f73492134..ee45f4947 100644
--- a/language/match.go
+++ b/language/match.go
@@ -545,7 +545,7 @@ type bestMatch struct {
 // match as the preferred match.
 //
 // If pin is true and have and tag are a strong match, it will henceforth only
-// consider matches for this language. This corresponds to the nothing that most
+// consider matches for this language. This corresponds to the idea that most
 // users have a strong preference for the first defined language. A user can
 // still prefer a second language over a dialect of the preferred language by
 // explicitly specifying dialects, e.g. "en, nl, en-GB". In this case pin should

From d1c84af989ab0f62cd853b5ae33b1b4db4f1e88b Mon Sep 17 00:00:00 2001
From: "Bryan C. Mills" <bcmills@google.com>
Date: Sun, 23 Jan 2022 16:23:19 -0500
Subject: [PATCH 29/40] message/pipeline: skip TestFullCycle on plan9-arm

This test has timed out several times recently on this builder. The
test is pretty slow even on Linux, and may be especially
filesystem-intensive.

For golang/go#49338

Change-Id: Ife2bb399b10f369f815055bb0ad44bb007f606b7
Reviewed-on: https://go-review.googlesource.com/c/text/+/380414
Trust: Bryan Mills <bcmills@google.com>
Run-TryBot: Bryan Mills <bcmills@google.com>
TryBot-Result: Gopher Robot <gobot@golang.org>
Reviewed-by: Ian Lance Taylor <iant@golang.org>
---
 message/pipeline/pipeline_test.go | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/message/pipeline/pipeline_test.go b/message/pipeline/pipeline_test.go
index 51c14a50b..2adb11fd2 100644
--- a/message/pipeline/pipeline_test.go
+++ b/message/pipeline/pipeline_test.go
@@ -33,6 +33,9 @@ func TestFullCycle(t *testing.T) {
 	if runtime.GOOS == "android" {
 		t.Skip("cannot load outside packages on android")
 	}
+	if b := os.Getenv("GO_BUILDER_NAME"); b == "plan9-arm" {
+		t.Skipf("skipping: test frequently times out on %s", b)
+	}
 	if _, err := exec.LookPath("go"); err != nil {
 		t.Skipf("skipping because 'go' command is unavailable: %v", err)
 	}

From 8db23f83d6d6c5a1bcecede55281db3c11fc7c60 Mon Sep 17 00:00:00 2001
From: Russ Cox <rsc@golang.org>
Date: Mon, 11 Apr 2022 13:13:21 -0400
Subject: [PATCH 30/40] all: gofmt

Gofmt to update doc comments to the new formatting.

For golang/go#51082.

Change-Id: I3e3c5666d5e901f2c5303911ddb548e3dd567fce
Reviewed-on: https://go-review.googlesource.com/c/text/+/399603
Run-TryBot: Russ Cox <rsc@golang.org>
TryBot-Result: Gopher Robot <gobot@golang.org>
Auto-Submit: Russ Cox <rsc@golang.org>
Reviewed-by: Ian Lance Taylor <iant@google.com>
---
 cases/gen_trieval.go                  | 73 ++++++++++++-----------
 cases/trieval.go                      | 73 ++++++++++++-----------
 cmd/gotext/doc.go                     | 39 ++++--------
 collate/build/builder.go              | 39 +++++++-----
 collate/build/colelem.go              |  8 ++-
 collate/build/contract.go             | 25 ++++----
 feature/plural/gen.go                 | 15 ++---
 feature/plural/message.go             | 14 ++---
 feature/plural/plural.go              | 51 ++++++++--------
 internal/catmsg/catmsg.go             | 50 ++++++++--------
 internal/cldrtree/cldrtree.go         |  1 -
 internal/colltab/collelem.go          | 39 ++++++------
 internal/export/idna/gen_trieval.go   | 34 +++++------
 internal/export/idna/trieval.go       | 34 +++++------
 internal/language/tables.go           | 17 +++---
 internal/number/decimal.go            | 48 +++++++--------
 internal/testtext/codesize.go         | 12 ++--
 internal/triegen/triegen.go           | 25 ++++----
 internal/utf8internal/utf8internal.go |  2 +-
 language/display/lookup.go            | 16 ++---
 language/doc.go                       | 44 +++++++-------
 message/catalog/catalog.go            | 85 +++++++++++++--------------
 message/doc.go                        | 50 ++++++++--------
 number/doc.go                         | 17 +++---
 unicode/bidi/core.go                  | 20 +++----
 unicode/cldr/collate.go               |  8 ++-
 unicode/norm/forminfo.go              |  9 +--
 unicode/norm/maketables.go            |  2 +
 unicode/norm/normalize.go             | 11 ++--
 width/tables10.0.0.go                 | 24 +++++---
 width/tables11.0.0.go                 | 24 +++++---
 width/tables12.0.0.go                 | 24 +++++---
 width/tables13.0.0.go                 | 24 +++++---
 width/tables9.0.0.go                  | 24 +++++---
 34 files changed, 528 insertions(+), 453 deletions(-)

diff --git a/cases/gen_trieval.go b/cases/gen_trieval.go
index 6c7222a73..14dd33b1d 100644
--- a/cases/gen_trieval.go
+++ b/cases/gen_trieval.go
@@ -19,19 +19,19 @@ package main
 //
 // The per-rune values have the following format:
 //
-//   if (exception) {
-//     15..4  unsigned exception index
-//   } else {
-//     15..8  XOR pattern or index to XOR pattern for case mapping
-//            Only 13..8 are used for XOR patterns.
-//         7  inverseFold (fold to upper, not to lower)
-//         6  index: interpret the XOR pattern as an index
-//            or isMid if case mode is cIgnorableUncased.
-//      5..4  CCC: zero (normal or break), above or other
-//   }
-//      3  exception: interpret this value as an exception index
-//         (TODO: is this bit necessary? Probably implied from case mode.)
-//   2..0  case mode
+//	if (exception) {
+//	  15..4  unsigned exception index
+//	} else {
+//	  15..8  XOR pattern or index to XOR pattern for case mapping
+//	         Only 13..8 are used for XOR patterns.
+//	      7  inverseFold (fold to upper, not to lower)
+//	      6  index: interpret the XOR pattern as an index
+//	         or isMid if case mode is cIgnorableUncased.
+//	   5..4  CCC: zero (normal or break), above or other
+//	}
+//	   3  exception: interpret this value as an exception index
+//	      (TODO: is this bit necessary? Probably implied from case mode.)
+//	2..0  case mode
 //
 // For the non-exceptional cases, a rune must be either uncased, lowercase or
 // uppercase. If the rune is cased, the XOR pattern maps either a lowercase
@@ -133,37 +133,40 @@ const (
 // The entry is pointed to by the exception index in an entry. It has the
 // following format:
 //
-// Header
-// byte 0:
-//  7..6  unused
-//  5..4  CCC type (same bits as entry)
-//     3  unused
-//  2..0  length of fold
+// Header:
 //
-// byte 1:
-//   7..6  unused
-//   5..3  length of 1st mapping of case type
-//   2..0  length of 2nd mapping of case type
+//	byte 0:
+//	 7..6  unused
+//	 5..4  CCC type (same bits as entry)
+//	    3  unused
+//	 2..0  length of fold
 //
-//   case     1st    2nd
-//   lower -> upper, title
-//   upper -> lower, title
-//   title -> lower, upper
+//	byte 1:
+//	  7..6  unused
+//	  5..3  length of 1st mapping of case type
+//	  2..0  length of 2nd mapping of case type
+//
+//	  case     1st    2nd
+//	  lower -> upper, title
+//	  upper -> lower, title
+//	  title -> lower, upper
 //
 // Lengths with the value 0x7 indicate no value and implies no change.
 // A length of 0 indicates a mapping to zero-length string.
 //
 // Body bytes:
-//   case folding bytes
-//   lowercase mapping bytes
-//   uppercase mapping bytes
-//   titlecase mapping bytes
-//   closure mapping bytes (for NFKC_Casefold). (TODO)
+//
+//	case folding bytes
+//	lowercase mapping bytes
+//	uppercase mapping bytes
+//	titlecase mapping bytes
+//	closure mapping bytes (for NFKC_Casefold). (TODO)
 //
 // Fallbacks:
-//   missing fold  -> lower
-//   missing title -> upper
-//   all missing   -> original rune
+//
+//	missing fold  -> lower
+//	missing title -> upper
+//	all missing   -> original rune
 //
 // exceptions starts with a dummy byte to enforce that there is no zero index
 // value.
diff --git a/cases/trieval.go b/cases/trieval.go
index 99e039628..4e4d13fe5 100644
--- a/cases/trieval.go
+++ b/cases/trieval.go
@@ -14,19 +14,19 @@ package cases
 //
 // The per-rune values have the following format:
 //
-//   if (exception) {
-//     15..4  unsigned exception index
-//   } else {
-//     15..8  XOR pattern or index to XOR pattern for case mapping
-//            Only 13..8 are used for XOR patterns.
-//         7  inverseFold (fold to upper, not to lower)
-//         6  index: interpret the XOR pattern as an index
-//            or isMid if case mode is cIgnorableUncased.
-//      5..4  CCC: zero (normal or break), above or other
-//   }
-//      3  exception: interpret this value as an exception index
-//         (TODO: is this bit necessary? Probably implied from case mode.)
-//   2..0  case mode
+//	if (exception) {
+//	  15..4  unsigned exception index
+//	} else {
+//	  15..8  XOR pattern or index to XOR pattern for case mapping
+//	         Only 13..8 are used for XOR patterns.
+//	      7  inverseFold (fold to upper, not to lower)
+//	      6  index: interpret the XOR pattern as an index
+//	         or isMid if case mode is cIgnorableUncased.
+//	   5..4  CCC: zero (normal or break), above or other
+//	}
+//	   3  exception: interpret this value as an exception index
+//	      (TODO: is this bit necessary? Probably implied from case mode.)
+//	2..0  case mode
 //
 // For the non-exceptional cases, a rune must be either uncased, lowercase or
 // uppercase. If the rune is cased, the XOR pattern maps either a lowercase
@@ -128,37 +128,40 @@ const (
 // The entry is pointed to by the exception index in an entry. It has the
 // following format:
 //
-// Header
-// byte 0:
-//  7..6  unused
-//  5..4  CCC type (same bits as entry)
-//     3  unused
-//  2..0  length of fold
+// Header:
 //
-// byte 1:
-//   7..6  unused
-//   5..3  length of 1st mapping of case type
-//   2..0  length of 2nd mapping of case type
+//	byte 0:
+//	 7..6  unused
+//	 5..4  CCC type (same bits as entry)
+//	    3  unused
+//	 2..0  length of fold
 //
-//   case     1st    2nd
-//   lower -> upper, title
-//   upper -> lower, title
-//   title -> lower, upper
+//	byte 1:
+//	  7..6  unused
+//	  5..3  length of 1st mapping of case type
+//	  2..0  length of 2nd mapping of case type
+//
+//	  case     1st    2nd
+//	  lower -> upper, title
+//	  upper -> lower, title
+//	  title -> lower, upper
 //
 // Lengths with the value 0x7 indicate no value and implies no change.
 // A length of 0 indicates a mapping to zero-length string.
 //
 // Body bytes:
-//   case folding bytes
-//   lowercase mapping bytes
-//   uppercase mapping bytes
-//   titlecase mapping bytes
-//   closure mapping bytes (for NFKC_Casefold). (TODO)
+//
+//	case folding bytes
+//	lowercase mapping bytes
+//	uppercase mapping bytes
+//	titlecase mapping bytes
+//	closure mapping bytes (for NFKC_Casefold). (TODO)
 //
 // Fallbacks:
-//   missing fold  -> lower
-//   missing title -> upper
-//   all missing   -> original rune
+//
+//	missing fold  -> lower
+//	missing title -> upper
+//	all missing   -> original rune
 //
 // exceptions starts with a dummy byte to enforce that there is no zero index
 // value.
diff --git a/cmd/gotext/doc.go b/cmd/gotext/doc.go
index fa247c6d3..d363ae25e 100644
--- a/cmd/gotext/doc.go
+++ b/cmd/gotext/doc.go
@@ -4,60 +4,47 @@
 //
 // Usage:
 //
-// 	gotext command [arguments]
+//	gotext command [arguments]
 //
 // The commands are:
 //
-// 	update      merge translations and generate catalog
-// 	extract     extracts strings to be translated from code
-// 	rewrite     rewrites fmt functions to use a message Printer
-// 	generate    generates code to insert translated messages
+//	update      merge translations and generate catalog
+//	extract     extracts strings to be translated from code
+//	rewrite     rewrites fmt functions to use a message Printer
+//	generate    generates code to insert translated messages
 //
 // Use "gotext help [command]" for more information about a command.
 //
 // Additional help topics:
 //
-//
 // Use "gotext help [topic]" for more information about that topic.
 //
-//
-// Merge translations and generate catalog
+// # Merge translations and generate catalog
 //
 // Usage:
 //
-// 	gotext update <package>* [-out <gofile>]
-//
-//
+//	gotext update <package>* [-out <gofile>]
 //
-//
-// Extracts strings to be translated from code
+// # Extracts strings to be translated from code
 //
 // Usage:
 //
-// 	gotext extract <package>*
-//
-//
+//	gotext extract <package>*
 //
-//
-// Rewrites fmt functions to use a message Printer
+// # Rewrites fmt functions to use a message Printer
 //
 // Usage:
 //
-// 	gotext rewrite <package>
+//	gotext rewrite <package>
 //
 // rewrite is typically done once for a project. It rewrites all usages of
 // fmt to use x/text's message package whenever a message.Printer is in scope.
 // It rewrites Print and Println calls with constant strings to the equivalent
 // using Printf to allow translators to reorder arguments.
 //
-//
-// Generates code to insert translated messages
+// # Generates code to insert translated messages
 //
 // Usage:
 //
-// 	gotext generate <package>
-//
-//
-//
-//
+//	gotext generate <package>
 package main
diff --git a/collate/build/builder.go b/collate/build/builder.go
index 092a4b506..3efb7387d 100644
--- a/collate/build/builder.go
+++ b/collate/build/builder.go
@@ -225,26 +225,37 @@ func (t *Tailoring) SetAnchorBefore(anchor string) error {
 //
 // Examples: create a tailoring for Swedish, where "ä" is ordered after "z"
 // at the primary sorting level:
-//      t := b.Tailoring("se")
-// 		t.SetAnchor("z")
-// 		t.Insert(colltab.Primary, "ä", "")
+//
+//	t := b.Tailoring("se")
+//	t.SetAnchor("z")
+//	t.Insert(colltab.Primary, "ä", "")
+//
 // Order "ü" after "ue" at the secondary sorting level:
-//		t.SetAnchor("ue")
-//		t.Insert(colltab.Secondary, "ü","")
+//
+//	t.SetAnchor("ue")
+//	t.Insert(colltab.Secondary, "ü","")
+//
 // or
-//		t.SetAnchor("u")
-//		t.Insert(colltab.Secondary, "ü", "e")
+//
+//	t.SetAnchor("u")
+//	t.Insert(colltab.Secondary, "ü", "e")
+//
 // Order "q" afer "ab" at the secondary level and "Q" after "q"
 // at the tertiary level:
-// 		t.SetAnchor("ab")
-// 		t.Insert(colltab.Secondary, "q", "")
-// 		t.Insert(colltab.Tertiary, "Q", "")
+//
+//	t.SetAnchor("ab")
+//	t.Insert(colltab.Secondary, "q", "")
+//	t.Insert(colltab.Tertiary, "Q", "")
+//
 // Order "b" before "a":
-//      t.SetAnchorBefore("a")
-//      t.Insert(colltab.Primary, "b", "")
+//
+//	t.SetAnchorBefore("a")
+//	t.Insert(colltab.Primary, "b", "")
+//
 // Order "0" after the last primary ignorable:
-//      t.SetAnchor("<last_primary_ignorable/>")
-//      t.Insert(colltab.Primary, "0", "")
+//
+//	t.SetAnchor("<last_primary_ignorable/>")
+//	t.Insert(colltab.Primary, "0", "")
 func (t *Tailoring) Insert(level colltab.Level, str, extend string) error {
 	if t.anchor == nil {
 		return fmt.Errorf("%s:Insert: no anchor point set for tailoring of %s", t.id, str)
diff --git a/collate/build/colelem.go b/collate/build/colelem.go
index 04fc3bfb7..1aaa062c5 100644
--- a/collate/build/colelem.go
+++ b/collate/build/colelem.go
@@ -51,6 +51,7 @@ func makeCE(ce rawCE) (uint32, error) {
 //   - n* is the size of the first node in the contraction trie.
 //   - i* is the index of the first node in the contraction trie.
 //   - b* is the offset into the contraction collation element table.
+//
 // See contract.go for details on the contraction trie.
 const (
 	contractID            = 0xC0000000
@@ -103,7 +104,8 @@ func makeExpansionHeader(n int) (uint32, error) {
 // The collation element, in this case, is of the form
 // 11110000 00000000 wwwwwwww vvvvvvvv, where
 //   - v* is the replacement tertiary weight for the first rune,
-//   - w* is the replacement tertiary weight for the second rune,
+//   - w* is the replacement tertiary weight for the second rune.
+//
 // Tertiary weights of subsequent runes should be replaced with maxTertiary.
 // See https://www.unicode.org/reports/tr10/#Compatibility_Decompositions for more details.
 const (
@@ -162,7 +164,9 @@ func implicitPrimary(r rune) int {
 // primaries (either double primaries or for illegal runes)
 // to our own representation.
 // A CJK character C is represented in the DUCET as
-//   [.FBxx.0020.0002.C][.BBBB.0000.0000.C]
+//
+//	[.FBxx.0020.0002.C][.BBBB.0000.0000.C]
+//
 // We will rewrite these characters to a single CE.
 // We assume the CJK values start at 0x8000.
 // See https://unicode.org/reports/tr10/#Implicit_Weights
diff --git a/collate/build/contract.go b/collate/build/contract.go
index e2df64f0c..5d79eb8bf 100644
--- a/collate/build/contract.go
+++ b/collate/build/contract.go
@@ -56,19 +56,22 @@ const (
 // entry might still resemble a completed suffix.
 // Examples:
 // The suffix strings "ab" and "ac" can be represented as:
-// []ctEntry{
-//     {'a', 1, 1, noIndex},  // 'a' by itself does not match, so i is 0xFF.
-//     {'b', 'c', 0, 1},   // "ab" -> 1, "ac" -> 2
-// }
+//
+//	[]ctEntry{
+//		{'a', 1, 1, noIndex},  // 'a' by itself does not match, so i is 0xFF.
+//		{'b', 'c', 0, 1},   // "ab" -> 1, "ac" -> 2
+//	}
 //
 // The suffix strings "ab", "abc", "abd", and "abcd" can be represented as:
-// []ctEntry{
-//     {'a', 1, 1, noIndex}, // 'a' must be followed by 'b'.
-//     {'b', 1, 2, 1},    // "ab" -> 1, may be followed by 'c' or 'd'.
-//     {'d', 'd', final, 3},  // "abd" -> 3
-//     {'c', 4, 1, 2},    // "abc" -> 2, may be followed by 'd'.
-//     {'d', 'd', final, 4},  // "abcd" -> 4
-// }
+//
+//	[]ctEntry{
+//		{'a', 1, 1, noIndex}, // 'a' must be followed by 'b'.
+//		{'b', 1, 2, 1},    // "ab" -> 1, may be followed by 'c' or 'd'.
+//		{'d', 'd', final, 3},  // "abd" -> 3
+//		{'c', 4, 1, 2},    // "abc" -> 2, may be followed by 'd'.
+//		{'d', 'd', final, 4},  // "abcd" -> 4
+//	}
+//
 // See genStateTests in contract_test.go for more examples.
 type ctEntry struct {
 	L uint8 // non-final: byte value to match; final: lowest match in range.
diff --git a/feature/plural/gen.go b/feature/plural/gen.go
index b9c5f2493..5f8f375fb 100644
--- a/feature/plural/gen.go
+++ b/feature/plural/gen.go
@@ -359,15 +359,16 @@ var operandIndex = map[string]opID{
 // the resulting or conditions to conds.
 //
 // Example rules:
-//   // Category "one" in English: only allow 1 with no visible fraction
-//   i = 1 and v = 0 @integer 1
 //
-//   // Category "few" in Czech: all numbers with visible fractions
-//   v != 0   @decimal ...
+//	// Category "one" in English: only allow 1 with no visible fraction
+//	i = 1 and v = 0 @integer 1
 //
-//   // Category "zero" in Latvian: all multiples of 10 or the numbers 11-19 or
-//   // numbers with a fraction 11..19 and no trailing zeros.
-//   n % 10 = 0 or n % 100 = 11..19 or v = 2 and f % 100 = 11..19 @integer ...
+//	// Category "few" in Czech: all numbers with visible fractions
+//	v != 0   @decimal ...
+//
+//	// Category "zero" in Latvian: all multiples of 10 or the numbers 11-19 or
+//	// numbers with a fraction 11..19 and no trailing zeros.
+//	n % 10 = 0 or n % 100 = 11..19 or v = 2 and f % 100 = 11..19 @integer ...
 //
 // @integer and @decimal are followed by examples and are not relevant for the
 // rule itself. The are used here to signal the termination of the rule.
diff --git a/feature/plural/message.go b/feature/plural/message.go
index f931f8a6a..6248d01cc 100644
--- a/feature/plural/message.go
+++ b/feature/plural/message.go
@@ -35,13 +35,13 @@ type Interface interface {
 // The cases argument are pairs of selectors and messages. Selectors are of type
 // string or Form. Messages are of type string or catalog.Message. A selector
 // matches an argument if:
-//    - it is "other" or Other
-//    - it matches the plural form of the argument: "zero", "one", "two", "few",
-//      or "many", or the equivalent Form
-//    - it is of the form "=x" where x is an integer that matches the value of
-//      the argument.
-//    - it is of the form "<x" where x is an integer that is larger than the
-//      argument.
+//   - it is "other" or Other
+//   - it matches the plural form of the argument: "zero", "one", "two", "few",
+//     or "many", or the equivalent Form
+//   - it is of the form "=x" where x is an integer that matches the value of
+//     the argument.
+//   - it is of the form "<x" where x is an integer that is larger than the
+//     argument.
 //
 // The format argument determines the formatting parameters for which to
 // determine the plural form. This is especially relevant for non-integer
diff --git a/feature/plural/plural.go b/feature/plural/plural.go
index 5b521b144..e9f2d42e0 100644
--- a/feature/plural/plural.go
+++ b/feature/plural/plural.go
@@ -20,7 +20,6 @@ import (
 
 // Rules defines the plural rules for all languages for a certain plural type.
 //
-//
 // This package is UNDER CONSTRUCTION and its API may change.
 type Rules struct {
 	rules          []pluralCheck
@@ -54,19 +53,19 @@ var (
 
 // getIntApprox converts the digits in slice digits[start:end] to an integer
 // according to the following rules:
-//	- Let i be asInt(digits[start:end]), where out-of-range digits are assumed
-//	  to be zero.
-//	- Result n is big if i / 10^nMod > 1.
-//	- Otherwise the result is i % 10^nMod.
+//   - Let i be asInt(digits[start:end]), where out-of-range digits are assumed
+//     to be zero.
+//   - Result n is big if i / 10^nMod > 1.
+//   - Otherwise the result is i % 10^nMod.
 //
 // For example, if digits is {1, 2, 3} and start:end is 0:5, then the result
 // for various values of nMod is:
-//	- when nMod == 2, n == big
-//	- when nMod == 3, n == big
-//	- when nMod == 4, n == big
-//	- when nMod == 5, n == 12300
-//	- when nMod == 6, n == 12300
-//	- when nMod == 7, n == 12300
+//   - when nMod == 2, n == big
+//   - when nMod == 3, n == big
+//   - when nMod == 4, n == big
+//   - when nMod == 5, n == 12300
+//   - when nMod == 6, n == 12300
+//   - when nMod == 7, n == 12300
 func getIntApprox(digits []byte, start, end, nMod, big int) (n int) {
 	// Leading 0 digits just result in 0.
 	p := start
@@ -107,12 +106,13 @@ func getIntApprox(digits []byte, start, end, nMod, big int) (n int) {
 //
 // The following table contains examples of possible arguments to represent
 // the given numbers.
-//      decimal    digits              exp    scale
-//      123        []byte{1, 2, 3}     3      0
-//      123.4      []byte{1, 2, 3, 4}  3      1
-//      123.40     []byte{1, 2, 3, 4}  3      2
-//      100000     []byte{1}           6      0
-//      100000.00  []byte{1}           6      3
+//
+//	decimal    digits              exp    scale
+//	123        []byte{1, 2, 3}     3      0
+//	123.4      []byte{1, 2, 3, 4}  3      1
+//	123.40     []byte{1, 2, 3, 4}  3      2
+//	100000     []byte{1}           6      0
+//	100000.00  []byte{1}           6      3
 func (p *Rules) MatchDigits(t language.Tag, digits []byte, exp, scale int) Form {
 	index := tagToID(t)
 
@@ -152,14 +152,15 @@ func (p *Rules) matchComponents(t language.Tag, n, f, scale int) Form {
 // MatchPlural returns the plural form for the given language and plural
 // operands (as defined in
 // https://unicode.org/reports/tr35/tr35-numbers.html#Language_Plural_Rules):
-//  where
-//  	n  absolute value of the source number (integer and decimals)
-//  input
-//  	i  integer digits of n.
-//  	v  number of visible fraction digits in n, with trailing zeros.
-//  	w  number of visible fraction digits in n, without trailing zeros.
-//  	f  visible fractional digits in n, with trailing zeros (f = t * 10^(v-w))
-//  	t  visible fractional digits in n, without trailing zeros.
+//
+//	where
+//		n  absolute value of the source number (integer and decimals)
+//	input
+//		i  integer digits of n.
+//		v  number of visible fraction digits in n, with trailing zeros.
+//		w  number of visible fraction digits in n, without trailing zeros.
+//		f  visible fractional digits in n, with trailing zeros (f = t * 10^(v-w))
+//		t  visible fractional digits in n, without trailing zeros.
 //
 // If any of the operand values is too large to fit in an int, it is okay to
 // pass the value modulo 10,000,000.
diff --git a/internal/catmsg/catmsg.go b/internal/catmsg/catmsg.go
index c0bf86f09..1b257a7b4 100644
--- a/internal/catmsg/catmsg.go
+++ b/internal/catmsg/catmsg.go
@@ -9,8 +9,7 @@
 // own. For instance, the plural package provides functionality for selecting
 // translation strings based on the plural category of substitution arguments.
 //
-//
-// Encoding and Decoding
+// # Encoding and Decoding
 //
 // Catalogs store Messages encoded as a single string. Compiling a message into
 // a string both results in compacter representation and speeds up evaluation.
@@ -25,8 +24,7 @@
 // the message. This decoder takes a Decoder argument which provides the
 // counterparts for the decoding.
 //
-//
-// Renderers
+// # Renderers
 //
 // A Decoder must be initialized with a Renderer implementation. These
 // implementations must be provided by packages that use Catalogs, typically
@@ -38,22 +36,22 @@
 // as sequence of substrings passed to the Renderer. The following snippet shows
 // how to express the above example using the message package.
 //
-//   message.Set(language.English, "You are %d minute(s) late.",
-//       catalog.Var("minutes", plural.Select(1, "one", "minute")),
-//       catalog.String("You are %[1]d ${minutes} late."))
+//	message.Set(language.English, "You are %d minute(s) late.",
+//		catalog.Var("minutes", plural.Select(1, "one", "minute")),
+//		catalog.String("You are %[1]d ${minutes} late."))
 //
-//   p := message.NewPrinter(language.English)
-//   p.Printf("You are %d minute(s) late.", 5) // always 5 minutes late.
+//	p := message.NewPrinter(language.English)
+//	p.Printf("You are %d minute(s) late.", 5) // always 5 minutes late.
 //
 // To evaluate the Printf, package message wraps the arguments in a Renderer
 // that is passed to the catalog for message decoding. The call sequence that
 // results from evaluating the above message, assuming the person is rather
 // tardy, is:
 //
-//   Render("You are %[1]d ")
-//   Arg(1)
-//   Render("minutes")
-//   Render(" late.")
+//	Render("You are %[1]d ")
+//	Arg(1)
+//	Render("minutes")
+//	Render(" late.")
 //
 // The calls to Arg is caused by the plural.Select execution, which evaluates
 // the argument to determine whether the singular or plural message form should
@@ -267,10 +265,12 @@ func (s FirstOf) Compile(e *Encoder) error {
 // Var defines a message that can be substituted for a placeholder of the same
 // name. If an expression does not result in a string after evaluation, Name is
 // used as the substitution. For example:
-//    Var{
-//      Name:    "minutes",
-//      Message: plural.Select(1, "one", "minute"),
-//    }
+//
+//	Var{
+//	  Name:    "minutes",
+//	  Message: plural.Select(1, "one", "minute"),
+//	}
+//
 // will resolve to minute for singular and minutes for plural forms.
 type Var struct {
 	Name    string
@@ -318,13 +318,15 @@ func (r Raw) Compile(e *Encoder) (err error) {
 // calls for each placeholder and interstitial string. For example, for the
 // message: "%[1]v ${invites} %[2]v to ${their} party." The sequence of calls
 // is:
-//   d.Render("%[1]v ")
-//   d.Arg(1)
-//   d.Render(resultOfInvites)
-//   d.Render(" %[2]v to ")
-//   d.Arg(2)
-//   d.Render(resultOfTheir)
-//   d.Render(" party.")
+//
+//	d.Render("%[1]v ")
+//	d.Arg(1)
+//	d.Render(resultOfInvites)
+//	d.Render(" %[2]v to ")
+//	d.Arg(2)
+//	d.Render(resultOfTheir)
+//	d.Render(" party.")
+//
 // where the messages for "invites" and "their" both use a plural.Select
 // referring to the first argument.
 //
diff --git a/internal/cldrtree/cldrtree.go b/internal/cldrtree/cldrtree.go
index 7530831d6..cc2714e99 100644
--- a/internal/cldrtree/cldrtree.go
+++ b/internal/cldrtree/cldrtree.go
@@ -4,7 +4,6 @@
 
 // Package cldrtree builds and generates a CLDR index file, including all
 // inheritance.
-//
 package cldrtree
 
 //go:generate go test -gen
diff --git a/internal/colltab/collelem.go b/internal/colltab/collelem.go
index 396cebda2..0c23c8a48 100644
--- a/internal/colltab/collelem.go
+++ b/internal/colltab/collelem.go
@@ -78,24 +78,27 @@ func (ce Elem) ctype() ceType {
 // For normal collation elements, we assume that a collation element either has
 // a primary or non-default secondary value, not both.
 // Collation elements with a primary value are of the form
-// 01pppppp pppppppp ppppppp0 ssssssss
-//   - p* is primary collation value
-//   - s* is the secondary collation value
-// 00pppppp pppppppp ppppppps sssttttt, where
-//   - p* is primary collation value
-//   - s* offset of secondary from default value.
-//   - t* is the tertiary collation value
-// 100ttttt cccccccc pppppppp pppppppp
-//   - t* is the tertiar collation value
-//   - c* is the canonical combining class
-//   - p* is the primary collation value
+//
+//	01pppppp pppppppp ppppppp0 ssssssss
+//	  - p* is primary collation value
+//	  - s* is the secondary collation value
+//	00pppppp pppppppp ppppppps sssttttt, where
+//	  - p* is primary collation value
+//	  - s* offset of secondary from default value.
+//	  - t* is the tertiary collation value
+//	100ttttt cccccccc pppppppp pppppppp
+//	  - t* is the tertiar collation value
+//	  - c* is the canonical combining class
+//	  - p* is the primary collation value
+//
 // Collation elements with a secondary value are of the form
-// 1010cccc ccccssss ssssssss tttttttt, where
-//   - c* is the canonical combining class
-//   - s* is the secondary collation value
-//   - t* is the tertiary collation value
-// 11qqqqqq qqqqqqqq qqqqqqq0 00000000
-//   - q* quaternary value
+//
+//	1010cccc ccccssss ssssssss tttttttt, where
+//	  - c* is the canonical combining class
+//	  - s* is the secondary collation value
+//	  - t* is the tertiary collation value
+//	11qqqqqq qqqqqqqq qqqqqqq0 00000000
+//	  - q* quaternary value
 const (
 	ceTypeMask              = 0xC0000000
 	ceTypeMaskExt           = 0xE0000000
@@ -296,6 +299,7 @@ func (ce Elem) Weight(l Level) int {
 //   - n* is the size of the first node in the contraction trie.
 //   - i* is the index of the first node in the contraction trie.
 //   - b* is the offset into the contraction collation element table.
+//
 // See contract.go for details on the contraction trie.
 const (
 	maxNBits              = 4
@@ -326,6 +330,7 @@ func splitExpandIndex(ce Elem) (index int) {
 // The Elem, in this case, is of the form 11110000 00000000 wwwwwwww vvvvvvvv, where
 //   - v* is the replacement tertiary weight for the first rune,
 //   - w* is the replacement tertiary weight for the second rune,
+//
 // Tertiary weights of subsequent runes should be replaced with maxTertiary.
 // See https://www.unicode.org/reports/tr10/#Compatibility_Decompositions for more details.
 func splitDecompose(ce Elem) (t1, t2 uint8) {
diff --git a/internal/export/idna/gen_trieval.go b/internal/export/idna/gen_trieval.go
index 9d92407f2..501bfabed 100644
--- a/internal/export/idna/gen_trieval.go
+++ b/internal/export/idna/gen_trieval.go
@@ -22,23 +22,23 @@ package main
 //
 // The per-rune values have the following format:
 //
-//   if mapped {
-//     if inlinedXOR {
-//       15..13 inline XOR marker
-//       12..11 unused
-//       10..3  inline XOR mask
-//     } else {
-//       15..3  index into xor or mapping table
-//     }
-//   } else {
-//       15..14 unused
-//       13     mayNeedNorm
-//       12..11 attributes
-//       10..8  joining type
-//        7..3  category type
-//   }
-//      2  use xor pattern
-//   1..0  mapped category
+//	if mapped {
+//	  if inlinedXOR {
+//	    15..13 inline XOR marker
+//	    12..11 unused
+//	    10..3  inline XOR mask
+//	  } else {
+//	    15..3  index into xor or mapping table
+//	  }
+//	} else {
+//	    15..14 unused
+//	    13     mayNeedNorm
+//	    12..11 attributes
+//	    10..8  joining type
+//	     7..3  category type
+//	}
+//	   2  use xor pattern
+//	1..0  mapped category
 //
 // See the definitions below for a more detailed description of the various
 // bits.
diff --git a/internal/export/idna/trieval.go b/internal/export/idna/trieval.go
index 7a8cf889b..9c070a44b 100644
--- a/internal/export/idna/trieval.go
+++ b/internal/export/idna/trieval.go
@@ -17,23 +17,23 @@ package idna
 //
 // The per-rune values have the following format:
 //
-//   if mapped {
-//     if inlinedXOR {
-//       15..13 inline XOR marker
-//       12..11 unused
-//       10..3  inline XOR mask
-//     } else {
-//       15..3  index into xor or mapping table
-//     }
-//   } else {
-//       15..14 unused
-//       13     mayNeedNorm
-//       12..11 attributes
-//       10..8  joining type
-//        7..3  category type
-//   }
-//      2  use xor pattern
-//   1..0  mapped category
+//	if mapped {
+//	  if inlinedXOR {
+//	    15..13 inline XOR marker
+//	    12..11 unused
+//	    10..3  inline XOR mask
+//	  } else {
+//	    15..3  index into xor or mapping table
+//	  }
+//	} else {
+//	    15..14 unused
+//	    13     mayNeedNorm
+//	    12..11 attributes
+//	    10..8  joining type
+//	     7..3  category type
+//	}
+//	   2  use xor pattern
+//	1..0  mapped category
 //
 // See the definitions below for a more detailed description of the various
 // bits.
diff --git a/internal/language/tables.go b/internal/language/tables.go
index a19480c5b..3552e1afc 100644
--- a/internal/language/tables.go
+++ b/internal/language/tables.go
@@ -121,9 +121,10 @@ const langPrivateEnd = 0x3179
 // lang holds an alphabetically sorted list of ISO-639 language identifiers.
 // All entries are 4 bytes. The index of the identifier (divided by 4) is the language tag.
 // For 2-byte language identifiers, the two successive bytes have the following meaning:
-//     - if the first letter of the 2- and 3-letter ISO codes are the same:
-//       the second and third letter of the 3-letter ISO code.
-//     - otherwise: a 0 and a by 2 bits right-shifted index into altLangISO3.
+//   - if the first letter of the 2- and 3-letter ISO codes are the same:
+//     the second and third letter of the 3-letter ISO code.
+//   - otherwise: a 0 and a by 2 bits right-shifted index into altLangISO3.
+//
 // For 3-byte language identifiers the 4th byte is 0.
 const lang tag.Index = "" + // Size: 5324 bytes
 	"---\x00aaaraai\x00aak\x00aau\x00abbkabi\x00abq\x00abr\x00abt\x00aby\x00a" +
@@ -1086,9 +1087,9 @@ var regionTypes = [358]uint8{
 
 // regionISO holds a list of alphabetically sorted 2-letter ISO region codes.
 // Each 2-letter codes is followed by two bytes with the following meaning:
-//     - [A-Z}{2}: the first letter of the 2-letter code plus these two
-//                 letters form the 3-letter ISO code.
-//     - 0, n:     index into altRegionISO3.
+//   - [A-Z]{2}: the first letter of the 2-letter code plus these two
+//     letters form the 3-letter ISO code.
+//   - 0, n:     index into altRegionISO3.
 const regionISO tag.Index = "" + // Size: 1308 bytes
 	"AAAAACSCADNDAEREAFFGAGTGAIIAALLBAMRMANNTAOGOAQTAARRGASSMATUTAUUSAWBWAXLA" +
 	"AZZEBAIHBBRBBDGDBEELBFFABGGRBHHRBIDIBJENBLLMBMMUBNRNBOOLBQESBRRABSHSBTTN" +
@@ -1206,7 +1207,9 @@ var m49 = [358]int16{
 
 // m49Index gives indexes into fromM49 based on the three most significant bits
 // of a 10-bit UN.M49 code. To search an UN.M49 code in fromM49, search in
-//    fromM49[m49Index[msb39(code)]:m49Index[msb3(code)+1]]
+//
+//	fromM49[m49Index[msb39(code)]:m49Index[msb3(code)+1]]
+//
 // for an entry where the first 7 bits match the 7 lsb of the UN.M49 code.
 // The region code is stored in the 9 lsb of the indexed value.
 // Size: 18 bytes, 9 elements
diff --git a/internal/number/decimal.go b/internal/number/decimal.go
index cb656db6c..37e0c4b98 100644
--- a/internal/number/decimal.go
+++ b/internal/number/decimal.go
@@ -33,13 +33,14 @@ const maxIntDigits = 20
 // may point outside a valid position in Digits.
 //
 // Examples:
-//      Number     Decimal
-//      12345      Digits: [1, 2, 3, 4, 5], Exp: 5
-//      12.345     Digits: [1, 2, 3, 4, 5], Exp: 2
-//      12000      Digits: [1, 2],          Exp: 5
-//      12000.00   Digits: [1, 2],          Exp: 5
-//      0.00123    Digits: [1, 2, 3],       Exp: -2
-//      0          Digits: [],              Exp: 0
+//
+//	Number     Decimal
+//	12345      Digits: [1, 2, 3, 4, 5], Exp: 5
+//	12.345     Digits: [1, 2, 3, 4, 5], Exp: 2
+//	12000      Digits: [1, 2],          Exp: 5
+//	12000.00   Digits: [1, 2],          Exp: 5
+//	0.00123    Digits: [1, 2, 3],       Exp: -2
+//	0          Digits: [],              Exp: 0
 type Decimal struct {
 	digits
 
@@ -60,22 +61,23 @@ type digits struct {
 // engineering notation. Digits must have at least one digit.
 //
 // Examples:
-//      Number     Decimal
-//    decimal
-//      12345      Digits: [1, 2, 3, 4, 5], Exp: 5  End: 5
-//      12.345     Digits: [1, 2, 3, 4, 5], Exp: 2  End: 5
-//      12000      Digits: [1, 2],          Exp: 5  End: 5
-//      12000.00   Digits: [1, 2],          Exp: 5  End: 7
-//      0.00123    Digits: [1, 2, 3],       Exp: -2 End: 3
-//      0          Digits: [],              Exp: 0  End: 1
-//    scientific (actual exp is Exp - Comma)
-//      0e0        Digits: [0],             Exp: 1, End: 1, Comma: 1
-//      .0e0       Digits: [0],             Exp: 0, End: 1, Comma: 0
-//      0.0e0      Digits: [0],             Exp: 1, End: 2, Comma: 1
-//      1.23e4     Digits: [1, 2, 3],       Exp: 5, End: 3, Comma: 1
-//      .123e5     Digits: [1, 2, 3],       Exp: 5, End: 3, Comma: 0
-//    engineering
-//      12.3e3     Digits: [1, 2, 3],       Exp: 5, End: 3, Comma: 2
+//
+//	  Number     Decimal
+//	decimal
+//	  12345      Digits: [1, 2, 3, 4, 5], Exp: 5  End: 5
+//	  12.345     Digits: [1, 2, 3, 4, 5], Exp: 2  End: 5
+//	  12000      Digits: [1, 2],          Exp: 5  End: 5
+//	  12000.00   Digits: [1, 2],          Exp: 5  End: 7
+//	  0.00123    Digits: [1, 2, 3],       Exp: -2 End: 3
+//	  0          Digits: [],              Exp: 0  End: 1
+//	scientific (actual exp is Exp - Comma)
+//	  0e0        Digits: [0],             Exp: 1, End: 1, Comma: 1
+//	  .0e0       Digits: [0],             Exp: 0, End: 1, Comma: 0
+//	  0.0e0      Digits: [0],             Exp: 1, End: 2, Comma: 1
+//	  1.23e4     Digits: [1, 2, 3],       Exp: 5, End: 3, Comma: 1
+//	  .123e5     Digits: [1, 2, 3],       Exp: 5, End: 3, Comma: 0
+//	engineering
+//	  12.3e3     Digits: [1, 2, 3],       Exp: 5, End: 3, Comma: 2
 type Digits struct {
 	digits
 	// End indicates the end position of the number.
diff --git a/internal/testtext/codesize.go b/internal/testtext/codesize.go
index 5fc5eaec7..88df48747 100644
--- a/internal/testtext/codesize.go
+++ b/internal/testtext/codesize.go
@@ -16,11 +16,13 @@ import (
 
 // CodeSize builds the given code sample and returns the binary size or en error
 // if an error occurred. The code sample typically will look like this:
-//     package main
-//     import "golang.org/x/text/somepackage"
-//     func main() {
-//         somepackage.Func() // reference Func to cause it to be linked in.
-//     }
+//
+//	package main
+//	import "golang.org/x/text/somepackage"
+//	func main() {
+//	    somepackage.Func() // reference Func to cause it to be linked in.
+//	}
+//
 // See dict_test.go in the display package for an example.
 func CodeSize(s string) (int, error) {
 	// Write the file.
diff --git a/internal/triegen/triegen.go b/internal/triegen/triegen.go
index 51d218a30..de54a8075 100644
--- a/internal/triegen/triegen.go
+++ b/internal/triegen/triegen.go
@@ -34,23 +34,24 @@
 // triegen generates both tables and code. The code is optimized to use the
 // automatically chosen data types. The following code is generated for a Trie
 // or multiple Tries named "foo":
-//	- type fooTrie
-//		The trie type.
 //
-//	- func newFooTrie(x int) *fooTrie
-//		Trie constructor, where x is the index of the trie passed to Gen.
+//   - type fooTrie
+//     The trie type.
 //
-//	- func (t *fooTrie) lookup(s []byte) (v uintX, sz int)
-//		The lookup method, where uintX is automatically chosen.
+//   - func newFooTrie(x int) *fooTrie
+//     Trie constructor, where x is the index of the trie passed to Gen.
 //
-//	- func lookupString, lookupUnsafe and lookupStringUnsafe
-//		Variants of the above.
+//   - func (t *fooTrie) lookup(s []byte) (v uintX, sz int)
+//     The lookup method, where uintX is automatically chosen.
 //
-//	- var fooValues and fooIndex and any tables generated by Compacters.
-//		The core trie data.
+//   - func lookupString, lookupUnsafe and lookupStringUnsafe
+//     Variants of the above.
 //
-//	- var fooTrieHandles
-//		Indexes of starter blocks in case of multiple trie roots.
+//   - var fooValues and fooIndex and any tables generated by Compacters.
+//     The core trie data.
+//
+//   - var fooTrieHandles
+//     Indexes of starter blocks in case of multiple trie roots.
 //
 // It is recommended that users test the generated trie by checking the returned
 // value for every rune. Such exhaustive tests are possible as the number of
diff --git a/internal/utf8internal/utf8internal.go b/internal/utf8internal/utf8internal.go
index 575cea870..e5c53b1b3 100644
--- a/internal/utf8internal/utf8internal.go
+++ b/internal/utf8internal/utf8internal.go
@@ -74,7 +74,7 @@ type AcceptRange struct {
 
 // AcceptRanges is a slice of AcceptRange values. For a given byte sequence b
 //
-//		AcceptRanges[First[b[0]]>>AcceptShift]
+//	AcceptRanges[First[b[0]]>>AcceptShift]
 //
 // will give the value of AcceptRange for the multi-byte UTF-8 sequence starting
 // at b[0].
diff --git a/language/display/lookup.go b/language/display/lookup.go
index e6dc0e016..88307753d 100644
--- a/language/display/lookup.go
+++ b/language/display/lookup.go
@@ -92,10 +92,10 @@ func nameTag(langN, scrN, regN namer, x interface{}) string {
 // offsets for a string in data. For example, consider a header that defines
 // strings for the languages de, el, en, fi, and nl:
 //
-// 		header{
-// 			data: "GermanGreekEnglishDutch",
-//  		index: []uint16{ 0, 6, 11, 18, 18, 23 },
-// 		}
+//	header{
+//		data: "GermanGreekEnglishDutch",
+//		index: []uint16{0, 6, 11, 18, 18, 23},
+//	}
 //
 // For a language with index i, the string is defined by
 // data[index[i]:index[i+1]]. So the number of elements in index is always one
@@ -204,9 +204,11 @@ func supportedRegions() []language.Region {
 // for each length, which can be used in combination with binary search to get
 // the index associated with a tag.
 // For example, a tagIndex{
-//   "arenesfrruzh",  // 6 2-byte tags.
-//   "barwae",        // 2 3-byte tags.
-//   "",
+//
+//	"arenesfrruzh",  // 6 2-byte tags.
+//	"barwae",        // 2 3-byte tags.
+//	"",
+//
 // }
 // would mean that the 2-byte tag "fr" had an index of 3, and the 3-byte tag
 // "wae" had an index of 7.
diff --git a/language/doc.go b/language/doc.go
index 8afecd50e..212b77c90 100644
--- a/language/doc.go
+++ b/language/doc.go
@@ -10,18 +10,17 @@
 // and provides the user with the best experience
 // (see https://blog.golang.org/matchlang).
 //
-//
-// Matching preferred against supported languages
+// # Matching preferred against supported languages
 //
 // A Matcher for an application that supports English, Australian English,
 // Danish, and standard Mandarin can be created as follows:
 //
-//    var matcher = language.NewMatcher([]language.Tag{
-//        language.English,   // The first language is used as fallback.
-//        language.MustParse("en-AU"),
-//        language.Danish,
-//        language.Chinese,
-//    })
+//	var matcher = language.NewMatcher([]language.Tag{
+//	    language.English,   // The first language is used as fallback.
+//	    language.MustParse("en-AU"),
+//	    language.Danish,
+//	    language.Chinese,
+//	})
 //
 // This list of supported languages is typically implied by the languages for
 // which there exists translations of the user interface.
@@ -30,14 +29,14 @@
 // language tags.
 // The MatchString finds best matches for such strings:
 //
-//    handler(w http.ResponseWriter, r *http.Request) {
-//        lang, _ := r.Cookie("lang")
-//        accept := r.Header.Get("Accept-Language")
-//        tag, _ := language.MatchStrings(matcher, lang.String(), accept)
+//	handler(w http.ResponseWriter, r *http.Request) {
+//	    lang, _ := r.Cookie("lang")
+//	    accept := r.Header.Get("Accept-Language")
+//	    tag, _ := language.MatchStrings(matcher, lang.String(), accept)
 //
-//        // tag should now be used for the initialization of any
-//        // locale-specific service.
-//    }
+//	    // tag should now be used for the initialization of any
+//	    // locale-specific service.
+//	}
 //
 // The Matcher's Match method can be used to match Tags directly.
 //
@@ -48,8 +47,7 @@
 // For instance, it will know that a reader of Bokmål Danish can read Norwegian
 // and will know that Cantonese ("yue") is a good match for "zh-HK".
 //
-//
-// Using match results
+// # Using match results
 //
 // To guarantee a consistent user experience to the user it is important to
 // use the same language tag for the selection of any locale-specific services.
@@ -58,9 +56,9 @@
 // More subtly confusing is using the wrong sorting order or casing
 // algorithm for a certain language.
 //
-//    All the packages in x/text that provide locale-specific services
-//    (e.g. collate, cases) should be initialized with the tag that was
-//    obtained at the start of an interaction with the user.
+// All the packages in x/text that provide locale-specific services
+// (e.g. collate, cases) should be initialized with the tag that was
+// obtained at the start of an interaction with the user.
 //
 // Note that Tag that is returned by Match and MatchString may differ from any
 // of the supported languages, as it may contain carried over settings from
@@ -70,8 +68,7 @@
 // Match and MatchString both return the index of the matched supported tag
 // to simplify associating such data with the matched tag.
 //
-//
-// Canonicalization
+// # Canonicalization
 //
 // If one uses the Matcher to compare languages one does not need to
 // worry about canonicalization.
@@ -92,10 +89,9 @@
 // equivalence relations. The CanonType type can be used to alter the
 // canonicalization form.
 //
-// References
+// # References
 //
 // BCP 47 - Tags for Identifying Languages http://tools.ietf.org/html/bcp47
-//
 package language // import "golang.org/x/text/language"
 
 // TODO: explanation on how to match languages for your own locale-specific
diff --git a/message/catalog/catalog.go b/message/catalog/catalog.go
index de595b510..96955d075 100644
--- a/message/catalog/catalog.go
+++ b/message/catalog/catalog.go
@@ -13,8 +13,7 @@
 // language. The Loader interface defines a source of dictionaries. A
 // translation of a format string is represented by a Message.
 //
-//
-// Catalogs
+// # Catalogs
 //
 // A Catalog defines a programmatic interface for setting message translations.
 // It maintains a set of per-language dictionaries with translations for a set
@@ -24,8 +23,7 @@
 // the key. For example, a Dictionary for "en-GB" could leave out entries that
 // are identical to those in a dictionary for "en".
 //
-//
-// Messages
+// # Messages
 //
 // A Message is a format string which varies on the value of substitution
 // variables. For instance, to indicate the number of results one could want "no
@@ -39,8 +37,7 @@
 // to selected string. This separation of concerns allows Catalog to be used to
 // store any kind of formatting strings.
 //
-//
-// Selecting messages based on linguistic features of substitution arguments
+// # Selecting messages based on linguistic features of substitution arguments
 //
 // Messages may vary based on any linguistic features of the argument values.
 // The most common one is plural form, but others exist.
@@ -48,10 +45,10 @@
 // Selection messages are provided in packages that provide support for a
 // specific linguistic feature. The following snippet uses plural.Selectf:
 //
-//   catalog.Set(language.English, "You are %d minute(s) late.",
-//       plural.Selectf(1, "",
-//           plural.One, "You are 1 minute late.",
-//           plural.Other, "You are %d minutes late."))
+//	catalog.Set(language.English, "You are %d minute(s) late.",
+//		plural.Selectf(1, "",
+//			plural.One, "You are 1 minute late.",
+//			plural.Other, "You are %d minutes late."))
 //
 // In this example, a message is stored in the Catalog where one of two messages
 // is selected based on the first argument, a number. The first message is
@@ -64,47 +61,46 @@
 // Selects can be nested. This allows selecting sentences based on features of
 // multiple arguments or multiple linguistic properties of a single argument.
 //
-//
-// String interpolation
+// # String interpolation
 //
 // There is often a lot of commonality between the possible variants of a
 // message. For instance, in the example above the word "minute" varies based on
 // the plural catogory of the argument, but the rest of the sentence is
 // identical. Using interpolation the above message can be rewritten as:
 //
-//   catalog.Set(language.English, "You are %d minute(s) late.",
-//       catalog.Var("minutes",
-//           plural.Selectf(1, "", plural.One, "minute", plural.Other, "minutes")),
-//       catalog.String("You are %[1]d ${minutes} late."))
+//	catalog.Set(language.English, "You are %d minute(s) late.",
+//		catalog.Var("minutes",
+//			plural.Selectf(1, "", plural.One, "minute", plural.Other, "minutes")),
+//		catalog.String("You are %[1]d ${minutes} late."))
 //
 // Var is defined to return the variable name if the message does not yield a
 // match. This allows us to further simplify this snippet to
 //
-//   catalog.Set(language.English, "You are %d minute(s) late.",
-//       catalog.Var("minutes", plural.Selectf(1, "", plural.One, "minute")),
-//       catalog.String("You are %d ${minutes} late."))
+//	catalog.Set(language.English, "You are %d minute(s) late.",
+//		catalog.Var("minutes", plural.Selectf(1, "", plural.One, "minute")),
+//		catalog.String("You are %d ${minutes} late."))
 //
 // Overall this is still only a minor improvement, but things can get a lot more
 // unwieldy if more than one linguistic feature is used to determine a message
 // variant. Consider the following example:
 //
-//   // argument 1: list of hosts, argument 2: list of guests
-//   catalog.Set(language.English, "%[1]v invite(s) %[2]v to their party.",
-//     catalog.Var("their",
-//         plural.Selectf(1, ""
-//             plural.One, gender.Select(1, "female", "her", "other", "his"))),
-//     catalog.Var("invites", plural.Selectf(1, "", plural.One, "invite"))
-//     catalog.String("%[1]v ${invites} %[2]v to ${their} party.")),
+//	// argument 1: list of hosts, argument 2: list of guests
+//	catalog.Set(language.English, "%[1]v invite(s) %[2]v to their party.",
+//		catalog.Var("their",
+//			plural.Selectf(1, ""
+//				plural.One, gender.Select(1, "female", "her", "other", "his"))),
+//		catalog.Var("invites", plural.Selectf(1, "", plural.One, "invite"))
+//		catalog.String("%[1]v ${invites} %[2]v to ${their} party.")),
 //
 // Without variable substitution, this would have to be written as
 //
-//   // argument 1: list of hosts, argument 2: list of guests
-//   catalog.Set(language.English, "%[1]v invite(s) %[2]v to their party.",
-//     plural.Selectf(1, "",
-//         plural.One, gender.Select(1,
-//             "female", "%[1]v invites %[2]v to her party."
-//             "other", "%[1]v invites %[2]v to his party."),
-//         plural.Other, "%[1]v invites %[2]v to their party.")
+//	// argument 1: list of hosts, argument 2: list of guests
+//	catalog.Set(language.English, "%[1]v invite(s) %[2]v to their party.",
+//		plural.Selectf(1, "",
+//			plural.One, gender.Select(1,
+//				"female", "%[1]v invites %[2]v to her party."
+//				"other", "%[1]v invites %[2]v to his party."),
+//			plural.Other, "%[1]v invites %[2]v to their party."))
 //
 // Not necessarily shorter, but using variables there is less duplication and
 // the messages are more maintenance friendly. Moreover, languages may have up
@@ -113,33 +109,32 @@
 // Different messages using the same inflections can reuse variables by moving
 // them to macros. Using macros we can rewrite the message as:
 //
-//   // argument 1: list of hosts, argument 2: list of guests
-//   catalog.SetString(language.English, "%[1]v invite(s) %[2]v to their party.",
-//       "%[1]v ${invites(1)} %[2]v to ${their(1)} party.")
+//	// argument 1: list of hosts, argument 2: list of guests
+//	catalog.SetString(language.English, "%[1]v invite(s) %[2]v to their party.",
+//		"%[1]v ${invites(1)} %[2]v to ${their(1)} party.")
 //
 // Where the following macros were defined separately.
 //
-//   catalog.SetMacro(language.English, "invites", plural.Selectf(1, "",
-//      plural.One, "invite"))
-//   catalog.SetMacro(language.English, "their", plural.Selectf(1, "",
-//      plural.One, gender.Select(1, "female", "her", "other", "his"))),
+//	catalog.SetMacro(language.English, "invites", plural.Selectf(1, "",
+//		plural.One, "invite"))
+//	catalog.SetMacro(language.English, "their", plural.Selectf(1, "",
+//		plural.One, gender.Select(1, "female", "her", "other", "his"))),
 //
 // Placeholders use parentheses and the arguments to invoke a macro.
 //
-//
-// Looking up messages
+// # Looking up messages
 //
 // Message lookup using Catalogs is typically only done by specialized packages
 // and is not something the user should be concerned with. For instance, to
 // express the tardiness of a user using the related message we defined earlier,
 // the user may use the package message like so:
 //
-//   p := message.NewPrinter(language.English)
-//   p.Printf("You are %d minute(s) late.", 5)
+//	p := message.NewPrinter(language.English)
+//	p.Printf("You are %d minute(s) late.", 5)
 //
 // Which would print:
-//   You are 5 minutes late.
 //
+//	You are 5 minutes late.
 //
 // This package is UNDER CONSTRUCTION and its API may change.
 package catalog // import "golang.org/x/text/message/catalog"
diff --git a/message/doc.go b/message/doc.go
index 72e8fde71..4bf7bdcac 100644
--- a/message/doc.go
+++ b/message/doc.go
@@ -5,22 +5,21 @@
 // Package message implements formatted I/O for localized strings with functions
 // analogous to the fmt's print functions. It is a drop-in replacement for fmt.
 //
-//
-// Localized Formatting
+// # Localized Formatting
 //
 // A format string can be localized by replacing any of the print functions of
 // fmt with an equivalent call to a Printer.
 //
-//    p := message.NewPrinter(message.MatchLanguage("en"))
-//    p.Println(123456.78) // Prints 123,456.78
+//	p := message.NewPrinter(message.MatchLanguage("en"))
+//	p.Println(123456.78) // Prints 123,456.78
 //
-//    p.Printf("%d ducks in a row", 4331) // Prints 4,331 ducks in a row
+//	p.Printf("%d ducks in a row", 4331) // Prints 4,331 ducks in a row
 //
-//    p := message.NewPrinter(message.MatchLanguage("nl"))
-//    p.Printf("Hoogte: %.1f meter", 1244.9) // Prints Hoogte: 1,244.9 meter
+//	p := message.NewPrinter(message.MatchLanguage("nl"))
+//	p.Printf("Hoogte: %.1f meter", 1244.9) // Prints Hoogte: 1,244.9 meter
 //
-//    p := message.NewPrinter(message.MatchLanguage("bn"))
-//    p.Println(123456.78) // Prints ১,২৩,৪৫৬.৭৮
+//	p := message.NewPrinter(message.MatchLanguage("bn"))
+//	p.Println(123456.78) // Prints ১,২৩,৪৫৬.৭৮
 //
 // Printer currently supports numbers and specialized types for which packages
 // exist in x/text. Other builtin types such as time.Time and slices are
@@ -35,8 +34,7 @@
 //
 // See package fmt for more options.
 //
-//
-// Translation
+// # Translation
 //
 // The format strings that are passed to Printf, Sprintf, Fprintf, or Errorf
 // are used as keys to look up translations for the specified languages.
@@ -44,34 +42,36 @@
 //
 // One can use arbitrary keys to distinguish between otherwise ambiguous
 // strings:
-//    p := message.NewPrinter(language.English)
-//    p.Printf("archive(noun)")  // Prints "archive"
-//    p.Printf("archive(verb)")  // Prints "archive"
 //
-//    p := message.NewPrinter(language.German)
-//    p.Printf("archive(noun)")  // Prints "Archiv"
-//    p.Printf("archive(verb)")  // Prints "archivieren"
+//	p := message.NewPrinter(language.English)
+//	p.Printf("archive(noun)")  // Prints "archive"
+//	p.Printf("archive(verb)")  // Prints "archive"
+//
+//	p := message.NewPrinter(language.German)
+//	p.Printf("archive(noun)")  // Prints "Archiv"
+//	p.Printf("archive(verb)")  // Prints "archivieren"
 //
 // To retain the fallback functionality, use Key:
-//    p.Printf(message.Key("archive(noun)", "archive"))
-//    p.Printf(message.Key("archive(verb)", "archive"))
 //
+//	p.Printf(message.Key("archive(noun)", "archive"))
+//	p.Printf(message.Key("archive(verb)", "archive"))
 //
-// Translation Pipeline
+// # Translation Pipeline
 //
 // Format strings that contain text need to be translated to support different
 // locales. The first step is to extract strings that need to be translated.
 //
 // 1. Install gotext
-//    go get -u golang.org/x/text/cmd/gotext
-//    gotext -help
+//
+//	go get -u golang.org/x/text/cmd/gotext
+//	gotext -help
 //
 // 2. Mark strings in your source to be translated by using message.Printer,
 // instead of the functions of the fmt package.
 //
 // 3. Extract the strings from your source
 //
-//    gotext extract
+//	gotext extract
 //
 // The output will be written to the textdata directory.
 //
@@ -89,13 +89,11 @@
 // see also package golang.org/x/text/message/catalog can be used to implement
 // either dynamic or static loading of messages.
 //
-//
-// Plural and Gender Forms
+// # Plural and Gender Forms
 //
 // Translated messages can vary based on the plural and gender forms of
 // substitution values. In general, it is up to the translators to provide
 // alternative translations for such forms. See the packages in
 // golang.org/x/text/feature and golang.org/x/text/message/catalog for more
 // information.
-//
 package message
diff --git a/number/doc.go b/number/doc.go
index 2ad8d431a..876623086 100644
--- a/number/doc.go
+++ b/number/doc.go
@@ -9,19 +9,18 @@
 // builtin Go types and anything that implements the Convert interface
 // (currently internal).
 //
-//    p := message.NewPrinter(language.English)
+//	p := message.NewPrinter(language.English)
 //
-//    p.Printf("%v bottles of beer on the wall.", number.Decimal(1234))
-//    // Prints: 1,234 bottles of beer on the wall.
+//	p.Printf("%v bottles of beer on the wall.", number.Decimal(1234))
+//	// Prints: 1,234 bottles of beer on the wall.
 //
-//    p.Printf("%v of gophers lose too much fur", number.Percent(0.12))
-//    // Prints: 12% of gophers lose too much fur.
+//	p.Printf("%v of gophers lose too much fur", number.Percent(0.12))
+//	// Prints: 12% of gophers lose too much fur.
 //
-//    p := message.NewPrinter(language.Dutch)
-//
-//    p.Printf("There are %v bikes per household.", number.Decimal(1.2))
-//    // Prints: Er zijn 1,2 fietsen per huishouden.
+//	p := message.NewPrinter(language.Dutch)
 //
+//	p.Printf("There are %v bikes per household.", number.Decimal(1.2))
+//	// Prints: Er zijn 1,2 fietsen per huishouden.
 //
 // The width and scale specified in the formatting directives override the
 // configuration of the formatter.
diff --git a/unicode/bidi/core.go b/unicode/bidi/core.go
index fde188a33..9d2ae547b 100644
--- a/unicode/bidi/core.go
+++ b/unicode/bidi/core.go
@@ -193,14 +193,14 @@ func (p *paragraph) run() {
 //
 // At the end of this function:
 //
-//  - The member variable matchingPDI is set to point to the index of the
-//    matching PDI character for each isolate initiator character. If there is
-//    no matching PDI, it is set to the length of the input text. For other
-//    characters, it is set to -1.
-//  - The member variable matchingIsolateInitiator is set to point to the
-//    index of the matching isolate initiator character for each PDI character.
-//    If there is no matching isolate initiator, or the character is not a PDI,
-//    it is set to -1.
+//   - The member variable matchingPDI is set to point to the index of the
+//     matching PDI character for each isolate initiator character. If there is
+//     no matching PDI, it is set to the length of the input text. For other
+//     characters, it is set to -1.
+//   - The member variable matchingIsolateInitiator is set to point to the
+//     index of the matching isolate initiator character for each PDI character.
+//     If there is no matching isolate initiator, or the character is not a PDI,
+//     it is set to -1.
 func (p *paragraph) determineMatchingIsolates() {
 	p.matchingPDI = make([]int, p.Len())
 	p.matchingIsolateInitiator = make([]int, p.Len())
@@ -435,7 +435,7 @@ func maxLevel(a, b level) level {
 }
 
 // Rule X10, second bullet: Determine the start-of-sequence (sos) and end-of-sequence (eos) types,
-// 			 either L or R, for each isolating run sequence.
+// either L or R, for each isolating run sequence.
 func (p *paragraph) isolatingRunSequence(indexes []int) *isolatingRunSequence {
 	length := len(indexes)
 	types := make([]Class, length)
@@ -905,7 +905,7 @@ func (p *paragraph) getLevels(linebreaks []int) []level {
 // Lines are concatenated from left to right. So for example, the fifth
 // character from the left on the third line is
 //
-// 		getReordering(linebreaks)[linebreaks[1] + 4]
+//	getReordering(linebreaks)[linebreaks[1] + 4]
 //
 // (linebreaks[1] is the position after the last character of the second
 // line, which is also the index of the first character on the third line,
diff --git a/unicode/cldr/collate.go b/unicode/cldr/collate.go
index 27c5bac9a..056fe7f7f 100644
--- a/unicode/cldr/collate.go
+++ b/unicode/cldr/collate.go
@@ -98,9 +98,13 @@ func processRules(p RuleProcessor, s string) (err error) {
 }
 
 // parseSpecialAnchor parses the anchor syntax which is either of the form
-//    ['before' <level>] <anchor>
+//
+//	['before' <level>] <anchor>
+//
 // or
-//    [<label>]
+//
+//	[<label>]
+//
 // The starting should already be consumed.
 func parseSpecialAnchor(p RuleProcessor, s string) (tail string, err error) {
 	i := strings.IndexByte(s, ']')
diff --git a/unicode/norm/forminfo.go b/unicode/norm/forminfo.go
index 526c7033a..d69ccb4f9 100644
--- a/unicode/norm/forminfo.go
+++ b/unicode/norm/forminfo.go
@@ -110,10 +110,11 @@ func (p Properties) BoundaryAfter() bool {
 }
 
 // We pack quick check data in 4 bits:
-//   5:    Combines forward  (0 == false, 1 == true)
-//   4..3: NFC_QC Yes(00), No (10), or Maybe (11)
-//   2:    NFD_QC Yes (0) or No (1). No also means there is a decomposition.
-//   1..0: Number of trailing non-starters.
+//
+//	5:    Combines forward  (0 == false, 1 == true)
+//	4..3: NFC_QC Yes(00), No (10), or Maybe (11)
+//	2:    NFD_QC Yes (0) or No (1). No also means there is a decomposition.
+//	1..0: Number of trailing non-starters.
 //
 // When all 4 bits are zero, the character is inert, meaning it is never
 // influenced by normalization.
diff --git a/unicode/norm/maketables.go b/unicode/norm/maketables.go
index 0d24d2117..dd05b6f4a 100644
--- a/unicode/norm/maketables.go
+++ b/unicode/norm/maketables.go
@@ -132,8 +132,10 @@ func (c Char) String() string {
 }
 
 // In UnicodeData.txt, some ranges are marked like this:
+//
 //	3400;<CJK Ideograph Extension A, First>;Lo;0;L;;;;;N;;;;;
 //	4DB5;<CJK Ideograph Extension A, Last>;Lo;0;L;;;;;N;;;;;
+//
 // parseCharacter keeps a state variable indicating the weirdness.
 type State int
 
diff --git a/unicode/norm/normalize.go b/unicode/norm/normalize.go
index 95efcf26e..4747ad07a 100644
--- a/unicode/norm/normalize.go
+++ b/unicode/norm/normalize.go
@@ -18,16 +18,17 @@ import (
 // A Form denotes a canonical representation of Unicode code points.
 // The Unicode-defined normalization and equivalence forms are:
 //
-//   NFC   Unicode Normalization Form C
-//   NFD   Unicode Normalization Form D
-//   NFKC  Unicode Normalization Form KC
-//   NFKD  Unicode Normalization Form KD
+//	NFC   Unicode Normalization Form C
+//	NFD   Unicode Normalization Form D
+//	NFKC  Unicode Normalization Form KC
+//	NFKD  Unicode Normalization Form KD
 //
 // For a Form f, this documentation uses the notation f(x) to mean
 // the bytes or string x converted to the given form.
 // A position n in x is called a boundary if conversion to the form can
 // proceed independently on both sides:
-//   f(x) == append(f(x[0:n]), f(x[n:])...)
+//
+//	f(x) == append(f(x[0:n]), f(x[n:])...)
 //
 // References: https://unicode.org/reports/tr15/ and
 // https://unicode.org/notes/tn5/.
diff --git a/width/tables10.0.0.go b/width/tables10.0.0.go
index 186b1d4ef..cd9d91caf 100644
--- a/width/tables10.0.0.go
+++ b/width/tables10.0.0.go
@@ -1146,21 +1146,31 @@ var widthIndex = [1408]uint8{
 }
 
 // inverseData contains 4-byte entries of the following format:
-//   <length> <modified UTF-8-encoded rune> <0 padding>
+//
+//	<length> <modified UTF-8-encoded rune> <0 padding>
+//
 // The last byte of the UTF-8-encoded rune is xor-ed with the last byte of the
 // UTF-8 encoding of the original rune. Mappings often have the following
 // pattern:
-//   Ａ -> A  (U+FF21 -> U+0041)
-//   Ｂ -> B  (U+FF22 -> U+0042)
-//   ...
+//
+//	Ａ -> A  (U+FF21 -> U+0041)
+//	Ｂ -> B  (U+FF22 -> U+0042)
+//	...
+//
 // By xor-ing the last byte the same entry can be shared by many mappings. This
 // reduces the total number of distinct entries by about two thirds.
 // The resulting entry for the aforementioned mappings is
-//   { 0x01, 0xE0, 0x00, 0x00 }
+//
+//	{ 0x01, 0xE0, 0x00, 0x00 }
+//
 // Using this entry to map U+FF21 (UTF-8 [EF BC A1]), we get
-//   E0 ^ A1 = 41.
+//
+//	E0 ^ A1 = 41.
+//
 // Similarly, for U+FF22 (UTF-8 [EF BC A2]), we get
-//   E0 ^ A2 = 42.
+//
+//	E0 ^ A2 = 42.
+//
 // Note that because of the xor-ing, the byte sequence stored in the entry is
 // not valid UTF-8.
 var inverseData = [150][4]byte{
diff --git a/width/tables11.0.0.go b/width/tables11.0.0.go
index 990f7622f..327eaef9b 100644
--- a/width/tables11.0.0.go
+++ b/width/tables11.0.0.go
@@ -1158,21 +1158,31 @@ var widthIndex = [1408]uint8{
 }
 
 // inverseData contains 4-byte entries of the following format:
-//   <length> <modified UTF-8-encoded rune> <0 padding>
+//
+//	<length> <modified UTF-8-encoded rune> <0 padding>
+//
 // The last byte of the UTF-8-encoded rune is xor-ed with the last byte of the
 // UTF-8 encoding of the original rune. Mappings often have the following
 // pattern:
-//   Ａ -> A  (U+FF21 -> U+0041)
-//   Ｂ -> B  (U+FF22 -> U+0042)
-//   ...
+//
+//	Ａ -> A  (U+FF21 -> U+0041)
+//	Ｂ -> B  (U+FF22 -> U+0042)
+//	...
+//
 // By xor-ing the last byte the same entry can be shared by many mappings. This
 // reduces the total number of distinct entries by about two thirds.
 // The resulting entry for the aforementioned mappings is
-//   { 0x01, 0xE0, 0x00, 0x00 }
+//
+//	{ 0x01, 0xE0, 0x00, 0x00 }
+//
 // Using this entry to map U+FF21 (UTF-8 [EF BC A1]), we get
-//   E0 ^ A1 = 41.
+//
+//	E0 ^ A1 = 41.
+//
 // Similarly, for U+FF22 (UTF-8 [EF BC A2]), we get
-//   E0 ^ A2 = 42.
+//
+//	E0 ^ A2 = 42.
+//
 // Note that because of the xor-ing, the byte sequence stored in the entry is
 // not valid UTF-8.
 var inverseData = [150][4]byte{
diff --git a/width/tables12.0.0.go b/width/tables12.0.0.go
index 85296297e..5c14ade6d 100644
--- a/width/tables12.0.0.go
+++ b/width/tables12.0.0.go
@@ -1178,21 +1178,31 @@ var widthIndex = [1408]uint8{
 }
 
 // inverseData contains 4-byte entries of the following format:
-//   <length> <modified UTF-8-encoded rune> <0 padding>
+//
+//	<length> <modified UTF-8-encoded rune> <0 padding>
+//
 // The last byte of the UTF-8-encoded rune is xor-ed with the last byte of the
 // UTF-8 encoding of the original rune. Mappings often have the following
 // pattern:
-//   Ａ -> A  (U+FF21 -> U+0041)
-//   Ｂ -> B  (U+FF22 -> U+0042)
-//   ...
+//
+//	Ａ -> A  (U+FF21 -> U+0041)
+//	Ｂ -> B  (U+FF22 -> U+0042)
+//	...
+//
 // By xor-ing the last byte the same entry can be shared by many mappings. This
 // reduces the total number of distinct entries by about two thirds.
 // The resulting entry for the aforementioned mappings is
-//   { 0x01, 0xE0, 0x00, 0x00 }
+//
+//	{ 0x01, 0xE0, 0x00, 0x00 }
+//
 // Using this entry to map U+FF21 (UTF-8 [EF BC A1]), we get
-//   E0 ^ A1 = 41.
+//
+//	E0 ^ A1 = 41.
+//
 // Similarly, for U+FF22 (UTF-8 [EF BC A2]), we get
-//   E0 ^ A2 = 42.
+//
+//	E0 ^ A2 = 42.
+//
 // Note that because of the xor-ing, the byte sequence stored in the entry is
 // not valid UTF-8.
 var inverseData = [150][4]byte{
diff --git a/width/tables13.0.0.go b/width/tables13.0.0.go
index bac3f1aee..ab258e384 100644
--- a/width/tables13.0.0.go
+++ b/width/tables13.0.0.go
@@ -1179,21 +1179,31 @@ var widthIndex = [1408]uint8{
 }
 
 // inverseData contains 4-byte entries of the following format:
-//   <length> <modified UTF-8-encoded rune> <0 padding>
+//
+//	<length> <modified UTF-8-encoded rune> <0 padding>
+//
 // The last byte of the UTF-8-encoded rune is xor-ed with the last byte of the
 // UTF-8 encoding of the original rune. Mappings often have the following
 // pattern:
-//   Ａ -> A  (U+FF21 -> U+0041)
-//   Ｂ -> B  (U+FF22 -> U+0042)
-//   ...
+//
+//	Ａ -> A  (U+FF21 -> U+0041)
+//	Ｂ -> B  (U+FF22 -> U+0042)
+//	...
+//
 // By xor-ing the last byte the same entry can be shared by many mappings. This
 // reduces the total number of distinct entries by about two thirds.
 // The resulting entry for the aforementioned mappings is
-//   { 0x01, 0xE0, 0x00, 0x00 }
+//
+//	{ 0x01, 0xE0, 0x00, 0x00 }
+//
 // Using this entry to map U+FF21 (UTF-8 [EF BC A1]), we get
-//   E0 ^ A1 = 41.
+//
+//	E0 ^ A1 = 41.
+//
 // Similarly, for U+FF22 (UTF-8 [EF BC A2]), we get
-//   E0 ^ A2 = 42.
+//
+//	E0 ^ A2 = 42.
+//
 // Note that because of the xor-ing, the byte sequence stored in the entry is
 // not valid UTF-8.
 var inverseData = [150][4]byte{
diff --git a/width/tables9.0.0.go b/width/tables9.0.0.go
index b3db84f6f..6781f3d96 100644
--- a/width/tables9.0.0.go
+++ b/width/tables9.0.0.go
@@ -1114,21 +1114,31 @@ var widthIndex = [1408]uint8{
 }
 
 // inverseData contains 4-byte entries of the following format:
-//   <length> <modified UTF-8-encoded rune> <0 padding>
+//
+//	<length> <modified UTF-8-encoded rune> <0 padding>
+//
 // The last byte of the UTF-8-encoded rune is xor-ed with the last byte of the
 // UTF-8 encoding of the original rune. Mappings often have the following
 // pattern:
-//   Ａ -> A  (U+FF21 -> U+0041)
-//   Ｂ -> B  (U+FF22 -> U+0042)
-//   ...
+//
+//	Ａ -> A  (U+FF21 -> U+0041)
+//	Ｂ -> B  (U+FF22 -> U+0042)
+//	...
+//
 // By xor-ing the last byte the same entry can be shared by many mappings. This
 // reduces the total number of distinct entries by about two thirds.
 // The resulting entry for the aforementioned mappings is
-//   { 0x01, 0xE0, 0x00, 0x00 }
+//
+//	{ 0x01, 0xE0, 0x00, 0x00 }
+//
 // Using this entry to map U+FF21 (UTF-8 [EF BC A1]), we get
-//   E0 ^ A1 = 41.
+//
+//	E0 ^ A1 = 41.
+//
 // Similarly, for U+FF22 (UTF-8 [EF BC A2]), we get
-//   E0 ^ A2 = 42.
+//
+//	E0 ^ A2 = 42.
+//
 // Note that because of the xor-ing, the byte sequence stored in the entry is
 // not valid UTF-8.
 var inverseData = [150][4]byte{

From 78819d01d041a94e055bbaa2d95e5e4d49e8f8a0 Mon Sep 17 00:00:00 2001
From: Ian Lance Taylor <iant@golang.org>
Date: Mon, 25 Apr 2022 15:01:07 -0700
Subject: [PATCH 31/40] go.mod: update to golang.org/x/text v0.1.10

go get -u golang.org/x/tools
go mod tidy

For golang/go#50558
Fixes golang/go#52552

Change-Id: I233aa90922fc23800563fd05beb4be6f7e87cf5b
Reviewed-on: https://go-review.googlesource.com/c/text/+/402254
Run-TryBot: Ian Lance Taylor <iant@golang.org>
TryBot-Result: Gopher Robot <gobot@golang.org>
Reviewed-by: Robert Findley <rfindley@google.com>
Auto-Submit: Ian Lance Taylor <iant@google.com>
Reviewed-by: Ian Lance Taylor <iant@google.com>
Run-TryBot: Ian Lance Taylor <iant@google.com>
---
 go.mod |  6 +++---
 go.sum | 24 +++++++++++++-----------
 2 files changed, 16 insertions(+), 14 deletions(-)

diff --git a/go.mod b/go.mod
index 32d3aa025..3737e1a8f 100644
--- a/go.mod
+++ b/go.mod
@@ -1,10 +1,10 @@
 module golang.org/x/text
 
-require golang.org/x/tools v0.1.7
+require golang.org/x/tools v0.1.10
 
 require (
-	golang.org/x/mod v0.4.2 // indirect
-	golang.org/x/sys v0.0.0-20210809222454-d867a43fc93e // indirect
+	golang.org/x/mod v0.6.0-dev.0.20220106191415-9b9b3d81d5e3 // indirect
+	golang.org/x/sys v0.0.0-20211019181941-9d821ace8654 // indirect
 	golang.org/x/xerrors v0.0.0-20200804184101-5ec99f83aff1 // indirect
 )
 
diff --git a/go.sum b/go.sum
index 13ba81505..3f735d1c2 100644
--- a/go.sum
+++ b/go.sum
@@ -1,26 +1,28 @@
-github.com/yuin/goldmark v1.4.0/go.mod h1:mwnBkeHKe2W/ZEtQ+71ViKU8L12m81fl3OWwC1Zlc8k=
+github.com/yuin/goldmark v1.4.1/go.mod h1:mwnBkeHKe2W/ZEtQ+71ViKU8L12m81fl3OWwC1Zlc8k=
 golang.org/x/crypto v0.0.0-20190308221718-c2843e01d9a2/go.mod h1:djNgcEr1/C05ACkg1iLfiJU5Ep61QUkGW8qpdssI0+w=
-golang.org/x/crypto v0.0.0-20191011191535-87dc89f01550/go.mod h1:yigFU9vqHzYiE8UmvKecakEJjdnWj3jj499lnFckfCI=
-golang.org/x/mod v0.4.2 h1:Gz96sIWK3OalVv/I/qNygP42zyoKp3xptRVCWRFEBvo=
-golang.org/x/mod v0.4.2/go.mod h1:s0Qsj1ACt9ePp/hMypM3fl4fZqREWJwdYDEqhRiZZUA=
-golang.org/x/net v0.0.0-20190404232315-eb5bcb51f2a3/go.mod h1:t9HGtf8HONx5eT2rtn7q6eTqICYqUVnKs3thJo3Qplg=
+golang.org/x/crypto v0.0.0-20210921155107-089bfa567519/go.mod h1:GvvjBRRGRdwPK5ydBHafDWAxML/pGHZbMvKqRZ5+Abc=
+golang.org/x/mod v0.6.0-dev.0.20220106191415-9b9b3d81d5e3 h1:kQgndtyPBW/JIYERgdxfwMYh3AVStj88WQTlNDi2a+o=
+golang.org/x/mod v0.6.0-dev.0.20220106191415-9b9b3d81d5e3/go.mod h1:3p9vT2HGsQu2K1YbXdKPJLVgG5VJdoTa1poYQBtP1AY=
 golang.org/x/net v0.0.0-20190620200207-3b0461eec859/go.mod h1:z5CRVTTTmAJ677TzLLGU+0bjPO0LkuOLi4/5GtJWs/s=
-golang.org/x/net v0.0.0-20210805182204-aaa1db679c0d/go.mod h1:9nx3DQGgdP8bBQD5qxJ1jj9UTztislL4KSBs9R2vV5Y=
+golang.org/x/net v0.0.0-20210226172049-e18ecbb05110/go.mod h1:m0MpNAwzfU5UDzcl9v0D8zg8gWTRqZa9RBIspLL5mdg=
+golang.org/x/net v0.0.0-20211015210444-4f30a5c0130f/go.mod h1:9nx3DQGgdP8bBQD5qxJ1jj9UTztislL4KSBs9R2vV5Y=
 golang.org/x/sync v0.0.0-20190423024810-112230192c58/go.mod h1:RxMgew5VJxzue5/jJTE5uejpjVlOe/izrB70Jof72aM=
 golang.org/x/sync v0.0.0-20210220032951-036812b2e83c/go.mod h1:RxMgew5VJxzue5/jJTE5uejpjVlOe/izrB70Jof72aM=
 golang.org/x/sys v0.0.0-20190215142949-d0b11bdaac8a/go.mod h1:STP8DvDyc/dI5b8T5hshtkjS+E42TnysNCUPdjciGhY=
-golang.org/x/sys v0.0.0-20190412213103-97732733099d/go.mod h1:h1NjWce9XRLGQEsW7wpKNCjG9DtNlClVuFLEZdDNbEs=
 golang.org/x/sys v0.0.0-20201119102817-f84b799fce68/go.mod h1:h1NjWce9XRLGQEsW7wpKNCjG9DtNlClVuFLEZdDNbEs=
 golang.org/x/sys v0.0.0-20210423082822-04245dca01da/go.mod h1:h1NjWce9XRLGQEsW7wpKNCjG9DtNlClVuFLEZdDNbEs=
-golang.org/x/sys v0.0.0-20210809222454-d867a43fc93e h1:WUoyKPm6nCo1BnNUvPGnFG3T5DUVem42yDJZZ4CNxMA=
-golang.org/x/sys v0.0.0-20210809222454-d867a43fc93e/go.mod h1:oPkhp1MJrh7nUepCBck5+mAzfO9JrbApNNgaTdGDITg=
+golang.org/x/sys v0.0.0-20210615035016-665e8c7367d1/go.mod h1:oPkhp1MJrh7nUepCBck5+mAzfO9JrbApNNgaTdGDITg=
+golang.org/x/sys v0.0.0-20211019181941-9d821ace8654 h1:id054HUawV2/6IGm2IV8KZQjqtwAOo2CYlOToYqa0d0=
+golang.org/x/sys v0.0.0-20211019181941-9d821ace8654/go.mod h1:oPkhp1MJrh7nUepCBck5+mAzfO9JrbApNNgaTdGDITg=
 golang.org/x/term v0.0.0-20201126162022-7de9c90e9dd1/go.mod h1:bj7SfCRtBDWHUb9snDiAeCFNEtKQo2Wmx5Cou7ajbmo=
 golang.org/x/text v0.3.0/go.mod h1:NqM8EUOU14njkJ3fqMW+pc6Ldnwhi/IjpwHt7yyuwOQ=
+golang.org/x/text v0.3.3/go.mod h1:5Zoc/QRtKVWzQhOtBMvqHzDpF6irO9z98xDceosuGiQ=
 golang.org/x/text v0.3.6/go.mod h1:5Zoc/QRtKVWzQhOtBMvqHzDpF6irO9z98xDceosuGiQ=
+golang.org/x/text v0.3.7/go.mod h1:u+2+/6zg+i71rQMx5EYifcz6MCKuco9NR6JIITiCfzQ=
 golang.org/x/tools v0.0.0-20180917221912-90fa682c2a6e/go.mod h1:n7NCudcB/nEzxVGmLbDWY5pfWTLqBcC2KZ6jyYvM4mQ=
 golang.org/x/tools v0.0.0-20191119224855-298f0cb1881e/go.mod h1:b+2E5dAYhXwXZwtnZ6UAqBI28+e2cm9otk0dWdXHAEo=
-golang.org/x/tools v0.1.7 h1:6j8CgantCy3yc8JGBqkDLMKWqZ0RDU2g1HVgacojGWQ=
-golang.org/x/tools v0.1.7/go.mod h1:LGqMHiF4EqQNHR1JncWGqT5BVaXmza+X+BDGol+dOxo=
+golang.org/x/tools v0.1.10 h1:QjFRCZxdOhBJ/UNgnBZLbNV13DlbnK0quyivTnXJM20=
+golang.org/x/tools v0.1.10/go.mod h1:Uh6Zz+xoGYZom868N8YTex3t7RhtHDBrE8Gzo9bV56E=
 golang.org/x/xerrors v0.0.0-20190717185122-a985d3407aa7/go.mod h1:I/5z698sn9Ka8TeJc9MKroUUfqBBauWjQqLJ2OPfmY0=
 golang.org/x/xerrors v0.0.0-20191011141410-1b5146add898/go.mod h1:I/5z698sn9Ka8TeJc9MKroUUfqBBauWjQqLJ2OPfmY0=
 golang.org/x/xerrors v0.0.0-20200804184101-5ec99f83aff1 h1:go1bK/D/BFZV2I8cIQd1NKEZ+0owSTG1fDTci4IqFcE=

From ea49e3e2d5b3f1518081d8bc53ffefc8bc60ecec Mon Sep 17 00:00:00 2001
From: "Bryan C. Mills" <bcmills@google.com>
Date: Wed, 4 May 2022 14:38:27 -0400
Subject: [PATCH 32/40] go.mod: update x/tools to HEAD

x/tools/go/ssa is used by message/pipeline, and at its latest release
does not support generics. However, x/tools/go/ssa does seem to
support generics at head; upgrade to fix a build break if Go 1.19
ships with generic APIs in any imported packages.

Fixes golang/go#52711.

Change-Id: I75492dbcdfef9024ec2bc324f44c01a4239e1efd
Reviewed-on: https://go-review.googlesource.com/c/text/+/403852
TryBot-Result: Gopher Robot <gobot@golang.org>
Reviewed-by: Ian Lance Taylor <iant@google.com>
Run-TryBot: Bryan Mills <bcmills@google.com>
Auto-Submit: Bryan Mills <bcmills@google.com>
---
 go.mod |  5 ++---
 go.sum | 11 ++++-------
 2 files changed, 6 insertions(+), 10 deletions(-)

diff --git a/go.mod b/go.mod
index 3737e1a8f..21572583a 100644
--- a/go.mod
+++ b/go.mod
@@ -1,11 +1,10 @@
 module golang.org/x/text
 
-require golang.org/x/tools v0.1.10
+require golang.org/x/tools v0.1.11-0.20220504162446-54c7ba520b92
 
 require (
-	golang.org/x/mod v0.6.0-dev.0.20220106191415-9b9b3d81d5e3 // indirect
+	golang.org/x/mod v0.6.0-dev.0.20220419223038-86c51ed26bb4 // indirect
 	golang.org/x/sys v0.0.0-20211019181941-9d821ace8654 // indirect
-	golang.org/x/xerrors v0.0.0-20200804184101-5ec99f83aff1 // indirect
 )
 
 go 1.17
diff --git a/go.sum b/go.sum
index 3f735d1c2..7e13ec7fd 100644
--- a/go.sum
+++ b/go.sum
@@ -1,8 +1,8 @@
 github.com/yuin/goldmark v1.4.1/go.mod h1:mwnBkeHKe2W/ZEtQ+71ViKU8L12m81fl3OWwC1Zlc8k=
 golang.org/x/crypto v0.0.0-20190308221718-c2843e01d9a2/go.mod h1:djNgcEr1/C05ACkg1iLfiJU5Ep61QUkGW8qpdssI0+w=
 golang.org/x/crypto v0.0.0-20210921155107-089bfa567519/go.mod h1:GvvjBRRGRdwPK5ydBHafDWAxML/pGHZbMvKqRZ5+Abc=
-golang.org/x/mod v0.6.0-dev.0.20220106191415-9b9b3d81d5e3 h1:kQgndtyPBW/JIYERgdxfwMYh3AVStj88WQTlNDi2a+o=
-golang.org/x/mod v0.6.0-dev.0.20220106191415-9b9b3d81d5e3/go.mod h1:3p9vT2HGsQu2K1YbXdKPJLVgG5VJdoTa1poYQBtP1AY=
+golang.org/x/mod v0.6.0-dev.0.20220419223038-86c51ed26bb4 h1:6zppjxzCulZykYSLyVDYbneBfbaBIQPYMevg0bEwv2s=
+golang.org/x/mod v0.6.0-dev.0.20220419223038-86c51ed26bb4/go.mod h1:jJ57K6gSWd91VN4djpZkiMVwK6gcyfeH4XE8wZrZaV4=
 golang.org/x/net v0.0.0-20190620200207-3b0461eec859/go.mod h1:z5CRVTTTmAJ677TzLLGU+0bjPO0LkuOLi4/5GtJWs/s=
 golang.org/x/net v0.0.0-20210226172049-e18ecbb05110/go.mod h1:m0MpNAwzfU5UDzcl9v0D8zg8gWTRqZa9RBIspLL5mdg=
 golang.org/x/net v0.0.0-20211015210444-4f30a5c0130f/go.mod h1:9nx3DQGgdP8bBQD5qxJ1jj9UTztislL4KSBs9R2vV5Y=
@@ -21,9 +21,6 @@ golang.org/x/text v0.3.6/go.mod h1:5Zoc/QRtKVWzQhOtBMvqHzDpF6irO9z98xDceosuGiQ=
 golang.org/x/text v0.3.7/go.mod h1:u+2+/6zg+i71rQMx5EYifcz6MCKuco9NR6JIITiCfzQ=
 golang.org/x/tools v0.0.0-20180917221912-90fa682c2a6e/go.mod h1:n7NCudcB/nEzxVGmLbDWY5pfWTLqBcC2KZ6jyYvM4mQ=
 golang.org/x/tools v0.0.0-20191119224855-298f0cb1881e/go.mod h1:b+2E5dAYhXwXZwtnZ6UAqBI28+e2cm9otk0dWdXHAEo=
-golang.org/x/tools v0.1.10 h1:QjFRCZxdOhBJ/UNgnBZLbNV13DlbnK0quyivTnXJM20=
-golang.org/x/tools v0.1.10/go.mod h1:Uh6Zz+xoGYZom868N8YTex3t7RhtHDBrE8Gzo9bV56E=
+golang.org/x/tools v0.1.11-0.20220504162446-54c7ba520b92 h1:bKfKpfzAxCZ+/Th2EbSQcaLiq8xDP3n33SlwYkfoOgM=
+golang.org/x/tools v0.1.11-0.20220504162446-54c7ba520b92/go.mod h1:SgwaegtQh8clINPpECJMqnxLv9I09HLqnW3RMqW0CA4=
 golang.org/x/xerrors v0.0.0-20190717185122-a985d3407aa7/go.mod h1:I/5z698sn9Ka8TeJc9MKroUUfqBBauWjQqLJ2OPfmY0=
-golang.org/x/xerrors v0.0.0-20191011141410-1b5146add898/go.mod h1:I/5z698sn9Ka8TeJc9MKroUUfqBBauWjQqLJ2OPfmY0=
-golang.org/x/xerrors v0.0.0-20200804184101-5ec99f83aff1 h1:go1bK/D/BFZV2I8cIQd1NKEZ+0owSTG1fDTci4IqFcE=
-golang.org/x/xerrors v0.0.0-20200804184101-5ec99f83aff1/go.mod h1:I/5z698sn9Ka8TeJc9MKroUUfqBBauWjQqLJ2OPfmY0=

From b4bca84b03619dba00657375259024a7f8ae6712 Mon Sep 17 00:00:00 2001
From: Kevin Smith <ksmith.nop@gmail.com>
Date: Thu, 18 Feb 2021 03:11:56 +0000
Subject: [PATCH 33/40] language/display: fix Tag method comment

Minor fix to comment.

Change-Id: I181de709f02faf433e97f38208039bf789e6b71d
GitHub-Last-Rev: fd7f6501c5c677ba7f1d6779bb88cbf82c9a6f10
GitHub-Pull-Request: golang/text#19
Reviewed-on: https://go-review.googlesource.com/c/text/+/293469
Reviewed-by: Ian Lance Taylor <iant@google.com>
Reviewed-by: Marcel van Lohuizen <mpvl@golang.org>
Run-TryBot: Ian Lance Taylor <iant@google.com>
Auto-Submit: Ian Lance Taylor <iant@google.com>
Run-TryBot: Marcel van Lohuizen <mpvl@golang.org>
Reviewed-by: Carlos Amedee <carlos@golang.org>
TryBot-Result: Gopher Robot <gobot@golang.org>
---
 language/display/display.go | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/language/display/display.go b/language/display/display.go
index d043da907..31bdd6c6b 100644
--- a/language/display/display.go
+++ b/language/display/display.go
@@ -85,7 +85,7 @@ func Script(script interface{}) Formatter {
 	return Formatter{scriptFunc, script}
 }
 
-// Script returns a Formatter that renders the name for tag in the current
+// Tag returns a Formatter that renders the name for tag in the current
 // language. tag may be a language.Tag.
 // It renders tag in the default language if no translation for the current
 // language is supported.

From d03b41800055b01e3895b1e047af09733c93bf63 Mon Sep 17 00:00:00 2001
From: Russ Cox <rsc@golang.org>
Date: Fri, 22 Jul 2022 11:11:07 -0400
Subject: [PATCH 34/40] A+C: delete AUTHORS and CONTRIBUTORS

In 2009, Google's open-source lawyers asked us to create the AUTHORS
file to define "The Go Authors", and the CONTRIBUTORS file was in
keeping with open source best practices of the time.

Re-reviewing our repos now in 2022, the open-source lawyers are
comfortable with source control history taking the place of the
AUTHORS file, and most open source projects no longer maintain
CONTRIBUTORS files.

To ease maintenance, remove AUTHORS and CONTRIBUTORS from all repos.

For golang/go#53961.

Change-Id: I3abeb5f16d9a9446e16a3a5318d22a9c622db0b6
Reviewed-on: https://go-review.googlesource.com/c/text/+/418923
TryBot-Result: Gopher Robot <gobot@golang.org>
Reviewed-by: David Chase <drchase@google.com>
Run-TryBot: Russ Cox <rsc@golang.org>
---
 AUTHORS      | 3 ---
 CONTRIBUTORS | 3 ---
 2 files changed, 6 deletions(-)
 delete mode 100644 AUTHORS
 delete mode 100644 CONTRIBUTORS

diff --git a/AUTHORS b/AUTHORS
deleted file mode 100644
index 15167cd74..000000000
--- a/AUTHORS
+++ /dev/null
@@ -1,3 +0,0 @@
-# This source code refers to The Go Authors for copyright purposes.
-# The master list of authors is in the main Go distribution,
-# visible at http://tip.golang.org/AUTHORS.
diff --git a/CONTRIBUTORS b/CONTRIBUTORS
deleted file mode 100644
index 1c4577e96..000000000
--- a/CONTRIBUTORS
+++ /dev/null
@@ -1,3 +0,0 @@
-# This source code was written by the Go contributors.
-# The master list of contributors is in the main Go distribution,
-# visible at http://tip.golang.org/CONTRIBUTORS.

From ba9b0e1d4b03523c708709935fbc961124b6967b Mon Sep 17 00:00:00 2001
From: Jaroslavs Samcuks <yarcat@gmail.com>
Date: Fri, 12 Aug 2022 18:16:46 +0000
Subject: [PATCH 35/40] go.mod: update x/tools to HEAD

go get -u golang.org/x/tools
go mod tidy

x/tools/go/ssa is used by message/pipeline. Generics instantiation in
x/tools@0.1.11 could be confused with container index. However,
x/tools/go/ssa does have it fixed in x/tools@0.1.12 (see golang/go#52834).
This change upgrades the required version to ensure that fewer users of
message/pipelines have issues.

Updates golang/go#54086

Change-Id: I03882a7bb2c75a8f16ef376d06f2cf714d39e7a2
GitHub-Last-Rev: 351404b6dbc98236eaba0532290bbd428beabcfd
GitHub-Pull-Request: golang/text#32
Reviewed-on: https://go-review.googlesource.com/c/text/+/422414
TryBot-Result: Gopher Robot <gobot@golang.org>
Run-TryBot: Tim King <taking@google.com>
Reviewed-by: Tim King <taking@google.com>
Reviewed-by: Peter Weinberger <pjw@google.com>
---
 go.mod |  4 ++--
 go.sum | 18 +++++++++---------
 2 files changed, 11 insertions(+), 11 deletions(-)

diff --git a/go.mod b/go.mod
index 21572583a..c47a02995 100644
--- a/go.mod
+++ b/go.mod
@@ -1,10 +1,10 @@
 module golang.org/x/text
 
-require golang.org/x/tools v0.1.11-0.20220504162446-54c7ba520b92
+require golang.org/x/tools v0.1.12
 
 require (
 	golang.org/x/mod v0.6.0-dev.0.20220419223038-86c51ed26bb4 // indirect
-	golang.org/x/sys v0.0.0-20211019181941-9d821ace8654 // indirect
+	golang.org/x/sys v0.0.0-20220722155257-8c9f86f7a55f // indirect
 )
 
 go 1.17
diff --git a/go.sum b/go.sum
index 7e13ec7fd..3ddae732d 100644
--- a/go.sum
+++ b/go.sum
@@ -1,26 +1,26 @@
-github.com/yuin/goldmark v1.4.1/go.mod h1:mwnBkeHKe2W/ZEtQ+71ViKU8L12m81fl3OWwC1Zlc8k=
+github.com/yuin/goldmark v1.4.13/go.mod h1:6yULJ656Px+3vBD8DxQVa3kxgyrAnzto9xy5taEt/CY=
 golang.org/x/crypto v0.0.0-20190308221718-c2843e01d9a2/go.mod h1:djNgcEr1/C05ACkg1iLfiJU5Ep61QUkGW8qpdssI0+w=
 golang.org/x/crypto v0.0.0-20210921155107-089bfa567519/go.mod h1:GvvjBRRGRdwPK5ydBHafDWAxML/pGHZbMvKqRZ5+Abc=
 golang.org/x/mod v0.6.0-dev.0.20220419223038-86c51ed26bb4 h1:6zppjxzCulZykYSLyVDYbneBfbaBIQPYMevg0bEwv2s=
 golang.org/x/mod v0.6.0-dev.0.20220419223038-86c51ed26bb4/go.mod h1:jJ57K6gSWd91VN4djpZkiMVwK6gcyfeH4XE8wZrZaV4=
 golang.org/x/net v0.0.0-20190620200207-3b0461eec859/go.mod h1:z5CRVTTTmAJ677TzLLGU+0bjPO0LkuOLi4/5GtJWs/s=
 golang.org/x/net v0.0.0-20210226172049-e18ecbb05110/go.mod h1:m0MpNAwzfU5UDzcl9v0D8zg8gWTRqZa9RBIspLL5mdg=
-golang.org/x/net v0.0.0-20211015210444-4f30a5c0130f/go.mod h1:9nx3DQGgdP8bBQD5qxJ1jj9UTztislL4KSBs9R2vV5Y=
+golang.org/x/net v0.0.0-20220722155237-a158d28d115b/go.mod h1:XRhObCWvk6IyKnWLug+ECip1KBveYUHfp+8e9klMJ9c=
 golang.org/x/sync v0.0.0-20190423024810-112230192c58/go.mod h1:RxMgew5VJxzue5/jJTE5uejpjVlOe/izrB70Jof72aM=
-golang.org/x/sync v0.0.0-20210220032951-036812b2e83c/go.mod h1:RxMgew5VJxzue5/jJTE5uejpjVlOe/izrB70Jof72aM=
+golang.org/x/sync v0.0.0-20220722155255-886fb9371eb4/go.mod h1:RxMgew5VJxzue5/jJTE5uejpjVlOe/izrB70Jof72aM=
 golang.org/x/sys v0.0.0-20190215142949-d0b11bdaac8a/go.mod h1:STP8DvDyc/dI5b8T5hshtkjS+E42TnysNCUPdjciGhY=
 golang.org/x/sys v0.0.0-20201119102817-f84b799fce68/go.mod h1:h1NjWce9XRLGQEsW7wpKNCjG9DtNlClVuFLEZdDNbEs=
-golang.org/x/sys v0.0.0-20210423082822-04245dca01da/go.mod h1:h1NjWce9XRLGQEsW7wpKNCjG9DtNlClVuFLEZdDNbEs=
 golang.org/x/sys v0.0.0-20210615035016-665e8c7367d1/go.mod h1:oPkhp1MJrh7nUepCBck5+mAzfO9JrbApNNgaTdGDITg=
-golang.org/x/sys v0.0.0-20211019181941-9d821ace8654 h1:id054HUawV2/6IGm2IV8KZQjqtwAOo2CYlOToYqa0d0=
-golang.org/x/sys v0.0.0-20211019181941-9d821ace8654/go.mod h1:oPkhp1MJrh7nUepCBck5+mAzfO9JrbApNNgaTdGDITg=
+golang.org/x/sys v0.0.0-20220520151302-bc2c85ada10a/go.mod h1:oPkhp1MJrh7nUepCBck5+mAzfO9JrbApNNgaTdGDITg=
+golang.org/x/sys v0.0.0-20220722155257-8c9f86f7a55f h1:v4INt8xihDGvnrfjMDVXGxw9wrfxYyCjk0KbXjhR55s=
+golang.org/x/sys v0.0.0-20220722155257-8c9f86f7a55f/go.mod h1:oPkhp1MJrh7nUepCBck5+mAzfO9JrbApNNgaTdGDITg=
 golang.org/x/term v0.0.0-20201126162022-7de9c90e9dd1/go.mod h1:bj7SfCRtBDWHUb9snDiAeCFNEtKQo2Wmx5Cou7ajbmo=
+golang.org/x/term v0.0.0-20210927222741-03fcf44c2211/go.mod h1:jbD1KX2456YbFQfuXm/mYQcufACuNUgVhRMnK/tPxf8=
 golang.org/x/text v0.3.0/go.mod h1:NqM8EUOU14njkJ3fqMW+pc6Ldnwhi/IjpwHt7yyuwOQ=
 golang.org/x/text v0.3.3/go.mod h1:5Zoc/QRtKVWzQhOtBMvqHzDpF6irO9z98xDceosuGiQ=
-golang.org/x/text v0.3.6/go.mod h1:5Zoc/QRtKVWzQhOtBMvqHzDpF6irO9z98xDceosuGiQ=
 golang.org/x/text v0.3.7/go.mod h1:u+2+/6zg+i71rQMx5EYifcz6MCKuco9NR6JIITiCfzQ=
 golang.org/x/tools v0.0.0-20180917221912-90fa682c2a6e/go.mod h1:n7NCudcB/nEzxVGmLbDWY5pfWTLqBcC2KZ6jyYvM4mQ=
 golang.org/x/tools v0.0.0-20191119224855-298f0cb1881e/go.mod h1:b+2E5dAYhXwXZwtnZ6UAqBI28+e2cm9otk0dWdXHAEo=
-golang.org/x/tools v0.1.11-0.20220504162446-54c7ba520b92 h1:bKfKpfzAxCZ+/Th2EbSQcaLiq8xDP3n33SlwYkfoOgM=
-golang.org/x/tools v0.1.11-0.20220504162446-54c7ba520b92/go.mod h1:SgwaegtQh8clINPpECJMqnxLv9I09HLqnW3RMqW0CA4=
+golang.org/x/tools v0.1.12 h1:VveCTK38A2rkS8ZqFY25HIDFscX5X9OoEhJd3quQmXU=
+golang.org/x/tools v0.1.12/go.mod h1:hNGJHUnrk76NpqgfD5Aqm5Crs+Hm0VOH/i9J2+nxYbc=
 golang.org/x/xerrors v0.0.0-20190717185122-a985d3407aa7/go.mod h1:I/5z698sn9Ka8TeJc9MKroUUfqBBauWjQqLJ2OPfmY0=

From b0ca10ff35f1325c7d0ac7830fe3f036bd72d8f9 Mon Sep 17 00:00:00 2001
From: Roland Shoemaker <roland@golang.org>
Date: Tue, 23 Mar 2021 09:37:45 -0700
Subject: [PATCH 36/40] internal/language: bump script types to uint16 and
 update registry

The IANA language-subtag-registry now contains more than 256 scripts,
causing the uint8 types to overflow during table generation. The
internal script types are bumped to uint16 which should be more than
enough.

Fixes golang/go#45093

Change-Id: I58184902e6652f488521d084fce6e0b424121825
Reviewed-on: https://go-review.googlesource.com/c/text/+/304029
TryBot-Result: Gopher Robot <gobot@golang.org>
Reviewed-by: Than McIntosh <thanm@google.com>
Run-TryBot: Roland Shoemaker <roland@golang.org>
Reviewed-by: Damien Neil <dneil@google.com>
Auto-Submit: Roland Shoemaker <roland@golang.org>
---
 encoding/htmlindex/tables.go        |   9 +
 encoding/ianaindex/tables.go        |  53 +-
 encoding/internal/identifier/mib.go |   8 +
 internal/language/compact/tables.go |   6 +-
 internal/language/gen.go            |  28 +-
 internal/language/language_test.go  |   4 +-
 internal/language/lookup.go         |   2 +-
 internal/language/tables.go         | 853 ++++++++++++++--------------
 language/tables.go                  |  18 +-
 unicode/norm/tables13.0.0.go        |   4 +-
 10 files changed, 507 insertions(+), 478 deletions(-)

diff --git a/encoding/htmlindex/tables.go b/encoding/htmlindex/tables.go
index f074e2c6d..9e6daa896 100644
--- a/encoding/htmlindex/tables.go
+++ b/encoding/htmlindex/tables.go
@@ -93,8 +93,11 @@ var canonical = [numEncodings]string{
 
 var nameMap = map[string]htmlEncoding{
 	"unicode-1-1-utf-8":   utf8,
+	"unicode11utf8":       utf8,
+	"unicode20utf8":       utf8,
 	"utf-8":               utf8,
 	"utf8":                utf8,
+	"x-unicode20utf8":     utf8,
 	"866":                 ibm866,
 	"cp866":               ibm866,
 	"csibm866":            ibm866,
@@ -307,7 +310,13 @@ var nameMap = map[string]htmlEncoding{
 	"iso-2022-cn-ext":     replacement,
 	"iso-2022-kr":         replacement,
 	"replacement":         replacement,
+	"unicodefffe":         utf16be,
 	"utf-16be":            utf16be,
+	"csunicode":           utf16le,
+	"iso-10646-ucs-2":     utf16le,
+	"ucs-2":               utf16le,
+	"unicode":             utf16le,
+	"unicodefeff":         utf16le,
 	"utf-16":              utf16le,
 	"utf-16le":            utf16le,
 	"x-user-defined":      xUserDefined,
diff --git a/encoding/ianaindex/tables.go b/encoding/ianaindex/tables.go
index cec6a0407..921bb3b4b 100644
--- a/encoding/ianaindex/tables.go
+++ b/encoding/ianaindex/tables.go
@@ -141,6 +141,7 @@ const (
 	enc1018
 	enc1019
 	enc1020
+	enc1021
 	enc2000
 	enc2001
 	enc2002
@@ -265,7 +266,7 @@ const (
 	numIANA
 )
 
-var ianaToMIB = []identifier.MIB{ // 257 elements
+var ianaToMIB = []identifier.MIB{ // 258 elements
 	// Entry 0 - 3F
 	0x0003, 0x0004, 0x0005, 0x0006, 0x0007, 0x0008, 0x0009, 0x000a,
 	0x000b, 0x000c, 0x000d, 0x000e, 0x000f, 0x0010, 0x0011, 0x0012,
@@ -286,27 +287,27 @@ var ianaToMIB = []identifier.MIB{ // 257 elements
 	0x03ed, 0x03ee, 0x03ef, 0x03f0, 0x03f1, 0x03f2, 0x03f3, 0x03f4,
 	// Entry 80 - BF
 	0x03f5, 0x03f6, 0x03f7, 0x03f8, 0x03f9, 0x03fa, 0x03fb, 0x03fc,
-	0x07d0, 0x07d1, 0x07d2, 0x07d3, 0x07d4, 0x07d5, 0x07d6, 0x07d7,
-	0x07d8, 0x07d9, 0x07da, 0x07db, 0x07dc, 0x07dd, 0x07de, 0x07df,
-	0x07e0, 0x07e1, 0x07e2, 0x07e3, 0x07e4, 0x07e5, 0x07e6, 0x07e7,
-	0x07e8, 0x07e9, 0x07ea, 0x07eb, 0x07ec, 0x07ed, 0x07ee, 0x07ef,
-	0x07f0, 0x07f1, 0x07f2, 0x07f3, 0x07f4, 0x07f5, 0x07f6, 0x07f7,
-	0x07f8, 0x07f9, 0x07fa, 0x07fb, 0x07fc, 0x07fd, 0x07fe, 0x07ff,
-	0x0800, 0x0801, 0x0802, 0x0803, 0x0804, 0x0805, 0x0806, 0x0807,
+	0x03fd, 0x07d0, 0x07d1, 0x07d2, 0x07d3, 0x07d4, 0x07d5, 0x07d6,
+	0x07d7, 0x07d8, 0x07d9, 0x07da, 0x07db, 0x07dc, 0x07dd, 0x07de,
+	0x07df, 0x07e0, 0x07e1, 0x07e2, 0x07e3, 0x07e4, 0x07e5, 0x07e6,
+	0x07e7, 0x07e8, 0x07e9, 0x07ea, 0x07eb, 0x07ec, 0x07ed, 0x07ee,
+	0x07ef, 0x07f0, 0x07f1, 0x07f2, 0x07f3, 0x07f4, 0x07f5, 0x07f6,
+	0x07f7, 0x07f8, 0x07f9, 0x07fa, 0x07fb, 0x07fc, 0x07fd, 0x07fe,
+	0x07ff, 0x0800, 0x0801, 0x0802, 0x0803, 0x0804, 0x0805, 0x0806,
 	// Entry C0 - FF
-	0x0808, 0x0809, 0x080a, 0x080b, 0x080c, 0x080d, 0x080e, 0x080f,
-	0x0810, 0x0811, 0x0812, 0x0813, 0x0814, 0x0815, 0x0816, 0x0817,
-	0x0818, 0x0819, 0x081a, 0x081b, 0x081c, 0x081d, 0x081e, 0x081f,
-	0x0820, 0x0821, 0x0822, 0x0823, 0x0824, 0x0825, 0x0826, 0x0827,
-	0x0828, 0x0829, 0x082a, 0x082b, 0x082c, 0x082d, 0x082e, 0x082f,
-	0x0830, 0x0831, 0x0832, 0x0833, 0x0834, 0x0835, 0x0836, 0x0837,
-	0x0838, 0x0839, 0x083a, 0x083b, 0x083c, 0x083d, 0x08ca, 0x08cb,
-	0x08cc, 0x08cd, 0x08ce, 0x08cf, 0x08d0, 0x08d1, 0x08d2, 0x08d3,
+	0x0807, 0x0808, 0x0809, 0x080a, 0x080b, 0x080c, 0x080d, 0x080e,
+	0x080f, 0x0810, 0x0811, 0x0812, 0x0813, 0x0814, 0x0815, 0x0816,
+	0x0817, 0x0818, 0x0819, 0x081a, 0x081b, 0x081c, 0x081d, 0x081e,
+	0x081f, 0x0820, 0x0821, 0x0822, 0x0823, 0x0824, 0x0825, 0x0826,
+	0x0827, 0x0828, 0x0829, 0x082a, 0x082b, 0x082c, 0x082d, 0x082e,
+	0x082f, 0x0830, 0x0831, 0x0832, 0x0833, 0x0834, 0x0835, 0x0836,
+	0x0837, 0x0838, 0x0839, 0x083a, 0x083b, 0x083c, 0x083d, 0x08ca,
+	0x08cb, 0x08cc, 0x08cd, 0x08ce, 0x08cf, 0x08d0, 0x08d1, 0x08d2,
 	// Entry 100 - 13F
-	0x08d4,
-} // Size: 538 bytes
+	0x08d3, 0x08d4,
+} // Size: 540 bytes
 
-var ianaNames = []string{ // 257 elements
+var ianaNames = []string{ // 258 elements
 	"US-ASCII",
 	"\vISO-8859-1ISO_8859-1:1987",
 	"\vISO-8859-2ISO_8859-2:1987",
@@ -443,6 +444,7 @@ var ianaNames = []string{ // 257 elements
 	"UTF-32BE",
 	"UTF-32LE",
 	"BOCU-1",
+	"UTF-7-IMAP",
 	"ISO-8859-1-Windows-3.0-Latin-1",
 	"ISO-8859-1-Windows-3.1-Latin-1",
 	"ISO-8859-2-Windows-Latin-2",
@@ -564,9 +566,9 @@ var ianaNames = []string{ // 257 elements
 	"windows-1258",
 	"TIS-620",
 	"CP50220",
-} // Size: 7088 bytes
+} // Size: 7114 bytes
 
-var mibNames = []string{ // 257 elements
+var mibNames = []string{ // 258 elements
 	"ASCII",
 	"ISOLatin1",
 	"ISOLatin2",
@@ -703,6 +705,7 @@ var mibNames = []string{ // 257 elements
 	"UTF32BE",
 	"UTF32LE",
 	"BOCU-1",
+	"UTF7IMAP",
 	"Windows30Latin1",
 	"Windows31Latin1",
 	"Windows31Latin2",
@@ -824,7 +827,7 @@ var mibNames = []string{ // 257 elements
 	"windows1258",
 	"TIS620",
 	"CP50220",
-} // Size: 6776 bytes
+} // Size: 6800 bytes
 
 // TODO: Instead of using a map, we could use binary search strings doing
 // on-the fly lower-casing per character. This allows to always avoid
@@ -1692,6 +1695,10 @@ var ianaAliases = map[string]int{
 	"csbocu1":                                       enc1020,
 	"csBOCU-1":                                      enc1020,
 	"csbocu-1":                                      enc1020,
+	"UTF-7-IMAP":                                    enc1021,
+	"utf-7-imap":                                    enc1021,
+	"csUTF7IMAP":                                    enc1021,
+	"csutf7imap":                                    enc1021,
 	"ISO-8859-1-Windows-3.0-Latin-1":                enc2000,
 	"iso-8859-1-windows-3.0-latin-1":                enc2000,
 	"csWindows30Latin1":                             enc2000,
@@ -2345,4 +2352,4 @@ var ianaAliases = map[string]int{
 	"cscp50220":                                     enc2260,
 }
 
-// Total table size 14402 bytes (14KiB); checksum: CEBAA10C
+// Total table size 14454 bytes (14KiB); checksum: 9095144D
diff --git a/encoding/internal/identifier/mib.go b/encoding/internal/identifier/mib.go
index fc7df1bc7..351fb86e2 100644
--- a/encoding/internal/identifier/mib.go
+++ b/encoding/internal/identifier/mib.go
@@ -905,6 +905,14 @@ const (
 	// https://www.unicode.org/notes/tn6/
 	BOCU1 MIB = 1020
 
+	// UTF7IMAP is the MIB identifier with IANA name UTF-7-IMAP.
+	//
+	// Note: This charset is used to encode Unicode in IMAP mailbox names;
+	// see section 5.1.3 of rfc3501 . It should never be used
+	// outside this context. A name has been assigned so that charset processing
+	// implementations can refer to it in a consistent way.
+	UTF7IMAP MIB = 1021
+
 	// Windows30Latin1 is the MIB identifier with IANA name ISO-8859-1-Windows-3.0-Latin-1.
 	//
 	// Extended ISO 8859-1 Latin-1 for Windows 3.0.
diff --git a/internal/language/compact/tables.go b/internal/language/compact/tables.go
index fe7ad9ea7..32af9de59 100644
--- a/internal/language/compact/tables.go
+++ b/internal/language/compact/tables.go
@@ -966,7 +966,7 @@ var coreTags = []language.CompactCoreInfo{ // 773 elements
 	0x3fd00000, 0x3fd00072, 0x3fd000da, 0x3fd0010c,
 	0x3ff00000, 0x3ff000d1, 0x40100000, 0x401000c3,
 	0x40200000, 0x4020004c, 0x40700000, 0x40800000,
-	0x4085a000, 0x4085a0ba, 0x408e3000, 0x408e30ba,
+	0x4085a000, 0x4085a0ba, 0x408e8000, 0x408e80ba,
 	0x40c00000, 0x40c000b3, 0x41200000, 0x41200111,
 	0x41600000, 0x4160010f, 0x41c00000, 0x41d00000,
 	// Entry 280 - 29F
@@ -994,7 +994,7 @@ var coreTags = []language.CompactCoreInfo{ // 773 elements
 	0x4ae00130, 0x4b400000, 0x4b400099, 0x4b4000e8,
 	0x4bc00000, 0x4bc05000, 0x4bc05024, 0x4bc20000,
 	0x4bc20137, 0x4bc5a000, 0x4bc5a137, 0x4be00000,
-	0x4be5a000, 0x4be5a0b4, 0x4beeb000, 0x4beeb0b4,
+	0x4be5a000, 0x4be5a0b4, 0x4bef1000, 0x4bef10b4,
 	0x4c000000, 0x4c300000, 0x4c30013e, 0x4c900000,
 	// Entry 2E0 - 2FF
 	0x4c900001, 0x4cc00000, 0x4cc0012f, 0x4ce00000,
@@ -1012,4 +1012,4 @@ var coreTags = []language.CompactCoreInfo{ // 773 elements
 
 const specialTagsStr string = "ca-ES-valencia en-US-u-va-posix"
 
-// Total table size 3147 bytes (3KiB); checksum: BE816D44
+// Total table size 3147 bytes (3KiB); checksum: 6772C83C
diff --git a/internal/language/gen.go b/internal/language/gen.go
index 27c43dc96..95455ecf4 100644
--- a/internal/language/gen.go
+++ b/internal/language/gen.go
@@ -1209,12 +1209,12 @@ func (b *builder) writeLikelyData() {
 	type ( // generated types
 		likelyScriptRegion struct {
 			region uint16
-			script uint8
+			script uint16
 			flags  uint8
 		}
 		likelyLangScript struct {
 			lang   uint16
-			script uint8
+			script uint16
 			flags  uint8
 		}
 		likelyLangRegion struct {
@@ -1226,7 +1226,7 @@ func (b *builder) writeLikelyData() {
 		likelyTag struct {
 			lang   uint16
 			region uint16
-			script uint8
+			script uint16
 		}
 	)
 	var ( // generated variables
@@ -1279,7 +1279,7 @@ func (b *builder) writeLikelyData() {
 					log.Fatalf("region changed unexpectedly: %s -> %s", from, to)
 				}
 				likelyRegionGroup[id].lang = uint16(b.langIndex(to[0]))
-				likelyRegionGroup[id].script = uint8(b.script.index(to[1]))
+				likelyRegionGroup[id].script = uint16(b.script.index(to[1]))
 				likelyRegionGroup[id].region = uint16(b.region.index(to[2]))
 			} else {
 				regionToOther[r] = append(regionToOther[r], fromTo{from, to})
@@ -1293,11 +1293,11 @@ func (b *builder) writeLikelyData() {
 		list := langToOther[id]
 		if len(list) == 1 {
 			likelyLang[id].region = uint16(b.region.index(list[0].to[2]))
-			likelyLang[id].script = uint8(b.script.index(list[0].to[1]))
+			likelyLang[id].script = uint16(b.script.index(list[0].to[1]))
 		} else if len(list) > 1 {
 			likelyLang[id].flags = isList
 			likelyLang[id].region = uint16(len(likelyLangList))
-			likelyLang[id].script = uint8(len(list))
+			likelyLang[id].script = uint16(len(list))
 			for _, x := range list {
 				flags := uint8(0)
 				if len(x.from) > 1 {
@@ -1309,7 +1309,7 @@ func (b *builder) writeLikelyData() {
 				}
 				likelyLangList = append(likelyLangList, likelyScriptRegion{
 					region: uint16(b.region.index(x.to[2])),
-					script: uint8(b.script.index(x.to[1])),
+					script: uint16(b.script.index(x.to[1])),
 					flags:  flags,
 				})
 			}
@@ -1324,21 +1324,21 @@ func (b *builder) writeLikelyData() {
 		list := regionToOther[id]
 		if len(list) == 1 {
 			likelyRegion[id].lang = uint16(b.langIndex(list[0].to[0]))
-			likelyRegion[id].script = uint8(b.script.index(list[0].to[1]))
+			likelyRegion[id].script = uint16(b.script.index(list[0].to[1]))
 			if len(list[0].from) > 2 {
 				likelyRegion[id].flags = scriptInFrom
 			}
 		} else if len(list) > 1 {
 			likelyRegion[id].flags = isList
 			likelyRegion[id].lang = uint16(len(likelyRegionList))
-			likelyRegion[id].script = uint8(len(list))
+			likelyRegion[id].script = uint16(len(list))
 			for i, x := range list {
 				if len(x.from) == 2 && i != 0 || i > 0 && len(x.from) != 3 {
 					log.Fatalf("unspecified script must be first in list: %v at %d", x.from, i)
 				}
 				x := likelyLangScript{
 					lang:   uint16(b.langIndex(x.to[0])),
-					script: uint8(b.script.index(x.to[1])),
+					script: uint16(b.script.index(x.to[1])),
 				}
 				if len(list[0].from) > 2 {
 					x.flags = scriptInFrom
@@ -1453,8 +1453,8 @@ func (b *builder) writeRegionInclusionData() {
 
 type parentRel struct {
 	lang       uint16
-	script     uint8
-	maxScript  uint8
+	script     uint16
+	maxScript  uint16
 	toRegion   uint16
 	fromRegion []uint16
 }
@@ -1477,10 +1477,10 @@ func (b *builder) writeParents() {
 		if len(sub) == 2 {
 			// TODO: check that all undefined scripts are indeed Latn in these
 			// cases.
-			parent.maxScript = uint8(b.script.index("Latn"))
+			parent.maxScript = uint16(b.script.index("Latn"))
 			parent.toRegion = uint16(b.region.index(sub[1]))
 		} else {
-			parent.script = uint8(b.script.index(sub[1]))
+			parent.script = uint16(b.script.index(sub[1]))
 			parent.maxScript = parent.script
 			parent.toRegion = uint16(b.region.index(sub[2]))
 		}
diff --git a/internal/language/language_test.go b/internal/language/language_test.go
index 668034d03..07be42c84 100644
--- a/internal/language/language_test.go
+++ b/internal/language/language_test.go
@@ -14,8 +14,8 @@ import (
 func TestTagSize(t *testing.T) {
 	id := Tag{}
 	typ := reflect.TypeOf(id)
-	if typ.Size() > 24 {
-		t.Errorf("size of Tag was %d; want 24", typ.Size())
+	if typ.Size() > 32 {
+		t.Errorf("size of Tag was %d; want <= 32", typ.Size())
 	}
 }
 
diff --git a/internal/language/lookup.go b/internal/language/lookup.go
index 6294b8152..9309dc276 100644
--- a/internal/language/lookup.go
+++ b/internal/language/lookup.go
@@ -328,7 +328,7 @@ func (r Region) IsPrivateUse() bool {
 	return r.typ()&iso3166UserAssigned != 0
 }
 
-type Script uint8
+type Script uint16
 
 // getScriptID returns the script id for string s. It assumes that s
 // is of the format [A-Z][a-z]{3}.
diff --git a/internal/language/tables.go b/internal/language/tables.go
index 3552e1afc..fb6b58378 100644
--- a/internal/language/tables.go
+++ b/internal/language/tables.go
@@ -7,9 +7,9 @@ import "golang.org/x/text/internal/tag"
 // CLDRVersion is the CLDR version from which the tables in this package are derived.
 const CLDRVersion = "32"
 
-const NumLanguages = 8717
+const NumLanguages = 8752
 
-const NumScripts = 251
+const NumScripts = 258
 
 const NumRegions = 357
 
@@ -266,7 +266,7 @@ var langNoIndex = [2197]uint8{
 	0xad, 0x03, 0xff, 0xff, 0xcf, 0x05, 0x84, 0x62,
 	0xe9, 0xbf, 0xfd, 0xbf, 0xbf, 0xf7, 0xfd, 0x77,
 	0x0f, 0xff, 0xef, 0x6f, 0xff, 0xfb, 0xdf, 0xe2,
-	0xc9, 0xf8, 0x7f, 0x7e, 0x4d, 0xb8, 0x0a, 0x6a,
+	0xc9, 0xf8, 0x7f, 0x7e, 0x4d, 0xbc, 0x0a, 0x6a,
 	0x7c, 0xea, 0xe3, 0xfa, 0x7a, 0xbf, 0x67, 0xff,
 	// Entry 40 - 7F
 	0xff, 0xff, 0xff, 0xdf, 0x2a, 0x54, 0x91, 0xc0,
@@ -278,7 +278,7 @@ var langNoIndex = [2197]uint8{
 	0xa8, 0xff, 0x1f, 0x67, 0x7d, 0xeb, 0xef, 0xce,
 	0xff, 0xff, 0x9f, 0xff, 0xb7, 0xef, 0xfe, 0xcf,
 	// Entry 80 - BF
-	0xdb, 0xff, 0xf3, 0xcd, 0xfb, 0x2f, 0xff, 0xff,
+	0xdb, 0xff, 0xf3, 0xcd, 0xfb, 0x6f, 0xff, 0xff,
 	0xbb, 0xee, 0xf7, 0xbd, 0xdb, 0xff, 0x5f, 0xf7,
 	0xfd, 0xf2, 0xfd, 0xff, 0x5e, 0x2f, 0x3b, 0xba,
 	0x7e, 0xff, 0xff, 0xfe, 0xf7, 0xff, 0xdd, 0xff,
@@ -291,15 +291,15 @@ var langNoIndex = [2197]uint8{
 	0x1b, 0x14, 0x08, 0xf3, 0x2b, 0xe7, 0x17, 0x56,
 	0x05, 0x7d, 0x0e, 0x1c, 0x37, 0x7b, 0xf3, 0xef,
 	0x97, 0xff, 0x5d, 0x38, 0x64, 0x08, 0x00, 0x10,
-	0xbc, 0x85, 0xaf, 0xdf, 0xff, 0xff, 0x73, 0x35,
-	0x3e, 0x87, 0xc7, 0xdf, 0xff, 0x01, 0x81, 0x00,
+	0xbc, 0x85, 0xaf, 0xdf, 0xff, 0xff, 0x7b, 0x35,
+	0x3e, 0xc7, 0xc7, 0xdf, 0xff, 0x01, 0x81, 0x00,
 	0xb0, 0x05, 0x80, 0x00, 0x00, 0x00, 0x00, 0x03,
 	0x40, 0x00, 0x40, 0x92, 0x21, 0x50, 0xb1, 0x5d,
 	// Entry 100 - 13F
 	0xfd, 0xdc, 0xbe, 0x5e, 0x00, 0x00, 0x02, 0x64,
 	0x0d, 0x19, 0x41, 0xdf, 0x79, 0x22, 0x00, 0x00,
 	0x00, 0x5e, 0x64, 0xdc, 0x24, 0xe5, 0xd9, 0xe3,
-	0xfe, 0xff, 0xfd, 0xcb, 0x9f, 0x14, 0x01, 0x0c,
+	0xfe, 0xff, 0xfd, 0xcb, 0x9f, 0x14, 0x41, 0x0c,
 	0x86, 0x00, 0xd1, 0x00, 0xf0, 0xc7, 0x67, 0x5f,
 	0x56, 0x99, 0x5e, 0xb5, 0x6c, 0xaf, 0x03, 0x00,
 	0x02, 0x00, 0x00, 0x00, 0xc0, 0x37, 0xda, 0x56,
@@ -310,9 +310,9 @@ var langNoIndex = [2197]uint8{
 	0x0a, 0x00, 0x01, 0x00, 0x00, 0x10, 0x11, 0x09,
 	0x00, 0x00, 0x60, 0x10, 0x00, 0x00, 0x00, 0x10,
 	0x00, 0x00, 0x44, 0x00, 0x00, 0x10, 0x00, 0x04,
-	0x08, 0x00, 0x00, 0x04, 0x00, 0x80, 0x28, 0x04,
+	0x08, 0x00, 0x00, 0x05, 0x00, 0x80, 0x28, 0x04,
 	0x00, 0x00, 0x40, 0xd5, 0x2d, 0x00, 0x64, 0x35,
-	0x24, 0x52, 0xf4, 0xd4, 0xbd, 0x62, 0xc9, 0x03,
+	0x24, 0x52, 0xf4, 0xd5, 0xbf, 0x62, 0xc9, 0x03,
 	// Entry 180 - 1BF
 	0x00, 0x80, 0x00, 0x40, 0x00, 0x00, 0x00, 0x00,
 	0x00, 0x04, 0x13, 0x39, 0x01, 0xdd, 0x57, 0x98,
@@ -334,20 +334,20 @@ var langNoIndex = [2197]uint8{
 	// Entry 200 - 23F
 	0xdf, 0xc3, 0x83, 0x82, 0xc0, 0xfb, 0x57, 0x27,
 	0xed, 0x55, 0xe7, 0x01, 0x00, 0x20, 0xb2, 0xc5,
-	0xa4, 0x45, 0x25, 0x9b, 0x02, 0xdf, 0xe0, 0xdf,
-	0x03, 0x44, 0x08, 0x90, 0x01, 0x04, 0x01, 0xe3,
+	0xa4, 0x45, 0x25, 0x9b, 0x02, 0xdf, 0xe1, 0xdf,
+	0x03, 0x44, 0x08, 0x90, 0x01, 0x04, 0x81, 0xe3,
 	0x92, 0x54, 0xdb, 0x28, 0xd3, 0x5f, 0xfe, 0x6d,
 	0x79, 0xed, 0x1c, 0x7d, 0x04, 0x08, 0x00, 0x01,
 	0x21, 0x12, 0x64, 0x5f, 0xdd, 0x0e, 0x85, 0x4f,
 	0x40, 0x40, 0x00, 0x04, 0xf1, 0xfd, 0x3d, 0x54,
 	// Entry 240 - 27F
 	0xe8, 0x03, 0xb4, 0x27, 0x23, 0x0d, 0x00, 0x00,
-	0x20, 0x7b, 0x78, 0x02, 0x05, 0x84, 0x00, 0xf0,
+	0x20, 0x7b, 0x78, 0x02, 0x07, 0x84, 0x00, 0xf0,
 	0xbb, 0x7e, 0x5a, 0x00, 0x18, 0x04, 0x81, 0x00,
 	0x00, 0x00, 0x80, 0x10, 0x90, 0x1c, 0x01, 0x00,
 	0x00, 0x00, 0x00, 0x00, 0x10, 0x40, 0x00, 0x04,
 	0x08, 0xa0, 0x70, 0xa5, 0x0c, 0x40, 0x00, 0x00,
-	0x11, 0x24, 0x04, 0x68, 0x00, 0x20, 0x70, 0xff,
+	0x91, 0x24, 0x04, 0x68, 0x00, 0x20, 0x70, 0xff,
 	0x7b, 0x7f, 0x70, 0x00, 0x05, 0x9b, 0xdd, 0x66,
 	// Entry 280 - 2BF
 	0x03, 0x00, 0x11, 0x00, 0x00, 0x00, 0x40, 0x05,
@@ -366,12 +366,12 @@ var langNoIndex = [2197]uint8{
 	0xa7, 0x81, 0x47, 0x97, 0xfb, 0x00, 0x10, 0x00,
 	0x08, 0x00, 0x80, 0x00, 0x40, 0x04, 0x00, 0x01,
 	0x02, 0x00, 0x01, 0x40, 0x80, 0x00, 0x00, 0x08,
-	0xd8, 0xeb, 0xf6, 0x39, 0xc4, 0x89, 0x12, 0x00,
+	0xd8, 0xeb, 0xf6, 0x39, 0xc4, 0x8d, 0x12, 0x00,
 	// Entry 300 - 33F
 	0x00, 0x0c, 0x04, 0x01, 0x20, 0x20, 0xdd, 0xa0,
 	0x01, 0x00, 0x00, 0x00, 0x12, 0x00, 0x00, 0x00,
 	0x04, 0x10, 0xd0, 0x9d, 0x95, 0x13, 0x04, 0x80,
-	0x00, 0x01, 0xd0, 0x12, 0x40, 0x00, 0x10, 0xb0,
+	0x00, 0x01, 0xd0, 0x16, 0x40, 0x00, 0x10, 0xb0,
 	0x10, 0x62, 0x4c, 0xd2, 0x02, 0x01, 0x4a, 0x00,
 	0x46, 0x04, 0x00, 0x08, 0x02, 0x00, 0x20, 0x80,
 	0x00, 0x80, 0x06, 0x00, 0x08, 0x00, 0x00, 0x00,
@@ -398,9 +398,9 @@ var langNoIndex = [2197]uint8{
 	0x02, 0x30, 0x9f, 0x7a, 0x16, 0xbd, 0x7f, 0x57,
 	0xf2, 0xff, 0x31, 0xff, 0xf2, 0x1e, 0x90, 0xf7,
 	0xf1, 0xf9, 0x45, 0x80, 0x01, 0x02, 0x00, 0x00,
-	0x40, 0x54, 0x9f, 0x8a, 0xd9, 0xf9, 0x2e, 0x11,
+	0x40, 0x54, 0x9f, 0x8a, 0xdb, 0xf9, 0x2e, 0x11,
 	0x86, 0x51, 0xc0, 0xf3, 0xfb, 0x47, 0x40, 0x01,
-	0x05, 0xd1, 0x50, 0x5c, 0x00, 0x00, 0x00, 0x10,
+	0x05, 0xd1, 0x50, 0x5c, 0x00, 0x40, 0x00, 0x10,
 	0x04, 0x02, 0x00, 0x00, 0x0a, 0x00, 0x17, 0xd2,
 	0xb9, 0xfd, 0xfc, 0xba, 0xfe, 0xef, 0xc7, 0xbe,
 	// Entry 400 - 43F
@@ -422,19 +422,19 @@ var langNoIndex = [2197]uint8{
 	0xcd, 0xff, 0xfb, 0xff, 0xdf, 0xd7, 0xea, 0xff,
 	0xe5, 0x5f, 0x6d, 0x0f, 0xa7, 0x51, 0x06, 0xc4,
 	// Entry 480 - 4BF
-	0x13, 0x50, 0x5d, 0xaf, 0xa6, 0xff, 0x99, 0xfb,
+	0x93, 0x50, 0x5d, 0xaf, 0xa6, 0xff, 0x99, 0xfb,
 	0x63, 0x1d, 0x53, 0xff, 0xef, 0xb7, 0x35, 0x20,
 	0x14, 0x00, 0x55, 0x51, 0x82, 0x65, 0xf5, 0x41,
 	0xe2, 0xff, 0xfc, 0xdf, 0x02, 0x05, 0xc5, 0x05,
-	0x00, 0x22, 0x00, 0x74, 0x69, 0x10, 0x08, 0x04,
+	0x00, 0x22, 0x00, 0x74, 0x69, 0x10, 0x08, 0x05,
 	0x41, 0x00, 0x01, 0x06, 0x00, 0x00, 0x00, 0x00,
 	0x00, 0x51, 0x20, 0x05, 0x04, 0x01, 0x00, 0x00,
-	0x06, 0x01, 0x20, 0x00, 0x18, 0x01, 0x92, 0xb1,
+	0x06, 0x01, 0x20, 0x00, 0x18, 0x01, 0x92, 0xf1,
 	// Entry 4C0 - 4FF
-	0xfd, 0x47, 0x49, 0x06, 0x95, 0x06, 0x57, 0xed,
-	0xfb, 0x4c, 0x1c, 0x6b, 0x83, 0x04, 0x62, 0x40,
+	0xfd, 0x47, 0x69, 0x06, 0x95, 0x06, 0x57, 0xed,
+	0xfb, 0x4d, 0x1c, 0x6b, 0x83, 0x04, 0x62, 0x40,
 	0x00, 0x11, 0x42, 0x00, 0x00, 0x00, 0x54, 0x83,
-	0xb8, 0x4f, 0x10, 0x8c, 0x89, 0x46, 0xde, 0xf7,
+	0xb8, 0x4f, 0x10, 0x8e, 0x89, 0x46, 0xde, 0xf7,
 	0x13, 0x31, 0x00, 0x20, 0x00, 0x00, 0x00, 0x90,
 	0x00, 0x00, 0x00, 0x00, 0x00, 0x0a, 0x10, 0x00,
 	0x01, 0x00, 0x00, 0xf0, 0x5b, 0xf4, 0xbe, 0x3d,
@@ -471,7 +471,7 @@ var langNoIndex = [2197]uint8{
 	0xaa, 0x10, 0x5d, 0x98, 0x52, 0x00, 0x80, 0x20,
 	0x00, 0x00, 0x00, 0x00, 0x40, 0x00, 0x02, 0x02,
 	0x19, 0x00, 0x10, 0x02, 0x10, 0x61, 0x5a, 0x9d,
-	0x31, 0x00, 0x00, 0x00, 0x01, 0x10, 0x02, 0x20,
+	0x31, 0x00, 0x00, 0x00, 0x01, 0x18, 0x02, 0x20,
 	0x00, 0x00, 0x01, 0x00, 0x42, 0x00, 0x20, 0x00,
 	0x00, 0x1f, 0xdf, 0xd2, 0xb9, 0xff, 0xfd, 0x3f,
 	0x1f, 0x98, 0xcf, 0x9c, 0xff, 0xaf, 0x5f, 0xfe,
@@ -480,9 +480,9 @@ var langNoIndex = [2197]uint8{
 	0xb7, 0xf6, 0xfb, 0xb3, 0xc7, 0xff, 0x6f, 0xf1,
 	0x73, 0xb1, 0x7f, 0x9f, 0x7f, 0xbd, 0xfc, 0xb7,
 	0xee, 0x1c, 0xfa, 0xcb, 0xef, 0xdd, 0xf9, 0xbd,
-	0x6e, 0xae, 0x55, 0xfd, 0x6e, 0x81, 0x76, 0x1f,
+	0x6e, 0xae, 0x55, 0xfd, 0x6e, 0x81, 0x76, 0x9f,
 	0xd4, 0x77, 0xf5, 0x7d, 0xfb, 0xff, 0xeb, 0xfe,
-	0xbe, 0x5f, 0x46, 0x1b, 0xe9, 0x5f, 0x50, 0x18,
+	0xbe, 0x5f, 0x46, 0x5b, 0xe9, 0x5f, 0x50, 0x18,
 	0x02, 0xfa, 0xf7, 0x9d, 0x15, 0x97, 0x05, 0x0f,
 	// Entry 640 - 67F
 	0x75, 0xc4, 0x7d, 0x81, 0x92, 0xf5, 0x57, 0x6c,
@@ -496,14 +496,14 @@ var langNoIndex = [2197]uint8{
 	// Entry 680 - 6BF
 	0x97, 0x9d, 0xbf, 0x9f, 0xf7, 0xc7, 0xfd, 0x37,
 	0xce, 0x7f, 0x04, 0x1d, 0x73, 0x7f, 0xf8, 0xda,
-	0x5d, 0xce, 0x7d, 0x06, 0xb9, 0xea, 0x69, 0xa0,
+	0x5d, 0xce, 0x7d, 0x06, 0xb9, 0xea, 0x79, 0xa0,
 	0x1a, 0x20, 0x00, 0x30, 0x02, 0x04, 0x24, 0x08,
 	0x04, 0x00, 0x00, 0x40, 0xd4, 0x02, 0x04, 0x00,
 	0x00, 0x04, 0x00, 0x04, 0x00, 0x20, 0x01, 0x06,
 	0x50, 0x00, 0x08, 0x00, 0x00, 0x00, 0x24, 0x00,
 	0x04, 0x00, 0x10, 0xdc, 0x58, 0xd7, 0x0d, 0x0f,
 	// Entry 6C0 - 6FF
-	0x14, 0x4d, 0xf1, 0x16, 0x44, 0xd1, 0x42, 0x08,
+	0x14, 0x4d, 0xf1, 0x16, 0x44, 0xd5, 0x42, 0x08,
 	0x40, 0x00, 0x00, 0x40, 0x00, 0x08, 0x00, 0x00,
 	0x00, 0xdc, 0xfb, 0xcb, 0x0e, 0x58, 0x48, 0x41,
 	0x24, 0x20, 0x04, 0x00, 0x30, 0x12, 0x40, 0x00,
@@ -514,7 +514,7 @@ var langNoIndex = [2197]uint8{
 	// Entry 700 - 73F
 	0x00, 0x00, 0x00, 0x00, 0x0a, 0x00, 0x00, 0x00,
 	0x80, 0x86, 0xc2, 0x00, 0x00, 0x00, 0x00, 0x01,
-	0xdf, 0x18, 0x00, 0x00, 0x02, 0xf0, 0xfd, 0x79,
+	0xff, 0x18, 0x02, 0x00, 0x02, 0xf0, 0xfd, 0x79,
 	0x3b, 0x00, 0x25, 0x00, 0x00, 0x00, 0x02, 0x00,
 	0x00, 0x00, 0x00, 0x00, 0x00, 0x40, 0x00, 0x00,
 	0x03, 0x00, 0x09, 0x20, 0x00, 0x00, 0x01, 0x00,
@@ -526,7 +526,7 @@ var langNoIndex = [2197]uint8{
 	0xcd, 0xf9, 0x5c, 0x00, 0x01, 0x00, 0x30, 0x04,
 	0x04, 0x55, 0x00, 0x01, 0x04, 0xf4, 0x3f, 0x4a,
 	0x01, 0x00, 0x00, 0xb0, 0x80, 0x20, 0x55, 0x75,
-	0x97, 0x7c, 0x9f, 0x31, 0xcc, 0x68, 0xd1, 0x03,
+	0x97, 0x7c, 0xdf, 0x31, 0xcc, 0x68, 0xd1, 0x03,
 	0xd5, 0x57, 0x27, 0x14, 0x01, 0x00, 0x00, 0x00,
 	0x00, 0x00, 0x2c, 0xf7, 0xcb, 0x1f, 0x14, 0x60,
 	// Entry 780 - 7BF
@@ -539,7 +539,7 @@ var langNoIndex = [2197]uint8{
 	0xe8, 0x30, 0x90, 0x6a, 0x92, 0x00, 0x00, 0x02,
 	0xff, 0xef, 0xff, 0x4b, 0x85, 0x53, 0xf4, 0xed,
 	// Entry 7C0 - 7FF
-	0xdd, 0xbf, 0x72, 0x1d, 0xc7, 0x0c, 0xd5, 0x42,
+	0xdd, 0xbf, 0xf2, 0x5d, 0xc7, 0x0c, 0xd5, 0x42,
 	0xfc, 0xff, 0xf7, 0x1f, 0x00, 0x80, 0x40, 0x56,
 	0xcc, 0x16, 0x9e, 0xea, 0x35, 0x7d, 0xef, 0xff,
 	0xbd, 0xa4, 0xaf, 0x01, 0x44, 0x18, 0x01, 0x4d,
@@ -553,15 +553,15 @@ var langNoIndex = [2197]uint8{
 	0x40, 0x9c, 0x44, 0xdf, 0xf5, 0x8f, 0x66, 0xb3,
 	0x55, 0x20, 0xd4, 0xc1, 0xd8, 0x30, 0x3d, 0x80,
 	0x00, 0x00, 0x00, 0x04, 0xd4, 0x11, 0xc5, 0x84,
-	0x2e, 0x50, 0x00, 0x22, 0x50, 0x6e, 0xbd, 0x93,
+	0x2f, 0x50, 0x00, 0x22, 0x50, 0x6e, 0xbd, 0x93,
 	0x07, 0x00, 0x20, 0x10, 0x84, 0xb2, 0x45, 0x10,
 	0x06, 0x44, 0x00, 0x00, 0x12, 0x02, 0x11, 0x00,
 	// Entry 840 - 87F
-	0xf0, 0xfb, 0xfd, 0x7f, 0x05, 0x00, 0x12, 0x81,
+	0xf0, 0xfb, 0xfd, 0x7f, 0x05, 0x00, 0x16, 0x81,
 	0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x0c, 0x02,
 	0x00, 0x00, 0x00, 0x00, 0x03, 0x30, 0x02, 0x28,
 	0x84, 0x00, 0x21, 0xc0, 0x23, 0x24, 0x00, 0x00,
-	0x00, 0xcb, 0xe4, 0x3a, 0x42, 0x88, 0x14, 0xf1,
+	0x00, 0xcb, 0xe4, 0x3a, 0x46, 0x88, 0x14, 0xf1,
 	0xef, 0xff, 0x7f, 0x12, 0x01, 0x01, 0x84, 0x50,
 	0x07, 0xfc, 0xff, 0xff, 0x0f, 0x01, 0x00, 0x40,
 	0x10, 0x38, 0x01, 0x01, 0x1c, 0x12, 0x40, 0xe1,
@@ -583,8 +583,8 @@ var altLangIndex = [6]uint16{
 }
 
 // AliasMap maps langIDs to their suggested replacements.
-// Size: 704 bytes, 176 elements
-var AliasMap = [176]FromTo{
+// Size: 716 bytes, 179 elements
+var AliasMap = [179]FromTo{
 	0:   {From: 0x82, To: 0x88},
 	1:   {From: 0x187, To: 0x1ae},
 	2:   {From: 0x1f3, To: 0x1e1},
@@ -613,172 +613,176 @@ var AliasMap = [176]FromTo{
 	25:  {From: 0x80c, To: 0x5a},
 	26:  {From: 0x815, To: 0x8d},
 	27:  {From: 0x87e, To: 0x810},
-	28:  {From: 0x8c3, To: 0xee3},
-	29:  {From: 0x9ef, To: 0x331},
-	30:  {From: 0xa36, To: 0x2c5},
-	31:  {From: 0xa3d, To: 0xbf},
-	32:  {From: 0xabe, To: 0x3322},
-	33:  {From: 0xb38, To: 0x529},
-	34:  {From: 0xb75, To: 0x265a},
-	35:  {From: 0xb7e, To: 0xbc3},
-	36:  {From: 0xb9b, To: 0x44e},
-	37:  {From: 0xbbc, To: 0x4229},
-	38:  {From: 0xbbf, To: 0x529},
-	39:  {From: 0xbfe, To: 0x2da7},
-	40:  {From: 0xc2e, To: 0x3181},
-	41:  {From: 0xcb9, To: 0xf3},
-	42:  {From: 0xd08, To: 0xfa},
-	43:  {From: 0xdc8, To: 0x11a},
-	44:  {From: 0xdd7, To: 0x32d},
-	45:  {From: 0xdf8, To: 0xdfb},
-	46:  {From: 0xdfe, To: 0x531},
-	47:  {From: 0xe01, To: 0xdf3},
-	48:  {From: 0xedf, To: 0x205a},
-	49:  {From: 0xee9, To: 0x222e},
-	50:  {From: 0xeee, To: 0x2e9a},
-	51:  {From: 0xf39, To: 0x367},
-	52:  {From: 0x10d0, To: 0x140},
-	53:  {From: 0x1104, To: 0x2d0},
-	54:  {From: 0x11a0, To: 0x1ec},
-	55:  {From: 0x1279, To: 0x21},
-	56:  {From: 0x1424, To: 0x15e},
-	57:  {From: 0x1470, To: 0x14e},
-	58:  {From: 0x151f, To: 0xd9b},
-	59:  {From: 0x1523, To: 0x390},
-	60:  {From: 0x1532, To: 0x19f},
-	61:  {From: 0x1580, To: 0x210},
-	62:  {From: 0x1583, To: 0x10d},
-	63:  {From: 0x15a3, To: 0x3caf},
-	64:  {From: 0x1630, To: 0x222e},
-	65:  {From: 0x166a, To: 0x19b},
-	66:  {From: 0x16c8, To: 0x136},
-	67:  {From: 0x1700, To: 0x29f8},
-	68:  {From: 0x1718, To: 0x194},
-	69:  {From: 0x1727, To: 0xf3f},
-	70:  {From: 0x177a, To: 0x178},
-	71:  {From: 0x1809, To: 0x17b6},
-	72:  {From: 0x1816, To: 0x18f3},
-	73:  {From: 0x188a, To: 0x436},
-	74:  {From: 0x1979, To: 0x1d01},
-	75:  {From: 0x1a74, To: 0x2bb0},
-	76:  {From: 0x1a8a, To: 0x1f8},
-	77:  {From: 0x1b5a, To: 0x1fa},
-	78:  {From: 0x1b86, To: 0x1515},
-	79:  {From: 0x1d64, To: 0x2c9b},
-	80:  {From: 0x2038, To: 0x37b1},
-	81:  {From: 0x203d, To: 0x20dd},
-	82:  {From: 0x205a, To: 0x30b},
-	83:  {From: 0x20e3, To: 0x274},
-	84:  {From: 0x20ee, To: 0x263},
-	85:  {From: 0x20f2, To: 0x22d},
-	86:  {From: 0x20f9, To: 0x256},
-	87:  {From: 0x210f, To: 0x21eb},
-	88:  {From: 0x2135, To: 0x27d},
-	89:  {From: 0x2160, To: 0x913},
-	90:  {From: 0x2199, To: 0x121},
-	91:  {From: 0x21ce, To: 0x1561},
-	92:  {From: 0x21e6, To: 0x504},
-	93:  {From: 0x21f4, To: 0x49f},
-	94:  {From: 0x21fb, To: 0x269},
-	95:  {From: 0x222d, To: 0x121},
-	96:  {From: 0x2237, To: 0x121},
-	97:  {From: 0x2262, To: 0x92a},
-	98:  {From: 0x2316, To: 0x3226},
-	99:  {From: 0x236a, To: 0x2835},
-	100: {From: 0x2382, To: 0x3365},
-	101: {From: 0x2472, To: 0x2c7},
-	102: {From: 0x24e4, To: 0x2ff},
-	103: {From: 0x24f0, To: 0x2fa},
-	104: {From: 0x24fa, To: 0x31f},
-	105: {From: 0x2550, To: 0xb5b},
-	106: {From: 0x25a9, To: 0xe2},
-	107: {From: 0x263e, To: 0x2d0},
-	108: {From: 0x26c9, To: 0x26b4},
-	109: {From: 0x26f9, To: 0x3c8},
-	110: {From: 0x2727, To: 0x3caf},
-	111: {From: 0x2755, To: 0x6a4},
-	112: {From: 0x2765, To: 0x26b4},
-	113: {From: 0x2789, To: 0x4358},
-	114: {From: 0x27c9, To: 0x2001},
-	115: {From: 0x28ea, To: 0x27b1},
-	116: {From: 0x28ef, To: 0x2837},
-	117: {From: 0x2914, To: 0x351},
-	118: {From: 0x2986, To: 0x2da7},
-	119: {From: 0x29f0, To: 0x96b},
-	120: {From: 0x2b1a, To: 0x38d},
-	121: {From: 0x2bfc, To: 0x395},
-	122: {From: 0x2c3f, To: 0x3caf},
-	123: {From: 0x2cfc, To: 0x3be},
-	124: {From: 0x2d13, To: 0x597},
-	125: {From: 0x2d47, To: 0x148},
-	126: {From: 0x2d48, To: 0x148},
-	127: {From: 0x2dff, To: 0x2f1},
-	128: {From: 0x2e08, To: 0x19cc},
-	129: {From: 0x2e1a, To: 0x2d95},
-	130: {From: 0x2e21, To: 0x292},
-	131: {From: 0x2e54, To: 0x7d},
-	132: {From: 0x2e65, To: 0x2282},
-	133: {From: 0x2ea0, To: 0x2e9b},
-	134: {From: 0x2eef, To: 0x2ed7},
-	135: {From: 0x3193, To: 0x3c4},
-	136: {From: 0x3366, To: 0x338e},
-	137: {From: 0x342a, To: 0x3dc},
-	138: {From: 0x34ee, To: 0x18d0},
-	139: {From: 0x35c8, To: 0x2c9b},
-	140: {From: 0x35e6, To: 0x412},
-	141: {From: 0x3658, To: 0x246},
-	142: {From: 0x3676, To: 0x3f4},
-	143: {From: 0x36fd, To: 0x445},
-	144: {From: 0x37c0, To: 0x121},
-	145: {From: 0x3816, To: 0x38f2},
-	146: {From: 0x382a, To: 0x2b48},
-	147: {From: 0x382b, To: 0x2c9b},
-	148: {From: 0x382f, To: 0xa9},
-	149: {From: 0x3832, To: 0x3228},
-	150: {From: 0x386c, To: 0x39a6},
-	151: {From: 0x3892, To: 0x3fc0},
-	152: {From: 0x38a5, To: 0x39d7},
-	153: {From: 0x38b4, To: 0x1fa4},
-	154: {From: 0x38b5, To: 0x2e9a},
-	155: {From: 0x395c, To: 0x47e},
-	156: {From: 0x3b4e, To: 0xd91},
-	157: {From: 0x3b78, To: 0x137},
-	158: {From: 0x3c99, To: 0x4bc},
-	159: {From: 0x3fbd, To: 0x100},
-	160: {From: 0x4208, To: 0xa91},
-	161: {From: 0x42be, To: 0x573},
-	162: {From: 0x42f9, To: 0x3f60},
-	163: {From: 0x4378, To: 0x25a},
-	164: {From: 0x43b8, To: 0xe6c},
-	165: {From: 0x43cd, To: 0x10f},
-	166: {From: 0x44af, To: 0x3322},
-	167: {From: 0x44e3, To: 0x512},
-	168: {From: 0x45ca, To: 0x2409},
-	169: {From: 0x45dd, To: 0x26dc},
-	170: {From: 0x4610, To: 0x48ae},
-	171: {From: 0x46ae, To: 0x46a0},
-	172: {From: 0x473e, To: 0x4745},
-	173: {From: 0x4817, To: 0x3503},
-	174: {From: 0x4916, To: 0x31f},
-	175: {From: 0x49a7, To: 0x523},
+	28:  {From: 0x8a8, To: 0x8b7},
+	29:  {From: 0x8c3, To: 0xee3},
+	30:  {From: 0x8fa, To: 0x1dc},
+	31:  {From: 0x9ef, To: 0x331},
+	32:  {From: 0xa36, To: 0x2c5},
+	33:  {From: 0xa3d, To: 0xbf},
+	34:  {From: 0xabe, To: 0x3322},
+	35:  {From: 0xb38, To: 0x529},
+	36:  {From: 0xb75, To: 0x265a},
+	37:  {From: 0xb7e, To: 0xbc3},
+	38:  {From: 0xb9b, To: 0x44e},
+	39:  {From: 0xbbc, To: 0x4229},
+	40:  {From: 0xbbf, To: 0x529},
+	41:  {From: 0xbfe, To: 0x2da7},
+	42:  {From: 0xc2e, To: 0x3181},
+	43:  {From: 0xcb9, To: 0xf3},
+	44:  {From: 0xd08, To: 0xfa},
+	45:  {From: 0xdc8, To: 0x11a},
+	46:  {From: 0xdd7, To: 0x32d},
+	47:  {From: 0xdf8, To: 0xdfb},
+	48:  {From: 0xdfe, To: 0x531},
+	49:  {From: 0xe01, To: 0xdf3},
+	50:  {From: 0xedf, To: 0x205a},
+	51:  {From: 0xee9, To: 0x222e},
+	52:  {From: 0xeee, To: 0x2e9a},
+	53:  {From: 0xf39, To: 0x367},
+	54:  {From: 0x10d0, To: 0x140},
+	55:  {From: 0x1104, To: 0x2d0},
+	56:  {From: 0x11a0, To: 0x1ec},
+	57:  {From: 0x1279, To: 0x21},
+	58:  {From: 0x1424, To: 0x15e},
+	59:  {From: 0x1470, To: 0x14e},
+	60:  {From: 0x151f, To: 0xd9b},
+	61:  {From: 0x1523, To: 0x390},
+	62:  {From: 0x1532, To: 0x19f},
+	63:  {From: 0x1580, To: 0x210},
+	64:  {From: 0x1583, To: 0x10d},
+	65:  {From: 0x15a3, To: 0x3caf},
+	66:  {From: 0x1630, To: 0x222e},
+	67:  {From: 0x166a, To: 0x19b},
+	68:  {From: 0x16c8, To: 0x136},
+	69:  {From: 0x1700, To: 0x29f8},
+	70:  {From: 0x1718, To: 0x194},
+	71:  {From: 0x1727, To: 0xf3f},
+	72:  {From: 0x177a, To: 0x178},
+	73:  {From: 0x1809, To: 0x17b6},
+	74:  {From: 0x1816, To: 0x18f3},
+	75:  {From: 0x188a, To: 0x436},
+	76:  {From: 0x1979, To: 0x1d01},
+	77:  {From: 0x1a74, To: 0x2bb0},
+	78:  {From: 0x1a8a, To: 0x1f8},
+	79:  {From: 0x1b5a, To: 0x1fa},
+	80:  {From: 0x1b86, To: 0x1515},
+	81:  {From: 0x1d64, To: 0x2c9b},
+	82:  {From: 0x2038, To: 0x37b1},
+	83:  {From: 0x203d, To: 0x20dd},
+	84:  {From: 0x205a, To: 0x30b},
+	85:  {From: 0x20e3, To: 0x274},
+	86:  {From: 0x20ee, To: 0x263},
+	87:  {From: 0x20f2, To: 0x22d},
+	88:  {From: 0x20f9, To: 0x256},
+	89:  {From: 0x210f, To: 0x21eb},
+	90:  {From: 0x2135, To: 0x27d},
+	91:  {From: 0x2160, To: 0x913},
+	92:  {From: 0x2199, To: 0x121},
+	93:  {From: 0x21ce, To: 0x1561},
+	94:  {From: 0x21e6, To: 0x504},
+	95:  {From: 0x21f4, To: 0x49f},
+	96:  {From: 0x21fb, To: 0x269},
+	97:  {From: 0x222d, To: 0x121},
+	98:  {From: 0x2237, To: 0x121},
+	99:  {From: 0x2262, To: 0x92a},
+	100: {From: 0x2316, To: 0x3226},
+	101: {From: 0x236a, To: 0x2835},
+	102: {From: 0x2382, To: 0x3365},
+	103: {From: 0x2472, To: 0x2c7},
+	104: {From: 0x24e4, To: 0x2ff},
+	105: {From: 0x24f0, To: 0x2fa},
+	106: {From: 0x24fa, To: 0x31f},
+	107: {From: 0x2550, To: 0xb5b},
+	108: {From: 0x25a9, To: 0xe2},
+	109: {From: 0x263e, To: 0x2d0},
+	110: {From: 0x26c9, To: 0x26b4},
+	111: {From: 0x26f9, To: 0x3c8},
+	112: {From: 0x2727, To: 0x3caf},
+	113: {From: 0x2755, To: 0x6a4},
+	114: {From: 0x2765, To: 0x26b4},
+	115: {From: 0x2789, To: 0x4358},
+	116: {From: 0x27c9, To: 0x2001},
+	117: {From: 0x28ea, To: 0x27b1},
+	118: {From: 0x28ef, To: 0x2837},
+	119: {From: 0x2914, To: 0x351},
+	120: {From: 0x2986, To: 0x2da7},
+	121: {From: 0x29f0, To: 0x96b},
+	122: {From: 0x2b1a, To: 0x38d},
+	123: {From: 0x2bfc, To: 0x395},
+	124: {From: 0x2c3f, To: 0x3caf},
+	125: {From: 0x2ce1, To: 0x2201},
+	126: {From: 0x2cfc, To: 0x3be},
+	127: {From: 0x2d13, To: 0x597},
+	128: {From: 0x2d47, To: 0x148},
+	129: {From: 0x2d48, To: 0x148},
+	130: {From: 0x2dff, To: 0x2f1},
+	131: {From: 0x2e08, To: 0x19cc},
+	132: {From: 0x2e1a, To: 0x2d95},
+	133: {From: 0x2e21, To: 0x292},
+	134: {From: 0x2e54, To: 0x7d},
+	135: {From: 0x2e65, To: 0x2282},
+	136: {From: 0x2ea0, To: 0x2e9b},
+	137: {From: 0x2eef, To: 0x2ed7},
+	138: {From: 0x3193, To: 0x3c4},
+	139: {From: 0x3366, To: 0x338e},
+	140: {From: 0x342a, To: 0x3dc},
+	141: {From: 0x34ee, To: 0x18d0},
+	142: {From: 0x35c8, To: 0x2c9b},
+	143: {From: 0x35e6, To: 0x412},
+	144: {From: 0x3658, To: 0x246},
+	145: {From: 0x3676, To: 0x3f4},
+	146: {From: 0x36fd, To: 0x445},
+	147: {From: 0x37c0, To: 0x121},
+	148: {From: 0x3816, To: 0x38f2},
+	149: {From: 0x382a, To: 0x2b48},
+	150: {From: 0x382b, To: 0x2c9b},
+	151: {From: 0x382f, To: 0xa9},
+	152: {From: 0x3832, To: 0x3228},
+	153: {From: 0x386c, To: 0x39a6},
+	154: {From: 0x3892, To: 0x3fc0},
+	155: {From: 0x38a5, To: 0x39d7},
+	156: {From: 0x38b4, To: 0x1fa4},
+	157: {From: 0x38b5, To: 0x2e9a},
+	158: {From: 0x395c, To: 0x47e},
+	159: {From: 0x3b4e, To: 0xd91},
+	160: {From: 0x3b78, To: 0x137},
+	161: {From: 0x3c99, To: 0x4bc},
+	162: {From: 0x3fbd, To: 0x100},
+	163: {From: 0x4208, To: 0xa91},
+	164: {From: 0x42be, To: 0x573},
+	165: {From: 0x42f9, To: 0x3f60},
+	166: {From: 0x4378, To: 0x25a},
+	167: {From: 0x43b8, To: 0xe6c},
+	168: {From: 0x43cd, To: 0x10f},
+	169: {From: 0x44af, To: 0x3322},
+	170: {From: 0x44e3, To: 0x512},
+	171: {From: 0x45ca, To: 0x2409},
+	172: {From: 0x45dd, To: 0x26dc},
+	173: {From: 0x4610, To: 0x48ae},
+	174: {From: 0x46ae, To: 0x46a0},
+	175: {From: 0x473e, To: 0x4745},
+	176: {From: 0x4817, To: 0x3503},
+	177: {From: 0x4916, To: 0x31f},
+	178: {From: 0x49a7, To: 0x523},
 }
 
-// Size: 176 bytes, 176 elements
-var AliasTypes = [176]AliasType{
+// Size: 179 bytes, 179 elements
+var AliasTypes = [179]AliasType{
 	// Entry 0 - 3F
 	1, 0, 0, 0, 0, 0, 0, 1, 2, 2, 0, 1, 0, 0, 1, 2,
-	1, 1, 2, 0, 0, 1, 0, 1, 2, 1, 1, 0, 0, 2, 1, 1,
-	0, 2, 0, 0, 1, 0, 1, 0, 0, 1, 2, 1, 1, 1, 1, 0,
-	0, 0, 0, 2, 1, 1, 1, 1, 2, 1, 0, 1, 1, 2, 2, 0,
+	1, 1, 2, 0, 0, 1, 0, 1, 2, 1, 1, 0, 0, 0, 0, 2,
+	1, 1, 0, 2, 0, 0, 1, 0, 1, 0, 0, 1, 2, 1, 1, 1,
+	1, 0, 0, 0, 0, 2, 1, 1, 1, 1, 2, 1, 0, 1, 1, 2,
 	// Entry 40 - 7F
-	0, 1, 2, 0, 1, 0, 1, 1, 1, 1, 0, 0, 2, 1, 0, 0,
-	0, 0, 1, 1, 1, 1, 1, 0, 1, 0, 0, 0, 0, 0, 0, 0,
-	0, 1, 0, 0, 0, 1, 2, 2, 2, 0, 1, 1, 0, 1, 0, 0,
-	0, 0, 0, 0, 0, 1, 0, 0, 1, 1, 0, 1, 0, 2, 1, 1,
+	2, 0, 0, 1, 2, 0, 1, 0, 1, 1, 1, 1, 0, 0, 2, 1,
+	0, 0, 0, 0, 1, 1, 1, 1, 1, 0, 1, 0, 0, 0, 0, 0,
+	0, 0, 0, 1, 0, 0, 0, 1, 2, 2, 2, 0, 1, 1, 0, 1,
+	0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 1, 0, 0, 1, 0,
 	// Entry 80 - BF
-	0, 0, 1, 0, 0, 0, 0, 1, 1, 2, 0, 0, 2, 1, 1, 1,
-	0, 0, 0, 0, 2, 0, 0, 0, 0, 0, 0, 1, 1, 0, 1, 2,
-	0, 0, 0, 1, 0, 1, 0, 1, 0, 0, 0, 0, 1, 0, 1, 1,
+	2, 1, 1, 0, 0, 1, 0, 0, 0, 0, 1, 1, 2, 0, 0, 2,
+	1, 1, 1, 0, 0, 0, 0, 2, 0, 0, 0, 0, 0, 0, 1, 1,
+	0, 1, 2, 0, 0, 0, 1, 0, 1, 0, 1, 0, 0, 0, 0, 1,
+	0, 1, 1,
 }
 
 const (
@@ -786,17 +790,17 @@ const (
 	_Hani = 57
 	_Hans = 59
 	_Hant = 60
-	_Qaaa = 143
-	_Qaai = 151
-	_Qabx = 192
-	_Zinh = 245
-	_Zyyy = 250
-	_Zzzz = 251
+	_Qaaa = 147
+	_Qaai = 155
+	_Qabx = 196
+	_Zinh = 252
+	_Zyyy = 257
+	_Zzzz = 258
 )
 
 // script is an alphabetically sorted list of ISO 15924 codes. The index
 // of the script in the string, divided by 4, is the internal scriptID.
-const script tag.Index = "" + // Size: 1012 bytes
+const script tag.Index = "" + // Size: 1040 bytes
 	"----AdlmAfakAghbAhomArabAranArmiArmnAvstBaliBamuBassBatkBengBhksBlisBopo" +
 	"BrahBraiBugiBuhdCakmCansCariChamCherChrsCirtCoptCpmnCprtCyrlCyrsDevaDiak" +
 	"DogrDsrtDuplEgydEgyhEgypElbaElymEthiGeokGeorGlagGongGonmGothGranGrekGujr" +
@@ -804,14 +808,14 @@ const script tag.Index = "" + // Size: 1012 bytes
 	"JavaJpanJurcKaliKanaKharKhmrKhojKitlKitsKndaKoreKpelKthiLanaLaooLatfLatg" +
 	"LatnLekeLepcLimbLinaLinbLisuLomaLyciLydiMahjMakaMandManiMarcMayaMedfMend" +
 	"MercMeroMlymModiMongMoonMrooMteiMultMymrNandNarbNbatNewaNkdbNkgbNkooNshu" +
-	"OgamOlckOrkhOryaOsgeOsmaPalmPaucPermPhagPhliPhlpPhlvPhnxPiqdPlrdPrtiQaaa" +
-	"QaabQaacQaadQaaeQaafQaagQaahQaaiQaajQaakQaalQaamQaanQaaoQaapQaaqQaarQaas" +
-	"QaatQaauQaavQaawQaaxQaayQaazQabaQabbQabcQabdQabeQabfQabgQabhQabiQabjQabk" +
-	"QablQabmQabnQaboQabpQabqQabrQabsQabtQabuQabvQabwQabxRjngRohgRoroRunrSamr" +
-	"SaraSarbSaurSgnwShawShrdShuiSiddSindSinhSogdSogoSoraSoyoSundSyloSyrcSyre" +
-	"SyrjSyrnTagbTakrTaleTaluTamlTangTavtTeluTengTfngTglgThaaThaiTibtTirhToto" +
-	"UgarVaiiVispWaraWchoWoleXpeoXsuxYeziYiiiZanbZinhZmthZsyeZsymZxxxZyyyZzzz" +
-	"\xff\xff\xff\xff"
+	"OgamOlckOrkhOryaOsgeOsmaOugrPalmPaucPcunPelmPermPhagPhliPhlpPhlvPhnxPiqd" +
+	"PlrdPrtiPsinQaaaQaabQaacQaadQaaeQaafQaagQaahQaaiQaajQaakQaalQaamQaanQaao" +
+	"QaapQaaqQaarQaasQaatQaauQaavQaawQaaxQaayQaazQabaQabbQabcQabdQabeQabfQabg" +
+	"QabhQabiQabjQabkQablQabmQabnQaboQabpQabqQabrQabsQabtQabuQabvQabwQabxRanj" +
+	"RjngRohgRoroRunrSamrSaraSarbSaurSgnwShawShrdShuiSiddSindSinhSogdSogoSora" +
+	"SoyoSundSyloSyrcSyreSyrjSyrnTagbTakrTaleTaluTamlTangTavtTeluTengTfngTglg" +
+	"ThaaThaiTibtTirhTnsaTotoUgarVaiiVispVithWaraWchoWoleXpeoXsuxYeziYiiiZanb" +
+	"ZinhZmthZsyeZsymZxxxZyyyZzzz\xff\xff\xff\xff"
 
 // suppressScript is an index from langID to the dominant script for that language,
 // if it exists.  If a script is given, it should be suppressed from the language tag.
@@ -859,7 +863,7 @@ var suppressScript = [1330]uint8{
 	0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
 	0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x5a,
 	0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
-	0xe5, 0x00, 0x00, 0x00, 0x00, 0xe7, 0x00, 0x00,
+	0xea, 0x00, 0x00, 0x00, 0x00, 0xec, 0x00, 0x00,
 	0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x34, 0x00,
 	0x00, 0x5a, 0x00, 0x00, 0x5a, 0x00, 0x5a, 0x00,
 	// Entry 140 - 17F
@@ -963,7 +967,7 @@ var suppressScript = [1330]uint8{
 	0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
 	// Entry 400 - 43F
 	0x00, 0x00, 0x5a, 0x00, 0x00, 0x00, 0x00, 0x00,
-	0x00, 0x00, 0x00, 0x00, 0xcf, 0x00, 0x00, 0x00,
+	0x00, 0x00, 0x00, 0x00, 0xd4, 0x00, 0x00, 0x00,
 	0x00, 0x00, 0x5a, 0x00, 0x00, 0x00, 0x5a, 0x00,
 	0x00, 0x00, 0x00, 0x5a, 0x00, 0x00, 0x00, 0x00,
 	0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
@@ -973,10 +977,10 @@ var suppressScript = [1330]uint8{
 	// Entry 440 - 47F
 	0x00, 0x00, 0x00, 0x00, 0x5a, 0x5a, 0x00, 0x00,
 	0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
-	0xde, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
+	0xe3, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
 	0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
-	0x00, 0xe1, 0x00, 0x5a, 0x00, 0x00, 0x00, 0x00,
-	0x00, 0x00, 0x00, 0xe6, 0x00, 0x00, 0x00, 0x2c,
+	0x00, 0xe6, 0x00, 0x5a, 0x00, 0x00, 0x00, 0x00,
+	0x00, 0x00, 0x00, 0xeb, 0x00, 0x00, 0x00, 0x2c,
 	0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x5a,
 	0x00, 0x00, 0x5a, 0x00, 0x00, 0x00, 0x5a, 0x00,
 	// Entry 480 - 4BF
@@ -1087,7 +1091,7 @@ var regionTypes = [358]uint8{
 
 // regionISO holds a list of alphabetically sorted 2-letter ISO region codes.
 // Each 2-letter codes is followed by two bytes with the following meaning:
-//   - [A-Z]{2}: the first letter of the 2-letter code plus these two
+//   - [A-Z}{2}: the first letter of the 2-letter code plus these two
 //     letters form the 3-letter ISO code.
 //   - 0, n:     index into altRegionISO3.
 const regionISO tag.Index = "" + // Size: 1308 bytes
@@ -1271,117 +1275,118 @@ var fromM49 = [333]uint16{
 	0xc759, 0xc95a, 0xcb5b, 0xcd5c, 0xcf65,
 }
 
-// Size: 1995 bytes
+// Size: 2014 bytes
 var variantIndex = map[string]uint8{
 	"1606nict": 0x0,
 	"1694acad": 0x1,
 	"1901":     0x2,
 	"1959acad": 0x3,
-	"1994":     0x60,
+	"1994":     0x61,
 	"1996":     0x4,
 	"abl1943":  0x5,
 	"akuapem":  0x6,
-	"alalc97":  0x62,
+	"alalc97":  0x63,
 	"aluku":    0x7,
 	"ao1990":   0x8,
 	"aranes":   0x9,
 	"arevela":  0xa,
 	"arevmda":  0xb,
-	"asante":   0xc,
-	"auvern":   0xd,
-	"baku1926": 0xe,
-	"balanka":  0xf,
-	"barla":    0x10,
-	"basiceng": 0x11,
-	"bauddha":  0x12,
-	"biscayan": 0x13,
-	"biske":    0x5b,
-	"bohoric":  0x14,
-	"boont":    0x15,
-	"bornholm": 0x16,
-	"cisaup":   0x17,
-	"colb1945": 0x18,
-	"cornu":    0x19,
-	"creiss":   0x1a,
-	"dajnko":   0x1b,
-	"ekavsk":   0x1c,
-	"emodeng":  0x1d,
-	"fonipa":   0x63,
-	"fonkirsh": 0x64,
-	"fonnapa":  0x65,
-	"fonupa":   0x66,
-	"fonxsamp": 0x67,
-	"gascon":   0x1e,
-	"grclass":  0x1f,
-	"grital":   0x20,
-	"grmistr":  0x21,
-	"hepburn":  0x22,
-	"heploc":   0x61,
-	"hognorsk": 0x23,
-	"hsistemo": 0x24,
-	"ijekavsk": 0x25,
-	"itihasa":  0x26,
-	"ivanchov": 0x27,
-	"jauer":    0x28,
-	"jyutping": 0x29,
-	"kkcor":    0x2a,
-	"kociewie": 0x2b,
-	"kscor":    0x2c,
-	"laukika":  0x2d,
-	"lemosin":  0x2e,
-	"lengadoc": 0x2f,
-	"lipaw":    0x5c,
-	"luna1918": 0x30,
-	"metelko":  0x31,
-	"monoton":  0x32,
-	"ndyuka":   0x33,
-	"nedis":    0x34,
-	"newfound": 0x35,
-	"nicard":   0x36,
-	"njiva":    0x5d,
-	"nulik":    0x37,
-	"osojs":    0x5e,
-	"oxendict": 0x38,
-	"pahawh2":  0x39,
-	"pahawh3":  0x3a,
-	"pahawh4":  0x3b,
-	"pamaka":   0x3c,
-	"peano":    0x3d,
-	"petr1708": 0x3e,
-	"pinyin":   0x3f,
-	"polyton":  0x40,
-	"provenc":  0x41,
-	"puter":    0x42,
-	"rigik":    0x43,
-	"rozaj":    0x44,
-	"rumgr":    0x45,
-	"scotland": 0x46,
-	"scouse":   0x47,
-	"simple":   0x68,
-	"solba":    0x5f,
-	"sotav":    0x48,
-	"spanglis": 0x49,
-	"surmiran": 0x4a,
-	"sursilv":  0x4b,
-	"sutsilv":  0x4c,
-	"tarask":   0x4d,
-	"tongyong": 0x4e,
-	"tunumiit": 0x4f,
-	"uccor":    0x50,
-	"ucrcor":   0x51,
-	"ulster":   0x52,
-	"unifon":   0x53,
-	"vaidika":  0x54,
-	"valencia": 0x55,
-	"vallader": 0x56,
-	"vecdruka": 0x57,
-	"vivaraup": 0x58,
-	"wadegile": 0x59,
-	"xsistemo": 0x5a,
+	"arkaika":  0xc,
+	"asante":   0xd,
+	"auvern":   0xe,
+	"baku1926": 0xf,
+	"balanka":  0x10,
+	"barla":    0x11,
+	"basiceng": 0x12,
+	"bauddha":  0x13,
+	"biscayan": 0x14,
+	"biske":    0x5c,
+	"bohoric":  0x15,
+	"boont":    0x16,
+	"bornholm": 0x17,
+	"cisaup":   0x18,
+	"colb1945": 0x19,
+	"cornu":    0x1a,
+	"creiss":   0x1b,
+	"dajnko":   0x1c,
+	"ekavsk":   0x1d,
+	"emodeng":  0x1e,
+	"fonipa":   0x64,
+	"fonkirsh": 0x65,
+	"fonnapa":  0x66,
+	"fonupa":   0x67,
+	"fonxsamp": 0x68,
+	"gascon":   0x1f,
+	"grclass":  0x20,
+	"grital":   0x21,
+	"grmistr":  0x22,
+	"hepburn":  0x23,
+	"heploc":   0x62,
+	"hognorsk": 0x24,
+	"hsistemo": 0x25,
+	"ijekavsk": 0x26,
+	"itihasa":  0x27,
+	"ivanchov": 0x28,
+	"jauer":    0x29,
+	"jyutping": 0x2a,
+	"kkcor":    0x2b,
+	"kociewie": 0x2c,
+	"kscor":    0x2d,
+	"laukika":  0x2e,
+	"lemosin":  0x2f,
+	"lengadoc": 0x30,
+	"lipaw":    0x5d,
+	"luna1918": 0x31,
+	"metelko":  0x32,
+	"monoton":  0x33,
+	"ndyuka":   0x34,
+	"nedis":    0x35,
+	"newfound": 0x36,
+	"nicard":   0x37,
+	"njiva":    0x5e,
+	"nulik":    0x38,
+	"osojs":    0x5f,
+	"oxendict": 0x39,
+	"pahawh2":  0x3a,
+	"pahawh3":  0x3b,
+	"pahawh4":  0x3c,
+	"pamaka":   0x3d,
+	"peano":    0x3e,
+	"petr1708": 0x3f,
+	"pinyin":   0x40,
+	"polyton":  0x41,
+	"provenc":  0x42,
+	"puter":    0x43,
+	"rigik":    0x44,
+	"rozaj":    0x45,
+	"rumgr":    0x46,
+	"scotland": 0x47,
+	"scouse":   0x48,
+	"simple":   0x69,
+	"solba":    0x60,
+	"sotav":    0x49,
+	"spanglis": 0x4a,
+	"surmiran": 0x4b,
+	"sursilv":  0x4c,
+	"sutsilv":  0x4d,
+	"tarask":   0x4e,
+	"tongyong": 0x4f,
+	"tunumiit": 0x50,
+	"uccor":    0x51,
+	"ucrcor":   0x52,
+	"ulster":   0x53,
+	"unifon":   0x54,
+	"vaidika":  0x55,
+	"valencia": 0x56,
+	"vallader": 0x57,
+	"vecdruka": 0x58,
+	"vivaraup": 0x59,
+	"wadegile": 0x5a,
+	"xsistemo": 0x5b,
 }
 
 // variantNumSpecialized is the number of specialized variants in variants.
-const variantNumSpecialized = 98
+const variantNumSpecialized = 99
 
 // nRegionGroups is the number of region groups.
 const nRegionGroups = 33
@@ -1393,8 +1398,8 @@ type likelyLangRegion struct {
 
 // likelyScript is a lookup table, indexed by scriptID, for the most likely
 // languages and regions given a script.
-// Size: 1012 bytes, 253 elements
-var likelyScript = [253]likelyLangRegion{
+// Size: 1040 bytes, 260 elements
+var likelyScript = [260]likelyLangRegion{
 	1:   {lang: 0x14e, region: 0x84},
 	3:   {lang: 0x2a2, region: 0x106},
 	4:   {lang: 0x1f, region: 0x99},
@@ -1492,57 +1497,57 @@ var likelyScript = [253]likelyLangRegion{
 	129: {lang: 0x395, region: 0x99},
 	130: {lang: 0x399, region: 0x135},
 	131: {lang: 0x429, region: 0x115},
-	132: {lang: 0x3b, region: 0x11c},
-	133: {lang: 0xfd, region: 0xc4},
-	134: {lang: 0x27d, region: 0x106},
-	135: {lang: 0x2c9, region: 0x53},
-	136: {lang: 0x39f, region: 0x9c},
-	137: {lang: 0x39f, region: 0x53},
-	139: {lang: 0x3ad, region: 0xb0},
-	141: {lang: 0x1c6, region: 0x53},
-	142: {lang: 0x4fd, region: 0x9c},
-	193: {lang: 0x3cb, region: 0x95},
-	196: {lang: 0x372, region: 0x10c},
-	197: {lang: 0x420, region: 0x97},
-	199: {lang: 0x4ff, region: 0x15e},
-	200: {lang: 0x3f0, region: 0x99},
-	201: {lang: 0x45, region: 0x135},
-	202: {lang: 0x139, region: 0x7b},
-	203: {lang: 0x3e9, region: 0x99},
-	205: {lang: 0x3e9, region: 0x99},
-	206: {lang: 0x3fa, region: 0x99},
-	207: {lang: 0x40c, region: 0xb3},
-	210: {lang: 0x433, region: 0x99},
-	211: {lang: 0xef, region: 0xc5},
-	212: {lang: 0x43e, region: 0x95},
-	213: {lang: 0x44d, region: 0x35},
-	214: {lang: 0x44e, region: 0x9b},
-	218: {lang: 0x45a, region: 0xe7},
-	219: {lang: 0x11a, region: 0x99},
-	220: {lang: 0x45e, region: 0x53},
-	221: {lang: 0x232, region: 0x53},
-	222: {lang: 0x450, region: 0x99},
-	223: {lang: 0x4a5, region: 0x53},
-	224: {lang: 0x9f, region: 0x13e},
-	225: {lang: 0x461, region: 0x99},
-	227: {lang: 0x528, region: 0xba},
-	228: {lang: 0x153, region: 0xe7},
-	229: {lang: 0x128, region: 0xcd},
-	230: {lang: 0x46b, region: 0x123},
-	231: {lang: 0xa9, region: 0x53},
-	232: {lang: 0x2ce, region: 0x99},
-	234: {lang: 0x4ad, region: 0x11c},
-	235: {lang: 0x4be, region: 0xb4},
-	237: {lang: 0x1ce, region: 0x99},
-	240: {lang: 0x3a9, region: 0x9c},
-	241: {lang: 0x22, region: 0x9b},
-	243: {lang: 0x1ea, region: 0x53},
-	244: {lang: 0xef, region: 0xc5},
+	133: {lang: 0x3b, region: 0x11c},
+	134: {lang: 0xfd, region: 0xc4},
+	137: {lang: 0x27d, region: 0x106},
+	138: {lang: 0x2c9, region: 0x53},
+	139: {lang: 0x39f, region: 0x9c},
+	140: {lang: 0x39f, region: 0x53},
+	142: {lang: 0x3ad, region: 0xb0},
+	144: {lang: 0x1c6, region: 0x53},
+	145: {lang: 0x4fd, region: 0x9c},
+	198: {lang: 0x3cb, region: 0x95},
+	201: {lang: 0x372, region: 0x10c},
+	202: {lang: 0x420, region: 0x97},
+	204: {lang: 0x4ff, region: 0x15e},
+	205: {lang: 0x3f0, region: 0x99},
+	206: {lang: 0x45, region: 0x135},
+	207: {lang: 0x139, region: 0x7b},
+	208: {lang: 0x3e9, region: 0x99},
+	210: {lang: 0x3e9, region: 0x99},
+	211: {lang: 0x3fa, region: 0x99},
+	212: {lang: 0x40c, region: 0xb3},
+	215: {lang: 0x433, region: 0x99},
+	216: {lang: 0xef, region: 0xc5},
+	217: {lang: 0x43e, region: 0x95},
+	218: {lang: 0x44d, region: 0x35},
+	219: {lang: 0x44e, region: 0x9b},
+	223: {lang: 0x45a, region: 0xe7},
+	224: {lang: 0x11a, region: 0x99},
+	225: {lang: 0x45e, region: 0x53},
+	226: {lang: 0x232, region: 0x53},
+	227: {lang: 0x450, region: 0x99},
+	228: {lang: 0x4a5, region: 0x53},
+	229: {lang: 0x9f, region: 0x13e},
+	230: {lang: 0x461, region: 0x99},
+	232: {lang: 0x528, region: 0xba},
+	233: {lang: 0x153, region: 0xe7},
+	234: {lang: 0x128, region: 0xcd},
+	235: {lang: 0x46b, region: 0x123},
+	236: {lang: 0xa9, region: 0x53},
+	237: {lang: 0x2ce, region: 0x99},
+	240: {lang: 0x4ad, region: 0x11c},
+	241: {lang: 0x4be, region: 0xb4},
+	244: {lang: 0x1ce, region: 0x99},
+	247: {lang: 0x3a9, region: 0x9c},
+	248: {lang: 0x22, region: 0x9b},
+	250: {lang: 0x1ea, region: 0x53},
+	251: {lang: 0xef, region: 0xc5},
 }
 
 type likelyScriptRegion struct {
 	region uint16
-	script uint8
+	script uint16
 	flags  uint8
 }
 
@@ -1550,7 +1555,7 @@ type likelyScriptRegion struct {
 // scripts and regions given incomplete information. If more entries exist for a
 // given language, region and script are the index and size respectively
 // of the list in likelyLangList.
-// Size: 5320 bytes, 1330 elements
+// Size: 7980 bytes, 1330 elements
 var likelyLang = [1330]likelyScriptRegion{
 	0:    {region: 0x135, script: 0x5a, flags: 0x0},
 	1:    {region: 0x6f, script: 0x5a, flags: 0x0},
@@ -1586,7 +1591,7 @@ var likelyLang = [1330]likelyScriptRegion{
 	31:   {region: 0x99, script: 0x4, flags: 0x0},
 	32:   {region: 0x165, script: 0x5a, flags: 0x0},
 	33:   {region: 0x80, script: 0x5a, flags: 0x0},
-	34:   {region: 0x9b, script: 0xf1, flags: 0x0},
+	34:   {region: 0x9b, script: 0xf8, flags: 0x0},
 	35:   {region: 0x165, script: 0x5a, flags: 0x0},
 	36:   {region: 0x165, script: 0x5a, flags: 0x0},
 	37:   {region: 0x14d, script: 0x5a, flags: 0x0},
@@ -1619,7 +1624,7 @@ var likelyLang = [1330]likelyScriptRegion{
 	66:   {region: 0x6b, script: 0x5, flags: 0x0},
 	67:   {region: 0x99, script: 0xe, flags: 0x0},
 	68:   {region: 0x12f, script: 0x5a, flags: 0x0},
-	69:   {region: 0x135, script: 0xc9, flags: 0x0},
+	69:   {region: 0x135, script: 0xce, flags: 0x0},
 	70:   {region: 0x165, script: 0x5a, flags: 0x0},
 	71:   {region: 0x165, script: 0x5a, flags: 0x0},
 	72:   {region: 0x6e, script: 0x5a, flags: 0x0},
@@ -1673,7 +1678,7 @@ var likelyLang = [1330]likelyScriptRegion{
 	120:  {region: 0x165, script: 0x5a, flags: 0x0},
 	121:  {region: 0x12f, script: 0x5a, flags: 0x0},
 	122:  {region: 0x52, script: 0x5a, flags: 0x0},
-	123:  {region: 0x99, script: 0xde, flags: 0x0},
+	123:  {region: 0x99, script: 0xe3, flags: 0x0},
 	124:  {region: 0xe8, script: 0x5, flags: 0x0},
 	125:  {region: 0x99, script: 0x22, flags: 0x0},
 	126:  {region: 0x38, script: 0x20, flags: 0x0},
@@ -1708,7 +1713,7 @@ var likelyLang = [1330]likelyScriptRegion{
 	156:  {region: 0x165, script: 0x5a, flags: 0x0},
 	157:  {region: 0xe7, script: 0x5a, flags: 0x0},
 	158:  {region: 0x165, script: 0x5a, flags: 0x0},
-	159:  {region: 0x13e, script: 0xe0, flags: 0x0},
+	159:  {region: 0x13e, script: 0xe5, flags: 0x0},
 	160:  {region: 0xc3, script: 0x5a, flags: 0x0},
 	161:  {region: 0x165, script: 0x5a, flags: 0x0},
 	162:  {region: 0x165, script: 0x5a, flags: 0x0},
@@ -1718,7 +1723,7 @@ var likelyLang = [1330]likelyScriptRegion{
 	166:  {region: 0x165, script: 0x5a, flags: 0x0},
 	167:  {region: 0x165, script: 0x5a, flags: 0x0},
 	168:  {region: 0x165, script: 0x5a, flags: 0x0},
-	169:  {region: 0x53, script: 0xe7, flags: 0x0},
+	169:  {region: 0x53, script: 0xec, flags: 0x0},
 	170:  {region: 0x165, script: 0x5a, flags: 0x0},
 	171:  {region: 0x165, script: 0x5a, flags: 0x0},
 	172:  {region: 0x165, script: 0x5a, flags: 0x0},
@@ -1788,7 +1793,7 @@ var likelyLang = [1330]likelyScriptRegion{
 	236:  {region: 0x165, script: 0x5a, flags: 0x0},
 	237:  {region: 0x165, script: 0x5a, flags: 0x0},
 	238:  {region: 0x165, script: 0x5a, flags: 0x0},
-	239:  {region: 0xc5, script: 0xd3, flags: 0x0},
+	239:  {region: 0xc5, script: 0xd8, flags: 0x0},
 	240:  {region: 0x78, script: 0x5a, flags: 0x0},
 	241:  {region: 0x6b, script: 0x1d, flags: 0x0},
 	242:  {region: 0xe7, script: 0x5a, flags: 0x0},
@@ -1802,7 +1807,7 @@ var likelyLang = [1330]likelyScriptRegion{
 	250:  {region: 0x5e, script: 0x5a, flags: 0x0},
 	251:  {region: 0xe9, script: 0x5a, flags: 0x0},
 	252:  {region: 0x49, script: 0x17, flags: 0x0},
-	253:  {region: 0xc4, script: 0x85, flags: 0x0},
+	253:  {region: 0xc4, script: 0x86, flags: 0x0},
 	254:  {region: 0x8, script: 0x2, flags: 0x1},
 	255:  {region: 0x106, script: 0x20, flags: 0x0},
 	256:  {region: 0x7b, script: 0x5a, flags: 0x0},
@@ -1845,12 +1850,12 @@ var likelyLang = [1330]likelyScriptRegion{
 	293:  {region: 0x165, script: 0x5a, flags: 0x0},
 	294:  {region: 0x165, script: 0x5a, flags: 0x0},
 	295:  {region: 0x165, script: 0x5a, flags: 0x0},
-	296:  {region: 0xcd, script: 0xe5, flags: 0x0},
+	296:  {region: 0xcd, script: 0xea, flags: 0x0},
 	297:  {region: 0x165, script: 0x5a, flags: 0x0},
 	298:  {region: 0x165, script: 0x5a, flags: 0x0},
 	299:  {region: 0x114, script: 0x5a, flags: 0x0},
 	300:  {region: 0x37, script: 0x5a, flags: 0x0},
-	301:  {region: 0x43, script: 0xe7, flags: 0x0},
+	301:  {region: 0x43, script: 0xec, flags: 0x0},
 	302:  {region: 0x165, script: 0x5a, flags: 0x0},
 	303:  {region: 0xa4, script: 0x5a, flags: 0x0},
 	304:  {region: 0x80, script: 0x5a, flags: 0x0},
@@ -1960,7 +1965,7 @@ var likelyLang = [1330]likelyScriptRegion{
 	408:  {region: 0x165, script: 0x2c, flags: 0x0},
 	409:  {region: 0x165, script: 0x5a, flags: 0x0},
 	410:  {region: 0x99, script: 0x22, flags: 0x0},
-	411:  {region: 0x99, script: 0xe1, flags: 0x0},
+	411:  {region: 0x99, script: 0xe6, flags: 0x0},
 	412:  {region: 0x95, script: 0x5a, flags: 0x0},
 	413:  {region: 0xd9, script: 0x5a, flags: 0x0},
 	414:  {region: 0x130, script: 0x32, flags: 0x0},
@@ -2003,7 +2008,7 @@ var likelyLang = [1330]likelyScriptRegion{
 	451:  {region: 0xe7, script: 0x5a, flags: 0x0},
 	452:  {region: 0x165, script: 0x5a, flags: 0x0},
 	453:  {region: 0x12b, script: 0x40, flags: 0x0},
-	454:  {region: 0x53, script: 0x8d, flags: 0x0},
+	454:  {region: 0x53, script: 0x90, flags: 0x0},
 	455:  {region: 0x165, script: 0x5a, flags: 0x0},
 	456:  {region: 0xe8, script: 0x5, flags: 0x0},
 	457:  {region: 0x99, script: 0x22, flags: 0x0},
@@ -2038,7 +2043,7 @@ var likelyLang = [1330]likelyScriptRegion{
 	487:  {region: 0xd6, script: 0x5a, flags: 0x0},
 	488:  {region: 0x165, script: 0x5a, flags: 0x0},
 	489:  {region: 0x165, script: 0x5a, flags: 0x0},
-	490:  {region: 0x53, script: 0xf3, flags: 0x0},
+	490:  {region: 0x53, script: 0xfa, flags: 0x0},
 	491:  {region: 0x165, script: 0x5a, flags: 0x0},
 	492:  {region: 0x135, script: 0x5a, flags: 0x0},
 	493:  {region: 0x165, script: 0x5a, flags: 0x0},
@@ -2098,7 +2103,7 @@ var likelyLang = [1330]likelyScriptRegion{
 	547:  {region: 0x12f, script: 0x5a, flags: 0x0},
 	548:  {region: 0x122, script: 0x5, flags: 0x0},
 	549:  {region: 0x165, script: 0x5a, flags: 0x0},
-	550:  {region: 0x123, script: 0xe6, flags: 0x0},
+	550:  {region: 0x123, script: 0xeb, flags: 0x0},
 	551:  {region: 0x5a, script: 0x5a, flags: 0x0},
 	552:  {region: 0x52, script: 0x5a, flags: 0x0},
 	553:  {region: 0x165, script: 0x5a, flags: 0x0},
@@ -2110,7 +2115,7 @@ var likelyLang = [1330]likelyScriptRegion{
 	559:  {region: 0x165, script: 0x5a, flags: 0x0},
 	560:  {region: 0x41, script: 0x5a, flags: 0x0},
 	561:  {region: 0x99, script: 0x5a, flags: 0x0},
-	562:  {region: 0x53, script: 0xdd, flags: 0x0},
+	562:  {region: 0x53, script: 0xe2, flags: 0x0},
 	563:  {region: 0x99, script: 0x22, flags: 0x0},
 	564:  {region: 0xc3, script: 0x5a, flags: 0x0},
 	565:  {region: 0x165, script: 0x5a, flags: 0x0},
@@ -2194,7 +2199,7 @@ var likelyLang = [1330]likelyScriptRegion{
 	643:  {region: 0x165, script: 0x5a, flags: 0x0},
 	644:  {region: 0x165, script: 0x5a, flags: 0x0},
 	645:  {region: 0x165, script: 0x2c, flags: 0x0},
-	646:  {region: 0x123, script: 0xe6, flags: 0x0},
+	646:  {region: 0x123, script: 0xeb, flags: 0x0},
 	647:  {region: 0xe8, script: 0x5, flags: 0x0},
 	648:  {region: 0x165, script: 0x5a, flags: 0x0},
 	649:  {region: 0x165, script: 0x5a, flags: 0x0},
@@ -2214,7 +2219,7 @@ var likelyLang = [1330]likelyScriptRegion{
 	663:  {region: 0x165, script: 0x5a, flags: 0x0},
 	664:  {region: 0x95, script: 0x5a, flags: 0x0},
 	665:  {region: 0x165, script: 0x5a, flags: 0x0},
-	666:  {region: 0x53, script: 0xe6, flags: 0x0},
+	666:  {region: 0x53, script: 0xeb, flags: 0x0},
 	667:  {region: 0x165, script: 0x5a, flags: 0x0},
 	668:  {region: 0x165, script: 0x5a, flags: 0x0},
 	669:  {region: 0x165, script: 0x5a, flags: 0x0},
@@ -2238,7 +2243,7 @@ var likelyLang = [1330]likelyScriptRegion{
 	687:  {region: 0x135, script: 0x5a, flags: 0x0},
 	688:  {region: 0x165, script: 0x5a, flags: 0x0},
 	689:  {region: 0x165, script: 0x5a, flags: 0x0},
-	690:  {region: 0x99, script: 0xe1, flags: 0x0},
+	690:  {region: 0x99, script: 0xe6, flags: 0x0},
 	691:  {region: 0x9e, script: 0x5a, flags: 0x0},
 	692:  {region: 0x165, script: 0x5a, flags: 0x0},
 	693:  {region: 0x4b, script: 0x5a, flags: 0x0},
@@ -2260,7 +2265,7 @@ var likelyLang = [1330]likelyScriptRegion{
 	709:  {region: 0xa4, script: 0x5a, flags: 0x0},
 	710:  {region: 0x9c, script: 0x5, flags: 0x0},
 	711:  {region: 0xb8, script: 0x5a, flags: 0x0},
-	712:  {region: 0x123, script: 0xe6, flags: 0x0},
+	712:  {region: 0x123, script: 0xeb, flags: 0x0},
 	713:  {region: 0x53, script: 0x3b, flags: 0x0},
 	714:  {region: 0x12b, script: 0x5a, flags: 0x0},
 	715:  {region: 0x95, script: 0x5a, flags: 0x0},
@@ -2427,7 +2432,7 @@ var likelyLang = [1330]likelyScriptRegion{
 	879:  {region: 0xda, script: 0x5a, flags: 0x0},
 	880:  {region: 0x123, script: 0x56, flags: 0x0},
 	881:  {region: 0x99, script: 0x22, flags: 0x0},
-	882:  {region: 0x10c, script: 0xc4, flags: 0x0},
+	882:  {region: 0x10c, script: 0xc9, flags: 0x0},
 	883:  {region: 0x165, script: 0x5a, flags: 0x0},
 	884:  {region: 0x165, script: 0x5a, flags: 0x0},
 	885:  {region: 0x84, script: 0x7c, flags: 0x0},
@@ -2481,11 +2486,11 @@ var likelyLang = [1330]likelyScriptRegion{
 	934:  {region: 0x135, script: 0x5a, flags: 0x0},
 	935:  {region: 0x49, script: 0x5a, flags: 0x0},
 	936:  {region: 0x165, script: 0x5a, flags: 0x0},
-	937:  {region: 0x9c, script: 0xf0, flags: 0x0},
+	937:  {region: 0x9c, script: 0xf7, flags: 0x0},
 	938:  {region: 0x165, script: 0x5a, flags: 0x0},
 	939:  {region: 0x60, script: 0x5a, flags: 0x0},
 	940:  {region: 0x165, script: 0x5, flags: 0x0},
-	941:  {region: 0xb0, script: 0x8b, flags: 0x0},
+	941:  {region: 0xb0, script: 0x8e, flags: 0x0},
 	943:  {region: 0x165, script: 0x5a, flags: 0x0},
 	944:  {region: 0x165, script: 0x5a, flags: 0x0},
 	945:  {region: 0x99, script: 0x12, flags: 0x0},
@@ -2551,7 +2556,7 @@ var likelyLang = [1330]likelyScriptRegion{
 	1005: {region: 0x95, script: 0x5a, flags: 0x0},
 	1006: {region: 0x99, script: 0x5a, flags: 0x0},
 	1007: {region: 0x114, script: 0x5a, flags: 0x0},
-	1008: {region: 0x99, script: 0xc8, flags: 0x0},
+	1008: {region: 0x99, script: 0xcd, flags: 0x0},
 	1009: {region: 0x165, script: 0x5a, flags: 0x0},
 	1010: {region: 0x165, script: 0x5a, flags: 0x0},
 	1011: {region: 0x12f, script: 0x5a, flags: 0x0},
@@ -2574,11 +2579,11 @@ var likelyLang = [1330]likelyScriptRegion{
 	1028: {region: 0xb6, script: 0x5a, flags: 0x0},
 	1029: {region: 0x165, script: 0x2c, flags: 0x0},
 	1030: {region: 0x165, script: 0x5a, flags: 0x0},
-	1032: {region: 0xba, script: 0xe3, flags: 0x0},
+	1032: {region: 0xba, script: 0xe8, flags: 0x0},
 	1033: {region: 0x165, script: 0x5a, flags: 0x0},
 	1034: {region: 0xc4, script: 0x75, flags: 0x0},
 	1035: {region: 0x165, script: 0x5, flags: 0x0},
-	1036: {region: 0xb3, script: 0xcf, flags: 0x0},
+	1036: {region: 0xb3, script: 0xd4, flags: 0x0},
 	1037: {region: 0x6f, script: 0x5a, flags: 0x0},
 	1038: {region: 0x165, script: 0x5a, flags: 0x0},
 	1039: {region: 0x165, script: 0x5a, flags: 0x0},
@@ -2597,7 +2602,7 @@ var likelyLang = [1330]likelyScriptRegion{
 	1052: {region: 0x10c, script: 0x5a, flags: 0x0},
 	1054: {region: 0x10c, script: 0x5a, flags: 0x0},
 	1055: {region: 0x72, script: 0x5a, flags: 0x0},
-	1056: {region: 0x97, script: 0xc5, flags: 0x0},
+	1056: {region: 0x97, script: 0xca, flags: 0x0},
 	1057: {region: 0x165, script: 0x5a, flags: 0x0},
 	1058: {region: 0x72, script: 0x5a, flags: 0x0},
 	1059: {region: 0x164, script: 0x5a, flags: 0x0},
@@ -2609,14 +2614,14 @@ var likelyLang = [1330]likelyScriptRegion{
 	1065: {region: 0x115, script: 0x5a, flags: 0x0},
 	1066: {region: 0x165, script: 0x5a, flags: 0x0},
 	1067: {region: 0x165, script: 0x5a, flags: 0x0},
-	1068: {region: 0x123, script: 0xe6, flags: 0x0},
+	1068: {region: 0x123, script: 0xeb, flags: 0x0},
 	1069: {region: 0x165, script: 0x5a, flags: 0x0},
 	1070: {region: 0x165, script: 0x5a, flags: 0x0},
 	1071: {region: 0x165, script: 0x5a, flags: 0x0},
 	1072: {region: 0x165, script: 0x5a, flags: 0x0},
 	1073: {region: 0x27, script: 0x5a, flags: 0x0},
 	1074: {region: 0x37, script: 0x5, flags: 0x1},
-	1075: {region: 0x99, script: 0xd2, flags: 0x0},
+	1075: {region: 0x99, script: 0xd7, flags: 0x0},
 	1076: {region: 0x116, script: 0x5a, flags: 0x0},
 	1077: {region: 0x114, script: 0x5a, flags: 0x0},
 	1078: {region: 0x99, script: 0x22, flags: 0x0},
@@ -2643,9 +2648,9 @@ var likelyLang = [1330]likelyScriptRegion{
 	1099: {region: 0x95, script: 0x5a, flags: 0x0},
 	1100: {region: 0x165, script: 0x5a, flags: 0x0},
 	1101: {region: 0x35, script: 0xe, flags: 0x0},
-	1102: {region: 0x9b, script: 0xd6, flags: 0x0},
+	1102: {region: 0x9b, script: 0xdb, flags: 0x0},
 	1103: {region: 0xe9, script: 0x5a, flags: 0x0},
-	1104: {region: 0x99, script: 0xde, flags: 0x0},
+	1104: {region: 0x99, script: 0xe3, flags: 0x0},
 	1105: {region: 0xdb, script: 0x22, flags: 0x0},
 	1106: {region: 0x165, script: 0x5a, flags: 0x0},
 	1107: {region: 0x165, script: 0x5a, flags: 0x0},
@@ -2659,10 +2664,10 @@ var likelyLang = [1330]likelyScriptRegion{
 	1115: {region: 0x165, script: 0x5a, flags: 0x0},
 	1116: {region: 0x165, script: 0x5a, flags: 0x0},
 	1117: {region: 0x99, script: 0x52, flags: 0x0},
-	1118: {region: 0x53, script: 0xdc, flags: 0x0},
+	1118: {region: 0x53, script: 0xe1, flags: 0x0},
 	1119: {region: 0xdb, script: 0x22, flags: 0x0},
 	1120: {region: 0xdb, script: 0x22, flags: 0x0},
-	1121: {region: 0x99, script: 0xe1, flags: 0x0},
+	1121: {region: 0x99, script: 0xe6, flags: 0x0},
 	1122: {region: 0x165, script: 0x5a, flags: 0x0},
 	1123: {region: 0x112, script: 0x5a, flags: 0x0},
 	1124: {region: 0x131, script: 0x5a, flags: 0x0},
@@ -2672,7 +2677,7 @@ var likelyLang = [1330]likelyScriptRegion{
 	1128: {region: 0x165, script: 0x5a, flags: 0x0},
 	1129: {region: 0x165, script: 0x5a, flags: 0x0},
 	1130: {region: 0x165, script: 0x5a, flags: 0x0},
-	1131: {region: 0x123, script: 0xe6, flags: 0x0},
+	1131: {region: 0x123, script: 0xeb, flags: 0x0},
 	1132: {region: 0xdb, script: 0x22, flags: 0x0},
 	1133: {region: 0xdb, script: 0x22, flags: 0x0},
 	1134: {region: 0xdb, script: 0x22, flags: 0x0},
@@ -2711,14 +2716,14 @@ var likelyLang = [1330]likelyScriptRegion{
 	1167: {region: 0x87, script: 0x34, flags: 0x0},
 	1168: {region: 0xdb, script: 0x22, flags: 0x0},
 	1169: {region: 0xe7, script: 0x5a, flags: 0x0},
-	1170: {region: 0x43, script: 0xe7, flags: 0x0},
+	1170: {region: 0x43, script: 0xec, flags: 0x0},
 	1171: {region: 0x165, script: 0x5a, flags: 0x0},
 	1172: {region: 0x106, script: 0x20, flags: 0x0},
 	1173: {region: 0x165, script: 0x5a, flags: 0x0},
 	1174: {region: 0x165, script: 0x5a, flags: 0x0},
 	1175: {region: 0x131, script: 0x5a, flags: 0x0},
 	1176: {region: 0x165, script: 0x5a, flags: 0x0},
-	1177: {region: 0x123, script: 0xe6, flags: 0x0},
+	1177: {region: 0x123, script: 0xeb, flags: 0x0},
 	1178: {region: 0x32, script: 0x5a, flags: 0x0},
 	1179: {region: 0x165, script: 0x5a, flags: 0x0},
 	1180: {region: 0x165, script: 0x5a, flags: 0x0},
@@ -2729,7 +2734,7 @@ var likelyLang = [1330]likelyScriptRegion{
 	1185: {region: 0x165, script: 0x5a, flags: 0x0},
 	1187: {region: 0x165, script: 0x5a, flags: 0x0},
 	1188: {region: 0xd4, script: 0x5a, flags: 0x0},
-	1189: {region: 0x53, script: 0xdf, flags: 0x0},
+	1189: {region: 0x53, script: 0xe4, flags: 0x0},
 	1190: {region: 0xe5, script: 0x5a, flags: 0x0},
 	1191: {region: 0x165, script: 0x5a, flags: 0x0},
 	1192: {region: 0x106, script: 0x20, flags: 0x0},
@@ -2737,7 +2742,7 @@ var likelyLang = [1330]likelyScriptRegion{
 	1194: {region: 0x165, script: 0x5a, flags: 0x0},
 	1195: {region: 0x106, script: 0x20, flags: 0x0},
 	1196: {region: 0x3f, script: 0x4, flags: 0x1},
-	1197: {region: 0x11c, script: 0xea, flags: 0x0},
+	1197: {region: 0x11c, script: 0xf0, flags: 0x0},
 	1198: {region: 0x130, script: 0x20, flags: 0x0},
 	1199: {region: 0x75, script: 0x5a, flags: 0x0},
 	1200: {region: 0x2a, script: 0x5a, flags: 0x0},
@@ -2753,7 +2758,7 @@ var likelyLang = [1330]likelyScriptRegion{
 	1211: {region: 0x165, script: 0x5a, flags: 0x0},
 	1212: {region: 0x46, script: 0x4, flags: 0x1},
 	1213: {region: 0x165, script: 0x5a, flags: 0x0},
-	1214: {region: 0xb4, script: 0xeb, flags: 0x0},
+	1214: {region: 0xb4, script: 0xf1, flags: 0x0},
 	1215: {region: 0x165, script: 0x5a, flags: 0x0},
 	1216: {region: 0x161, script: 0x5a, flags: 0x0},
 	1217: {region: 0x9e, script: 0x5a, flags: 0x0},
@@ -2776,7 +2781,7 @@ var likelyLang = [1330]likelyScriptRegion{
 	1234: {region: 0x165, script: 0x5a, flags: 0x0},
 	1235: {region: 0xe7, script: 0x5a, flags: 0x0},
 	1236: {region: 0x2f, script: 0x5a, flags: 0x0},
-	1237: {region: 0x99, script: 0xe1, flags: 0x0},
+	1237: {region: 0x99, script: 0xe6, flags: 0x0},
 	1238: {region: 0x99, script: 0x22, flags: 0x0},
 	1239: {region: 0x165, script: 0x5a, flags: 0x0},
 	1240: {region: 0x165, script: 0x5a, flags: 0x0},
@@ -2816,9 +2821,9 @@ var likelyLang = [1330]likelyScriptRegion{
 	1274: {region: 0x99, script: 0x22, flags: 0x0},
 	1275: {region: 0x131, script: 0x5a, flags: 0x0},
 	1276: {region: 0x165, script: 0x5a, flags: 0x0},
-	1277: {region: 0x9c, script: 0x8e, flags: 0x0},
+	1277: {region: 0x9c, script: 0x91, flags: 0x0},
 	1278: {region: 0x165, script: 0x5a, flags: 0x0},
-	1279: {region: 0x15e, script: 0xc7, flags: 0x0},
+	1279: {region: 0x15e, script: 0xcc, flags: 0x0},
 	1280: {region: 0x165, script: 0x5a, flags: 0x0},
 	1281: {region: 0x165, script: 0x5a, flags: 0x0},
 	1282: {region: 0xdb, script: 0x22, flags: 0x0},
@@ -2858,7 +2863,7 @@ var likelyLang = [1330]likelyScriptRegion{
 	1316: {region: 0x10b, script: 0x5a, flags: 0x0},
 	1318: {region: 0xa8, script: 0x5, flags: 0x0},
 	1319: {region: 0xd9, script: 0x5a, flags: 0x0},
-	1320: {region: 0xba, script: 0xe3, flags: 0x0},
+	1320: {region: 0xba, script: 0xe8, flags: 0x0},
 	1321: {region: 0x4d, script: 0x14, flags: 0x1},
 	1322: {region: 0x53, script: 0x7d, flags: 0x0},
 	1323: {region: 0x165, script: 0x5a, flags: 0x0},
@@ -2870,11 +2875,11 @@ var likelyLang = [1330]likelyScriptRegion{
 }
 
 // likelyLangList holds lists info associated with likelyLang.
-// Size: 388 bytes, 97 elements
+// Size: 582 bytes, 97 elements
 var likelyLangList = [97]likelyScriptRegion{
 	0:  {region: 0x9c, script: 0x7, flags: 0x0},
 	1:  {region: 0xa1, script: 0x78, flags: 0x2},
-	2:  {region: 0x11c, script: 0x84, flags: 0x2},
+	2:  {region: 0x11c, script: 0x85, flags: 0x2},
 	3:  {region: 0x32, script: 0x5a, flags: 0x0},
 	4:  {region: 0x9b, script: 0x5, flags: 0x4},
 	5:  {region: 0x9c, script: 0x5, flags: 0x4},
@@ -2883,7 +2888,7 @@ var likelyLangList = [97]likelyScriptRegion{
 	8:  {region: 0x106, script: 0x20, flags: 0x0},
 	9:  {region: 0x38, script: 0x2f, flags: 0x2},
 	10: {region: 0x135, script: 0x5a, flags: 0x0},
-	11: {region: 0x7b, script: 0xca, flags: 0x2},
+	11: {region: 0x7b, script: 0xcf, flags: 0x2},
 	12: {region: 0x114, script: 0x5a, flags: 0x0},
 	13: {region: 0x84, script: 0x1, flags: 0x2},
 	14: {region: 0x5d, script: 0x1f, flags: 0x0},
@@ -2919,14 +2924,14 @@ var likelyLangList = [97]likelyScriptRegion{
 	44: {region: 0x99, script: 0x36, flags: 0x0},
 	45: {region: 0xe8, script: 0x5, flags: 0x4},
 	46: {region: 0xe8, script: 0x5, flags: 0x2},
-	47: {region: 0x9c, script: 0x88, flags: 0x0},
-	48: {region: 0x53, script: 0x89, flags: 0x2},
-	49: {region: 0xba, script: 0xe3, flags: 0x0},
+	47: {region: 0x9c, script: 0x8b, flags: 0x0},
+	48: {region: 0x53, script: 0x8c, flags: 0x2},
+	49: {region: 0xba, script: 0xe8, flags: 0x0},
 	50: {region: 0xd9, script: 0x5a, flags: 0x4},
 	51: {region: 0xe8, script: 0x5, flags: 0x0},
 	52: {region: 0x99, script: 0x22, flags: 0x2},
 	53: {region: 0x99, script: 0x4f, flags: 0x2},
-	54: {region: 0x99, script: 0xce, flags: 0x2},
+	54: {region: 0x99, script: 0xd3, flags: 0x2},
 	55: {region: 0x105, script: 0x20, flags: 0x0},
 	56: {region: 0xbd, script: 0x5a, flags: 0x4},
 	57: {region: 0x104, script: 0x5a, flags: 0x4},
@@ -2973,7 +2978,7 @@ var likelyLangList = [97]likelyScriptRegion{
 
 type likelyLangScript struct {
 	lang   uint16
-	script uint8
+	script uint16
 	flags  uint8
 }
 
@@ -2982,7 +2987,7 @@ type likelyLangScript struct {
 // for a given regionID, lang and script are the index and size respectively
 // of the list in likelyRegionList.
 // TODO: exclude containers and user-definable regions from the list.
-// Size: 1432 bytes, 358 elements
+// Size: 2148 bytes, 358 elements
 var likelyRegion = [358]likelyLangScript{
 	34:  {lang: 0xd7, script: 0x5a, flags: 0x0},
 	35:  {lang: 0x3a, script: 0x5, flags: 0x0},
@@ -3089,7 +3094,7 @@ var likelyRegion = [358]likelyLangScript{
 	175: {lang: 0x27, script: 0x2, flags: 0x1},
 	176: {lang: 0x3a, script: 0x5, flags: 0x0},
 	178: {lang: 0x10d, script: 0x5a, flags: 0x0},
-	179: {lang: 0x40c, script: 0xcf, flags: 0x0},
+	179: {lang: 0x40c, script: 0xd4, flags: 0x0},
 	181: {lang: 0x43b, script: 0x5a, flags: 0x0},
 	182: {lang: 0x2c0, script: 0x5a, flags: 0x0},
 	183: {lang: 0x15e, script: 0x5a, flags: 0x0},
@@ -3110,7 +3115,7 @@ var likelyRegion = [358]likelyLangScript{
 	201: {lang: 0x35, script: 0x2, flags: 0x1},
 	203: {lang: 0x320, script: 0x5a, flags: 0x0},
 	204: {lang: 0x37, script: 0x3, flags: 0x1},
-	205: {lang: 0x128, script: 0xe5, flags: 0x0},
+	205: {lang: 0x128, script: 0xea, flags: 0x0},
 	207: {lang: 0x13e, script: 0x5a, flags: 0x0},
 	208: {lang: 0x31f, script: 0x5a, flags: 0x0},
 	209: {lang: 0x3c0, script: 0x5a, flags: 0x0},
@@ -3188,7 +3193,7 @@ var likelyRegion = [358]likelyLangScript{
 }
 
 // likelyRegionList holds lists info associated with likelyRegion.
-// Size: 372 bytes, 93 elements
+// Size: 558 bytes, 93 elements
 var likelyRegionList = [93]likelyLangScript{
 	0:  {lang: 0x148, script: 0x5, flags: 0x0},
 	1:  {lang: 0x476, script: 0x5a, flags: 0x0},
@@ -3198,12 +3203,12 @@ var likelyRegionList = [93]likelyLangScript{
 	5:  {lang: 0x274, script: 0x5a, flags: 0x0},
 	6:  {lang: 0xb7, script: 0x5a, flags: 0x0},
 	7:  {lang: 0x432, script: 0x20, flags: 0x0},
-	8:  {lang: 0x12d, script: 0xe7, flags: 0x0},
+	8:  {lang: 0x12d, script: 0xec, flags: 0x0},
 	9:  {lang: 0x351, script: 0x22, flags: 0x0},
 	10: {lang: 0x529, script: 0x3b, flags: 0x0},
 	11: {lang: 0x4ac, script: 0x5, flags: 0x0},
 	12: {lang: 0x523, script: 0x5a, flags: 0x0},
-	13: {lang: 0x29a, script: 0xe6, flags: 0x0},
+	13: {lang: 0x29a, script: 0xeb, flags: 0x0},
 	14: {lang: 0x136, script: 0x34, flags: 0x0},
 	15: {lang: 0x48a, script: 0x5a, flags: 0x0},
 	16: {lang: 0x3a, script: 0x5, flags: 0x0},
@@ -3226,11 +3231,11 @@ var likelyRegionList = [93]likelyLangScript{
 	33: {lang: 0x476, script: 0x5a, flags: 0x0},
 	34: {lang: 0x24a, script: 0x4e, flags: 0x0},
 	35: {lang: 0xe6, script: 0x5, flags: 0x0},
-	36: {lang: 0x226, script: 0xe6, flags: 0x0},
+	36: {lang: 0x226, script: 0xeb, flags: 0x0},
 	37: {lang: 0x3a, script: 0x5, flags: 0x0},
 	38: {lang: 0x15e, script: 0x5a, flags: 0x0},
 	39: {lang: 0x2b8, script: 0x57, flags: 0x0},
-	40: {lang: 0x226, script: 0xe6, flags: 0x0},
+	40: {lang: 0x226, script: 0xeb, flags: 0x0},
 	41: {lang: 0x3a, script: 0x5, flags: 0x0},
 	42: {lang: 0x15e, script: 0x5a, flags: 0x0},
 	43: {lang: 0x3dc, script: 0x5a, flags: 0x0},
@@ -3263,7 +3268,7 @@ var likelyRegionList = [93]likelyLangScript{
 	70: {lang: 0x15e, script: 0x5a, flags: 0x0},
 	71: {lang: 0x15e, script: 0x5a, flags: 0x0},
 	72: {lang: 0x35, script: 0x5, flags: 0x0},
-	73: {lang: 0x46b, script: 0xe6, flags: 0x0},
+	73: {lang: 0x46b, script: 0xeb, flags: 0x0},
 	74: {lang: 0x2ec, script: 0x5, flags: 0x0},
 	75: {lang: 0x30f, script: 0x75, flags: 0x0},
 	76: {lang: 0x467, script: 0x20, flags: 0x0},
@@ -3288,7 +3293,7 @@ var likelyRegionList = [93]likelyLangScript{
 type likelyTag struct {
 	lang   uint16
 	region uint16
-	script uint8
+	script uint16
 }
 
 // Size: 198 bytes, 33 elements
@@ -3449,8 +3454,8 @@ var regionInclusionNext = [73]uint8{
 
 type parentRel struct {
 	lang       uint16
-	script     uint8
-	maxScript  uint8
+	script     uint16
+	maxScript  uint16
 	toRegion   uint16
 	fromRegion []uint16
 }
@@ -3464,4 +3469,4 @@ var parents = [5]parentRel{
 	4: {lang: 0x529, script: 0x3c, maxScript: 0x3c, toRegion: 0x8d, fromRegion: []uint16{0xc6}},
 }
 
-// Total table size 26398 bytes (25KiB); checksum: 1C859EA7
+// Total table size 30244 bytes (29KiB); checksum: B6B15F30
diff --git a/language/tables.go b/language/tables.go
index 96b57f610..34a732b69 100644
--- a/language/tables.go
+++ b/language/tables.go
@@ -39,12 +39,12 @@ const (
 	_Hani = 57
 	_Hans = 59
 	_Hant = 60
-	_Qaaa = 143
-	_Qaai = 151
-	_Qabx = 192
-	_Zinh = 245
-	_Zyyy = 250
-	_Zzzz = 251
+	_Qaaa = 147
+	_Qaai = 155
+	_Qabx = 196
+	_Zinh = 252
+	_Zyyy = 257
+	_Zzzz = 258
 )
 
 var regionToGroups = []uint8{ // 358 elements
@@ -265,9 +265,9 @@ var matchScript = []scriptIntelligibility{ // 26 elements
 	13: {wantLang: 0x39d, haveLang: 0x139, wantScript: 0x36, haveScript: 0x5a, distance: 0xa},
 	14: {wantLang: 0x3be, haveLang: 0x139, wantScript: 0x5, haveScript: 0x5a, distance: 0xa},
 	15: {wantLang: 0x3fa, haveLang: 0x139, wantScript: 0x5, haveScript: 0x5a, distance: 0xa},
-	16: {wantLang: 0x40c, haveLang: 0x139, wantScript: 0xcf, haveScript: 0x5a, distance: 0xa},
-	17: {wantLang: 0x450, haveLang: 0x139, wantScript: 0xde, haveScript: 0x5a, distance: 0xa},
-	18: {wantLang: 0x461, haveLang: 0x139, wantScript: 0xe1, haveScript: 0x5a, distance: 0xa},
+	16: {wantLang: 0x40c, haveLang: 0x139, wantScript: 0xd4, haveScript: 0x5a, distance: 0xa},
+	17: {wantLang: 0x450, haveLang: 0x139, wantScript: 0xe3, haveScript: 0x5a, distance: 0xa},
+	18: {wantLang: 0x461, haveLang: 0x139, wantScript: 0xe6, haveScript: 0x5a, distance: 0xa},
 	19: {wantLang: 0x46f, haveLang: 0x139, wantScript: 0x2c, haveScript: 0x5a, distance: 0xa},
 	20: {wantLang: 0x476, haveLang: 0x3e2, wantScript: 0x5a, haveScript: 0x20, distance: 0xa},
 	21: {wantLang: 0x4b4, haveLang: 0x139, wantScript: 0x5, haveScript: 0x5a, distance: 0xa},
diff --git a/unicode/norm/tables13.0.0.go b/unicode/norm/tables13.0.0.go
index 96a130d30..9115ef257 100644
--- a/unicode/norm/tables13.0.0.go
+++ b/unicode/norm/tables13.0.0.go
@@ -7315,7 +7315,7 @@ const recompMapPacked = "" +
 	"\x00V\x03\x03\x00\x00\x1e|" + // 0x00560303: 0x00001E7C
 	"\x00v\x03\x03\x00\x00\x1e}" + // 0x00760303: 0x00001E7D
 	"\x00V\x03#\x00\x00\x1e~" + // 0x00560323: 0x00001E7E
-	"\x00v\x03#\x00\x00\x1e\u007f" + // 0x00760323: 0x00001E7F
+	"\x00v\x03#\x00\x00\x1e\x7f" + // 0x00760323: 0x00001E7F
 	"\x00W\x03\x00\x00\x00\x1e\x80" + // 0x00570300: 0x00001E80
 	"\x00w\x03\x00\x00\x00\x1e\x81" + // 0x00770300: 0x00001E81
 	"\x00W\x03\x01\x00\x00\x1e\x82" + // 0x00570301: 0x00001E82
@@ -7342,7 +7342,7 @@ const recompMapPacked = "" +
 	"\x00t\x03\b\x00\x00\x1e\x97" + // 0x00740308: 0x00001E97
 	"\x00w\x03\n\x00\x00\x1e\x98" + // 0x0077030A: 0x00001E98
 	"\x00y\x03\n\x00\x00\x1e\x99" + // 0x0079030A: 0x00001E99
-	"\x01\u007f\x03\a\x00\x00\x1e\x9b" + // 0x017F0307: 0x00001E9B
+	"\x01\x7f\x03\a\x00\x00\x1e\x9b" + // 0x017F0307: 0x00001E9B
 	"\x00A\x03#\x00\x00\x1e\xa0" + // 0x00410323: 0x00001EA0
 	"\x00a\x03#\x00\x00\x1e\xa1" + // 0x00610323: 0x00001EA1
 	"\x00A\x03\t\x00\x00\x1e\xa2" + // 0x00410309: 0x00001EA2

From 795e854ff348c9cac4fd0033ce04c417705dd0bb Mon Sep 17 00:00:00 2001
From: cui fliter <imcusg@gmail.com>
Date: Fri, 16 Sep 2022 02:08:40 +0000
Subject: [PATCH 37/40] all: replace io/ioutil with io and os package

For golang/go#45557

Change-Id: Ibf78d87cc94baa0d1696e5abc2edad3d2723e42b
GitHub-Last-Rev: ad314caaff6e51edb51a63d183c0ff906cf6b2ad
GitHub-Pull-Request: golang/text#34
Reviewed-on: https://go-review.googlesource.com/c/text/+/430815
Reviewed-by: Cherry Mui <cherryyz@google.com>
TryBot-Result: Gopher Robot <gobot@golang.org>
Reviewed-by: Ian Lance Taylor <iant@google.com>
Reviewed-by: Meng Zhuo <mzh@golangcn.org>
Run-TryBot: Ian Lance Taylor <iant@google.com>
Run-TryBot: Meng Zhuo <mzh@golangcn.org>
Auto-Submit: Ian Lance Taylor <iant@google.com>
---
 cases/gen.go                             |  7 +++----
 cmd/gotext/main.go                       |  3 +--
 collate/maketables.go                    |  3 +--
 collate/reg_test.go                      |  3 +--
 encoding/encoding_test.go                |  4 ++--
 encoding/internal/enctest/enctest.go     | 12 ++++++------
 encoding/traditionalchinese/all_test.go  |  4 ++--
 feature/plural/message.go                |  4 ++--
 gen.go                                   |  5 ++---
 internal/cldrtree/cldrtree_test.go       |  6 +++---
 internal/gen/bitfield/bitfield_test.go   |  4 ++--
 internal/gen/gen.go                      | 15 +++++++--------
 internal/language/gen.go                 |  3 +--
 internal/testtext/codesize.go            |  5 ++---
 internal/triegen/example_compact_test.go |  5 ++---
 internal/triegen/example_test.go         |  4 ++--
 message/pipeline/pipeline_test.go        | 23 +++++++++++------------
 transform/transform_test.go              |  4 ++--
 unicode/cldr/decode.go                   |  3 +--
 unicode/cldr/makexml.go                  |  3 +--
 unicode/norm/normalize_test.go           |  5 ++---
 21 files changed, 56 insertions(+), 69 deletions(-)

diff --git a/cases/gen.go b/cases/gen.go
index a041fede1..2e1d95cc5 100644
--- a/cases/gen.go
+++ b/cases/gen.go
@@ -16,7 +16,6 @@ import (
 	"bytes"
 	"fmt"
 	"io"
-	"io/ioutil"
 	"log"
 	"reflect"
 	"strconv"
@@ -635,9 +634,9 @@ func genTablesTest() {
 
 	// We discard the output as we know we have perfect functions. We run them
 	// just to verify the properties are correct.
-	n := printProperties(ioutil.Discard, "DerivedCoreProperties.txt", "Cased", verifyCased)
-	n += printProperties(ioutil.Discard, "DerivedCoreProperties.txt", "Lowercase", verifyLower)
-	n += printProperties(ioutil.Discard, "DerivedCoreProperties.txt", "Uppercase", verifyUpper)
+	n := printProperties(io.Discard, "DerivedCoreProperties.txt", "Cased", verifyCased)
+	n += printProperties(io.Discard, "DerivedCoreProperties.txt", "Lowercase", verifyLower)
+	n += printProperties(io.Discard, "DerivedCoreProperties.txt", "Uppercase", verifyUpper)
 	if n > 0 {
 		log.Fatalf("One of the discarded properties does not have a perfect filter.")
 	}
diff --git a/cmd/gotext/main.go b/cmd/gotext/main.go
index c8dc7990a..aad1d4a14 100644
--- a/cmd/gotext/main.go
+++ b/cmd/gotext/main.go
@@ -16,7 +16,6 @@ import (
 	"go/build"
 	"go/format"
 	"io"
-	"io/ioutil"
 	"log"
 	"os"
 	"strings"
@@ -310,7 +309,7 @@ func help(args []string) {
 			if err != nil {
 				logf("Could not format generated docs: %v\n", err)
 			}
-			if err := ioutil.WriteFile("doc.go", b, 0666); err != nil {
+			if err := os.WriteFile("doc.go", b, 0666); err != nil {
 				logf("Could not create file alldocs.go: %v\n", err)
 			}
 		} else {
diff --git a/collate/maketables.go b/collate/maketables.go
index 59afeb9c2..4175143e3 100644
--- a/collate/maketables.go
+++ b/collate/maketables.go
@@ -17,7 +17,6 @@ import (
 	"flag"
 	"fmt"
 	"io"
-	"io/ioutil"
 	"log"
 	"os"
 	"regexp"
@@ -187,7 +186,7 @@ func failOnError(e error) {
 
 func openArchive() *zip.Reader {
 	f := gen.OpenCLDRCoreZip()
-	buffer, err := ioutil.ReadAll(f)
+	buffer, err := io.ReadAll(f)
 	f.Close()
 	failOnError(err)
 	archive, err := zip.NewReader(bytes.NewReader(buffer), int64(len(buffer)))
diff --git a/collate/reg_test.go b/collate/reg_test.go
index 4d3598485..f9c192cb3 100644
--- a/collate/reg_test.go
+++ b/collate/reg_test.go
@@ -10,7 +10,6 @@ import (
 	"bytes"
 	"flag"
 	"io"
-	"io/ioutil"
 	"log"
 	"path"
 	"regexp"
@@ -133,7 +132,7 @@ func convHex(line int, s string) int {
 
 func loadTestData() []Test {
 	f := gen.OpenUnicodeFile("UCA", "", "CollationTest.zip")
-	buffer, err := ioutil.ReadAll(f)
+	buffer, err := io.ReadAll(f)
 	f.Close()
 	Error(err)
 	archive, err := zip.NewReader(bytes.NewReader(buffer), int64(len(buffer)))
diff --git a/encoding/encoding_test.go b/encoding/encoding_test.go
index 173814762..e459fa230 100644
--- a/encoding/encoding_test.go
+++ b/encoding/encoding_test.go
@@ -5,7 +5,7 @@
 package encoding_test
 
 import (
-	"io/ioutil"
+	"io"
 	"strings"
 	"testing"
 
@@ -62,7 +62,7 @@ func TestReplacement(t *testing.T) {
 			want = "AB\x00CD\ufffdYZ"
 		}
 		sr := strings.NewReader("AB\x00CD\x80YZ")
-		g, err := ioutil.ReadAll(transform.NewReader(sr, enc))
+		g, err := io.ReadAll(transform.NewReader(sr, enc))
 		if err != nil {
 			t.Errorf("%s: ReadAll: %v", direction, err)
 			continue
diff --git a/encoding/internal/enctest/enctest.go b/encoding/internal/enctest/enctest.go
index 0cccae044..cf5da2675 100644
--- a/encoding/internal/enctest/enctest.go
+++ b/encoding/internal/enctest/enctest.go
@@ -8,7 +8,7 @@ import (
 	"bytes"
 	"fmt"
 	"io"
-	"io/ioutil"
+	"os"
 	"strings"
 	"testing"
 
@@ -105,7 +105,7 @@ func Benchmark(b *testing.B, enc encoding.Encoding) {
 			b.ResetTimer()
 			for i := 0; i < b.N; i++ {
 				r := transform.NewReader(bytes.NewReader(src), transformer)
-				io.Copy(ioutil.Discard, r)
+				io.Copy(io.Discard, r)
 			}
 		})
 	}
@@ -157,15 +157,15 @@ func load(direction string, enc encoding.Encoding) ([]byte, []byte, Transcoder,
 		dstFile, srcFile = srcFile, dstFile
 		coder = enc.NewDecoder()
 	}
-	dst, err := ioutil.ReadFile(dstFile)
+	dst, err := os.ReadFile(dstFile)
 	if err != nil {
-		if dst, err = ioutil.ReadFile("../" + dstFile); err != nil {
+		if dst, err = os.ReadFile("../" + dstFile); err != nil {
 			return nil, nil, nil, err
 		}
 	}
-	src, err := ioutil.ReadFile(srcFile)
+	src, err := os.ReadFile(srcFile)
 	if err != nil {
-		if src, err = ioutil.ReadFile("../" + srcFile); err != nil {
+		if src, err = os.ReadFile("../" + srcFile); err != nil {
 			return nil, nil, nil, err
 		}
 	}
diff --git a/encoding/traditionalchinese/all_test.go b/encoding/traditionalchinese/all_test.go
index 3825c7672..f804e83e1 100644
--- a/encoding/traditionalchinese/all_test.go
+++ b/encoding/traditionalchinese/all_test.go
@@ -6,7 +6,7 @@ package traditionalchinese
 
 import (
 	"fmt"
-	"io/ioutil"
+	"io"
 	"strings"
 	"testing"
 
@@ -103,7 +103,7 @@ func TestBig5CircumflexAndMacron(t *testing.T) {
 		"\x88\xa2\x88\xa3\x88\xa4\x88\xa5\x88\xa6"
 	want := "ÓǑÒ\u00ca\u0304Ế\u00ca\u030cỀÊ " +
 		"ü\u00ea\u0304ế\u00ea\u030cề"
-	dst, err := ioutil.ReadAll(transform.NewReader(
+	dst, err := io.ReadAll(transform.NewReader(
 		strings.NewReader(src), Big5.NewDecoder()))
 	if err != nil {
 		t.Fatal(err)
diff --git a/feature/plural/message.go b/feature/plural/message.go
index 6248d01cc..56d518cc3 100644
--- a/feature/plural/message.go
+++ b/feature/plural/message.go
@@ -6,7 +6,7 @@ package plural
 
 import (
 	"fmt"
-	"io/ioutil"
+	"io"
 	"reflect"
 	"strconv"
 
@@ -56,7 +56,7 @@ type Interface interface {
 func Selectf(arg int, format string, cases ...interface{}) catalog.Message {
 	var p parser
 	// Intercept the formatting parameters of format by doing a dummy print.
-	fmt.Fprintf(ioutil.Discard, format, &p)
+	fmt.Fprintf(io.Discard, format, &p)
 	m := &message{arg, kindDefault, 0, cases}
 	switch p.verb {
 	case 'g':
diff --git a/gen.go b/gen.go
index fb2fb94a7..566a30355 100644
--- a/gen.go
+++ b/gen.go
@@ -14,7 +14,6 @@ import (
 	"flag"
 	"fmt"
 	"go/format"
-	"io/ioutil"
 	"os"
 	"os/exec"
 	"path"
@@ -256,7 +255,7 @@ func copyPackage(dirSrc, dirDst, search, replace string) {
 			filepath.Dir(file) != dirSrc {
 			return nil
 		}
-		b, err := ioutil.ReadFile(file)
+		b, err := os.ReadFile(file)
 		if err != nil || bytes.Contains(b, []byte("\n// +build ignore")) {
 			return err
 		}
@@ -275,7 +274,7 @@ func copyPackage(dirSrc, dirDst, search, replace string) {
 		}
 		file = filepath.Join(dirDst, base)
 		vprintf("=== COPY %s\n", file)
-		return ioutil.WriteFile(file, b, 0666)
+		return os.WriteFile(file, b, 0666)
 	})
 	if err != nil {
 		fmt.Println("Copying exported files failed:", err)
diff --git a/internal/cldrtree/cldrtree_test.go b/internal/cldrtree/cldrtree_test.go
index 06c366a05..c42eba30a 100644
--- a/internal/cldrtree/cldrtree_test.go
+++ b/internal/cldrtree/cldrtree_test.go
@@ -7,9 +7,9 @@ package cldrtree
 import (
 	"bytes"
 	"flag"
-	"io/ioutil"
 	"log"
 	"math/rand"
+	"os"
 	"path/filepath"
 	"reflect"
 	"regexp"
@@ -303,11 +303,11 @@ func TestGen(t *testing.T) {
 
 			file := filepath.Join("testdata", tc, "output.go")
 			if *genOutput {
-				ioutil.WriteFile(file, got, 0700)
+				os.WriteFile(file, got, 0700)
 				t.SkipNow()
 			}
 
-			b, err := ioutil.ReadFile(file)
+			b, err := os.ReadFile(file)
 			if err != nil {
 				t.Fatalf("failed to open file: %v", err)
 			}
diff --git a/internal/gen/bitfield/bitfield_test.go b/internal/gen/bitfield/bitfield_test.go
index 789f86d1a..a43dda962 100644
--- a/internal/gen/bitfield/bitfield_test.go
+++ b/internal/gen/bitfield/bitfield_test.go
@@ -7,7 +7,7 @@ package bitfield
 import (
 	"bytes"
 	"fmt"
-	"io/ioutil"
+	"os"
 	"testing"
 )
 
@@ -222,7 +222,7 @@ func (t test1) Baz() int8 {
 `
 
 func mustRead(filename string) string {
-	b, err := ioutil.ReadFile(filename)
+	b, err := os.ReadFile(filename)
 	if err != nil {
 		panic(err)
 	}
diff --git a/internal/gen/gen.go b/internal/gen/gen.go
index fa289534a..268258dd3 100644
--- a/internal/gen/gen.go
+++ b/internal/gen/gen.go
@@ -25,7 +25,6 @@ import (
 	"go/build"
 	"go/format"
 	"io"
-	"io/ioutil"
 	"log"
 	"net/http"
 	"os"
@@ -175,7 +174,7 @@ func getLocalDir() string {
 		if err := os.MkdirAll(dir, permissions); err != nil {
 			log.Fatalf("Could not create directory: %v", err)
 		}
-		ioutil.WriteFile(readme, []byte(readmeTxt), permissions)
+		os.WriteFile(readme, []byte(readmeTxt), permissions)
 	}
 	return dir
 }
@@ -213,15 +212,15 @@ func open(file, urlRoot, path string) io.ReadCloser {
 	}
 	r := get(urlRoot, path)
 	defer r.Close()
-	b, err := ioutil.ReadAll(r)
+	b, err := io.ReadAll(r)
 	if err != nil {
 		log.Fatalf("Could not download file: %v", err)
 	}
 	os.MkdirAll(filepath.Dir(file), permissions)
-	if err := ioutil.WriteFile(file, b, permissions); err != nil {
+	if err := os.WriteFile(file, b, permissions); err != nil {
 		log.Fatalf("Could not create file: %v", err)
 	}
-	return ioutil.NopCloser(bytes.NewReader(b))
+	return io.NopCloser(bytes.NewReader(b))
 }
 
 func get(root, path string) io.ReadCloser {
@@ -280,13 +279,13 @@ func fileToPattern(filename string) string {
 func updateBuildTags(pattern string) {
 	for _, t := range tags {
 		oldFile := fmt.Sprintf(pattern, t.version)
-		b, err := ioutil.ReadFile(oldFile)
+		b, err := os.ReadFile(oldFile)
 		if err != nil {
 			continue
 		}
 		build := fmt.Sprintf("// +build %s", t.buildTags)
 		b = regexp.MustCompile(`// \+build .*`).ReplaceAll(b, []byte(build))
-		err = ioutil.WriteFile(oldFile, b, 0644)
+		err = os.WriteFile(oldFile, b, 0644)
 		if err != nil {
 			log.Fatal(err)
 		}
@@ -334,7 +333,7 @@ func WriteGo(w io.Writer, pkg, tags string, b []byte) (n int, err error) {
 // Repackage rewrites a Go file from belonging to package main to belonging to
 // the given package.
 func Repackage(inFile, outFile, pkg string) {
-	src, err := ioutil.ReadFile(inFile)
+	src, err := os.ReadFile(inFile)
 	if err != nil {
 		log.Fatalf("reading %s: %v", inFile, err)
 	}
diff --git a/internal/language/gen.go b/internal/language/gen.go
index 95455ecf4..520f1596f 100644
--- a/internal/language/gen.go
+++ b/internal/language/gen.go
@@ -15,7 +15,6 @@ import (
 	"flag"
 	"fmt"
 	"io"
-	"io/ioutil"
 	"log"
 	"math"
 	"reflect"
@@ -921,7 +920,7 @@ func (b *builder) writeRegion() {
 	r := gen.OpenIANAFile("domains/root/db")
 	defer r.Close()
 
-	buf, err := ioutil.ReadAll(r)
+	buf, err := io.ReadAll(r)
 	failOnError(err)
 	re := regexp.MustCompile(`"/domains/root/db/([a-z]{2}).html"`)
 	for _, m := range re.FindAllSubmatch(buf, -1) {
diff --git a/internal/testtext/codesize.go b/internal/testtext/codesize.go
index 88df48747..cdaed81d5 100644
--- a/internal/testtext/codesize.go
+++ b/internal/testtext/codesize.go
@@ -7,7 +7,6 @@ package testtext
 import (
 	"bytes"
 	"fmt"
-	"io/ioutil"
 	"os"
 	"os/exec"
 	"path/filepath"
@@ -26,13 +25,13 @@ import (
 // See dict_test.go in the display package for an example.
 func CodeSize(s string) (int, error) {
 	// Write the file.
-	tmpdir, err := ioutil.TempDir(os.TempDir(), "testtext")
+	tmpdir, err := os.MkdirTemp(os.TempDir(), "testtext")
 	if err != nil {
 		return 0, fmt.Errorf("testtext: failed to create tmpdir: %v", err)
 	}
 	defer os.RemoveAll(tmpdir)
 	filename := filepath.Join(tmpdir, "main.go")
-	if err := ioutil.WriteFile(filename, []byte(s), 0644); err != nil {
+	if err := os.WriteFile(filename, []byte(s), 0644); err != nil {
 		return 0, fmt.Errorf("testtext: failed to write main.go: %v", err)
 	}
 
diff --git a/internal/triegen/example_compact_test.go b/internal/triegen/example_compact_test.go
index 7cf604ca4..95486d1ff 100644
--- a/internal/triegen/example_compact_test.go
+++ b/internal/triegen/example_compact_test.go
@@ -7,7 +7,6 @@ package triegen_test
 import (
 	"fmt"
 	"io"
-	"io/ioutil"
 
 	"golang.org/x/text/internal/triegen"
 )
@@ -17,12 +16,12 @@ func ExampleCompacter() {
 	for r := rune(0); r < 10000; r += 64 {
 		t.Insert(r, 0x9015BADA55^uint64(r))
 	}
-	sz, _ := t.Gen(ioutil.Discard)
+	sz, _ := t.Gen(io.Discard)
 
 	fmt.Printf("Size normal:    %5d\n", sz)
 
 	var c myCompacter
-	sz, _ = t.Gen(ioutil.Discard, triegen.Compact(&c))
+	sz, _ = t.Gen(io.Discard, triegen.Compact(&c))
 
 	fmt.Printf("Size compacted: %5d\n", sz)
 
diff --git a/internal/triegen/example_test.go b/internal/triegen/example_test.go
index 557a152e7..5823a2c34 100644
--- a/internal/triegen/example_test.go
+++ b/internal/triegen/example_test.go
@@ -6,7 +6,7 @@ package triegen_test
 
 import (
 	"fmt"
-	"io/ioutil"
+	"io"
 	"math/rand"
 	"unicode"
 
@@ -15,7 +15,7 @@ import (
 
 const seed = 0x12345
 
-var genWriter = ioutil.Discard
+var genWriter = io.Discard
 
 func randomRunes() map[rune]uint8 {
 	rnd := rand.New(rand.NewSource(seed))
diff --git a/message/pipeline/pipeline_test.go b/message/pipeline/pipeline_test.go
index 2adb11fd2..f4cd42a69 100644
--- a/message/pipeline/pipeline_test.go
+++ b/message/pipeline/pipeline_test.go
@@ -11,7 +11,6 @@ import (
 	"flag"
 	"fmt"
 	"go/build"
-	"io/ioutil"
 	"os"
 	"os/exec"
 	"path"
@@ -40,7 +39,7 @@ func TestFullCycle(t *testing.T) {
 		t.Skipf("skipping because 'go' command is unavailable: %v", err)
 	}
 
-	GOPATH, err := ioutil.TempDir("", "pipeline_test")
+	GOPATH, err := os.MkdirTemp("", "pipeline_test")
 	if err != nil {
 		t.Fatal(err)
 	}
@@ -66,7 +65,7 @@ func TestFullCycle(t *testing.T) {
 	wd, _ := os.Getwd()
 	defer os.Chdir(wd)
 
-	dirs, err := ioutil.ReadDir(testdata)
+	dirs, err := os.ReadDir(testdata)
 	if err != nil {
 		t.Fatal(err)
 	}
@@ -124,11 +123,11 @@ func copyTestdata(t *testing.T, dst string) {
 			return os.MkdirAll(filepath.Join(dst, rel), 0755)
 		}
 
-		data, err := ioutil.ReadFile(p)
+		data, err := os.ReadFile(p)
 		if err != nil {
 			return err
 		}
-		return ioutil.WriteFile(filepath.Join(dst, rel), data, 0644)
+		return os.WriteFile(filepath.Join(dst, rel), data, 0644)
 	})
 	if err != nil {
 		t.Fatal(err)
@@ -145,17 +144,17 @@ func initTestdataModule(t *testing.T, dst string) {
 
 replace golang.org/x/text => %s
 `, xTextDir)
-	if err := ioutil.WriteFile(filepath.Join(dst, "go.mod"), []byte(goMod), 0644); err != nil {
+	if err := os.WriteFile(filepath.Join(dst, "go.mod"), []byte(goMod), 0644); err != nil {
 		t.Fatal(err)
 	}
 
 	// Copy in the checksums from the parent module so that we won't
 	// need to re-fetch them from the checksum database.
-	data, err := ioutil.ReadFile(filepath.Join(xTextDir, "go.sum"))
+	data, err := os.ReadFile(filepath.Join(xTextDir, "go.sum"))
 	if err != nil {
 		t.Fatal(err)
 	}
-	if err := ioutil.WriteFile(filepath.Join(dst, "go.sum"), data, 0644); err != nil {
+	if err := os.WriteFile(filepath.Join(dst, "go.sum"), data, 0644); err != nil {
 		t.Fatal(err)
 	}
 
@@ -194,17 +193,17 @@ func checkOutput(t *testing.T, gen string, testdataDir string) {
 			return nil
 		}
 
-		got, err := ioutil.ReadFile(gotFile)
+		got, err := os.ReadFile(gotFile)
 		if err != nil {
 			t.Errorf("failed to read %q", gotFile)
 			return nil
 		}
 		if *genFiles {
-			if err := ioutil.WriteFile(wantFile, got, 0644); err != nil {
+			if err := os.WriteFile(wantFile, got, 0644); err != nil {
 				t.Fatal(err)
 			}
 		}
-		want, err := ioutil.ReadFile(wantFile)
+		want, err := os.ReadFile(wantFile)
 		if err != nil {
 			t.Errorf("failed to read %q", wantFile)
 		} else {
@@ -242,7 +241,7 @@ func writeJSON(t *testing.T, path string, x interface{}) {
 	if err != nil {
 		t.Fatal(err)
 	}
-	if err := ioutil.WriteFile(path, data, 0644); err != nil {
+	if err := os.WriteFile(path, data, 0644); err != nil {
 		t.Fatal(err)
 	}
 }
diff --git a/transform/transform_test.go b/transform/transform_test.go
index 273abfa52..62fad2bc9 100644
--- a/transform/transform_test.go
+++ b/transform/transform_test.go
@@ -8,7 +8,7 @@ import (
 	"bytes"
 	"errors"
 	"fmt"
-	"io/ioutil"
+	"io"
 	"strconv"
 	"strings"
 	"testing"
@@ -648,7 +648,7 @@ func TestReader(t *testing.T) {
 			// exported API. We override them manually.
 			r.dst = make([]byte, tc.dstSize)
 			r.src = make([]byte, tc.srcSize)
-			got, err := ioutil.ReadAll(r)
+			got, err := io.ReadAll(r)
 			str := string(got)
 			if str != tc.wantStr || err != tc.wantErr {
 				t.Errorf("\ngot  %q, %v\nwant %q, %v", str, err, tc.wantStr, tc.wantErr)
diff --git a/unicode/cldr/decode.go b/unicode/cldr/decode.go
index 48f6bd629..1abcb9e1f 100644
--- a/unicode/cldr/decode.go
+++ b/unicode/cldr/decode.go
@@ -10,7 +10,6 @@ import (
 	"encoding/xml"
 	"fmt"
 	"io"
-	"io/ioutil"
 	"log"
 	"os"
 	"path/filepath"
@@ -160,7 +159,7 @@ func (zl zipLoader) Reader(i int) (io.ReadCloser, error) {
 
 // DecodeZip loads CLDR data from the zip archive for which r is the source.
 func (d *Decoder) DecodeZip(r io.Reader) (cldr *CLDR, err error) {
-	buffer, err := ioutil.ReadAll(r)
+	buffer, err := io.ReadAll(r)
 	if err != nil {
 		return nil, err
 	}
diff --git a/unicode/cldr/makexml.go b/unicode/cldr/makexml.go
index 3c1fd26ea..528f2c48d 100644
--- a/unicode/cldr/makexml.go
+++ b/unicode/cldr/makexml.go
@@ -15,7 +15,6 @@ import (
 	"flag"
 	"fmt"
 	"io"
-	"io/ioutil"
 	"log"
 	"os"
 	"regexp"
@@ -30,7 +29,7 @@ func main() {
 	flag.Parse()
 
 	r := gen.OpenCLDRCoreZip()
-	buffer, err := ioutil.ReadAll(r)
+	buffer, err := io.ReadAll(r)
 	if err != nil {
 		log.Fatal("Could not read zip file")
 	}
diff --git a/unicode/norm/normalize_test.go b/unicode/norm/normalize_test.go
index 8387d4e03..678ca403d 100644
--- a/unicode/norm/normalize_test.go
+++ b/unicode/norm/normalize_test.go
@@ -9,7 +9,6 @@ import (
 	"flag"
 	"fmt"
 	"io"
-	"io/ioutil"
 	"log"
 	"os"
 	"os/exec"
@@ -927,14 +926,14 @@ func TestString(t *testing.T) {
 
 func runNM(code string) (string, error) {
 	// Write the file.
-	tmpdir, err := ioutil.TempDir(os.TempDir(), "normalize_test")
+	tmpdir, err := os.MkdirTemp(os.TempDir(), "normalize_test")
 	if err != nil {
 		return "", fmt.Errorf("failed to create tmpdir: %v", err)
 	}
 	defer os.RemoveAll(tmpdir)
 	goTool := filepath.Join(runtime.GOROOT(), "bin", "go")
 	filename := filepath.Join(tmpdir, "main.go")
-	if err := ioutil.WriteFile(filename, []byte(code), 0644); err != nil {
+	if err := os.WriteFile(filename, []byte(code), 0644); err != nil {
 		return "", fmt.Errorf("failed to write main.go: %v", err)
 	}
 	outputFile := filepath.Join(tmpdir, "main")

From b18d3dd8a4b426ebedcf279b593e85ac4985b9d3 Mon Sep 17 00:00:00 2001
From: cui fliter <imcusg@gmail.com>
Date: Tue, 4 Oct 2022 14:50:44 +0000
Subject: [PATCH 38/40] secure/precis: replace bytes.Compare with bytes.Equal

Change-Id: Ifa6ba05253b38e1cb3d5791e62b36a523fb68e52
GitHub-Last-Rev: 2d7de01c3d93285224e3c65f55845a316da8f4d0
GitHub-Pull-Request: golang/text#36
Reviewed-on: https://go-review.googlesource.com/c/text/+/438559
Run-TryBot: Dmitri Shuralyov <dmitshur@golang.org>
Reviewed-by: Ian Lance Taylor <iant@google.com>
Reviewed-by: Dmitri Shuralyov <dmitshur@google.com>
TryBot-Result: Gopher Robot <gobot@golang.org>
Run-TryBot: Ian Lance Taylor <iant@google.com>
Auto-Submit: Ian Lance Taylor <iant@google.com>
Reviewed-by: Dmitri Shuralyov <dmitshur@golang.org>
Auto-Submit: Dmitri Shuralyov <dmitshur@golang.org>
---
 secure/precis/profile.go | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/secure/precis/profile.go b/secure/precis/profile.go
index 35bd6f0a5..bdd991bb9 100644
--- a/secure/precis/profile.go
+++ b/secure/precis/profile.go
@@ -316,7 +316,7 @@ func (p *Profile) Compare(a, b string) bool {
 		return false
 	}
 
-	return bytes.Compare(akey, bkey) == 0
+	return bytes.Equal(akey, bkey)
 }
 
 // Allowed returns a runes.Set containing every rune that is a member of the

From 23407e72ed5b895a2dfd230aec777f4fbe026d6a Mon Sep 17 00:00:00 2001
From: Heschi Kreinick <heschi@google.com>
Date: Wed, 5 Oct 2022 16:07:52 -0400
Subject: [PATCH 39/40] go.mod: ignore cyclic dependency for tagging

tools and text have a cyclic dependency, which needs to be broken during
the upgrading/tagging process. This direction is due to
message/pipeline, which is marked as "IN DEVELOPMENT", so I think it's
less important to keep it up to date.

For golang/go#48523.

Change-Id: Ic4cdfd05628649035eee8a37e662cf22827c705b
Reviewed-on: https://go-review.googlesource.com/c/text/+/439295
Run-TryBot: Heschi Kreinick <heschi@google.com>
Reviewed-by: Bryan Mills <bcmills@google.com>
TryBot-Result: Gopher Robot <gobot@golang.org>
---
 go.mod | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/go.mod b/go.mod
index c47a02995..7afa1eb19 100644
--- a/go.mod
+++ b/go.mod
@@ -1,6 +1,6 @@
 module golang.org/x/text
 
-require golang.org/x/tools v0.1.12
+require golang.org/x/tools v0.1.12 // tagx:ignore
 
 require (
 	golang.org/x/mod v0.6.0-dev.0.20220419223038-86c51ed26bb4 // indirect

From 434eadcdbc3b0256971992e8c70027278364c72c Mon Sep 17 00:00:00 2001
From: Roland Shoemaker <bracewell@google.com>
Date: Fri, 2 Sep 2022 09:35:37 -0700
Subject: [PATCH 40/40] language: reject excessively large Accept-Language
 strings

The BCP 47 tag parser has quadratic time complexity due to inherent
aspects of its design. Since the parser is, by design, exposed to
untrusted user input, this can be leveraged to force a program to
consume significant time parsing Accept-Language headers.

The parser cannot be easily rewritten to fix this behavior for
various reasons. Instead the solution implemented in this CL is to
limit the total complexity of tags passed into ParseAcceptLanguage
by limiting the number of dashes in the string to 1000. This should
be more than enough for the majority of real world use cases, where
the number of tags being sent is likely to be in the single digits.

Thanks to the OSS-Fuzz project for discovering this issue and to Adam
Korczynski (ADA Logics) for writing the fuzz case and for reporting the
issue.

Fixes CVE-2022-32149
Fixes golang/go#56152

Change-Id: I7bda1d84cee2b945039c203f26869d58ee9374ae
Reviewed-on: https://team-review.git.corp.google.com/c/golang/go-private/+/1565112
Reviewed-by: Damien Neil <dneil@google.com>
Reviewed-by: Tatiana Bradley <tatianabradley@google.com>
Reviewed-on: https://go-review.googlesource.com/c/text/+/442235
TryBot-Result: Gopher Robot <gobot@golang.org>
Auto-Submit: Roland Shoemaker <roland@golang.org>
Run-TryBot: Roland Shoemaker <roland@golang.org>
---
 language/parse.go      |  5 +++++
 language/parse_test.go | 13 +++++++++++++
 2 files changed, 18 insertions(+)

diff --git a/language/parse.go b/language/parse.go
index 59b041008..b982d9e42 100644
--- a/language/parse.go
+++ b/language/parse.go
@@ -147,6 +147,7 @@ func update(b *language.Builder, part ...interface{}) (err error) {
 }
 
 var errInvalidWeight = errors.New("ParseAcceptLanguage: invalid weight")
+var errTagListTooLarge = errors.New("tag list exceeds max length")
 
 // ParseAcceptLanguage parses the contents of an Accept-Language header as
 // defined in http://www.ietf.org/rfc/rfc2616.txt and returns a list of Tags and
@@ -164,6 +165,10 @@ func ParseAcceptLanguage(s string) (tag []Tag, q []float32, err error) {
 		}
 	}()
 
+	if strings.Count(s, "-") > 1000 {
+		return nil, nil, errTagListTooLarge
+	}
+
 	var entry string
 	for s != "" {
 		if entry, s = split(s, ','); entry == "" {
diff --git a/language/parse_test.go b/language/parse_test.go
index e1e5653ad..0eee033e6 100644
--- a/language/parse_test.go
+++ b/language/parse_test.go
@@ -394,3 +394,16 @@ func TestParseAcceptLanguage(t *testing.T) {
 		}
 	}
 }
+
+func TestParseAcceptLanguageTooBig(t *testing.T) {
+	s := strings.Repeat("en-x-a-", 333)
+	_, _, err := ParseAcceptLanguage(s)
+	if err != language.ErrSyntax {
+		t.Errorf("ParseAcceptLanguage() unexpected error: got %v, want %v", err, language.ErrSyntax)
+	}
+	s += "en-x-a"
+	_, _, err = ParseAcceptLanguage(s)
+	if err != errTagListTooLarge {
+		t.Errorf("ParseAcceptLanguage() unexpected error: got %v, want %v", err, errTagListTooLarge)
+	}
+}