// Copyright 2012 The Go Authors. All rights reserved. // Use of this source code is governed by a BSD-style // license that can be found in the LICENSE file. // +build ignore // // usage: // // go run makeisprint.go -output isprint.go // package main import ( "bytes" "flag" "fmt" "go/format" "log" "os" "unicode" ) var filename = flag.String("output", "isprint.go", "output file name") var ( range16 []uint16 except16 []uint16 range32 []uint32 except32 []uint32 ) // bsearch16 returns the smallest i such that a[i] >= x. // If there is no such i, bsearch16 returns len(a). func bsearch16(a []uint16, x uint16) int { i, j := 0, len(a) for i < j { h := i + (j-i)/2 if a[h] < x { i = h + 1 } else { j = h } } return i } // bsearch32 returns the smallest i such that a[i] >= x. // If there is no such i, bsearch32 returns len(a). func bsearch32(a []uint32, x uint32) int { i, j := 0, len(a) for i < j { h := i + (j-i)/2 if a[h] < x { i = h + 1 } else { j = h } } return i } func isPrint(r rune) bool { // Same algorithm, either on uint16 or uint32 value. // First, find first i such that rang[i] >= x. // This is the index of either the start or end of a pair that might span x. // The start is even (rang[i&^1]) and the end is odd (rang[i|1]). // If we find x in a range, make sure x is not in exception list. if 0 <= r && r < 1<<16 { rr, rang, except := uint16(r), range16, except16 i := bsearch16(rang, rr) if i >= len(rang) || rr < rang[i&^1] || rang[i|1] < rr { return false } j := bsearch16(except, rr) return j >= len(except) || except[j] != rr } rr, rang, except := uint32(r), range32, except32 i := bsearch32(rang, rr) if i >= len(rang) || rr < rang[i&^1] || rang[i|1] < rr { return false } j := bsearch32(except, rr) return j >= len(except) || except[j] != rr } func scan(min, max rune) (rang, except []uint32) { lo := rune(-1) for i := min; ; i++ { if (i > max || !unicode.IsPrint(i)) && lo >= 0 { // End range, but avoid flip flop. if i+1 <= max && unicode.IsPrint(i+1) { except = append(except, uint32(i)) continue } rang = append(rang, uint32(lo), uint32(i-1)) lo = -1 } if i > max { break } if lo < 0 && unicode.IsPrint(i) { lo = i } } return } func to16(x []uint32) []uint16 { var y []uint16 for _, v := range x { if uint32(uint16(v)) != v { panic("bad 32->16 conversion") } y = append(y, uint16(v)) } return y } func main() { flag.Parse() rang, except := scan(0, 0xFFFF) range16 = to16(rang) except16 = to16(except) range32, except32 = scan(0x10000, unicode.MaxRune) for i := rune(0); i <= unicode.MaxRune; i++ { if isPrint(i) != unicode.IsPrint(i) { log.Fatalf("%U: isPrint=%v, want %v\n", i, isPrint(i), unicode.IsPrint(i)) } } var buf bytes.Buffer fmt.Fprintf(&buf, `// Copyright 2013 The Go Authors. All rights reserved. // Use of this source code is governed by a BSD-style // license that can be found in the LICENSE file.`+"\n\n") fmt.Fprintf(&buf, "// Code generated by go run makeisprint.go -output isprint.go; DO NOT EDIT.\n\n") fmt.Fprintf(&buf, "package strconv\n\n") fmt.Fprintf(&buf, "// (%d+%d+%d)*2 + (%d)*4 = %d bytes\n\n", len(range16), len(except16), len(except32), len(range32), (len(range16)+len(except16)+len(except32))*2+ (len(range32))*4) fmt.Fprintf(&buf, "var isPrint16 = []uint16{\n") for i := 0; i < len(range16); i += 2 { fmt.Fprintf(&buf, "\t%#04x, %#04x,\n", range16[i], range16[i+1]) } fmt.Fprintf(&buf, "}\n\n") fmt.Fprintf(&buf, "var isNotPrint16 = []uint16{\n") for _, r := range except16 { fmt.Fprintf(&buf, "\t%#04x,\n", r) } fmt.Fprintf(&buf, "}\n\n") fmt.Fprintf(&buf, "var isPrint32 = []uint32{\n") for i := 0; i < len(range32); i += 2 { fmt.Fprintf(&buf, "\t%#06x, %#06x,\n", range32[i], range32[i+1]) } fmt.Fprintf(&buf, "}\n\n") fmt.Fprintf(&buf, "var isNotPrint32 = []uint16{ // add 0x10000 to each entry\n") for _, r := range except32 { if r >= 0x20000 { log.Fatalf("%U too big for isNotPrint32\n", r) } fmt.Fprintf(&buf, "\t%#04x,\n", r-0x10000) } fmt.Fprintf(&buf, "}\n\n") // The list of graphic but not "printable" runes is short. Just make one easy table. fmt.Fprintf(&buf, "// isGraphic lists the graphic runes not matched by IsPrint.\n") fmt.Fprintf(&buf, "var isGraphic = []uint16{\n") for r := rune(0); r <= unicode.MaxRune; r++ { if unicode.IsPrint(r) != unicode.IsGraphic(r) { // Sanity check. if !unicode.IsGraphic(r) { log.Fatalf("%U is printable but not graphic\n", r) } if r > 0xFFFF { // We expect only 16-bit values. log.Fatalf("%U too big for isGraphic\n", r) } fmt.Fprintf(&buf, "\t%#04x,\n", r) } } fmt.Fprintf(&buf, "}\n") data, err := format.Source(buf.Bytes()) if err != nil { log.Fatal(err) } err = os.WriteFile(*filename, data, 0644) if err != nil { log.Fatal(err) } }