40 lines
734 B
Go
40 lines
734 B
Go
// Package bom is used to clean up UTF-8 Byte Order Marks.
|
|
package bom
|
|
|
|
import (
|
|
"bufio"
|
|
"io"
|
|
)
|
|
|
|
const (
|
|
bom0 = 0xef
|
|
bom1 = 0xbb
|
|
bom2 = 0xbf
|
|
)
|
|
|
|
// Clean returns b with the 3 byte BOM stripped off the front if it is present.
|
|
// If the BOM is not present, then b is returned.
|
|
func Clean(b []byte) []byte {
|
|
if len(b) >= 3 &&
|
|
b[0] == bom0 &&
|
|
b[1] == bom1 &&
|
|
b[2] == bom2 {
|
|
return b[3:]
|
|
}
|
|
return b
|
|
}
|
|
|
|
// NewReader returns an io.Reader that will skip over initial UTF-8 byte order marks.
|
|
func NewReader(r io.Reader) io.Reader {
|
|
buf := bufio.NewReader(r)
|
|
b, err := buf.Peek(3)
|
|
if err != nil {
|
|
// not enough bytes
|
|
return buf
|
|
}
|
|
if b[0] == bom0 && b[1] == bom1 && b[2] == bom2 {
|
|
discardBytes(buf, 3)
|
|
}
|
|
return buf
|
|
}
|