Source file
src/bytes/bytes.go
1
2
3
4
5
6
7 package bytes
8
9 import (
10 "internal/bytealg"
11 "math/bits"
12 "unicode"
13 "unicode/utf8"
14 _ "unsafe"
15 )
16
17
18
19
20 func Equal(a, b []byte) bool {
21
22 return string(a) == string(b)
23 }
24
25
26
27
28 func Compare(a, b []byte) int {
29 return bytealg.Compare(a, b)
30 }
31
32
33
34 func explode(s []byte, n int) [][]byte {
35 if n <= 0 || n > len(s) {
36 n = len(s)
37 }
38 a := make([][]byte, n)
39 var size int
40 na := 0
41 for len(s) > 0 {
42 if na+1 >= n {
43 a[na] = s
44 na++
45 break
46 }
47 _, size = utf8.DecodeRune(s)
48 a[na] = s[0:size:size]
49 s = s[size:]
50 na++
51 }
52 return a[0:na]
53 }
54
55
56
57 func Count(s, sep []byte) int {
58
59 if len(sep) == 0 {
60 return utf8.RuneCount(s) + 1
61 }
62 if len(sep) == 1 {
63 return bytealg.Count(s, sep[0])
64 }
65 n := 0
66 for {
67 i := Index(s, sep)
68 if i == -1 {
69 return n
70 }
71 n++
72 s = s[i+len(sep):]
73 }
74 }
75
76
77 func Contains(b, subslice []byte) bool {
78 return Index(b, subslice) != -1
79 }
80
81
82 func ContainsAny(b []byte, chars string) bool {
83 return IndexAny(b, chars) >= 0
84 }
85
86
87 func ContainsRune(b []byte, r rune) bool {
88 return IndexRune(b, r) >= 0
89 }
90
91
92 func ContainsFunc(b []byte, f func(rune) bool) bool {
93 return IndexFunc(b, f) >= 0
94 }
95
96
97 func IndexByte(b []byte, c byte) int {
98 return bytealg.IndexByte(b, c)
99 }
100
101 func indexBytePortable(s []byte, c byte) int {
102 for i, b := range s {
103 if b == c {
104 return i
105 }
106 }
107 return -1
108 }
109
110
111 func LastIndex(s, sep []byte) int {
112 n := len(sep)
113 switch {
114 case n == 0:
115 return len(s)
116 case n == 1:
117 return bytealg.LastIndexByte(s, sep[0])
118 case n == len(s):
119 if Equal(s, sep) {
120 return 0
121 }
122 return -1
123 case n > len(s):
124 return -1
125 }
126 return bytealg.LastIndexRabinKarp(s, sep)
127 }
128
129
130 func LastIndexByte(s []byte, c byte) int {
131 return bytealg.LastIndexByte(s, c)
132 }
133
134
135
136
137
138
139 func IndexRune(s []byte, r rune) int {
140 const haveFastIndex = bytealg.MaxBruteForce > 0
141 switch {
142 case 0 <= r && r < utf8.RuneSelf:
143 return IndexByte(s, byte(r))
144 case r == utf8.RuneError:
145 for i := 0; i < len(s); {
146 r1, n := utf8.DecodeRune(s[i:])
147 if r1 == utf8.RuneError {
148 return i
149 }
150 i += n
151 }
152 return -1
153 case !utf8.ValidRune(r):
154 return -1
155 default:
156
157
158
159 var b [utf8.UTFMax]byte
160 n := utf8.EncodeRune(b[:], r)
161 last := n - 1
162 i := last
163 fails := 0
164 for i < len(s) {
165 if s[i] != b[last] {
166 o := IndexByte(s[i+1:], b[last])
167 if o < 0 {
168 return -1
169 }
170 i += o + 1
171 }
172
173 for j := 1; j < n; j++ {
174 if s[i-j] != b[last-j] {
175 goto next
176 }
177 }
178 return i - last
179 next:
180 fails++
181 i++
182 if (haveFastIndex && fails > bytealg.Cutover(i)) && i < len(s) ||
183 (!haveFastIndex && fails >= 4+i>>4 && i < len(s)) {
184 goto fallback
185 }
186 }
187 return -1
188
189 fallback:
190
191
192 if haveFastIndex {
193 if j := bytealg.Index(s[i-last:], b[:n]); j >= 0 {
194 return i + j - last
195 }
196 } else {
197
198
199 c0 := b[last]
200 c1 := b[last-1]
201 loop:
202 for ; i < len(s); i++ {
203 if s[i] == c0 && s[i-1] == c1 {
204 for k := 2; k < n; k++ {
205 if s[i-k] != b[last-k] {
206 continue loop
207 }
208 }
209 return i - last
210 }
211 }
212 }
213 return -1
214 }
215 }
216
217
218
219
220
221 func IndexAny(s []byte, chars string) int {
222 if chars == "" {
223
224 return -1
225 }
226 if len(s) == 1 {
227 r := rune(s[0])
228 if r >= utf8.RuneSelf {
229
230 for _, r = range chars {
231 if r == utf8.RuneError {
232 return 0
233 }
234 }
235 return -1
236 }
237 if bytealg.IndexByteString(chars, s[0]) >= 0 {
238 return 0
239 }
240 return -1
241 }
242 if len(chars) == 1 {
243 r := rune(chars[0])
244 if r >= utf8.RuneSelf {
245 r = utf8.RuneError
246 }
247 return IndexRune(s, r)
248 }
249 if len(s) > 8 {
250 if as, isASCII := makeASCIISet(chars); isASCII {
251 for i, c := range s {
252 if as.contains(c) {
253 return i
254 }
255 }
256 return -1
257 }
258 }
259 var width int
260 for i := 0; i < len(s); i += width {
261 r := rune(s[i])
262 if r < utf8.RuneSelf {
263 if bytealg.IndexByteString(chars, s[i]) >= 0 {
264 return i
265 }
266 width = 1
267 continue
268 }
269 r, width = utf8.DecodeRune(s[i:])
270 if r != utf8.RuneError {
271
272 if len(chars) == width {
273 if chars == string(r) {
274 return i
275 }
276 continue
277 }
278
279 if bytealg.MaxLen >= width {
280 if bytealg.IndexString(chars, string(r)) >= 0 {
281 return i
282 }
283 continue
284 }
285 }
286 for _, ch := range chars {
287 if r == ch {
288 return i
289 }
290 }
291 }
292 return -1
293 }
294
295
296
297
298
299 func LastIndexAny(s []byte, chars string) int {
300 if chars == "" {
301
302 return -1
303 }
304 if len(s) > 8 {
305 if as, isASCII := makeASCIISet(chars); isASCII {
306 for i := len(s) - 1; i >= 0; i-- {
307 if as.contains(s[i]) {
308 return i
309 }
310 }
311 return -1
312 }
313 }
314 if len(s) == 1 {
315 r := rune(s[0])
316 if r >= utf8.RuneSelf {
317 for _, r = range chars {
318 if r == utf8.RuneError {
319 return 0
320 }
321 }
322 return -1
323 }
324 if bytealg.IndexByteString(chars, s[0]) >= 0 {
325 return 0
326 }
327 return -1
328 }
329 if len(chars) == 1 {
330 cr := rune(chars[0])
331 if cr >= utf8.RuneSelf {
332 cr = utf8.RuneError
333 }
334 for i := len(s); i > 0; {
335 r, size := utf8.DecodeLastRune(s[:i])
336 i -= size
337 if r == cr {
338 return i
339 }
340 }
341 return -1
342 }
343 for i := len(s); i > 0; {
344 r := rune(s[i-1])
345 if r < utf8.RuneSelf {
346 if bytealg.IndexByteString(chars, s[i-1]) >= 0 {
347 return i - 1
348 }
349 i--
350 continue
351 }
352 r, size := utf8.DecodeLastRune(s[:i])
353 i -= size
354 if r != utf8.RuneError {
355
356 if len(chars) == size {
357 if chars == string(r) {
358 return i
359 }
360 continue
361 }
362
363 if bytealg.MaxLen >= size {
364 if bytealg.IndexString(chars, string(r)) >= 0 {
365 return i
366 }
367 continue
368 }
369 }
370 for _, ch := range chars {
371 if r == ch {
372 return i
373 }
374 }
375 }
376 return -1
377 }
378
379
380
381 func genSplit(s, sep []byte, sepSave, n int) [][]byte {
382 if n == 0 {
383 return nil
384 }
385 if len(sep) == 0 {
386 return explode(s, n)
387 }
388 if n < 0 {
389 n = Count(s, sep) + 1
390 }
391 if n > len(s)+1 {
392 n = len(s) + 1
393 }
394
395 a := make([][]byte, n)
396 n--
397 i := 0
398 for i < n {
399 m := Index(s, sep)
400 if m < 0 {
401 break
402 }
403 a[i] = s[: m+sepSave : m+sepSave]
404 s = s[m+len(sep):]
405 i++
406 }
407 a[i] = s
408 return a[:i+1]
409 }
410
411
412
413
414
415
416
417
418
419
420 func SplitN(s, sep []byte, n int) [][]byte { return genSplit(s, sep, 0, n) }
421
422
423
424
425
426
427
428
429 func SplitAfterN(s, sep []byte, n int) [][]byte {
430 return genSplit(s, sep, len(sep), n)
431 }
432
433
434
435
436
437
438
439 func Split(s, sep []byte) [][]byte { return genSplit(s, sep, 0, -1) }
440
441
442
443
444
445 func SplitAfter(s, sep []byte) [][]byte {
446 return genSplit(s, sep, len(sep), -1)
447 }
448
449 var asciiSpace = [256]uint8{'\t': 1, '\n': 1, '\v': 1, '\f': 1, '\r': 1, ' ': 1}
450
451
452
453
454
455
456
457 func Fields(s []byte) [][]byte {
458
459
460 n := 0
461 wasSpace := 1
462
463 setBits := uint8(0)
464 for i := 0; i < len(s); i++ {
465 r := s[i]
466 setBits |= r
467 isSpace := int(asciiSpace[r])
468 n += wasSpace & ^isSpace
469 wasSpace = isSpace
470 }
471
472 if setBits >= utf8.RuneSelf {
473
474 return FieldsFunc(s, unicode.IsSpace)
475 }
476
477
478 a := make([][]byte, n)
479 na := 0
480 fieldStart := 0
481 i := 0
482
483 for i < len(s) && asciiSpace[s[i]] != 0 {
484 i++
485 }
486 fieldStart = i
487 for i < len(s) {
488 if asciiSpace[s[i]] == 0 {
489 i++
490 continue
491 }
492 a[na] = s[fieldStart:i:i]
493 na++
494 i++
495
496 for i < len(s) && asciiSpace[s[i]] != 0 {
497 i++
498 }
499 fieldStart = i
500 }
501 if fieldStart < len(s) {
502 a[na] = s[fieldStart:len(s):len(s)]
503 }
504 return a
505 }
506
507
508
509
510
511
512
513
514
515
516 func FieldsFunc(s []byte, f func(rune) bool) [][]byte {
517
518
519 type span struct {
520 start int
521 end int
522 }
523 spans := make([]span, 0, 32)
524
525
526
527
528
529 start := -1
530 for i := 0; i < len(s); {
531 size := 1
532 r := rune(s[i])
533 if r >= utf8.RuneSelf {
534 r, size = utf8.DecodeRune(s[i:])
535 }
536 if f(r) {
537 if start >= 0 {
538 spans = append(spans, span{start, i})
539 start = -1
540 }
541 } else {
542 if start < 0 {
543 start = i
544 }
545 }
546 i += size
547 }
548
549
550 if start >= 0 {
551 spans = append(spans, span{start, len(s)})
552 }
553
554
555 a := make([][]byte, len(spans))
556 for i, span := range spans {
557 a[i] = s[span.start:span.end:span.end]
558 }
559
560 return a
561 }
562
563
564
565 func Join(s [][]byte, sep []byte) []byte {
566 if len(s) == 0 {
567 return []byte{}
568 }
569 if len(s) == 1 {
570
571 return append([]byte(nil), s[0]...)
572 }
573
574 var n int
575 if len(sep) > 0 {
576 if len(sep) >= maxInt/(len(s)-1) {
577 panic("bytes: Join output length overflow")
578 }
579 n += len(sep) * (len(s) - 1)
580 }
581 for _, v := range s {
582 if len(v) > maxInt-n {
583 panic("bytes: Join output length overflow")
584 }
585 n += len(v)
586 }
587
588 b := bytealg.MakeNoZero(n)[:n:n]
589 bp := copy(b, s[0])
590 for _, v := range s[1:] {
591 bp += copy(b[bp:], sep)
592 bp += copy(b[bp:], v)
593 }
594 return b
595 }
596
597
598 func HasPrefix(s, prefix []byte) bool {
599 return len(s) >= len(prefix) && Equal(s[:len(prefix)], prefix)
600 }
601
602
603 func HasSuffix(s, suffix []byte) bool {
604 return len(s) >= len(suffix) && Equal(s[len(s)-len(suffix):], suffix)
605 }
606
607
608
609
610
611 func Map(mapping func(r rune) rune, s []byte) []byte {
612
613
614
615 b := make([]byte, 0, len(s))
616 for i := 0; i < len(s); {
617 wid := 1
618 r := rune(s[i])
619 if r >= utf8.RuneSelf {
620 r, wid = utf8.DecodeRune(s[i:])
621 }
622 r = mapping(r)
623 if r >= 0 {
624 b = utf8.AppendRune(b, r)
625 }
626 i += wid
627 }
628 return b
629 }
630
631
632
633
634
635
636
637
638
639
640
641
642
643
644
645
646
647 func Repeat(b []byte, count int) []byte {
648 if count == 0 {
649 return []byte{}
650 }
651
652
653
654
655 if count < 0 {
656 panic("bytes: negative Repeat count")
657 }
658 hi, lo := bits.Mul(uint(len(b)), uint(count))
659 if hi > 0 || lo > uint(maxInt) {
660 panic("bytes: Repeat output length overflow")
661 }
662 n := int(lo)
663
664 if len(b) == 0 {
665 return []byte{}
666 }
667
668
669
670
671
672
673
674
675
676
677
678 const chunkLimit = 8 * 1024
679 chunkMax := n
680 if chunkMax > chunkLimit {
681 chunkMax = chunkLimit / len(b) * len(b)
682 if chunkMax == 0 {
683 chunkMax = len(b)
684 }
685 }
686 nb := bytealg.MakeNoZero(n)[:n:n]
687 bp := copy(nb, b)
688 for bp < n {
689 chunk := min(bp, chunkMax)
690 bp += copy(nb[bp:], nb[:chunk])
691 }
692 return nb
693 }
694
695
696
697 func ToUpper(s []byte) []byte {
698 isASCII, hasLower := true, false
699 for i := 0; i < len(s); i++ {
700 c := s[i]
701 if c >= utf8.RuneSelf {
702 isASCII = false
703 break
704 }
705 hasLower = hasLower || ('a' <= c && c <= 'z')
706 }
707
708 if isASCII {
709 if !hasLower {
710
711 return append([]byte(""), s...)
712 }
713 b := bytealg.MakeNoZero(len(s))[:len(s):len(s)]
714 for i := 0; i < len(s); i++ {
715 c := s[i]
716 if 'a' <= c && c <= 'z' {
717 c -= 'a' - 'A'
718 }
719 b[i] = c
720 }
721 return b
722 }
723 return Map(unicode.ToUpper, s)
724 }
725
726
727
728 func ToLower(s []byte) []byte {
729 isASCII, hasUpper := true, false
730 for i := 0; i < len(s); i++ {
731 c := s[i]
732 if c >= utf8.RuneSelf {
733 isASCII = false
734 break
735 }
736 hasUpper = hasUpper || ('A' <= c && c <= 'Z')
737 }
738
739 if isASCII {
740 if !hasUpper {
741 return append([]byte(""), s...)
742 }
743 b := bytealg.MakeNoZero(len(s))[:len(s):len(s)]
744 for i := 0; i < len(s); i++ {
745 c := s[i]
746 if 'A' <= c && c <= 'Z' {
747 c += 'a' - 'A'
748 }
749 b[i] = c
750 }
751 return b
752 }
753 return Map(unicode.ToLower, s)
754 }
755
756
757 func ToTitle(s []byte) []byte { return Map(unicode.ToTitle, s) }
758
759
760
761 func ToUpperSpecial(c unicode.SpecialCase, s []byte) []byte {
762 return Map(c.ToUpper, s)
763 }
764
765
766
767 func ToLowerSpecial(c unicode.SpecialCase, s []byte) []byte {
768 return Map(c.ToLower, s)
769 }
770
771
772
773 func ToTitleSpecial(c unicode.SpecialCase, s []byte) []byte {
774 return Map(c.ToTitle, s)
775 }
776
777
778
779 func ToValidUTF8(s, replacement []byte) []byte {
780 b := make([]byte, 0, len(s)+len(replacement))
781 invalid := false
782 for i := 0; i < len(s); {
783 c := s[i]
784 if c < utf8.RuneSelf {
785 i++
786 invalid = false
787 b = append(b, c)
788 continue
789 }
790 _, wid := utf8.DecodeRune(s[i:])
791 if wid == 1 {
792 i++
793 if !invalid {
794 invalid = true
795 b = append(b, replacement...)
796 }
797 continue
798 }
799 invalid = false
800 b = append(b, s[i:i+wid]...)
801 i += wid
802 }
803 return b
804 }
805
806
807
808 func isSeparator(r rune) bool {
809
810 if r <= 0x7F {
811 switch {
812 case '0' <= r && r <= '9':
813 return false
814 case 'a' <= r && r <= 'z':
815 return false
816 case 'A' <= r && r <= 'Z':
817 return false
818 case r == '_':
819 return false
820 }
821 return true
822 }
823
824 if unicode.IsLetter(r) || unicode.IsDigit(r) {
825 return false
826 }
827
828 return unicode.IsSpace(r)
829 }
830
831
832
833
834
835
836 func Title(s []byte) []byte {
837
838
839
840 prev := ' '
841 return Map(
842 func(r rune) rune {
843 if isSeparator(prev) {
844 prev = r
845 return unicode.ToTitle(r)
846 }
847 prev = r
848 return r
849 },
850 s)
851 }
852
853
854
855 func TrimLeftFunc(s []byte, f func(r rune) bool) []byte {
856 i := indexFunc(s, f, false)
857 if i == -1 {
858 return nil
859 }
860 return s[i:]
861 }
862
863
864
865 func TrimRightFunc(s []byte, f func(r rune) bool) []byte {
866 i := lastIndexFunc(s, f, false)
867 if i >= 0 && s[i] >= utf8.RuneSelf {
868 _, wid := utf8.DecodeRune(s[i:])
869 i += wid
870 } else {
871 i++
872 }
873 return s[0:i]
874 }
875
876
877
878 func TrimFunc(s []byte, f func(r rune) bool) []byte {
879 return TrimRightFunc(TrimLeftFunc(s, f), f)
880 }
881
882
883
884 func TrimPrefix(s, prefix []byte) []byte {
885 if HasPrefix(s, prefix) {
886 return s[len(prefix):]
887 }
888 return s
889 }
890
891
892
893 func TrimSuffix(s, suffix []byte) []byte {
894 if HasSuffix(s, suffix) {
895 return s[:len(s)-len(suffix)]
896 }
897 return s
898 }
899
900
901
902
903 func IndexFunc(s []byte, f func(r rune) bool) int {
904 return indexFunc(s, f, true)
905 }
906
907
908
909
910 func LastIndexFunc(s []byte, f func(r rune) bool) int {
911 return lastIndexFunc(s, f, true)
912 }
913
914
915
916
917 func indexFunc(s []byte, f func(r rune) bool, truth bool) int {
918 start := 0
919 for start < len(s) {
920 wid := 1
921 r := rune(s[start])
922 if r >= utf8.RuneSelf {
923 r, wid = utf8.DecodeRune(s[start:])
924 }
925 if f(r) == truth {
926 return start
927 }
928 start += wid
929 }
930 return -1
931 }
932
933
934
935
936 func lastIndexFunc(s []byte, f func(r rune) bool, truth bool) int {
937 for i := len(s); i > 0; {
938 r, size := rune(s[i-1]), 1
939 if r >= utf8.RuneSelf {
940 r, size = utf8.DecodeLastRune(s[0:i])
941 }
942 i -= size
943 if f(r) == truth {
944 return i
945 }
946 }
947 return -1
948 }
949
950
951
952
953
954
955
956
957
958 type asciiSet [8]uint32
959
960
961
962 func makeASCIISet(chars string) (as asciiSet, ok bool) {
963 for i := 0; i < len(chars); i++ {
964 c := chars[i]
965 if c >= utf8.RuneSelf {
966 return as, false
967 }
968 as[c/32] |= 1 << (c % 32)
969 }
970 return as, true
971 }
972
973
974 func (as *asciiSet) contains(c byte) bool {
975 return (as[c/32] & (1 << (c % 32))) != 0
976 }
977
978
979
980
981 func containsRune(s string, r rune) bool {
982 for _, c := range s {
983 if c == r {
984 return true
985 }
986 }
987 return false
988 }
989
990
991
992 func Trim(s []byte, cutset string) []byte {
993 if len(s) == 0 {
994
995 return nil
996 }
997 if cutset == "" {
998 return s
999 }
1000 if len(cutset) == 1 && cutset[0] < utf8.RuneSelf {
1001 return trimLeftByte(trimRightByte(s, cutset[0]), cutset[0])
1002 }
1003 if as, ok := makeASCIISet(cutset); ok {
1004 return trimLeftASCII(trimRightASCII(s, &as), &as)
1005 }
1006 return trimLeftUnicode(trimRightUnicode(s, cutset), cutset)
1007 }
1008
1009
1010
1011 func TrimLeft(s []byte, cutset string) []byte {
1012 if len(s) == 0 {
1013
1014 return nil
1015 }
1016 if cutset == "" {
1017 return s
1018 }
1019 if len(cutset) == 1 && cutset[0] < utf8.RuneSelf {
1020 return trimLeftByte(s, cutset[0])
1021 }
1022 if as, ok := makeASCIISet(cutset); ok {
1023 return trimLeftASCII(s, &as)
1024 }
1025 return trimLeftUnicode(s, cutset)
1026 }
1027
1028 func trimLeftByte(s []byte, c byte) []byte {
1029 for len(s) > 0 && s[0] == c {
1030 s = s[1:]
1031 }
1032 if len(s) == 0 {
1033
1034 return nil
1035 }
1036 return s
1037 }
1038
1039 func trimLeftASCII(s []byte, as *asciiSet) []byte {
1040 for len(s) > 0 {
1041 if !as.contains(s[0]) {
1042 break
1043 }
1044 s = s[1:]
1045 }
1046 if len(s) == 0 {
1047
1048 return nil
1049 }
1050 return s
1051 }
1052
1053 func trimLeftUnicode(s []byte, cutset string) []byte {
1054 for len(s) > 0 {
1055 r, n := rune(s[0]), 1
1056 if r >= utf8.RuneSelf {
1057 r, n = utf8.DecodeRune(s)
1058 }
1059 if !containsRune(cutset, r) {
1060 break
1061 }
1062 s = s[n:]
1063 }
1064 if len(s) == 0 {
1065
1066 return nil
1067 }
1068 return s
1069 }
1070
1071
1072
1073 func TrimRight(s []byte, cutset string) []byte {
1074 if len(s) == 0 || cutset == "" {
1075 return s
1076 }
1077 if len(cutset) == 1 && cutset[0] < utf8.RuneSelf {
1078 return trimRightByte(s, cutset[0])
1079 }
1080 if as, ok := makeASCIISet(cutset); ok {
1081 return trimRightASCII(s, &as)
1082 }
1083 return trimRightUnicode(s, cutset)
1084 }
1085
1086 func trimRightByte(s []byte, c byte) []byte {
1087 for len(s) > 0 && s[len(s)-1] == c {
1088 s = s[:len(s)-1]
1089 }
1090 return s
1091 }
1092
1093 func trimRightASCII(s []byte, as *asciiSet) []byte {
1094 for len(s) > 0 {
1095 if !as.contains(s[len(s)-1]) {
1096 break
1097 }
1098 s = s[:len(s)-1]
1099 }
1100 return s
1101 }
1102
1103 func trimRightUnicode(s []byte, cutset string) []byte {
1104 for len(s) > 0 {
1105 r, n := rune(s[len(s)-1]), 1
1106 if r >= utf8.RuneSelf {
1107 r, n = utf8.DecodeLastRune(s)
1108 }
1109 if !containsRune(cutset, r) {
1110 break
1111 }
1112 s = s[:len(s)-n]
1113 }
1114 return s
1115 }
1116
1117
1118
1119 func TrimSpace(s []byte) []byte {
1120
1121 start := 0
1122 for ; start < len(s); start++ {
1123 c := s[start]
1124 if c >= utf8.RuneSelf {
1125
1126
1127 return TrimFunc(s[start:], unicode.IsSpace)
1128 }
1129 if asciiSpace[c] == 0 {
1130 break
1131 }
1132 }
1133
1134
1135 stop := len(s)
1136 for ; stop > start; stop-- {
1137 c := s[stop-1]
1138 if c >= utf8.RuneSelf {
1139 return TrimFunc(s[start:stop], unicode.IsSpace)
1140 }
1141 if asciiSpace[c] == 0 {
1142 break
1143 }
1144 }
1145
1146
1147
1148
1149 if start == stop {
1150
1151
1152 return nil
1153 }
1154 return s[start:stop]
1155 }
1156
1157
1158
1159 func Runes(s []byte) []rune {
1160 t := make([]rune, utf8.RuneCount(s))
1161 i := 0
1162 for len(s) > 0 {
1163 r, l := utf8.DecodeRune(s)
1164 t[i] = r
1165 i++
1166 s = s[l:]
1167 }
1168 return t
1169 }
1170
1171
1172
1173
1174
1175
1176
1177 func Replace(s, old, new []byte, n int) []byte {
1178 m := 0
1179 if n != 0 {
1180
1181 m = Count(s, old)
1182 }
1183 if m == 0 {
1184
1185 return append([]byte(nil), s...)
1186 }
1187 if n < 0 || m < n {
1188 n = m
1189 }
1190
1191
1192 t := make([]byte, len(s)+n*(len(new)-len(old)))
1193 w := 0
1194 start := 0
1195 if len(old) > 0 {
1196 for range n {
1197 j := start + Index(s[start:], old)
1198 w += copy(t[w:], s[start:j])
1199 w += copy(t[w:], new)
1200 start = j + len(old)
1201 }
1202 } else {
1203 w += copy(t[w:], new)
1204 for range n - 1 {
1205 _, wid := utf8.DecodeRune(s[start:])
1206 j := start + wid
1207 w += copy(t[w:], s[start:j])
1208 w += copy(t[w:], new)
1209 start = j
1210 }
1211 }
1212 w += copy(t[w:], s[start:])
1213 return t[0:w]
1214 }
1215
1216
1217
1218
1219
1220
1221 func ReplaceAll(s, old, new []byte) []byte {
1222 return Replace(s, old, new, -1)
1223 }
1224
1225
1226
1227
1228 func EqualFold(s, t []byte) bool {
1229
1230 i := 0
1231 for ; i < len(s) && i < len(t); i++ {
1232 sr := s[i]
1233 tr := t[i]
1234 if sr|tr >= utf8.RuneSelf {
1235 goto hasUnicode
1236 }
1237
1238
1239 if tr == sr {
1240 continue
1241 }
1242
1243
1244 if tr < sr {
1245 tr, sr = sr, tr
1246 }
1247
1248 if 'A' <= sr && sr <= 'Z' && tr == sr+'a'-'A' {
1249 continue
1250 }
1251 return false
1252 }
1253
1254 return len(s) == len(t)
1255
1256 hasUnicode:
1257 s = s[i:]
1258 t = t[i:]
1259 for len(s) != 0 && len(t) != 0 {
1260
1261 var sr, tr rune
1262 if s[0] < utf8.RuneSelf {
1263 sr, s = rune(s[0]), s[1:]
1264 } else {
1265 r, size := utf8.DecodeRune(s)
1266 sr, s = r, s[size:]
1267 }
1268 if t[0] < utf8.RuneSelf {
1269 tr, t = rune(t[0]), t[1:]
1270 } else {
1271 r, size := utf8.DecodeRune(t)
1272 tr, t = r, t[size:]
1273 }
1274
1275
1276
1277
1278 if tr == sr {
1279 continue
1280 }
1281
1282
1283 if tr < sr {
1284 tr, sr = sr, tr
1285 }
1286
1287 if tr < utf8.RuneSelf {
1288
1289 if 'A' <= sr && sr <= 'Z' && tr == sr+'a'-'A' {
1290 continue
1291 }
1292 return false
1293 }
1294
1295
1296
1297 r := unicode.SimpleFold(sr)
1298 for r != sr && r < tr {
1299 r = unicode.SimpleFold(r)
1300 }
1301 if r == tr {
1302 continue
1303 }
1304 return false
1305 }
1306
1307
1308 return len(s) == len(t)
1309 }
1310
1311
1312 func Index(s, sep []byte) int {
1313 n := len(sep)
1314 switch {
1315 case n == 0:
1316 return 0
1317 case n == 1:
1318 return IndexByte(s, sep[0])
1319 case n == len(s):
1320 if Equal(sep, s) {
1321 return 0
1322 }
1323 return -1
1324 case n > len(s):
1325 return -1
1326 case n <= bytealg.MaxLen:
1327
1328 if len(s) <= bytealg.MaxBruteForce {
1329 return bytealg.Index(s, sep)
1330 }
1331 c0 := sep[0]
1332 c1 := sep[1]
1333 i := 0
1334 t := len(s) - n + 1
1335 fails := 0
1336 for i < t {
1337 if s[i] != c0 {
1338
1339
1340 o := IndexByte(s[i+1:t], c0)
1341 if o < 0 {
1342 return -1
1343 }
1344 i += o + 1
1345 }
1346 if s[i+1] == c1 && Equal(s[i:i+n], sep) {
1347 return i
1348 }
1349 fails++
1350 i++
1351
1352 if fails > bytealg.Cutover(i) {
1353 r := bytealg.Index(s[i:], sep)
1354 if r >= 0 {
1355 return r + i
1356 }
1357 return -1
1358 }
1359 }
1360 return -1
1361 }
1362 c0 := sep[0]
1363 c1 := sep[1]
1364 i := 0
1365 fails := 0
1366 t := len(s) - n + 1
1367 for i < t {
1368 if s[i] != c0 {
1369 o := IndexByte(s[i+1:t], c0)
1370 if o < 0 {
1371 break
1372 }
1373 i += o + 1
1374 }
1375 if s[i+1] == c1 && Equal(s[i:i+n], sep) {
1376 return i
1377 }
1378 i++
1379 fails++
1380 if fails >= 4+i>>4 && i < t {
1381
1382
1383
1384
1385
1386
1387
1388
1389 j := bytealg.IndexRabinKarp(s[i:], sep)
1390 if j < 0 {
1391 return -1
1392 }
1393 return i + j
1394 }
1395 }
1396 return -1
1397 }
1398
1399
1400
1401
1402
1403
1404
1405 func Cut(s, sep []byte) (before, after []byte, found bool) {
1406 if i := Index(s, sep); i >= 0 {
1407 return s[:i], s[i+len(sep):], true
1408 }
1409 return s, nil, false
1410 }
1411
1412
1413
1414
1415 func Clone(b []byte) []byte {
1416 if b == nil {
1417 return nil
1418 }
1419 return append([]byte{}, b...)
1420 }
1421
1422
1423
1424
1425
1426
1427
1428 func CutPrefix(s, prefix []byte) (after []byte, found bool) {
1429 if !HasPrefix(s, prefix) {
1430 return s, false
1431 }
1432 return s[len(prefix):], true
1433 }
1434
1435
1436
1437
1438
1439
1440
1441 func CutSuffix(s, suffix []byte) (before []byte, found bool) {
1442 if !HasSuffix(s, suffix) {
1443 return s, false
1444 }
1445 return s[:len(s)-len(suffix)], true
1446 }
1447
View as plain text