github.com/matrixorigin/matrixone@v1.2.0/pkg/vectorize/lengthutf8/length_utf8_test.go (about)

     1  // Copyright 2021 Matrix Origin
     2  //
     3  // Licensed under the Apache License, Version 2.0 (the "License");
     4  // you may not use this file except in compliance with the License.
     5  // You may obtain a copy of the License at
     6  //
     7  //      http://www.apache.org/licenses/LICENSE-2.0
     8  //
     9  // Unless required by applicable law or agreed to in writing, software
    10  // distributed under the License is distributed on an "AS IS" BASIS,
    11  // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
    12  // See the License for the specific language governing permissions and
    13  // limitations under the License.
    14  
    15  package lengthutf8
    16  
    17  import (
    18  	"testing"
    19  
    20  	"github.com/stretchr/testify/require"
    21  )
    22  
    23  func TestCountUTF8CodePoints(t *testing.T) {
    24  	cases := map[string]uint64{
    25  		"abc":   3,
    26  		"":      0,
    27  		"   ":   3,
    28  		"中国123": 5,
    29  		"abc😄":  4,
    30  		"中国中国中国中国中国中国中国中国中国中国1234":      24,
    31  		"中国中国中国中国中国中国中国中国中国中国1234😄ggg!": 29,
    32  	}
    33  
    34  	for input, expected := range cases {
    35  		actual := CountUTF8CodePoints([]byte(input))
    36  		require.Equal(t, expected, actual)
    37  	}
    38  }