valid UTF String - Java java.lang

Java examples for java.lang:String UTF

Description

valid UTF String

Demo Code

/**//from  w  w w.j  a va2 s . c o  m
 * Licensed to the Apache Software Foundation (ASF) under one or more
 * contributor license agreements.  See the NOTICE file distributed with
 * this work for additional information regarding copyright ownership.
 * The ASF licenses this file to You under the Apache License, Version 2.0
 * (the "License"); you may not use this file except in compliance with
 * the License.  You may obtain a copy of the License at
 *
 *     http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */
//package com.java2s;

public class Main {
    public static final int UNI_SUR_HIGH_START = 0xD800;
    public static final int UNI_SUR_HIGH_END = 0xDBFF;
    public static final int UNI_SUR_LOW_START = 0xDC00;
    public static final int UNI_SUR_LOW_END = 0xDFFF;

    public static boolean validUTF16String(CharSequence s) {
        final int size = s.length();
        for (int i = 0; i < size; i++) {
            char ch = s.charAt(i);
            if (ch >= UNI_SUR_HIGH_START && ch <= UNI_SUR_HIGH_END) {
                if (i < size - 1) {
                    i++;
                    char nextCH = s.charAt(i);
                    if (nextCH >= UNI_SUR_LOW_START
                            && nextCH <= UNI_SUR_LOW_END) {
                        // Valid surrogate pair
                    } else
                        // Unmatched high surrogate
                        return false;
                } else
                    // Unmatched high surrogate
                    return false;
            } else if (ch >= UNI_SUR_LOW_START && ch <= UNI_SUR_LOW_END)
                // Unmatched low surrogate
                return false;
        }

        return true;
    }
}

Related Tutorials