remove Non Utf Compliant Characters from String - Android XML

Android examples for XML:XML String

Description

remove Non Utf Compliant Characters from String

Demo Code

/********************************************************************************
 *
 *   Copyright (C) 2005  Svyatoslav Urbanovych
 *
 * This program is free software; you can redistribute it and/or
 * modify it under the terms of the GNU General Public License
 * as published by the Free Software Foundation; either version 2
 * of the License, or (at your option) any later version.

 * This program is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 * GNU General Public License for more details.

 * You should have received a copy of the GNU General Public License
 * along with this program; if not, write to the Free Software
 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA  02110-1301, USA.
 *********************************************************************************/
//package com.java2s;

public class Main {
    public static void main(String[] argv) throws Exception {
        String inString = "java2s.com";
        System.out.println(removeNonUtf8CompliantCharacters(inString));
    }/*from  w  w  w.  java  2 s  . co  m*/

    public static String removeNonUtf8CompliantCharacters(
            final String inString) {
        if (null == inString)
            return null;
        byte[] byteArr = inString.getBytes();
        for (int i = 0; i < byteArr.length; i++) {
            byte ch = byteArr[i];
            // remove any characters outside the valid UTF-8 range as well as all control characters
            // except tabs and new lines
            if (!((ch > 31 && ch < 253) || ch == '\t' || ch == '\n' || ch == '\r')) {
                byteArr[i] = ' ';
            }
        }
        return new String(byteArr);
    }
}

Related Tutorials