Package com.caucho.quercus.lib.i18n

Source Code of com.caucho.quercus.lib.i18n.Utf8Encoder

/*
* Copyright (c) 1998-2008 Caucho Technology -- all rights reserved
*
* This file is part of Resin(R) Open Source
*
* Each copy or derived work must preserve the copyright notice and this
* notice unmodified.
*
* Resin Open Source is free software; you can redistribute it and/or modify
* it under the terms of the GNU General Public License as published by
* the Free Software Foundation; either version 2 of the License, or
* (at your option) any later version.
*
* Resin Open Source is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE, or any warranty
* of NON-INFRINGEMENT.  See the GNU General Public License for more
* details.
*
* You should have received a copy of the GNU General Public License
* along with Resin Open Source; if not, write to the
*
*   Free Software Foundation, Inc.
*   59 Temple Place, Suite 330
*   Boston, MA 02111-1307  USA
*
* @author Nam Nguyen
*/

package com.caucho.quercus.lib.i18n;

import com.caucho.quercus.env.Env;
import com.caucho.quercus.env.StringValue;

public class Utf8Encoder
  extends Encoder
{
  public Utf8Encoder(String charset)
  {
    super(charset);
  }
 
  @Override
  public boolean isUtf8()
  {
    return true;
  }

  public boolean isEncodable(Env env, StringValue str)
  {
    int len = str.length();
    for (int i = 0; i < len; i++) {
      char ch = str.charAt(i);
     
      if (ch <= 0x7F)
        continue;
     
      if ('\uD800' <= ch && ch <= '\uDBFF') {
        char ch2;
       
        if (i + 1 < len
            && '\uDC00' <= (ch2 = str.charAt(i + 1)) && ch2 <= '\uDFFF') {
          i++;
        }
        else
          return false;
      }
    }
   
    return true;
  }
 
  @Override
  public StringValue encode(Env env, CharSequence str)
  {
    StringValue sb = env.createBinaryBuilder();
   
    int len = str.length();
    for (int i = 0; i < len; i++) {
      char ch = str.charAt(i);
     
      if (ch <= 0x7F) {
        sb.appendByte(ch);
        continue;
      }
     
      int code = ch;
     
      if ('\uD800' <= ch && ch <= '\uDBFF') {
        char ch2;
       
        if (i + 1 < len
            && '\uDC00' <= (ch2 = str.charAt(i + 1)) && ch2 <= '\uDFFF') {
          i++;
         
          code = 0x10000 + ((code & 0xFF) << 8);
          code = code + (ch2 & 0xFF);
        }
        else {
          if (_isIgnore) {
          }
          else if (_replacement != null)
            sb.append(_replacement);
          else
            return sb;
         
          continue;
        }
      }
     
      if (0x80 <= code && code <= 0x7FF) {
        sb.appendByte(0xC0 | (code >> 6));
        sb.appendByte(0x80 | (code & 0x3F));
      }
      else if (0x800 <= code && code <= 0xFFFF) {
        sb.appendByte(0xE0 | (code >> 12));
        sb.appendByte(0x80 | ((code >> 6) & 0x3F));
        sb.appendByte(0x80 | (code & 0x3F));
      }
      else {
        sb.appendByte(0xF0 | (code >> 18));
        sb.appendByte(0x80 | ((code >> 12) & 0x3F));
        sb.appendByte(0x80 | ((code >> 6) & 0x3F));
        sb.appendByte(0x80 | (code & 0x3F));
      }
    }
   
    return sb;
  }
 
}
TOP

Related Classes of com.caucho.quercus.lib.i18n.Utf8Encoder

TOP
Copyright © 2018 www.massapi.com. All rights reserved.
All source code are property of their respective owners. Java is a trademark of Sun Microsystems, Inc and owned by ORACLE Inc. Contact coftware#gmail.com.