org.glassfish.grizzly/grizzly-websockets-server/3.0.0 : org/glassfish/grizzly/http/util/UEncoder.java

UEncoder
https://projects.eclipse.org/projects/ee4j.grizzly/grizzly-websockets-server: Grizzly Bill of Materials (BOM) (Oracle Corporation)
EPL-2.0
/*
 * Copyright (c) 2010, 2020 Oracle and/or its affiliates. All rights reserved.
 * Copyright 2004 The Apache Software Foundation
 *
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with the License.
 * You may obtain a copy of the License at
 *
 *     http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */

package org.glassfish.grizzly.http.util;

import java.io.CharArrayWriter;
import java.io.IOException;
import java.io.Writer;
import java.util.BitSet;
import java.util.logging.Level;
import java.util.logging.Logger;

import org.glassfish.grizzly.Grizzly;

Efficient implementation for encoders. This class is not thread safe - you need one encoder per thread. The encoder
will save and recycle the internal objects, avoiding garbage.

You can add extra characters that you want preserved, for example while encoding a URL you can add "/".
Author: Costin Manolache/**
 * Efficient implementation for encoders. This class is not thread safe - you need one encoder per thread. The encoder
 * will save and recycle the internal objects, avoiding garbage.
 * <p/>
 * You can add extra characters that you want preserved, for example while encoding a URL you can add "/".
 *
 * @author Costin Manolache
 */
public final class UEncoder {

    private final static Logger logger = Grizzly.logger(UEncoder.class);

    private static final BitSet initialSafeChars = new BitSet(128);
    static {
        initSafeChars();
    }

    // Not static - the set may differ ( it's better than adding
    // an extra check for "/", "+", etc
    private final BitSet safeChars;
    private C2BConverter c2b;
    private ByteChunk bb;

    private String encoding = "UTF8";
    private static final int debug = 0;

    public UEncoder() {
        safeChars = (BitSet) initialSafeChars.clone();
    }

    public void setEncoding(String s) {
        encoding = s;
    }

    public void addSafeCharacter(char c) {
        safeChars.set(c);
    }

    URL Encode string, using a specified encoding.
Params: buf – the Writer to write the encoded result to.
s – the String to encode./**
     * URL Encode string, using a specified encoding.
     *
     * @param buf the {@link Writer} to write the encoded result to.
     * @param s the String to encode.
     */
    public void urlEncode(Writer buf, String s) throws IOException {
        urlEncode(buf, s, false);
    }

    URL Encode string, using a specified encoding.
Params: buf – the Writer to write the encoded result to.
s – the String to encode.
toHexUpperCase – the hex string will be in upper case/**
     * URL Encode string, using a specified encoding.
     *
     * @param buf the {@link Writer} to write the encoded result to.
     * @param s the String to encode.
     * @param toHexUpperCase the hex string will be in upper case
     */
    public void urlEncode(Writer buf, String s, boolean toHexUpperCase) throws IOException {
        if (c2b == null) {
            bb = new ByteChunk(16); // small enough.
            c2b = C2BConverter.getInstance(bb, encoding);
        }

        for (int i = 0; i < s.length(); i++) {
            int c = s.charAt(i);
            if (safeChars.get(c)) {
                if (debug > 0) {
                    log("Safe: " + (char) c);
                }
                buf.write((char) c);
            } else {
                if (debug > 0) {
                    log("Unsafe:  " + (char) c);
                }
                c2b.convert((char) c);

                // "surrogate" - UTF is _not_ 16 bit, but 21 !!!!
                // ( while UCS is 31 ). Amazing...
                if (c >= 0xD800 && c <= 0xDBFF) {
                    if (i + 1 < s.length()) {
                        int d = s.charAt(i + 1);
                        if (d >= 0xDC00 && d <= 0xDFFF) {
                            if (debug > 0) {
                                log("Unsafe:  " + c);
                            }
                            c2b.convert((char) d);
                            i++;
                        }
                    }
                }

                urlEncode(buf, bb.getBuffer(), bb.getStart(), bb.getLength(), toHexUpperCase);
                bb.recycle();
            }
        }
    }

    /**
     */
    public void urlEncode(Writer buf, byte bytes[], int off, int len) throws IOException {
        urlEncode(buf, bytes, off, len, false);
    }

    /**
     */
    public void urlEncode(Writer buf, byte bytes[], int off, int len, boolean toHexUpperCase) throws IOException {
        for (int j = off; j < len; j++) {
            buf.write('%');
            char ch = Character.forDigit(bytes[j] >> 4 & 0xF, 16);
            if (toHexUpperCase) {
                ch = Character.toUpperCase(ch);
            }
            if (debug > 0) {
                log("Encode:  " + ch);
            }
            buf.write(ch);
            ch = Character.forDigit(bytes[j] & 0xF, 16);
            if (toHexUpperCase) {
                ch = Character.toUpperCase(ch);
            }
            if (debug > 0) {
                log("Encode:  " + ch);
            }
            buf.write(ch);
        }
    }

    Utility funtion to re-encode the URL. Still has problems with charset, since UEncoder mostly ignores it.
Params: url – /**
     * Utility funtion to re-encode the URL. Still has problems with charset, since UEncoder mostly ignores it.
     *
     * @param url
     */
    public String encodeURL(String url) {
        return encodeURL(url, false);
    }

    Utility function to re-encode the URL. Still has problems with charset, since UEncoder mostly ignores it.
Params: uri – the URI to encode.
toHexUpperCase – the hex string will be in upper case/**
     * Utility function to re-encode the URL. Still has problems with charset, since UEncoder mostly ignores it.
     *
     * @param uri the URI to encode.
     * @param toHexUpperCase the hex string will be in upper case
     */
    public String encodeURL(String uri, boolean toHexUpperCase) {
        String outUri = null;
        try {
            // XXX optimize - recycle, etc
            CharArrayWriter out = new CharArrayWriter();
            urlEncode(out, uri, toHexUpperCase);
            outUri = out.toString();
        } catch (IOException ignore) {
        }
        return outUri;
    }

    // -------------------- Internal implementation --------------------

    private static void initSafeChars() {
        int i;
        for (i = 'a'; i <= 'z'; i++) {
            initialSafeChars.set(i);
        }
        for (i = 'A'; i <= 'Z'; i++) {
            initialSafeChars.set(i);
        }
        for (i = '0'; i <= '9'; i++) {
            initialSafeChars.set(i);
        }
        // safe
        initialSafeChars.set('$');
        initialSafeChars.set('-');
        initialSafeChars.set('_');
        initialSafeChars.set('.');

        // Dangerous: someone may treat this as " "
        // RFC1738 does allow it, it's not reserved
        // initialSafeChars.set('+');
        // extra
        initialSafeChars.set('!');
        initialSafeChars.set('*');
        initialSafeChars.set('\'');
        initialSafeChars.set('(');
        initialSafeChars.set(')');
        initialSafeChars.set(',');
    }

    private static void log(String s) {
        if (logger.isLoggable(Level.FINE)) {
            logger.fine(s);
        }
    }
}
/

org.glassfish.grizzly/ grizzly-websockets-server/ 3.0.0/ org/glassfish/grizzly/http/util/UEncoder.java