/*
* Copyright (c) 2010, 2020 Oracle and/or its affiliates. All rights reserved.
* Copyright 2004 The Apache Software Foundation
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.glassfish.grizzly.http.util;
import java.io.CharArrayWriter;
import java.io.IOException;
import java.io.Writer;
import java.util.BitSet;
import java.util.logging.Level;
import java.util.logging.Logger;
import org.glassfish.grizzly.Grizzly;
Efficient implementation for encoders. This class is not thread safe - you need one encoder per thread. The encoder
will save and recycle the internal objects, avoiding garbage.
You can add extra characters that you want preserved, for example while encoding a URL you can add "/".
Author: Costin Manolache
/**
* Efficient implementation for encoders. This class is not thread safe - you need one encoder per thread. The encoder
* will save and recycle the internal objects, avoiding garbage.
* <p/>
* You can add extra characters that you want preserved, for example while encoding a URL you can add "/".
*
* @author Costin Manolache
*/
public final class UEncoder {
private final static Logger logger = Grizzly.logger(UEncoder.class);
private static final BitSet initialSafeChars = new BitSet(128);
static {
initSafeChars();
}
// Not static - the set may differ ( it's better than adding
// an extra check for "/", "+", etc
private final BitSet safeChars;
private C2BConverter c2b;
private ByteChunk bb;
private String encoding = "UTF8";
private static final int debug = 0;
public UEncoder() {
safeChars = (BitSet) initialSafeChars.clone();
}
public void setEncoding(String s) {
encoding = s;
}
public void addSafeCharacter(char c) {
safeChars.set(c);
}
URL Encode string, using a specified encoding.
Params: - buf – the
Writer
to write the encoded result to. - s – the String to encode.
/**
* URL Encode string, using a specified encoding.
*
* @param buf the {@link Writer} to write the encoded result to.
* @param s the String to encode.
*/
public void urlEncode(Writer buf, String s) throws IOException {
urlEncode(buf, s, false);
}
URL Encode string, using a specified encoding.
Params: - buf – the
Writer
to write the encoded result to. - s – the String to encode.
- toHexUpperCase – the hex string will be in upper case
/**
* URL Encode string, using a specified encoding.
*
* @param buf the {@link Writer} to write the encoded result to.
* @param s the String to encode.
* @param toHexUpperCase the hex string will be in upper case
*/
public void urlEncode(Writer buf, String s, boolean toHexUpperCase) throws IOException {
if (c2b == null) {
bb = new ByteChunk(16); // small enough.
c2b = C2BConverter.getInstance(bb, encoding);
}
for (int i = 0; i < s.length(); i++) {
int c = s.charAt(i);
if (safeChars.get(c)) {
if (debug > 0) {
log("Safe: " + (char) c);
}
buf.write((char) c);
} else {
if (debug > 0) {
log("Unsafe: " + (char) c);
}
c2b.convert((char) c);
// "surrogate" - UTF is _not_ 16 bit, but 21 !!!!
// ( while UCS is 31 ). Amazing...
if (c >= 0xD800 && c <= 0xDBFF) {
if (i + 1 < s.length()) {
int d = s.charAt(i + 1);
if (d >= 0xDC00 && d <= 0xDFFF) {
if (debug > 0) {
log("Unsafe: " + c);
}
c2b.convert((char) d);
i++;
}
}
}
urlEncode(buf, bb.getBuffer(), bb.getStart(), bb.getLength(), toHexUpperCase);
bb.recycle();
}
}
}
/**
*/
public void urlEncode(Writer buf, byte bytes[], int off, int len) throws IOException {
urlEncode(buf, bytes, off, len, false);
}
/**
*/
public void urlEncode(Writer buf, byte bytes[], int off, int len, boolean toHexUpperCase) throws IOException {
for (int j = off; j < len; j++) {
buf.write('%');
char ch = Character.forDigit(bytes[j] >> 4 & 0xF, 16);
if (toHexUpperCase) {
ch = Character.toUpperCase(ch);
}
if (debug > 0) {
log("Encode: " + ch);
}
buf.write(ch);
ch = Character.forDigit(bytes[j] & 0xF, 16);
if (toHexUpperCase) {
ch = Character.toUpperCase(ch);
}
if (debug > 0) {
log("Encode: " + ch);
}
buf.write(ch);
}
}
Utility funtion to re-encode the URL. Still has problems with charset, since UEncoder mostly ignores it.
Params: - url –
/**
* Utility funtion to re-encode the URL. Still has problems with charset, since UEncoder mostly ignores it.
*
* @param url
*/
public String encodeURL(String url) {
return encodeURL(url, false);
}
Utility function to re-encode the URL. Still has problems with charset, since UEncoder mostly ignores it.
Params: - uri – the URI to encode.
- toHexUpperCase – the hex string will be in upper case
/**
* Utility function to re-encode the URL. Still has problems with charset, since UEncoder mostly ignores it.
*
* @param uri the URI to encode.
* @param toHexUpperCase the hex string will be in upper case
*/
public String encodeURL(String uri, boolean toHexUpperCase) {
String outUri = null;
try {
// XXX optimize - recycle, etc
CharArrayWriter out = new CharArrayWriter();
urlEncode(out, uri, toHexUpperCase);
outUri = out.toString();
} catch (IOException ignore) {
}
return outUri;
}
// -------------------- Internal implementation --------------------
private static void initSafeChars() {
int i;
for (i = 'a'; i <= 'z'; i++) {
initialSafeChars.set(i);
}
for (i = 'A'; i <= 'Z'; i++) {
initialSafeChars.set(i);
}
for (i = '0'; i <= '9'; i++) {
initialSafeChars.set(i);
}
// safe
initialSafeChars.set('$');
initialSafeChars.set('-');
initialSafeChars.set('_');
initialSafeChars.set('.');
// Dangerous: someone may treat this as " "
// RFC1738 does allow it, it's not reserved
// initialSafeChars.set('+');
// extra
initialSafeChars.set('!');
initialSafeChars.set('*');
initialSafeChars.set('\'');
initialSafeChars.set('(');
initialSafeChars.set(')');
initialSafeChars.set(',');
}
private static void log(String s) {
if (logger.isLoggable(Level.FINE)) {
logger.fine(s);
}
}
}