TestPercentCodec.java
/*
* ====================================================================
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing,
* software distributed under the License is distributed on an
* "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
* KIND, either express or implied. See the License for the
* specific language governing permissions and limitations
* under the License.
* ====================================================================
*
* This software consists of voluntary contributions made by many
* individuals on behalf of the Apache Software Foundation. For more
* information on the Apache Software Foundation, please see
* <http://www.apache.org/>.
*
*/
package org.apache.hc.core5.net;
import static org.junit.jupiter.api.Assertions.assertEquals;
import java.nio.charset.StandardCharsets;
import java.util.stream.Stream;
import org.junit.jupiter.api.Test;
import org.junit.jupiter.params.ParameterizedTest;
import org.junit.jupiter.params.provider.MethodSource;
/**
* Unit tests for {@link PercentCodec}.
*/
class TestPercentCodec {
@Test
void testCoding() {
final StringBuilder buf = new StringBuilder();
PercentCodec.encode(buf, "blah!", StandardCharsets.UTF_8);
PercentCodec.encode(buf, " ~ ", StandardCharsets.UTF_8);
PercentCodec.encode(buf, "huh?", StandardCharsets.UTF_8);
assertEquals("blah%21%20~%20huh%3F", buf.toString());
}
@Test
void testDecoding() {
assertEquals("blah! ~ huh?", PercentCodec.decode("blah%21%20~%20huh%3F", StandardCharsets.UTF_8));
assertEquals("blah!+~ huh?", PercentCodec.decode("blah%21+~%20huh%3F", StandardCharsets.UTF_8));
assertEquals("blah! ~ huh?", PercentCodec.decode("blah%21+~%20huh%3F", StandardCharsets.UTF_8, true));
}
@Test
void testDecodingPartialContent() {
assertEquals("blah! %", PercentCodec.decode("blah%21%20%", StandardCharsets.UTF_8));
assertEquals("blah! %a", PercentCodec.decode("blah%21%20%a", StandardCharsets.UTF_8));
assertEquals("blah! %wa", PercentCodec.decode("blah%21%20%wa", StandardCharsets.UTF_8));
}
@ParameterizedTest
@MethodSource("params")
void testRfc5987EncodingDecoding(final String input, final String expected) {
assertEquals(expected, PercentCodec.RFC5987.encode(input));
assertEquals(input, PercentCodec.RFC5987.decode(expected));
}
static Stream<Object[]> params() {
return Stream.of(
new Object[]{"foo-��-���.html", "foo-%C3%A4-%E2%82%AC.html"},
new Object[]{"��������������������� 2.jpg", "%E4%B8%96%E7%95%8C%E3%83%BC%E3%83%95%E3%82%A1%E3%82%A4%E3%83%AB%202.jpg"},
new Object[]{"foo.jpg", "foo.jpg"},
new Object[]{"simple", "simple"}, // Unreserved characters
new Object[]{"reserved/chars?", "reserved%2Fchars%3F"}, // Reserved characters
new Object[]{"", ""}, // Empty string
new Object[]{"space test", "space%20test"}, // String with space
new Object[]{"��mlaut", "%C3%BCmlaut"} // Non-ASCII characters
);
}
@Test
void verifyRfc5987EncodingandDecoding() {
final String s = "!\"$��%^&*()_-+={[}]:@~;'#,./<>?\\|���������������";
assertEquals(s, PercentCodec.RFC5987.decode(PercentCodec.RFC5987.encode(s)));
}
@Test
void testRfc7639CanonicalAlpnTokenEncoding() {
// RFC 7639 requires protocol-id to be a token and applies additional canonical constraints:
// - Octets not allowed in tokens MUST be percent-encoded (RFC 3986).
// - '%' MUST be percent-encoded.
// - Octets that are valid token characters MUST NOT be percent-encoded (except '%').
// - Uppercase hex digits MUST be used.
assertEquals("h2", PercentCodec.HTTP_TOKEN.encode("h2"));
assertEquals("http%2F1.1", PercentCodec.HTTP_TOKEN.encode("http/1.1"));
assertEquals("%25", PercentCodec.HTTP_TOKEN.encode("%"));
assertEquals("foo+bar", PercentCodec.HTTP_TOKEN.encode("foo+bar"));
assertEquals("!#$&'*+-.^_`|~", PercentCodec.HTTP_TOKEN.encode("!#$&'*+-.^_`|~"));
assertEquals("foo bar", PercentCodec.HTTP_TOKEN.decode("foo%20bar"));
assertEquals("ws/��", PercentCodec.HTTP_TOKEN.decode("ws%2F%C3%A9"));
}
@Test
void testPercentCodecEncodeIsNotRfc7639Canonical() {
// PercentCodec.encode(..) uses RFC 3986 UNRESERVED as the safe set.
// This percent-encodes valid RFC 7230 tchar like '+', '*', '!', '|', which RFC 7639 forbids.
assertEquals("foo%2Bbar", PercentCodec.encode("foo+bar", StandardCharsets.UTF_8));
assertEquals("%2A", PercentCodec.encode("*", StandardCharsets.UTF_8));
assertEquals("%21", PercentCodec.encode("!", StandardCharsets.UTF_8));
assertEquals("%7C", PercentCodec.encode("|", StandardCharsets.UTF_8));
}
}