MalformedInputException test functions are added

This commit is contained in:
Afshin 2019-09-29 18:30:31 +02:00
parent e8f83431b3
commit 230b2db438
2 changed files with 70 additions and 5 deletions

View File

@ -1,10 +1,9 @@
package com.baeldung.encoding;
import java.io.File;
import java.io.FileInputStream;
import java.io.IOException;
import java.io.InputStreamReader;
import java.io.UnsupportedEncodingException;
import java.io.*;
import java.nio.charset.Charset;
import java.nio.charset.CharsetDecoder;
import java.nio.charset.CodingErrorAction;
public class CharacterEncodingExamples {
@ -29,4 +28,15 @@ public class CharacterEncodingExamples {
}
return buffer.toString();
}
static String decodeText(String input, Charset charset, CodingErrorAction codingErrorAction) throws IOException {
CharsetDecoder charsetDecoder = charset.newDecoder();
charsetDecoder.onMalformedInput(codingErrorAction);
return new BufferedReader(
new InputStreamReader(
new ByteArrayInputStream(input.getBytes()),
charsetDecoder))
.readLine();
}
}

View File

@ -1,9 +1,21 @@
package com.baeldung.encoding;
import java.io.BufferedReader;
import java.io.IOException;
import java.io.InputStreamReader;
import java.io.Reader;
import java.nio.charset.*;
import java.nio.file.Path;
import java.nio.file.Paths;
import java.util.ArrayList;
import java.util.Arrays;
import java.util.List;
import org.junit.Assert;
import org.junit.Test;
import org.junit.jupiter.api.Assertions;
import static java.nio.file.Files.newInputStream;
public class CharacterEncodingExamplesUnitTest {
@ -58,4 +70,47 @@ public class CharacterEncodingExamplesUnitTest {
"0 0 10001010 10011110 ");
}
@Test
public void givenUTF8String_decodeByUS_ASCII_ReplaceMalformedInputSequence() throws IOException {
String input = "The façade pattern is a software design pattern.";
Assertions.assertEquals(CharacterEncodingExamples.decodeText(input, StandardCharsets.US_ASCII, CodingErrorAction.REPLACE),
"The fa<66><61>ade pattern is a software design pattern.");
}
@Test
public void givenUTF8String_decodeByUS_ASCII_IgnoreMalformedInputSequence() throws IOException {
String input = "The façade pattern is a software design pattern.";
Assertions.assertEquals(
CharacterEncodingExamples.decodeText(input, StandardCharsets.US_ASCII, CodingErrorAction.IGNORE),
"The faade pattern is a software design pattern.");
}
@Test
public void givenUTF8String_decodeByUS_ASCII_ReportMalformedInputSequence() {
String input = "The façade pattern is a software design pattern.";
Assertions.assertThrows(MalformedInputException.class,
() -> CharacterEncodingExamples.decodeText(input, StandardCharsets.US_ASCII, CodingErrorAction.REPORT));
}
@Test
public void givenTextFile_FindSuitableCandidateEncodings() {
Path path = Paths.get("src/test/resources/encoding.txt");
List<Charset> allCandidateCharSets = Arrays.asList(StandardCharsets.US_ASCII, StandardCharsets.UTF_8, StandardCharsets.ISO_8859_1);
List<Charset> suitableCharsets = new ArrayList<>();
allCandidateCharSets.forEach(charset -> {
try {
CharsetDecoder charsetDecoder = charset.newDecoder().onMalformedInput(CodingErrorAction.REPORT);
Reader reader = new InputStreamReader(newInputStream(path), charsetDecoder);
BufferedReader bufferedReader = new BufferedReader(reader);
while (bufferedReader.readLine() != null) {
}
suitableCharsets.add(charset);
} catch (MalformedInputException ignored) {
} catch (IOException ex) {
ex.printStackTrace();
}
});
Assertions.assertEquals(suitableCharsets, Arrays.asList(StandardCharsets.UTF_8, StandardCharsets.ISO_8859_1));
}
}