-
Notifications
You must be signed in to change notification settings - Fork 56
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
test: add DocumentInputStreamTest test case
- Loading branch information
Showing
7 changed files
with
177 additions
and
7 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
|
@@ -33,6 +33,7 @@ jobs: | |
revert | ||
perf | ||
style | ||
test | ||
scopes: | | ||
core | ||
deps | ||
|
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
163 changes: 163 additions & 0 deletions
163
...tests/src/main/java/org/eclipse/tm4e/ui/tests/internal/utils/DocumentInputStreamTest.java
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,163 @@ | ||
/******************************************************************************* | ||
* Copyright (c) 2024 Sebastian Thomschke and others. | ||
* This program and the accompanying materials are made | ||
* available under the terms of the Eclipse Public License 2.0 | ||
* which is available at https://www.eclipse.org/legal/epl-2.0/ | ||
* | ||
* SPDX-License-Identifier: EPL-2.0 | ||
* | ||
* Contributors: | ||
* Sebastian Thomschke - initial implementation | ||
*******************************************************************************/ | ||
package org.eclipse.tm4e.ui.tests.internal.utils; | ||
|
||
import static java.nio.charset.StandardCharsets.UTF_8; | ||
import static org.junit.Assert.*; | ||
|
||
import java.io.ByteArrayInputStream; | ||
import java.io.IOException; | ||
import java.util.ArrayList; | ||
|
||
import org.eclipse.core.resources.IFile; | ||
import org.eclipse.core.resources.IProject; | ||
import org.eclipse.core.resources.ResourcesPlugin; | ||
import org.eclipse.core.runtime.CoreException; | ||
import org.eclipse.jface.text.IDocument; | ||
import org.eclipse.tm4e.ui.internal.utils.DocumentInputStream; | ||
import org.eclipse.ui.editors.text.FileDocumentProvider; | ||
import org.eclipse.ui.part.FileEditorInput; | ||
import org.eclipse.ui.texteditor.IDocumentProvider; | ||
import org.junit.Before; | ||
import org.junit.Test; | ||
|
||
class DocumentInputStreamTest { | ||
|
||
private static final String TEST_ASCII = "Hello, World!"; | ||
|
||
private static final String EMOJI = "😊"; | ||
private static final int EMOJI_BYTES_LEN = EMOJI.getBytes(UTF_8).length; | ||
private static final String JAPANESE = "こんにちは"; | ||
private static final String TEST_UNICODE = EMOJI + JAPANESE; | ||
private static final int TEST_UNICODE_BYTES_LEN = TEST_UNICODE.getBytes(UTF_8).length; | ||
|
||
private final IDocumentProvider documentProvider = new FileDocumentProvider(); | ||
private IDocument document; | ||
|
||
@Before | ||
public void setUp() throws CoreException { | ||
final IProject p = ResourcesPlugin.getWorkspace().getRoot().getProject(getClass().getName() + System.currentTimeMillis()); | ||
p.create(null); | ||
p.open(null); | ||
|
||
IFile testFile = p.getFile("testfile"); | ||
testFile.create(new ByteArrayInputStream(TEST_UNICODE.getBytes()), true, null); | ||
final var editorInput = new FileEditorInput(testFile); | ||
documentProvider.connect(editorInput); | ||
document = documentProvider.getDocument(editorInput); | ||
} | ||
|
||
@Test | ||
public void testAvailable() throws IOException { | ||
document.set(TEST_ASCII); | ||
try (var is = new DocumentInputStream(document)) { | ||
assertEquals(UTF_8, is.getCharset()); | ||
assertEquals(TEST_ASCII.length(), is.available()); | ||
final byte[] buffer = new byte[4]; | ||
is.read(buffer); | ||
assertEquals(TEST_ASCII.length() - 4, is.available()); | ||
is.readAllBytes(); | ||
assertEquals(0, is.available()); | ||
} | ||
|
||
document.set(TEST_UNICODE); | ||
try (var is = new DocumentInputStream(document)) { | ||
assertEquals(UTF_8, is.getCharset()); | ||
assertTrue(is.available() > 0); | ||
is.read(new byte[10]); | ||
assertTrue(is.available() > 0); | ||
is.readAllBytes(); | ||
assertEquals(0, is.available()); | ||
} | ||
} | ||
|
||
@Test | ||
public void testEndOfStream() throws IOException { | ||
try (var is = new DocumentInputStream(document)) { | ||
assertEquals(UTF_8, is.getCharset()); | ||
is.skip(Long.MAX_VALUE); | ||
assertEquals(-1, is.read()); | ||
} | ||
} | ||
|
||
@Test | ||
public void testReadEachByte() throws IOException { | ||
try (var is = new DocumentInputStream(document)) { | ||
assertEquals(UTF_8, is.getCharset()); | ||
final var bytesRead = new ArrayList<Byte>(); | ||
int b; | ||
while ((b = is.read()) != -1) { | ||
bytesRead.add((byte) b); | ||
} | ||
|
||
final byte[] byteArray = new byte[bytesRead.size()]; | ||
for (int i = 0; i < bytesRead.size(); i++) { | ||
byteArray[i] = bytesRead.get(i); | ||
} | ||
assertEquals(TEST_UNICODE, new String(byteArray, UTF_8)); | ||
} | ||
} | ||
|
||
@Test | ||
public void testReadIntoByteArray() throws IOException { | ||
final byte[] buffer = new byte[1024]; // Buffer to read a portion of the text | ||
|
||
try (var is = new DocumentInputStream(document)) { | ||
assertEquals(UTF_8, is.getCharset()); | ||
final int bytesRead = is.read(buffer, 0, buffer.length); | ||
|
||
assertEquals(TEST_UNICODE, new String(buffer, 0, bytesRead, UTF_8)); | ||
} | ||
} | ||
|
||
@Test | ||
public void testSkip() throws IOException { | ||
try (var is = new DocumentInputStream(document)) { | ||
assertEquals(UTF_8, is.getCharset()); | ||
// skip emoji | ||
final long skipped = is.skip(EMOJI_BYTES_LEN); | ||
assertEquals(EMOJI_BYTES_LEN, skipped); | ||
|
||
final byte[] japanese = new byte[TEST_UNICODE_BYTES_LEN]; | ||
final int bytesRead = is.read(japanese); | ||
|
||
assertEquals(JAPANESE, new String(japanese, 0, bytesRead, UTF_8)); | ||
} | ||
} | ||
|
||
@Test | ||
public void testHighSurrogateAtEndOfInput() throws IOException { | ||
document.set(new String(new char[] { 'A', '\uD800' })); // valid char followed by an isolated high surrogate | ||
try (var is = new DocumentInputStream(document)) { | ||
assertEquals(UTF_8, is.getCharset()); | ||
final byte[] result = is.readAllBytes(); | ||
final String output = new String(result, UTF_8); | ||
|
||
// the high surrogate at the end should be replaced by the | ||
// Unicode replacement char | ||
assertEquals("A\uFFFD", output); | ||
} | ||
} | ||
|
||
@Test | ||
public void testHighSurrogateWithoutLowSurrogate() throws IOException { | ||
document.set(new String(new char[] { '\uD800', 'A' })); // \uD800 is a high surrogate, followed by 'A' | ||
try (var is = new DocumentInputStream(document)) { | ||
assertEquals(UTF_8, is.getCharset()); | ||
final byte[] result = is.readAllBytes(); | ||
final String output = new String(result, UTF_8); | ||
|
||
// the invalid surrogate pair should be replaced by the Unicode replacement char | ||
assertEquals("\uFFFD" + "A", output); | ||
} | ||
} | ||
} |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters