diff --git a/src/main/resources/us_uk/stemmer b/src/main/resources/us_uk/stemmer
index 598b93b..ed2fd32 100644
--- a/src/main/resources/us_uk/stemmer
+++ b/src/main/resources/us_uk/stemmer
@@ -9523,7 +9523,7 @@ piddle   piddles piddling piddled
 pidgin   pidgins
 pie   pies
 piece   pieces piecing pieced
-pied-à-terre   pieds-à-terre
+pied-a-terre   pieds-a-terre
 pier   piers
 pierce   pierces piercing pierced
 pierrot   pierrots
diff --git a/src/test/java/org/egothor/stemmer/CompileIntegrationTest.java b/src/test/java/org/egothor/stemmer/CompileIntegrationTest.java
new file mode 100644
index 0000000..2dd68bc
--- /dev/null
+++ b/src/test/java/org/egothor/stemmer/CompileIntegrationTest.java
@@ -0,0 +1,518 @@
+package org.egothor.stemmer;
+
+import static org.junit.jupiter.api.Assertions.assertAll;
+import static org.junit.jupiter.api.Assertions.assertEquals;
+import static org.junit.jupiter.api.Assertions.assertFalse;
+import static org.junit.jupiter.api.Assertions.assertNotNull;
+import static org.junit.jupiter.api.Assertions.assertTrue;
+
+import java.io.BufferedReader;
+import java.io.ByteArrayOutputStream;
+import java.io.IOException;
+import java.io.InputStream;
+import java.io.InputStreamReader;
+import java.io.PrintStream;
+import java.nio.charset.Charset;
+import java.nio.charset.StandardCharsets;
+import java.nio.file.Files;
+import java.nio.file.Path;
+import java.util.LinkedHashMap;
+import java.util.LinkedHashSet;
+import java.util.Map;
+import java.util.Set;
+import java.util.stream.Stream;
+
+import org.junit.jupiter.api.DisplayName;
+import org.junit.jupiter.api.Nested;
+import org.junit.jupiter.api.Tag;
+import org.junit.jupiter.api.Test;
+import org.junit.jupiter.api.TestInstance;
+import org.junit.jupiter.api.io.TempDir;
+import org.junit.jupiter.params.ParameterizedTest;
+import org.junit.jupiter.params.provider.Arguments;
+import org.junit.jupiter.params.provider.MethodSource;
+
+/**
+ * Integration tests for the {@link Compile} CLI.
+ *
+ * <p>
+ * This suite validates the command end to end through real filesystem-based
+ * execution:
+ * </p>
+ *
+ * <ol>
+ * <li>copying a source dictionary resource to a temporary input file</li>
+ * <li>running the CLI against that input file</li>
+ * <li>writing a GZip-compressed binary artifact</li>
+ * <li>reloading the artifact through {@link StemmerPatchTrieBinaryIO}</li>
+ * <li>verifying representative stemming behavior</li>
+ * </ol>
+ *
+ * <p>
+ * The suite intentionally has two layers:
+ * </p>
+ *
+ * <ul>
+ * <li>a focused fixture dictionary that validates remarks, UTF-8, nested output
+ * paths, and {@code --store-original}</li>
+ * <li>real bundled project dictionaries that validate multidictionary CLI
+ * compilation against shipped resources</li>
+ * </ul>
+ */
+@Tag("integration")
+@Tag("cli")
+@Tag("stemmer")
+@TestInstance(TestInstance.Lifecycle.PER_CLASS)
+@DisplayName("Compile integration")
+final class CompileIntegrationTest {
+
+    /**
+     * Dedicated fixture dictionary used for deterministic parser-oriented CLI
+     * integration checks.
+     */
+    private static final String REMARK_AWARE_DICTIONARY_RESOURCE = "org/egothor/stemmer/compile/remark-aware-dictionary.txt";
+
+    /**
+     * Reduction mode used by integration scenarios.
+     */
+    private static final ReductionMode DEFAULT_REDUCTION_MODE = ReductionMode.MERGE_SUBTREES_WITH_EQUIVALENT_RANKED_GET_ALL_RESULTS;
+
+    /**
+     * Reader charset used for robust extraction of ASCII-safe representative probes
+     * from bundled project dictionaries.
+     *
+     * <p>
+     * ISO-8859-1 is intentionally used here as a byte-preserving single-byte
+     * decoder so that the test can safely scan heterogeneous dictionary resources
+     * and then select only ASCII-safe representative terms for semantic assertions.
+     * </p>
+     */
+    private static final Charset BUNDLED_PROBE_SCAN_CHARSET = StandardCharsets.ISO_8859_1;
+
+    /**
+     * Maximum number of representative bundled variants asserted per dictionary.
+     */
+    private static final int REPRESENTATIVE_VARIANT_LIMIT = 32;
+
+    /**
+     * Temporary directory used for filesystem-based command execution.
+     */
+    @TempDir
+    private Path tempDir;
+
+    /**
+     * Provides bundled project dictionary scenarios.
+     *
+     * @return parameter stream
+     */
+    static Stream<Arguments> bundledDictionaryCases() {
+        return Stream.of(Arguments.of("da_dk", "da_dk/stemmer"), Arguments.of("de_de", "de_de/stemmer"),
+                Arguments.of("es_es", "es_es/stemmer"), Arguments.of("fr_fr", "fr_fr/stemmer"),
+                Arguments.of("it_it", "it_it/stemmer"), Arguments.of("nl_nl", "nl_nl/stemmer"),
+                Arguments.of("no_no", "no_no/stemmer"), Arguments.of("pt_pt", "pt_pt/stemmer"),
+                Arguments.of("ru_ru", "ru_ru/stemmer"), Arguments.of("sv_se", "sv_se/stemmer"),
+                Arguments.of("us_uk", "us_uk/stemmer"), Arguments.of("us_uk.profi", "us_uk.profi/stemmer"));
+    }
+
+    @Nested
+    @DisplayName("Remark-aware fixture workflow")
+    final class RemarkAwareFixtureWorkflow {
+
+        /**
+         * Verifies that the CLI can compile the dedicated remark-aware test dictionary,
+         * create nested output directories, preserve expected lookup behavior, and
+         * store canonical stems when {@code --store-original} is enabled.
+         *
+         * @throws IOException if reading or writing fails
+         */
+        @Test
+        @DisplayName("CLI should compile the remark-aware fixture and preserve expected lookups")
+        void shouldCompileRemarkAwareFixtureAndPreserveExpectedLookups() throws IOException {
+            final Path inputFile = copyResourceToTemporaryFile(REMARK_AWARE_DICTIONARY_RESOURCE,
+                    "remark-aware-dictionary.txt");
+            final Path outputFile = tempDir.resolve("fixture").resolve("nested").resolve("fixture.dat.gz");
+
+            final CommandResult result = runWithCapturedStandardError("--input", inputFile.toString(), "--output",
+                    outputFile.toString(), "--reduction-mode", DEFAULT_REDUCTION_MODE.name(), "--store-original");
+
+            assertEquals(0, result.exitCode(), "Fixture compilation must succeed. stderr:\n" + result.standardError());
+            assertTrue(Files.exists(outputFile), "The CLI must create the nested output artifact.");
+            assertTrue(Files.isDirectory(outputFile.getParent()), "The CLI must create missing parent directories.");
+            assertTrue(Files.size(outputFile) > 0L, "The compiled output artifact must not be empty.");
+            assertGzipCompressed(outputFile);
+
+            final FrequencyTrie<String> trie = StemmerPatchTrieBinaryIO.read(outputFile);
+
+            assertVariantResolvesToExpectedStem(trie, "running", Set.of("run"));
+            assertVariantResolvesToExpectedStem(trie, "walked", Set.of("walk"));
+            assertVariantResolvesToExpectedStem(trie, "cities", Set.of("city"));
+            assertVariantResolvesToExpectedStem(trie, "cafÃ©s", Set.of("cafÃ©"));
+            assertVariantResolvesToExpectedStem(trie, "played", Set.of("play"));
+
+            assertAll(
+                    () -> assertEquals(PatchCommandEncoder.NOOP_PATCH, trie.get("run"),
+                            "Stored canonical stem 'run' must resolve through the no-op patch."),
+                    () -> assertEquals(PatchCommandEncoder.NOOP_PATCH, trie.get("walk"),
+                            "Stored canonical stem 'walk' must resolve through the no-op patch."),
+                    () -> assertEquals(PatchCommandEncoder.NOOP_PATCH, trie.get("city"),
+                            "Stored canonical stem 'city' must resolve through the no-op patch."),
+                    () -> assertEquals(PatchCommandEncoder.NOOP_PATCH, trie.get("cafÃ©"),
+                            "Stored canonical stem 'cafÃ©' must resolve through the no-op patch."),
+                    () -> assertEquals("run", PatchCommandEncoder.apply("run", trie.get("run")),
+                            "Stored canonical stem 'run' must reconstruct to itself."),
+                    () -> assertEquals("cafÃ©", PatchCommandEncoder.apply("cafÃ©", trie.get("cafÃ©")),
+                            "Stored canonical stem 'cafÃ©' must reconstruct to itself."));
+        }
+
+        /**
+         * Verifies that the CLI rejects an already existing output path unless
+         * overwrite is explicitly enabled.
+         *
+         * @throws IOException if reading or writing fails
+         */
+        @Test
+        @DisplayName("CLI should require overwrite before replacing an existing output artifact")
+        void shouldRequireOverwriteForExistingOutput() throws IOException {
+            final Path inputFile = copyResourceToTemporaryFile(REMARK_AWARE_DICTIONARY_RESOURCE,
+                    "remark-aware-dictionary-overwrite.txt");
+            final Path outputFile = tempDir.resolve("fixture").resolve("overwrite").resolve("fixture.dat.gz");
+
+            final CommandResult firstRun = runWithCapturedStandardError("--input", inputFile.toString(), "--output",
+                    outputFile.toString(), "--reduction-mode", DEFAULT_REDUCTION_MODE.name());
+
+            assertEquals(0, firstRun.exitCode(),
+                    "Initial fixture compilation must succeed. stderr:\n" + firstRun.standardError());
+            assertTrue(Files.exists(outputFile), "The initial compilation must create the output artifact.");
+            assertTrue(Files.size(outputFile) > 0L, "The initial output artifact must not be empty.");
+
+            final CommandResult secondRunWithoutOverwrite = runWithCapturedStandardError("--input",
+                    inputFile.toString(), "--output", outputFile.toString(), "--reduction-mode",
+                    DEFAULT_REDUCTION_MODE.name());
+
+            assertEquals(1, secondRunWithoutOverwrite.exitCode(),
+                    "Compilation without overwrite must fail when the output file already exists.");
+            assertFalse(secondRunWithoutOverwrite.standardError().isBlank(),
+                    "The CLI must report a meaningful error when overwrite is not enabled.");
+
+            final CommandResult thirdRunWithOverwrite = runWithCapturedStandardError("--input", inputFile.toString(),
+                    "--output", outputFile.toString(), "--reduction-mode", DEFAULT_REDUCTION_MODE.name(),
+                    "--overwrite");
+
+            assertEquals(0, thirdRunWithOverwrite.exitCode(),
+                    "Compilation with overwrite must succeed. stderr:\n" + thirdRunWithOverwrite.standardError());
+            assertTrue(Files.exists(outputFile), "Overwrite compilation must preserve the output artifact.");
+            assertTrue(Files.size(outputFile) > 0L, "Overwrite compilation must produce a non-empty artifact.");
+            assertGzipCompressed(outputFile);
+
+            final FrequencyTrie<String> trie = StemmerPatchTrieBinaryIO.read(outputFile);
+            assertVariantResolvesToExpectedStem(trie, "running", Set.of("run"));
+            assertVariantResolvesToExpectedStem(trie, "walked", Set.of("walk"));
+        }
+
+        /**
+         * Verifies one representative fixture word end to end.
+         *
+         * @param trie          compiled and reloaded trie
+         * @param word          probe word
+         * @param expectedStems acceptable expected stems
+         */
+        private void assertVariantResolvesToExpectedStem(final FrequencyTrie<String> trie, final String word,
+                final Set<String> expectedStems) {
+            final String preferredPatch = trie.get(word);
+            final Set<String> actualStems = reconstructAllStemCandidates(trie, word);
+
+            assertAll(
+                    () -> assertNotNull(preferredPatch,
+                            "A preferred patch must be available for fixture word '" + word + "'."),
+                    () -> assertEquals(expectedStems, actualStems,
+                            "Fixture word '" + word + "' must preserve all expected stem candidates."),
+                    () -> assertTrue(expectedStems.contains(PatchCommandEncoder.apply(word, preferredPatch)),
+                            "The preferred stem must be one of the acceptable stems for fixture word '" + word + "'."));
+        }
+    }
+
+    @Nested
+    @DisplayName("Bundled project dictionary workflows")
+    final class BundledProjectDictionaryWorkflows {
+
+        /**
+         * Verifies that the CLI can compile each bundled project dictionary, create a
+         * compressed artifact, reload it, and preserve representative variant lookup
+         * behavior derived from the source dictionary itself.
+         *
+         * <p>
+         * The representative assertions intentionally target only variant terms, not
+         * canonical stems, because direct lookup of the canonical stem is not part of
+         * the default non-{@code --store-original} contract.
+         * </p>
+         *
+         * @param scenario     scenario identifier
+         * @param resourcePath bundled dictionary resource path
+         * @throws IOException if reading or writing fails
+         */
+        @ParameterizedTest(name = "[{index}] {0}")
+        @MethodSource("org.egothor.stemmer.CompileIntegrationTest#bundledDictionaryCases")
+        @DisplayName("CLI should compile bundled project dictionaries and preserve representative variant semantics")
+        void shouldCompileBundledProjectDictionaryAndPreserveRepresentativeVariantSemantics(final String scenario,
+                final String resourcePath) throws IOException {
+            final Path inputFile = copyResourceToTemporaryFile(resourcePath, scenario + "-stemmer.txt");
+            final Path outputFile = tempDir.resolve("bundled").resolve(scenario).resolve("compiled.dat.gz");
+
+            final CommandResult result = runWithCapturedStandardError("--input", inputFile.toString(), "--output",
+                    outputFile.toString(), "--reduction-mode", DEFAULT_REDUCTION_MODE.name());
+
+            assertEquals(0, result.exitCode(), "Bundled dictionary compilation must succeed for " + scenario
+                    + ". stderr:\n" + result.standardError());
+            assertTrue(Files.exists(outputFile), "The CLI must create the output artifact for " + scenario + '.');
+            assertTrue(Files.size(outputFile) > 0L, "The output artifact must not be empty for " + scenario + '.');
+            assertGzipCompressed(outputFile);
+
+            final FrequencyTrie<String> trie = StemmerPatchTrieBinaryIO.read(outputFile);
+            final Map<String, Set<String>> representativeStemsByVariant = readRepresentativeVariantExpectations(
+                    resourcePath, REPRESENTATIVE_VARIANT_LIMIT);
+
+            assertFalse(representativeStemsByVariant.isEmpty(),
+                    "The bundled dictionary must provide at least one representative variant for " + scenario + '.');
+
+            for (Map.Entry<String, Set<String>> entry : representativeStemsByVariant.entrySet()) {
+                final String variant = entry.getKey();
+                final Set<String> expectedStems = entry.getValue();
+                final String preferredPatch = trie.get(variant);
+                final Set<String> actualStems = reconstructAllStemCandidates(trie, variant);
+
+                assertAll(
+                        () -> assertNotNull(preferredPatch,
+                                "A preferred patch must be available for representative variant '" + variant + "' in "
+                                        + scenario + '.'),
+                        () -> assertFalse(actualStems.isEmpty(),
+                                "At least one stem candidate must be returned for representative variant '" + variant
+                                        + "' in " + scenario + '.'),
+                        () -> assertTrue(actualStems.containsAll(expectedStems),
+                                "All acceptable stems must be preserved for representative variant '" + variant
+                                        + "' in " + scenario + ". Expected=" + expectedStems + ", actual="
+                                        + actualStems),
+                        () -> assertTrue(expectedStems.contains(PatchCommandEncoder.apply(variant, preferredPatch)),
+                                "The preferred stem must be one of the acceptable stems for representative variant '"
+                                        + variant + "' in " + scenario + '.'));
+            }
+        }
+    }
+
+    /**
+     * Copies one classpath resource to a temporary file so that the CLI is
+     * exercised through its real file-based contract.
+     *
+     * @param resourcePath classpath resource path
+     * @param fileName     target temporary file name
+     * @return copied temporary file
+     * @throws IOException if the resource cannot be found or copied
+     */
+    private Path copyResourceToTemporaryFile(final String resourcePath, final String fileName) throws IOException {
+        final Path targetFile = tempDir.resolve(fileName);
+        final Path parentDirectory = targetFile.toAbsolutePath().getParent();
+
+        if (parentDirectory != null) {
+            Files.createDirectories(parentDirectory);
+        }
+
+        try (InputStream inputStream = openResource(resourcePath)) {
+            Files.copy(inputStream, targetFile);
+        }
+
+        return targetFile;
+    }
+
+    /**
+     * Opens one classpath resource.
+     *
+     * @param resourcePath classpath resource path
+     * @return opened input stream
+     * @throws IOException if the resource cannot be found
+     */
+    private static InputStream openResource(final String resourcePath) throws IOException {
+        final InputStream inputStream = CompileIntegrationTest.class.getClassLoader().getResourceAsStream(resourcePath);
+        if (inputStream == null) {
+            throw new IOException("Classpath resource not found: " + resourcePath);
+        }
+        return inputStream;
+    }
+
+    /**
+     * Reads representative variant expectations from a bundled project dictionary.
+     *
+     * <p>
+     * This helper scans the source dictionary in a byte-preserving single-byte
+     * charset and selects only ASCII-safe probe terms. That keeps the
+     * multidictionary integration assertions stable even when the bundled resources
+     * use heterogeneous encodings, while still validating the CLI against the real
+     * shipped dictionaries.
+     * </p>
+     *
+     * <p>
+     * The dictionary format is expected to be:
+     * </p>
+     *
+     * <pre>
+     * stem variant1 variant2 ...
+     * </pre>
+     *
+     * <p>
+     * Lines beginning with comment prefixes or blank lines are ignored. Canonical
+     * stems are intentionally excluded from the expectation map unless they also
+     * appear as distinct variants on a source line.
+     * </p>
+     *
+     * @param resourcePath bundled dictionary resource path
+     * @param limit        maximum number of representative variants to collect
+     * @return representative variants mapped to their acceptable stems
+     * @throws IOException if reading fails
+     */
+    private static Map<String, Set<String>> readRepresentativeVariantExpectations(final String resourcePath,
+            final int limit) throws IOException {
+        final Map<String, Set<String>> expectations = new LinkedHashMap<String, Set<String>>();
+
+        try (InputStream inputStream = openResource(resourcePath);
+                BufferedReader reader = new BufferedReader(
+                        new InputStreamReader(inputStream, BUNDLED_PROBE_SCAN_CHARSET))) {
+            for (String line = reader.readLine(); line != null; line = reader.readLine()) {
+                if (expectations.size() >= limit) {
+                    break;
+                }
+
+                final String trimmedLine = line.trim();
+                if (trimmedLine.isEmpty() || trimmedLine.startsWith("#") || trimmedLine.startsWith("//")) {
+                    continue;
+                }
+
+                final String[] tokens = trimmedLine.split("\\s+");
+                if (tokens.length < 2) {
+                    continue;
+                }
+
+                final String stem = tokens[0];
+                if (!isAsciiProbeToken(stem)) {
+                    continue;
+                }
+
+                for (int index = 1; index < tokens.length && expectations.size() < limit; index++) {
+                    final String variant = tokens[index];
+
+                    if (!isAsciiProbeToken(variant) || variant.equals(stem)) {
+                        continue;
+                    }
+
+                    registerExpectedStem(expectations, variant, stem);
+                }
+            }
+        }
+
+        return expectations;
+    }
+
+    /**
+     * Determines whether one token is suitable for stable ASCII-safe bundled
+     * multidictionary probing.
+     *
+     * @param token token to inspect
+     * @return {@code true} when the token is a non-empty lower-case ASCII letter
+     *         sequence
+     */
+    private static boolean isAsciiProbeToken(final String token) {
+        if (token == null || token.isEmpty()) {
+            return false;
+        }
+
+        for (int index = 0; index < token.length(); index++) {
+            final char character = token.charAt(index);
+            if (character < 'a' || character > 'z') {
+                return false;
+            }
+        }
+
+        return true;
+    }
+
+    /**
+     * Registers one acceptable stem for one input word.
+     *
+     * @param expectedStemsByWord expectation map
+     * @param word                input word
+     * @param stem                acceptable stem
+     */
+    private static void registerExpectedStem(final Map<String, Set<String>> expectedStemsByWord, final String word,
+            final String stem) {
+        Set<String> stems = expectedStemsByWord.get(word);
+        if (stems == null) {
+            stems = new LinkedHashSet<String>();
+            expectedStemsByWord.put(word, stems);
+        }
+        stems.add(stem);
+    }
+
+    /**
+     * Reconstructs all stem candidates returned by the trie for one input word.
+     *
+     * @param trie compiled trie
+     * @param word input word
+     * @return reconstructed stem candidates
+     */
+    private static Set<String> reconstructAllStemCandidates(final FrequencyTrie<String> trie, final String word) {
+        final String[] patchCommands = trie.getAll(word);
+        final Set<String> stems = new LinkedHashSet<String>();
+
+        if (patchCommands == null) {
+            return stems;
+        }
+
+        for (String patchCommand : patchCommands) {
+            stems.add(PatchCommandEncoder.apply(word, patchCommand));
+        }
+
+        return stems;
+    }
+
+    /**
+     * Verifies that one compiled artifact starts with the standard GZip magic
+     * header.
+     *
+     * @param artifactFile compiled artifact file
+     * @throws IOException if the file cannot be read
+     */
+    private static void assertGzipCompressed(final Path artifactFile) throws IOException {
+        final byte[] bytes = Files.readAllBytes(artifactFile);
+
+        assertTrue(bytes.length >= 2, "A GZip artifact must contain at least the two magic header bytes.");
+        assertEquals(0x1F, bytes[0] & 0xFF, "The first GZip magic byte must match.");
+        assertEquals(0x8B, bytes[1] & 0xFF, "The second GZip magic byte must match.");
+    }
+
+    /**
+     * Executes {@link Compile#run(String...)} while capturing {@code System.err}.
+     *
+     * @param arguments CLI arguments
+     * @return captured command result
+     */
+    private static CommandResult runWithCapturedStandardError(final String... arguments) {
+        final PrintStream originalStandardError = System.err;
+        final ByteArrayOutputStream capturedStandardError = new ByteArrayOutputStream();
+
+        try (PrintStream replacementStandardError = new PrintStream(capturedStandardError, true,
+                StandardCharsets.UTF_8)) {
+            System.setErr(replacementStandardError);
+            final int exitCode = Compile.run(arguments);
+            replacementStandardError.flush();
+            return new CommandResult(exitCode, capturedStandardError.toString(StandardCharsets.UTF_8));
+        } finally {
+            System.setErr(originalStandardError);
+        }
+    }
+
+    /**
+     * Captured CLI result.
+     *
+     * @param exitCode      process exit code
+     * @param standardError captured standard error
+     */
+    private record CommandResult(int exitCode, String standardError) {
+    }
+}
\ No newline at end of file
diff --git a/src/test/java/org/egothor/stemmer/CompileTest.java b/src/test/java/org/egothor/stemmer/CompileTest.java
index dd08426..a240776 100644
--- a/src/test/java/org/egothor/stemmer/CompileTest.java
+++ b/src/test/java/org/egothor/stemmer/CompileTest.java
@@ -37,7 +37,6 @@ import org.junit.jupiter.api.io.TempDir;
  * </p>
  */
 @Tag("unit")
-@Tag("cli")
 @DisplayName("Compile")
 class CompileTest {
 
diff --git a/src/test/resources/org/egothor/stemmer/compile/remark-aware-dictionary.txt b/src/test/resources/org/egothor/stemmer/compile/remark-aware-dictionary.txt
new file mode 100644
index 0000000..3a8a9a3
--- /dev/null
+++ b/src/test/resources/org/egothor/stemmer/compile/remark-aware-dictionary.txt
@@ -0,0 +1,8 @@
+# full-line remark
+// full-line slash remark
+
+run running runs runner // trailing remark
+walk walking walks walked
+city cities
+cafÃ© cafÃ©s
+play playing played # trailing remark
\ No newline at end of file