diff --git a/pyproject.toml b/pyproject.toml
index 9f7c870f..82d0b689 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -1,6 +1,6 @@
 [project]
 name = "dolma"
-version = "1.0.10"
+version = "1.0.11"
 description = "Data filters"
 license = { text = "Apache-2.0" }
 readme = "README.md"
diff --git a/python/dolma/cli/__main__.py b/python/dolma/cli/__main__.py
index 3b4ea842..55f14f44 100644
--- a/python/dolma/cli/__main__.py
+++ b/python/dolma/cli/__main__.py
@@ -1,93 +1,4 @@
-import multiprocessing
-from argparse import ArgumentParser
-from pathlib import Path
-from typing import Any, Dict, List, Optional, Union
+from dolma.cli.main import main
 
-import smart_open
-from yaml import safe_load
-
-from ..core.paths import exists
-from .analyzer import AnalyzerCli
-from .deduper import DeduperCli
-from .mixer import MixerCli
-
-# must import these to register the resolvers
-from .resolvers import *  # noqa: F401,F403,W0401
-from .tagger import ListTaggerCli, TaggerCli
-from .tokenizer import TokenizerCli
-from .warc import WarcExtractorCli
-
-AVAILABLE_COMMANDS = {
-    "dedupe": DeduperCli,
-    "mix": MixerCli,
-    "tag": TaggerCli,
-    "list": ListTaggerCli,
-    "stat": AnalyzerCli,
-    "tokens": TokenizerCli,
-    "warc": WarcExtractorCli,
-    # following functionality is not yet implemented
-    # "train-ft": None,
-    # "train-lm": None,
-}
-
-
-def read_config(path: Union[None, str]) -> Dict[str, Any]:
-    """Read a configuration file if it exists"""
-    if path is None:
-        return {}
-
-    if not exists(path):
-        raise FileNotFoundError(f"Config file {path} does not exist")
-
-    with smart_open.open(path, mode="rt") as f:
-        return dict(safe_load(f))
-
-
-def main(argv: Optional[List[str]] = None):
-    """Main entry point for the CLI"""
-
-    try:
-        # attempting to set start method to spawn in case it is not set
-        multiprocessing.set_start_method("spawn")
-    except RuntimeError as ex:
-        # method already set, check if it is set to spawn
-        if multiprocessing.get_start_method() != "spawn":
-            raise RuntimeError("Multiprocessing start method must be set to spawn") from ex
-
-    parser = ArgumentParser(
-        prog="dolma",
-        usage="dolma {global options} [command] {command options}",
-        description="Command line interface for the Dolma processing toolkit",
-    )
-    parser.add_argument(
-        "-c",
-        "--config",
-        help="Path to configuration optional file",
-        type=Path,
-        default=None,
-    )
-
-    # Continue by adding subparsers and parsing the arguments
-    subparsers = parser.add_subparsers(dest="command")
-    subparsers.required = True
-    subparsers.choices = AVAILABLE_COMMANDS.keys()  # type: ignore
-    for command, cli in AVAILABLE_COMMANDS.items():
-        cli.make_parser(subparsers.add_parser(command, help=cli.DESCRIPTION))
-
-    # parse the arguments
-    args = parser.parse_args(argv)
-
-    # first, get the command and config path to run
-    command = args.__dict__.pop("command")
-    config_path = args.__dict__.pop("config", None) or None
-
-    # remove the other optional arguments from the top level parser
-    args.__dict__.pop("dolma_version", None)
-    args.__dict__.pop("dolma_commands", None)
-
-    # read the config file if one was provided
-    config = read_config(config_path)
-
-    # get the cli for the command and run it with the config we just loaded + the args
-    cli = AVAILABLE_COMMANDS[command]
-    return cli.run_from_args(args=args, config=config)
+if __name__ == "__main__":
+    main()
diff --git a/python/dolma/cli/main.py b/python/dolma/cli/main.py
new file mode 100644
index 00000000..3b4ea842
--- /dev/null
+++ b/python/dolma/cli/main.py
@@ -0,0 +1,93 @@
+import multiprocessing
+from argparse import ArgumentParser
+from pathlib import Path
+from typing import Any, Dict, List, Optional, Union
+
+import smart_open
+from yaml import safe_load
+
+from ..core.paths import exists
+from .analyzer import AnalyzerCli
+from .deduper import DeduperCli
+from .mixer import MixerCli
+
+# must import these to register the resolvers
+from .resolvers import *  # noqa: F401,F403,W0401
+from .tagger import ListTaggerCli, TaggerCli
+from .tokenizer import TokenizerCli
+from .warc import WarcExtractorCli
+
+AVAILABLE_COMMANDS = {
+    "dedupe": DeduperCli,
+    "mix": MixerCli,
+    "tag": TaggerCli,
+    "list": ListTaggerCli,
+    "stat": AnalyzerCli,
+    "tokens": TokenizerCli,
+    "warc": WarcExtractorCli,
+    # following functionality is not yet implemented
+    # "train-ft": None,
+    # "train-lm": None,
+}
+
+
+def read_config(path: Union[None, str]) -> Dict[str, Any]:
+    """Read a configuration file if it exists"""
+    if path is None:
+        return {}
+
+    if not exists(path):
+        raise FileNotFoundError(f"Config file {path} does not exist")
+
+    with smart_open.open(path, mode="rt") as f:
+        return dict(safe_load(f))
+
+
+def main(argv: Optional[List[str]] = None):
+    """Main entry point for the CLI"""
+
+    try:
+        # attempting to set start method to spawn in case it is not set
+        multiprocessing.set_start_method("spawn")
+    except RuntimeError as ex:
+        # method already set, check if it is set to spawn
+        if multiprocessing.get_start_method() != "spawn":
+            raise RuntimeError("Multiprocessing start method must be set to spawn") from ex
+
+    parser = ArgumentParser(
+        prog="dolma",
+        usage="dolma {global options} [command] {command options}",
+        description="Command line interface for the Dolma processing toolkit",
+    )
+    parser.add_argument(
+        "-c",
+        "--config",
+        help="Path to configuration optional file",
+        type=Path,
+        default=None,
+    )
+
+    # Continue by adding subparsers and parsing the arguments
+    subparsers = parser.add_subparsers(dest="command")
+    subparsers.required = True
+    subparsers.choices = AVAILABLE_COMMANDS.keys()  # type: ignore
+    for command, cli in AVAILABLE_COMMANDS.items():
+        cli.make_parser(subparsers.add_parser(command, help=cli.DESCRIPTION))
+
+    # parse the arguments
+    args = parser.parse_args(argv)
+
+    # first, get the command and config path to run
+    command = args.__dict__.pop("command")
+    config_path = args.__dict__.pop("config", None) or None
+
+    # remove the other optional arguments from the top level parser
+    args.__dict__.pop("dolma_version", None)
+    args.__dict__.pop("dolma_commands", None)
+
+    # read the config file if one was provided
+    config = read_config(config_path)
+
+    # get the cli for the command and run it with the config we just loaded + the args
+    cli = AVAILABLE_COMMANDS[command]
+    return cli.run_from_args(args=args, config=config)