From 79977cdf4b9a2fcac4c47b458cccca101686da63 Mon Sep 17 00:00:00 2001 From: Mirek Kratochvil Date: Mon, 14 Jul 2025 10:33:22 +0200 Subject: clean up, support external tokenizers --- Opts.hs | 14 +++++++------- 1 file changed, 7 insertions(+), 7 deletions(-) (limited to 'Opts.hs') diff --git a/Opts.hs b/Opts.hs index 761bda0..bc81aad 100644 --- a/Opts.hs +++ b/Opts.hs @@ -9,32 +9,32 @@ import Options.Applicative import Paths_werge (version) data Tokenizer - = TokenizerFilter String - | TokenizeCharClass - | TokenizeCharClassSimple + = TokenizeFilter String + | TokenizeCharCategory + | TokenizeCharCategorySimple deriving (Show) tokenizer = asum - [ TokenizerFilter + [ TokenizeFilter <$> strOption (long "tok-filter" <> short 'F' <> metavar "FILTER" <> help "external program to separate the text to tokens") , flag' - TokenizeCharClassSimple + TokenizeCharCategorySimple (long "simple-tokens" <> short 'i' <> help "use wider character class to separate the tokens (results in larger tokens and ignores case)") , flag' - TokenizeCharClass + TokenizeCharCategory (long "full-tokens" <> short 'I' <> help "separate characters by all known character classes (default)") - , pure TokenizeCharClass + , pure TokenizeCharCategory ] data Spaces -- cgit v1.2.3