diff --git a/CHANGES.txt b/CHANGES.txt index e576138..ad0f053 100644 --- a/CHANGES.txt +++ b/CHANGES.txt @@ -1,5 +1,14 @@ # CHANGELOG # +## Version 2.2.0, 2022-01-18 ## + +- New feature: Prune XML tags and their contents from the input before + tokenization (via the command line option --prune TAGNAME1 --prune + TAGNAME2 … or by passing prune_tags=["TAGNAME1", "TAGNAME2", …] to + tokenize_xml or tokenize_xml_file). This can be useful when + processing HTML files, e.g. for removing any