diff --git a/HISTORY b/HISTORY.md similarity index 76% rename from HISTORY rename to HISTORY.md index 44e0583c..b0830703 100644 --- a/HISTORY +++ b/HISTORY.md @@ -1,3 +1,21 @@ +0.6.0a1 +======= + +* Preprocessing of code inputs have changed, and code tokens are no longer treated specially. + Instead, they are treated as normal words and preprocessed using BPE. This allows using any + Huggingface tokenizer without changes. Tasks can still define certain tokens that should be + treated as special tokens. These are either added as new tokens, or further preprocessed + into non-ambiguous sequences of words. +* Old models (MQAN and baselines) were removed. The GloVe vectors and other non-contextual + word embeddings were also removed. Old training options that were ineffective or unused + were removed. +* The internals of the library have been refactored to simplify development allow using any + Huggingface Seq2Seq or MLM model. As a result, the name of the models have changed: `Seq2Seq` + is now `TransformerLSTM` and `Bart` is now `TransformerSeq2Seq`. Command-line flags changed as well. + +NOTE: due to the change in model names and commnd-line flags, this release is not backward +compatible with models trained with genienlp <= 0.5.0 + 0.5.0 ===== diff --git a/setup.py b/setup.py index 939175eb..89e0d584 100644 --- a/setup.py +++ b/setup.py @@ -34,7 +34,7 @@ with open("README.md", "r") as fh: setuptools.setup( name='genienlp', - version='0.5.0', + version='0.6.0a1', packages=setuptools.find_packages(exclude=['tests']), entry_points= {