diff --git a/website/assets/img/docs/architecture.svg b/website/assets/img/docs/architecture.svg new file mode 100644 index 000000000..d62d08f88 --- /dev/null +++ b/website/assets/img/docs/architecture.svg @@ -0,0 +1,128 @@ + + + + Language + + + + MAKES + + + + nlp.vocab.morphology + + Vocab + + + + nlp.vocab + + StringStore + + + + nlp.vocab.strings + + + + nlp.tokenizer.vocab + + Tokenizer + + + + nlp.make_doc() + + + + nlp.pipeline + + + + nlp.pipeline[i].vocab + + pt + + en + + de + + fr + + es + + it + + nl + + sv + + fi + + nb + + hu + + he + + bn + + ja + + zh + + + + + + doc.vocab + + + + MAKES + + Doc + + + + MAKES + + + + token.doc + + Token + + Span + + + + lexeme.vocab + + Lexeme + + + + MAKES + + + + span.doc + + Dependency Parser + + Entity Recognizer + + Tagger + + Matcher + + Lemmatizer + + Morphology + diff --git a/website/assets/img/docs/language_data.svg b/website/assets/img/docs/language_data.svg new file mode 100644 index 000000000..e32c070ce --- /dev/null +++ b/website/assets/img/docs/language_data.svg @@ -0,0 +1,82 @@ + + + + + + Tokenizer + + + + + + + + + + Base data + + + + + + + + + + + + + + + + Language data + + + + stop words + + + + lexical attributes + + + + + + tokenizer exceptions + + + + + + prefixes, suffixes, infixes + + + + + lemma data + + + + Lemmatizer + + + + char classes + + Token + + + + morph rules + + + + tag map + + Morphology +