Add Tokenwiser to Projects (#7541)

* Add tokenwiser * Update universe.json
2025-07-15 18:52:29 +03:00 · 2021-04-01 14:39:36 +02:00 · 2021-04-01 14:39:36 +02:00 · 8b3eec6e62
commit 8b3eec6e62
parent 59c2069eb1
1 changed files with 43 additions and 0 deletions
--- a/website/meta/universe.json
+++ b/website/meta/universe.json
@ -231,6 +231,49 @@
                "website": "https://koaning.io"
            }
        },
        {
            "id": "tokenwiser",
            "title": "tokenwiser",
            "slogan": "Connect vowpal-wabbit & scikit-learn models to spaCy to run simple classification benchmarks. Comes with many utility functions for spaCy pipelines.",
            "github": "koaning/tokenwiser",
            "pip": "tokenwiser",
            "thumb": "https://koaning.github.io/tokenwiser/token.png",
            "image": "https://koaning.github.io/tokenwiser/logo-tokw.png",
            "code_example": [
                "import spacy",
                "",
                "from sklearn.pipeline import make_pipeline",
                "from sklearn.feature_extraction.text import CountVectorizer",
                "from sklearn.linear_model import LogisticRegression",
                "",
                "from tokenwiser.component import attach_sklearn_categoriser",
                "",
                "X = [",
                "    'i really like this post',",
                "    'thanks for that comment',",
                "    'i enjoy this friendly forum',",
                "    'this is a bad post',",
                "    'i dislike this article',",
                "    'this is not well written'",
                "]",
                "",
                "y = ['pos', 'pos', 'pos', 'neg', 'neg', 'neg']",
                "",
                "# Note that we're training a pipeline here via a single-batch `.fit()` method",
                "pipe = make_pipeline(CountVectorizer(), LogisticRegression()).fit(X, y)",
                "",
                "nlp = spacy.load('en_core_web_sm')",
                "# This is where we attach our pre-trained model as a pipeline step.",
                "attach_sklearn_categoriser(nlp, pipe_name='silly_sentiment', estimator=pipe)"
            ],
            "category": ["pipeline", "training"],
            "author": "Vincent D. Warmerdam",
            "author_links": {
                "twitter": "fishnets88",
                "github": "koaning",
                "website": "https://koaning.io"
            }
        },
        {
            "id": "spacy-stanza",
            "title": "spacy-stanza",