Rename section and add wrapper docs

2026-01-04 07:53:24 +03:00 · 2017-11-06 02:40:34 +01:00 · 2017-11-06 02:40:34 +01:00 · 68b7e3a33a
commit 68b7e3a33a
parent e62c4a034e
4 changed files with 131 additions and 70 deletions
--- a/website/usage/_data.json
+++ b/website/usage/_data.json
@ -128,7 +128,7 @@
        "next": "training",
        "menu": {
            "Pre-processing Text": "pre-processing",
-            "spaCy and Thinc": "thinc",
+            "Wrapping Models": "wrapping",
            "TensorFlow / Keras": "tensorflow-keras",
            "scikit-learn": "scikit-learn",
            "PyTorch": "pytorch",
--- a/website/usage/_deep-learning/_thinc.jade
+++ b/website/usage/_deep-learning/_thinc.jade
@ -1,66 +0,0 @@
-//- 💫 DOCS > USAGE > DEEP LEARNING > THINC
-
-p
-    |  #[+a(gh("thinc")) Thinc] is the machine learning library powering spaCy.
-    |  It's a practical toolkit for implementing models that follow the
-    |  #[+a("https://explosion.ai/blog/deep-learning-formula-nlp", true) "Embed, encode, attend, predict"]
-    |  architecture. It's designed to be easy to install, efficient for CPU
-    |  usage and optimised for NLP and deep learning with text – in particular,
-    |  hierarchically structured input and variable-length sequences.
-
-p
-    |  spaCy's built-in pipeline components can all be powered by any object
-    |  that follows Thinc's #[code Model] API. If a wrapper is not yet available
-    |  for the library you're using, you should create a
-    |  #[code thinc.neural.Model] subclass that implements a #[code begin_update]
-    |  method. You'll also want to implement #[code to_bytes], #[code from_bytes],
-    |  #[code to_disk] and #[code from_disk] methods, to save and load your
-    |  model. Here's the tempate you'll need to fill in:
-
-    +code("Thinc Model API").
-        class ThincModel(thinc.neural.Model):
-            def __init__(self, *args, **kwargs):
-                pass
-
-            def begin_update(self, X, drop=0.):
-                def backprop(dY, sgd=None):
-                    return dX
-                return Y, backprop
-
-            def to_disk(self, path, **exclude):
-                return None
-
-            def from_disk(self, path, **exclude):
-                return self
-
-            def to_bytes(self, **exclude):
-                return bytes
-
-            def from_bytes(self, msgpacked_bytes, **exclude):
-                return self
-
-p
-    |  The #[code begin_update] method should return a callback, that takes the
-    |  gradient with respect to the output, and returns the gradient with
-    |  respect to the input.  It's usually convenient to implement the callback
-    |  as a nested function, so you can refer to any intermediate variables from
-    |  the forward computation in the enclosing scope.
-
-+h(3, "how-thinc-works") How Thinc works
-
-p
-    |  Neural networks are all about composing small functions that we know how
-    |  to differentiate into larger functions that we know how to differentiate.
-    |  To differentiate a function efficiently, you usually need to store
-    |  intermediate results, computed during the "forward pass", to reuse them
-    |  during the backward pass. Most libraries require the data passed through
-    |  the network to accumulate these intermediate result. This is the "tape"
-    |  in tape-based differentiation.
-
-p
-    |  In Thinc, a model that computes #[code y = f(x)] is required to also
-    |  return a callback that computes #[code dx = f&apos;(dy)]. The same
-    |  intermediate state needs to be tracked, but this becomes an
-    |  implementation detail for the model to take care of – usually, the
-    |  callback is implemented as a closure, so the intermediate results can be
-    |  read from the enclosing scope.
--- a/website/usage/_deep-learning/_wrapping.jade
+++ b/website/usage/_deep-learning/_wrapping.jade
@ -0,0 +1,127 @@
+//- 💫 DOCS > USAGE > DEEP LEARNING > WRAPPING MODELS
+
+p
+    |  #[+a(gh("thinc")) Thinc] is the machine learning library powering spaCy.
+    |  It's a practical toolkit for implementing models that follow the
+    |  #[+a("https://explosion.ai/blog/deep-learning-formula-nlp", true) "Embed, encode, attend, predict"]
+    |  architecture. It's designed to be easy to install, efficient for CPU
+    |  usage and optimised for NLP and deep learning with text – in particular,
+    |  hierarchically structured input and variable-length sequences.
+
+aside("How Thinc works")
+    |  To differentiate a function efficiently, you usually need to store
+    |  intermediate results, computed during the "forward pass", to reuse them
+    |  during the backward pass. Most libraries require the data passed through
+    |  the network to accumulate these intermediate result. In
+    |  #[+a(gh("thinc")) Thinc], a model
+    |  that computes #[code y = f(x)] is required to also
+    |  return a callback that computes #[code dx = f&apos;(dy)]. Usually, the
+    |  callback is implemented as a closure, so the intermediate results can be
+    |  read from the enclosing scope.
+
+p
+    |  spaCy's built-in pipeline components can all be powered by any object
+    |  that follows Thinc's #[code Model] API. If a wrapper is not yet available
+    |  for the library you're using, you should create a
+    |  #[code thinc.neural.Model] subclass that implements a #[code begin_update]
+    |  method. You'll also want to implement #[code to_bytes], #[code from_bytes],
+    |  #[code to_disk] and #[code from_disk] methods, to save and load your
+    |  model.
+
+code("Thinc Model API").
+    class ThincModel(thinc.neural.Model):
+        def __init__(self, *args, **kwargs):
+            pass
+
+        def begin_update(self, X, drop=0.):
+            def backprop(dY, sgd=None):
+                return dX
+            return Y, backprop
+
+        def to_disk(self, path, **exclude):
+            return None
+
+        def from_disk(self, path, **exclude):
+            return self
+
+        def to_bytes(self, **exclude):
+            return bytes
+
+        def from_bytes(self, msgpacked_bytes, **exclude):
+            return self
+
+        def to_gpu(self, device_num):
+            return None
+
+        def to_cpu(self):
+            return None
+
+        def resize_output(self, new_size):
+            return None
+
+        def resize_input(self):
+            return None
+
+        @contextlib.contextmanager
+        def use_params(self, params):
+            return None
+
+table(["Method", "Description"])
+    +row
+        +cell #[code __init__]
+        +cell Initialise the model.
+
+    +row
+        +cell #[code begin_update]
+        +cell Return the output of the wrapped PyTorch model for the given input, along with a callback to handle the backward pass.
+
+    +row
+        +cell #[code to_disk]
+        +cell Save the model's weights to disk.
+
+    +row
+        +cell #[code from_disk]
+        +cell Read the model's weights from disk.
+
+    +row
+        +cell #[code to_bytes]
+        +cell Serialize the model's weights to bytes.
+
+    +row
+        +cell #[code from_bytes]
+        +cell Load the model's weights from bytes.
+
+    +row
+        +cell #[code to_gpu]
+        +cell
+            |  Ensure the model's weights are on the specified GPU device. If
+            |  already on that device, no action is taken.
+
+    +row
+        +cell #[code to_cpu]
+        +cell
+            |  Ensure the model's weights are on CPU. If already on CPU, no
+            |  action is taken.
+
+    +row
+        +cell #[code resize_output]
+        +cell
+            |  Resize the model such that the model's output vector has a new
+            |  size. If #[code new_size] is larger, weights corresponding to
+            |  the new output neurons are zero-initialized. If #[code new_size]
+            |  is smaller, neurons are dropped from the end of the vector.
+
+    +row
+        +cell #[code resize_input]
+        +cell
+            |  Resize the model such that the expects input vectors of a
+            |  different size. If #[code new_size] is larger, weights
+            |  corresponding to the new input neurons are zero-initialized. If
+            |  #[code new_size] is smaller, weights are dropped from the end of
+            |  the vector.
+
+    +row
+        +cell #[code use_params]
+        +cell
+            |  Use the given parameters, for the scope of the contextmanager.
+            |  At the end of the block, the weights are restored.
--- a/website/usage/deep-learning.jade
+++ b/website/usage/deep-learning.jade
@ -8,9 +8,9 @@ include ../_includes/_mixins
    +h(2, "pre-processing") Pre-processing text for deep learning
    include _deep-learning/_pre-processing

-+section("thinc")
-    +h(2, "thinc") spaCy and Thinc
-    include _deep-learning/_thinc
+section("wrapping")
+    +h(2, "wrapping") Wrapping models
+    include _deep-learning/_wrapping

 +section("tensorflow-keras")
    +h(2, "tensorflow-keras") Using spaCy with TensorFlow / Keras