Export @195097388.

a4bb31d0 · Terry Koo · dea7ecf6 · a4bb31d0 · a4bb31d0 · a4bb31d0
Commit a4bb31d0 authored May 02, 2018 by Terry Koo
20 changed files
--- a/research/syntaxnet/dragnn/runtime/feed_forward_network_kernel_test.cc
+++ b/research/syntaxnet/dragnn/runtime/feed_forward_network_kernel_test.cc
+// Copyright 2017 Google Inc. All Rights Reserved.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+// =============================================================================
+
+#include "dragnn/runtime/feed_forward_network_kernel.h"
+
+#include <stddef.h>
+#include <algorithm>
+#include <memory>
+#include <string>
+
+#include "dragnn/core/test/generic.h"
+#include "dragnn/protos/spec.pb.h"
+#include "dragnn/runtime/flexible_matrix_kernel.h"
+#include "dragnn/runtime/math/types.h"
+#include "dragnn/runtime/network_states.h"
+#include "dragnn/runtime/test/network_test_base.h"
+#include "dragnn/runtime/variable_store.h"
+#include "syntaxnet/base.h"
+#include "tensorflow/core/lib/core/errors.h"
+#include "tensorflow/core/lib/core/status.h"
+#include "tensorflow/core/lib/core/status_test_util.h"
+#include "tensorflow/core/lib/strings/strcat.h"
+#include "tensorflow/core/platform/test.h"
+
+namespace syntaxnet {
+namespace dragnn {
+namespace runtime {
+namespace {
+
+class FeedForwardNetworkKernelTest : public NetworkTestBase {
+ protected:
+  // Adds a weight matrix with the |name_suffix| with the given dimensions and
+  // |fill_value|.
+  void AddWeights(const string &name_suffix, size_t num_rows,
+                  size_t num_columns, float fill_value) {
+    const string weights_name =
+        tensorflow::strings::StrCat(kTestComponentName, "/weights_",
+                                    name_suffix, FlexibleMatrixKernel::kSuffix);
+    AddMatrixVariable(weights_name, num_columns, num_rows, fill_value);
+  }
+
+  // Adds a bias vector with the |name_suffix| with the given dimensions and
+  // |fill_value|.
+  void AddBiases(const string &name_suffix, size_t dimension,
+                 float fill_value) {
+    const string biases_name =
+        tensorflow::strings::StrCat(kTestComponentName, "/bias_", name_suffix);
+    AddVectorVariable(biases_name, dimension, fill_value);
+  }
+
+  // Initializes the |kernel_| based on the |component_spec_text|.  On error,
+  // returns non-OK.
+  tensorflow::Status Initialize(const string &component_spec_text) {
+    ComponentSpec component_spec;
+    CHECK(TextFormat::ParseFromString(component_spec_text, &component_spec));
+    component_spec.set_name(kTestComponentName);
+
+    // Since FeedForwardNetwork uses the concatenated input, it is insensitive
+    // to the particular fixed or linked embedding inputs.  For simplicity, the
+    // tests use a trivial network structure and a single fixed embedding.
+    AddComponent(kTestComponentName);
+
+    TF_RETURN_IF_ERROR(kernel_.Initialize(component_spec, &variable_store_,
+                                          &network_state_manager_));
+
+    size_t input_dimension = 0;
+    for (const FixedFeatureChannel &channel : component_spec.fixed_feature()) {
+      input_dimension += channel.embedding_dim();
+    }
+    return kernel_.ValidateInputDimension(input_dimension);
+  }
+
+  FeedForwardNetworkKernel kernel_;
+};
+
+// Tests that FeedForwardNetworkKernel fails when a weight matrix does not match
+// the dimension of its output activations.
+TEST_F(FeedForwardNetworkKernelTest, BadWeightRows) {
+  const size_t kInputDim = 5;
+  const size_t kLogitsDim = 3;
+  const string kBadSpec = R"(fixed_feature {
+                               vocabulary_size: 50
+                               embedding_dim: 5
+                               size: 1
+                             }
+                             num_actions: 3)";
+  AddWeights("softmax", kInputDim, kLogitsDim - 1 /* bad */, 1.0);
+  AddBiases("softmax", kLogitsDim, 1.0);
+
+  EXPECT_THAT(
+      Initialize(kBadSpec),
+      test::IsErrorWithSubstr(
+          "Weight matrix shape should be output dimension plus padding"));
+}
+
+// Tests that FeedForwardNetworkKernel fails when a weight matrix does not match
+// the dimension of its input activations.
+TEST_F(FeedForwardNetworkKernelTest, BadWeightColumns) {
+  const size_t kInputDim = 5;
+  const size_t kLogitsDim = 3;
+  const string kBadSpec = R"(fixed_feature {
+                               vocabulary_size: 50
+                               embedding_dim: 5
+                               size: 1
+                             }
+                             num_actions: 3)";
+  AddWeights("softmax", kInputDim + 1 /* bad */, kLogitsDim, 1.0);
+  AddBiases("softmax", kLogitsDim, 1.0);
+
+  EXPECT_THAT(Initialize(kBadSpec),
+              test::IsErrorWithSubstr(
+                  "Weight matrix shape does not match input dimension"));
+}
+
+// Tests that FeedForwardNetworkKernel fails when a bias vector does not match
+// the dimension of its output activations.
+TEST_F(FeedForwardNetworkKernelTest, BadBiasDimension) {
+  const size_t kInputDim = 5;
+  const size_t kLogitsDim = 3;
+  const string kBadSpec = R"(fixed_feature {
+                               vocabulary_size: 50
+                               embedding_dim: 5
+                               size: 1
+                             }
+                             num_actions: 3)";
+  AddWeights("softmax", kInputDim, kLogitsDim, 1.0);
+  AddBiases("softmax", kLogitsDim + 1 /* bad */, 1.0);
+
+  EXPECT_THAT(Initialize(kBadSpec),
+              test::IsErrorWithSubstr(
+                  "Bias vector shape does not match output dimension"));
+}
+
+// Tests that FeedForwardNetworkKernel fails when the value of the
+// "layer_norm_input" option is not false.
+TEST_F(FeedForwardNetworkKernelTest, UnsupportedLayerNormInputOption) {
+  const string kBadSpec = R"(network_unit {
+                               parameters {
+                                 key: 'layer_norm_input'
+                                 value: 'true'
+                               }
+                             })";
+
+  EXPECT_THAT(Initialize(kBadSpec),
+              test::IsErrorWithSubstr("Layer norm is not supported"));
+}
+
+// Tests that FeedForwardNetworkKernel fails when the value of the
+// "layer_norm_hidden" option is not false.
+TEST_F(FeedForwardNetworkKernelTest, UnsupportedLayerNormHiddenOption) {
+  const string kBadSpec = R"(network_unit {
+                               parameters {
+                                 key: 'layer_norm_hidden'
+                                 value: 'true'
+                               }
+                             })";
+
+  EXPECT_THAT(Initialize(kBadSpec),
+              test::IsErrorWithSubstr("Layer norm is not supported"));
+}
+
+// Tests that FeedForwardNetworkKernel fails when the value of the
+// "nonlinearity" option is not "relu".
+TEST_F(FeedForwardNetworkKernelTest, UnsupportedNonlinearityOption) {
+  const string kBadSpec = R"(network_unit {
+                               parameters {
+                                 key: 'nonlinearity'
+                                 value: 'elu'
+                               }
+                             })";
+
+  EXPECT_THAT(Initialize(kBadSpec),
+              test::IsErrorWithSubstr("Non-linearity is not supported"));
+}
+
+// Tests that the FeedForwardNetworkKernel works when there are no hidden
+// layers, just a softmax that computes logits.
+TEST_F(FeedForwardNetworkKernelTest, JustLogits) {
+  const size_t kInputDim = 5;
+  const size_t kLogitsDim = 3;
+  const string kSpec = R"(fixed_feature {
+                            vocabulary_size: 50
+                            embedding_dim: 5
+                            size: 1
+                          }
+                          num_actions: 3)";
+  AddWeights("softmax", kInputDim, kLogitsDim, 0.0);
+  AddBiases("softmax", kLogitsDim, 0.0);
+
+  TF_ASSERT_OK(Initialize(kSpec));
+
+  EXPECT_EQ(kernel_.logits_name(), "logits");
+  EXPECT_EQ(kernel_.layers().size(), 1);
+}
+
+// Tests that the FeedForwardNetworkKernel works with multiple hidden layers as
+// well as a softmax that computes logits.
+TEST_F(FeedForwardNetworkKernelTest, MultiLayer) {
+  const size_t kDims[] = {5, 4, 3, 2};
+  const string kSpec = R"(fixed_feature {
+                            vocabulary_size: 50
+                            embedding_dim: 5
+                            size: 1
+                          }
+                          network_unit {
+                            parameters {
+                              key: 'hidden_layer_sizes'
+                              value: '4,3'
+                            }
+                          }
+                          num_actions: 2)";
+  AddWeights("0", kDims[0], kDims[1], 0.0);
+  AddBiases("0", kDims[1], 0.0);
+  AddWeights("1", kDims[1], kDims[2], 0.0);
+  AddBiases("1", kDims[2], 0.0);
+  AddWeights("softmax", kDims[2], kDims[3], 0.0);
+  AddBiases("softmax", kDims[3], 0.0);
+
+  TF_ASSERT_OK(Initialize(kSpec));
+
+  EXPECT_EQ(kernel_.logits_name(), "logits");
+  EXPECT_EQ(kernel_.layers().size(), 3);
+}
+
+// Tests that the FeedForwardNetworkKernel does not produce logits and does not
+// use the softmax variables when the component is deterministic.
+TEST_F(FeedForwardNetworkKernelTest, NoLogitsOrSoftmaxWhenDeterministic) {
+  const size_t kDims[] = {5, 4};
+  const string kSpec = R"(num_actions: 1
+                          fixed_feature {
+                            vocabulary_size: 50
+                            embedding_dim: 5
+                            size: 1
+                          }
+                          network_unit {
+                            parameters {
+                              key: 'hidden_layer_sizes'
+                              value: '4'
+                            }
+                          })";
+
+  // No "softmax" weights or biases.
+  AddWeights("0", kDims[0], kDims[1], 0.0);
+  AddBiases("0", kDims[1], 0.0);
+
+  TF_ASSERT_OK(Initialize(kSpec));
+
+  // No specified logits layer.
+  EXPECT_TRUE(kernel_.logits_name().empty());
+  EXPECT_EQ(kernel_.layers().size(), 1);
+}
+
+// Tests that the FeedForwardNetworkKernel does not produce logits when
+// omit_logits is true, even if there are actions.
+TEST_F(FeedForwardNetworkKernelTest, NoLogitsOrSoftmaxWhenOmitLogitsTrue) {
+  const size_t kDims[] = {5, 4};
+  const string kSpec = R"(fixed_feature {
+                            vocabulary_size: 50
+                            embedding_dim: 5
+                            size: 1
+                          }
+                          network_unit {
+                            parameters {
+                              key: 'hidden_layer_sizes'
+                              value: '4'
+                            }
+                            parameters {
+                              key: 'omit_logits'
+                              value: 'true'
+                            }
+                          }
+                          num_actions: 10)";
+
+  // No "softmax" weights or biases.
+  AddWeights("0", kDims[0], kDims[1], 0.0);
+  AddBiases("0", kDims[1], 0.0);
+
+  TF_ASSERT_OK(Initialize(kSpec));
+
+  // No specified logits layer.
+  EXPECT_TRUE(kernel_.logits_name().empty());
+  EXPECT_EQ(kernel_.layers().size(), 1);
+}
+
+}  // namespace
+}  // namespace runtime
+}  // namespace dragnn
+}  // namespace syntaxnet
--- a/research/syntaxnet/dragnn/runtime/feed_forward_network_layer.cc
+++ b/research/syntaxnet/dragnn/runtime/feed_forward_network_layer.cc
+// Copyright 2017 Google Inc. All Rights Reserved.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+// =============================================================================
+
+#include "dragnn/runtime/feed_forward_network_layer.h"
+
+#include "tensorflow/core/lib/core/errors.h"
+
+namespace syntaxnet {
+namespace dragnn {
+namespace runtime {
+
+constexpr char FeedForwardNetworkLayer::kLogitsName[];
+
+tensorflow::Status FeedForwardNetworkLayer::Initialize(
+    const string &component_name, const string &layer_name,
+    size_t output_dimension, ActivationFunction activation_function,
+    const string &variable_suffix, VariableStore *variable_store,
+    NetworkStateManager *network_state_manager) {
+  debug_name_ = tensorflow::strings::StrCat(component_name, "/", layer_name);
+  activation_function_ = activation_function;
+
+  const string weights_name =
+      tensorflow::strings::StrCat(component_name, "/weights_", variable_suffix);
+  const string biases_name =
+      tensorflow::strings::StrCat(component_name, "/bias_", variable_suffix);
+
+  TF_RETURN_IF_ERROR(variable_store->Lookup(biases_name, &biases_));
+  TF_RETURN_IF_ERROR(matrix_kernel_.Initialize(
+      debug_name_, weights_name, output_dimension, variable_store));
+
+  TF_RETURN_IF_ERROR(
+      network_state_manager->AddLayer(layer_name, output_dimension, &handle_));
+  if (!matrix_kernel_.MatchesOutputDimension(output_dimension)) {
+    return tensorflow::errors::InvalidArgument(
+        "Weight matrix shape should be output dimension plus padding. ",
+        debug_name_, ": weights=[", matrix_kernel_.NumPaddedRows(), ", ",
+        matrix_kernel_.NumColumns(), "] vs output=", output_dimension);
+  }
+
+  // NOTE(gatoatigrado): Do we need to pad the bias vector?
+  if (biases_.size() != output_dimension) {
+    return tensorflow::errors::InvalidArgument(
+        "Bias vector shape does not match output dimension in ", debug_name_,
+        ": biases=[", biases_.size(), "] vs output=", output_dimension);
+  }
+
+  return tensorflow::Status::OK();
+}
+
+tensorflow::Status FeedForwardNetworkLayer::InitializeSoftmax(
+    const ComponentSpec &component_spec, VariableStore *variable_store,
+    NetworkStateManager *network_state_manager) {
+  return Initialize(component_spec.name(), kLogitsName,
+                    component_spec.num_actions(), ActivationFunction::kIdentity,
+                    "softmax", variable_store, network_state_manager);
+}
+
+tensorflow::Status FeedForwardNetworkLayer::CheckInputDimAndGetOutputDim(
+    size_t input_dim, size_t *output_dim) const {
+  if (matrix_kernel_.NumColumns() != input_dim) {
+    return tensorflow::errors::InvalidArgument(
+        "Weight matrix shape does not match input dimension in ", debug_name_,
+        ": weights=[", matrix_kernel_.NumPaddedRows(), ", ",
+        matrix_kernel_.NumColumns(), "] vs input=", input_dim);
+  }
+
+  *output_dim = matrix_kernel_.NumPaddedRows();
+  return tensorflow::Status::OK();
+}
+
+MutableMatrix<float> FeedForwardNetworkLayer::Apply(
+    Matrix<float> inputs, const NetworkStates &network_states) const {
+  const MutableMatrix<float> outputs = network_states.GetLayer(handle_);
+
+  size_t row = 0;
+  for (; row + 1 < inputs.num_rows(); row += 2) {
+    matrix_kernel_.MatrixVectorVectorProduct(
+        inputs.row(row), inputs.row(row + 1), biases_, biases_,
+        outputs.row(row), outputs.row(row + 1));
+    ApplyActivationFunction(activation_function_, outputs.row(row));
+    ApplyActivationFunction(activation_function_, outputs.row(row + 1));
+  }
+
+  if (row < inputs.num_rows()) {
+    Vector<float> input_row = inputs.row(row);
+    MutableVector<float> output_row = outputs.row(row);
+    matrix_kernel_.MatrixVectorProduct(input_row, biases_, output_row);
+    ApplyActivationFunction(activation_function_, output_row);
+  }
+
+  return outputs;
+}
+
+}  // namespace runtime
+}  // namespace dragnn
+}  // namespace syntaxnet
--- a/research/syntaxnet/dragnn/runtime/feed_forward_network_layer.h
+++ b/research/syntaxnet/dragnn/runtime/feed_forward_network_layer.h
+// Copyright 2017 Google Inc. All Rights Reserved.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+// =============================================================================
+
+#ifndef DRAGNN_RUNTIME_FEED_FORWARD_NETWORK_LAYER_H_
+#define DRAGNN_RUNTIME_FEED_FORWARD_NETWORK_LAYER_H_
+
+#include <stddef.h>
+#include <string>
+
+#include "dragnn/protos/spec.pb.h"
+#include "dragnn/runtime/activation_functions.h"
+#include "dragnn/runtime/flexible_matrix_kernel.h"
+#include "dragnn/runtime/math/types.h"
+#include "dragnn/runtime/network_states.h"
+#include "dragnn/runtime/variable_store.h"
+#include "syntaxnet/base.h"
+#include "tensorflow/core/lib/core/status.h"
+
+namespace syntaxnet {
+namespace dragnn {
+namespace runtime {
+
+// Configuration and parameters of some layer of a multi-layer perceptron.
+class FeedForwardNetworkLayer {
+ public:
+  // Name of the logits layer produced by a softmax.
+  static constexpr char kLogitsName[] = "logits";
+
+  // Creates an uninitialized layer.  Call Initialize() before use.
+  FeedForwardNetworkLayer() = default;
+
+  // Initializes this as a layer named |layer_name| of the component named
+  // |component_name| that produces activations of size |output_dimension|,
+  // and applies the |activation_function| to the output.  Adds this layer to
+  // the |network_state_manager| and retrieves trained parameters from the
+  // |variable_store| using the |variable_suffix|.  On error, returns non-OK.
+  tensorflow::Status Initialize(const string &component_name,
+                                const string &layer_name,
+                                size_t output_dimension,
+                                ActivationFunction activation_function,
+                                const string &variable_suffix,
+                                VariableStore *variable_store,
+                                NetworkStateManager *network_state_manager);
+
+  // For convenience, initializes this as a softmax that produces a layer named
+  // |kLogitsName|.
+  tensorflow::Status InitializeSoftmax(
+      const ComponentSpec &component_spec, VariableStore *variable_store,
+      NetworkStateManager *network_state_manager);
+
+  // Returns OK iff this is compatible with input activation vectors of size
+  // |input_dim| and sets |output_dim| to the output dimension of this layer.
+  tensorflow::Status CheckInputDimAndGetOutputDim(size_t input_dim,
+                                                  size_t *output_dim) const;
+
+  // Applies the weights and biases of this layer to the |input| activations,
+  // writes the resulting output activations into the |step_index|'th row of
+  // the relevant output layer in the |network_states|, and returns the row.
+  MutableVector<float> Apply(Vector<float> input,
+                             const NetworkStates &network_states,
+                             size_t step_index) const;
+
+  // As above, but applies to a step-wise matrix of |inputs|.
+  MutableMatrix<float> Apply(Matrix<float> inputs,
+                             const NetworkStates &network_states) const;
+
+ private:
+  // Name of the layer, for debug purposes.
+  string debug_name_;
+
+  // Handle of the layer in the network states.
+  LayerHandle<float> handle_;
+
+  // Weight matrix and bias vector for computing the layer activations.
+  FlexibleMatrixKernel matrix_kernel_;
+  Vector<float> biases_;
+
+  // The activation function to apply to the output.
+  ActivationFunction activation_function_ = ActivationFunction::kIdentity;
+};
+
+// Implementation details below.
+
+inline MutableVector<float> FeedForwardNetworkLayer::Apply(
+    Vector<float> input, const NetworkStates &network_states,
+    size_t step_index) const {
+  const MutableVector<float> output =
+      network_states.GetLayer(handle_).row(step_index);
+
+  matrix_kernel_.MatrixVectorProduct(input, biases_, output);
+
+  ApplyActivationFunction(activation_function_, output);
+  return output;
+}
+
+}  // namespace runtime
+}  // namespace dragnn
+}  // namespace syntaxnet
+
+#endif  // DRAGNN_RUNTIME_FEED_FORWARD_NETWORK_LAYER_H_
--- a/research/syntaxnet/dragnn/runtime/feed_forward_network_layer_test.cc
+++ b/research/syntaxnet/dragnn/runtime/feed_forward_network_layer_test.cc
+// Copyright 2017 Google Inc. All Rights Reserved.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+// =============================================================================
+
+#include "dragnn/runtime/feed_forward_network_layer.h"
+
+#include <stddef.h>
+#include <algorithm>
+#include <string>
+
+#include "dragnn/core/test/generic.h"
+#include "dragnn/runtime/activation_functions.h"
+#include "dragnn/runtime/flexible_matrix_kernel.h"
+#include "dragnn/runtime/math/types.h"
+#include "dragnn/runtime/network_states.h"
+#include "dragnn/runtime/test/helpers.h"
+#include "dragnn/runtime/test/network_test_base.h"
+#include "dragnn/runtime/variable_store.h"
+#include "syntaxnet/base.h"
+#include "tensorflow/core/lib/core/errors.h"
+#include "tensorflow/core/lib/core/status.h"
+#include "tensorflow/core/lib/core/status_test_util.h"
+#include "tensorflow/core/lib/strings/strcat.h"
+#include "tensorflow/core/platform/test.h"
+
+namespace syntaxnet {
+namespace dragnn {
+namespace runtime {
+namespace {
+
+constexpr char kLayerName[] = "layer";
+constexpr char kVariableSuffix[] = "suffix";
+
+constexpr size_t kInputDim = 5;
+constexpr size_t kLogitsDim = 3;
+constexpr size_t kNumSteps = 4;
+
+class FeedForwardNetworkLayerTest : public NetworkTestBase {
+ protected:
+  // Adds a weight matrix with the given dimensions and |fill_value|.
+  void AddWeights(size_t num_rows, size_t num_columns, float fill_value) {
+    const string weights_name = tensorflow::strings::StrCat(
+        kTestComponentName, "/weights_", kVariableSuffix,
+        FlexibleMatrixKernel::kSuffix);
+    AddMatrixVariable(weights_name, num_columns, num_rows, fill_value);
+  }
+
+  // Adds a bias vector with the given dimensions and |fill_value|.
+  void AddBiases(size_t dimension, float fill_value) {
+    const string biases_name = tensorflow::strings::StrCat(
+        kTestComponentName, "/bias_", kVariableSuffix);
+    AddVectorVariable(biases_name, dimension, fill_value);
+  }
+
+  // Returns the result of initializing the |layer_| with the arguments.
+  tensorflow::Status Initialize(
+      ActivationFunction activation_function = ActivationFunction::kIdentity,
+      size_t num_steps = kNumSteps) {
+    if (!initialized_) {
+      AddComponent(kTestComponentName);
+      TF_RETURN_IF_ERROR(layer_.Initialize(
+          kTestComponentName, kLayerName, kLogitsDim, activation_function,
+          kVariableSuffix, &variable_store_, &network_state_manager_));
+      initialized_ = true;
+    }
+
+    network_states_.Reset(&network_state_manager_);
+    StartComponent(num_steps);
+    return tensorflow::Status::OK();
+  }
+
+  // Applies the |layer_| to the |input| and returns the result.
+  Vector<float> Apply(const std::vector<float> &input) {
+    UniqueVector<float> input_vector(input);
+    layer_.Apply(Vector<float>(*input_vector), network_states_,
+                 /*step_index=*/0);
+    return Vector<float>(GetLayer(kTestComponentName, kLayerName).row(0));
+  }
+
+  // Applies the |layer_| to the |inputs| and returns the result.
+  Matrix<float> Apply(const std::vector<std::vector<float>> &inputs) {
+    UniqueMatrix<float> input_matrix(inputs);
+    layer_.Apply(Matrix<float>(*input_matrix), network_states_);
+    return Matrix<float>(GetLayer(kTestComponentName, kLayerName));
+  }
+
+  bool initialized_ = false;
+  FeedForwardNetworkLayer layer_;
+};
+
+// Tests that FeedForwardNetworkLayer fails when a weight matrix does not match
+// the dimension of its output activations.
+TEST_F(FeedForwardNetworkLayerTest, BadWeightRows) {
+  AddWeights(kInputDim, kLogitsDim - 1 /* bad */, 1.0);
+  AddBiases(kLogitsDim, 1.0);
+
+  EXPECT_THAT(
+      Initialize(),
+      test::IsErrorWithSubstr(
+          "Weight matrix shape should be output dimension plus padding"));
+}
+
+// Tests that FeedForwardNetworkLayer fails when a weight matrix does not match
+// the dimension of its input activations.
+TEST_F(FeedForwardNetworkLayerTest, BadWeightColumns) {
+  AddWeights(kInputDim + 1 /* bad */, kLogitsDim, 1.0);
+  AddBiases(kLogitsDim, 1.0);
+
+  TF_ASSERT_OK(Initialize());
+
+  size_t output_dim = 0;
+  EXPECT_THAT(layer_.CheckInputDimAndGetOutputDim(kInputDim, &output_dim),
+              test::IsErrorWithSubstr(
+                  "Weight matrix shape does not match input dimension"));
+}
+
+// Tests that FeedForwardNetworkLayer fails when a bias vector does not match
+// the dimension of its output activations.
+TEST_F(FeedForwardNetworkLayerTest, BadBiasDimension) {
+  AddWeights(kInputDim, kLogitsDim, 1.0);
+  AddBiases(kLogitsDim + 1 /* bad */, 1.0);
+
+  EXPECT_THAT(Initialize(),
+              test::IsErrorWithSubstr(
+                  "Bias vector shape does not match output dimension"));
+}
+
+// Tests that FeedForwardNetworkLayer can be used with identity activations.
+TEST_F(FeedForwardNetworkLayerTest, IdentityActivations) {
+  AddWeights(kInputDim, kLogitsDim, 1.0);
+  AddBiases(kLogitsDim, 0.5);
+
+  TF_ASSERT_OK(Initialize());
+
+  size_t output_dim = 0;
+  TF_ASSERT_OK(layer_.CheckInputDimAndGetOutputDim(kInputDim, &output_dim));
+  EXPECT_EQ(output_dim, kLogitsDim);
+
+  // 0.5 + 1 + 2 + 3 + 4 + 5 = 15.5
+  std::vector<float> row = {1.0, 2.0, 3.0, 4.0, 5.0};
+  ExpectVector(Apply(row), kLogitsDim, 15.5);
+  ExpectMatrix(Apply(std::vector<std::vector<float>>(kNumSteps, row)),
+               kNumSteps, kLogitsDim, 15.5);
+
+  // 0.5 - 1 - 2 - 3 - 4 - 5 = -14.5
+  row = {-1.0, -2.0, -3.0, -4.0, -5.0};
+  ExpectVector(Apply(row), kLogitsDim, -14.5);
+  ExpectMatrix(Apply(std::vector<std::vector<float>>(kNumSteps, row)),
+               kNumSteps, kLogitsDim, -14.5);
+}
+
+// Tests that FeedForwardNetworkLayer can be used with ReLU activations.
+TEST_F(FeedForwardNetworkLayerTest, ReluActivations) {
+  AddWeights(kInputDim, kLogitsDim, 1.0);
+  AddBiases(kLogitsDim, 0.5);
+
+  TF_ASSERT_OK(Initialize(ActivationFunction::kRelu));
+
+  size_t output_dim = 0;
+  TF_ASSERT_OK(layer_.CheckInputDimAndGetOutputDim(kInputDim, &output_dim));
+  EXPECT_EQ(output_dim, kLogitsDim);
+
+  // max(0.0, 0.5 + 1 + 2 + 3 + 4 + 5) = 15.5
+  std::vector<float> row = {1.0, 2.0, 3.0, 4.0, 5.0};
+  ExpectVector(Apply(row), kLogitsDim, 15.5);
+  ExpectMatrix(Apply(std::vector<std::vector<float>>(kNumSteps, row)),
+               kNumSteps, kLogitsDim, 15.5);
+
+  // max(0.0, 0.5 - 1 - 2 - 3 - 4 - 5) = 0.0
+  row = {-1.0, -2.0, -3.0, -4.0, -5.0};
+  ExpectVector(Apply(row), kLogitsDim, 0.0);
+  ExpectMatrix(Apply(std::vector<std::vector<float>>(kNumSteps, row)),
+               kNumSteps, kLogitsDim, 0.0);
+}
+
+// Make sure SGEMVV implementation is correct.
+TEST_F(FeedForwardNetworkLayerTest, VaryingSizes) {
+  AddWeights(kInputDim, kLogitsDim, 1.0);
+  AddBiases(kLogitsDim, 0.5);
+
+  std::vector<float> row1 = {1.0, 2.0, 3.0, 4.0, 5.0};  // relu(sum + b) = 15.5
+  std::vector<float> row2 = {-1.0, -2.0, -3.0, -4.0, -5.0};  // result: 0
+  std::vector<float> row3 = {1.0, -2.0, 3.0, -4.0, 5.0};     // result: 3.5
+
+  // Zero-row computation.
+  TF_ASSERT_OK(Initialize(ActivationFunction::kRelu, 0));
+  Matrix<float> result = Apply(std::vector<std::vector<float>>());
+  EXPECT_EQ(result.num_rows(), 0);
+
+  // One-row computation.
+  TF_ASSERT_OK(Initialize(ActivationFunction::kRelu, 1));
+  result = Apply(std::vector<std::vector<float>>{row1});
+  EXPECT_EQ(result.num_rows(), 1);
+  ExpectVector(result.row(0), kLogitsDim, 15.5);
+
+  // Two-row computation.
+  TF_ASSERT_OK(Initialize(ActivationFunction::kRelu, 2));
+  result = Apply({row1, row2});
+  EXPECT_EQ(result.num_rows(), 2);
+  ExpectVector(result.row(0), kLogitsDim, 15.5);
+  ExpectVector(result.row(1), kLogitsDim, 0.0);
+
+  // Three-row computation.
+  TF_ASSERT_OK(Initialize(ActivationFunction::kRelu, 3));
+  result = Apply({row1, row2, row3});
+  EXPECT_EQ(result.num_rows(), 3);
+  ExpectVector(result.row(0), kLogitsDim, 15.5);
+  ExpectVector(result.row(1), kLogitsDim, 0.0);
+  ExpectVector(result.row(2), kLogitsDim, 3.5);
+}
+
+}  // namespace
+}  // namespace runtime
+}  // namespace dragnn
+}  // namespace syntaxnet
--- a/research/syntaxnet/dragnn/runtime/feed_forward_network_test.cc
+++ b/research/syntaxnet/dragnn/runtime/feed_forward_network_test.cc
+// Copyright 2017 Google Inc. All Rights Reserved.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+// =============================================================================
+
+#include <stddef.h>
+#include <algorithm>
+#include <memory>
+#include <string>
+
+#include "dragnn/core/test/generic.h"
+#include "dragnn/protos/spec.pb.h"
+#include "dragnn/runtime/flexible_matrix_kernel.h"
+#include "dragnn/runtime/math/types.h"
+#include "dragnn/runtime/network_states.h"
+#include "dragnn/runtime/network_unit.h"
+#include "dragnn/runtime/test/network_test_base.h"
+#include "dragnn/runtime/variable_store.h"
+#include "syntaxnet/base.h"
+#include <gmock/gmock.h>
+#include "tensorflow/core/lib/core/errors.h"
+#include "tensorflow/core/lib/core/status.h"
+#include "tensorflow/core/lib/core/status_test_util.h"
+#include "tensorflow/core/lib/strings/strcat.h"
+#include "tensorflow/core/platform/test.h"
+
+namespace syntaxnet {
+namespace dragnn {
+namespace runtime {
+namespace {
+
+using ::testing::_;
+using ::testing::Invoke;
+
+// Applies the ReLU activation to the |value|.
+float Relu(float value) { return std::max(0.0f, value); }
+
+class FeedForwardNetworkTest : public NetworkTestBase {
+ protected:
+  // Adds a weight matrix with the |name_suffix| with the given dimensions and
+  // |fill_value|.
+  void AddWeights(const string &name_suffix, size_t num_rows,
+                  size_t num_columns, float fill_value) {
+    const string weights_name =
+        tensorflow::strings::StrCat(kTestComponentName, "/weights_",
+                                    name_suffix, FlexibleMatrixKernel::kSuffix);
+    AddMatrixVariable(weights_name, num_columns, num_rows, fill_value);
+  }
+
+  // Adds a bias vector with the |name_suffix| with the given dimensions and
+  // |fill_value|.
+  void AddBiases(const string &name_suffix, size_t dimension,
+                 float fill_value) {
+    const string biases_name =
+        tensorflow::strings::StrCat(kTestComponentName, "/bias_", name_suffix);
+    AddVectorVariable(biases_name, dimension, fill_value);
+  }
+
+  // Creates a network unit, initializes it based on the |component_spec_text|,
+  // and evaluates it.  On error, returns non-OK.
+  tensorflow::Status Run(const string &component_spec_text) {
+    ComponentSpec component_spec;
+    CHECK(TextFormat::ParseFromString(component_spec_text, &component_spec));
+    component_spec.set_name(kTestComponentName);
+
+    // Since FeedForwardNetwork uses the concatenated input, it is insensitive
+    // to the particular fixed or linked embedding inputs.  For simplicity, the
+    // tests use a trivial network structure and a single fixed embedding.
+    AddComponent(kTestComponentName);
+
+    TF_RETURN_IF_ERROR(
+        NetworkUnit::CreateOrError("FeedForwardNetwork", &network_unit_));
+    TF_RETURN_IF_ERROR(network_unit_->Initialize(
+        component_spec, &variable_store_, &network_state_manager_,
+        &extension_manager_));
+
+    network_states_.Reset(&network_state_manager_);
+    StartComponent(1);  // only evaluate the first step
+    session_state_.extensions.Reset(&extension_manager_);
+
+    TF_RETURN_IF_ERROR(
+        network_unit_->Evaluate(0, &session_state_, &compute_session_));
+
+    return tensorflow::Status::OK();
+  }
+
+  // Returns the activation vector of the first step of layer named |layer_name|
+  // in the current component.
+  Vector<float> GetActivations(const string &layer_name) const {
+    Matrix<float> layer(GetLayer(kTestComponentName, layer_name));
+    return layer.row(0);
+  }
+
+  std::unique_ptr<NetworkUnit> network_unit_;
+};
+
+// Tests that FeedForwardNetwork fails when a weight matrix does not match the
+// dimension of its output activations.
+TEST_F(FeedForwardNetworkTest, BadWeightRows) {
+  const size_t kInputDim = 5;
+  const size_t kLogitsDim = 3;
+  const string kBadSpec = R"(fixed_feature {
+                               vocabulary_size: 50
+                               embedding_dim: 5
+                               size: 1
+                             }
+                             num_actions: 3)";
+  AddFixedEmbeddingMatrix(0, 50, kInputDim, 1.0);
+  AddWeights("softmax", kInputDim, kLogitsDim - 1 /* bad */, 1.0);
+  AddBiases("softmax", kLogitsDim, 1.0);
+
+  EXPECT_THAT(
+      Run(kBadSpec),
+      test::IsErrorWithSubstr(
+          "Weight matrix shape should be output dimension plus padding"));
+}
+
+// Tests that FeedForwardNetwork fails when a weight matrix does not match the
+// dimension of its input activations.
+TEST_F(FeedForwardNetworkTest, BadWeightColumns) {
+  const size_t kInputDim = 5;
+  const size_t kLogitsDim = 3;
+  const string kBadSpec = R"(fixed_feature {
+                               vocabulary_size: 50
+                               embedding_dim: 5
+                               size: 1
+                             }
+                             num_actions: 3)";
+  AddFixedEmbeddingMatrix(0, 50, kInputDim, 1.0);
+  AddWeights("softmax", kInputDim + 1 /* bad */, kLogitsDim, 1.0);
+  AddBiases("softmax", kLogitsDim, 1.0);
+
+  EXPECT_THAT(Run(kBadSpec),
+              test::IsErrorWithSubstr(
+                  "Weight matrix shape does not match input dimension"));
+}
+
+// Tests that FeedForwardNetwork fails when a bias vector does not match the
+// dimension of its output activations.
+TEST_F(FeedForwardNetworkTest, BadBiasDimension) {
+  const size_t kInputDim = 5;
+  const size_t kLogitsDim = 3;
+  const string kBadSpec = R"(fixed_feature {
+                               vocabulary_size: 50
+                               embedding_dim: 5
+                               size: 1
+                             }
+                             num_actions: 3)";
+  AddFixedEmbeddingMatrix(0, 50, kInputDim, 1.0);
+  AddWeights("softmax", kInputDim, kLogitsDim, 1.0);
+  AddBiases("softmax", kLogitsDim + 1 /* bad */, 1.0);
+
+  EXPECT_THAT(Run(kBadSpec),
+              test::IsErrorWithSubstr(
+                  "Bias vector shape does not match output dimension"));
+}
+
+// Tests that FeedForwardNetwork fails when the value of the "layer_norm_input"
+// option is not false.
+TEST_F(FeedForwardNetworkTest, UnsupportedLayerNormInputOption) {
+  const string kBadSpec = R"(network_unit {
+                               parameters {
+                                 key: 'layer_norm_input'
+                                 value: 'true'
+                               }
+                             })";
+
+  EXPECT_THAT(Run(kBadSpec),
+              test::IsErrorWithSubstr("Layer norm is not supported"));
+}
+
+// Tests that FeedForwardNetwork fails when the value of the "layer_norm_hidden"
+// option is not false.
+TEST_F(FeedForwardNetworkTest, UnsupportedLayerNormHiddenOption) {
+  const string kBadSpec = R"(network_unit {
+                               parameters {
+                                 key: 'layer_norm_hidden'
+                                 value: 'true'
+                               }
+                             })";
+
+  EXPECT_THAT(Run(kBadSpec),
+              test::IsErrorWithSubstr("Layer norm is not supported"));
+}
+
+// Tests that FeedForwardNetwork fails when the value of the "nonlinearity"
+// option is not "relu".
+TEST_F(FeedForwardNetworkTest, UnsupportedNonlinearityOption) {
+  const string kBadSpec = R"(network_unit {
+                               parameters {
+                                 key: 'nonlinearity'
+                                 value: 'elu'
+                               }
+                             })";
+
+  EXPECT_THAT(Run(kBadSpec),
+              test::IsErrorWithSubstr("Non-linearity is not supported"));
+}
+
+// Tests that the FeedForwardNetwork works when there are no hidden layers, just
+// a softmax that computes logits.
+TEST_F(FeedForwardNetworkTest, JustLogits) {
+  const size_t kInputDim = 5;
+  const size_t kLogitsDim = 3;
+  const string kSpec = R"(fixed_feature {
+                            vocabulary_size: 50
+                            embedding_dim: 5
+                            size: 1
+                          }
+                          num_actions: 3)";
+  const float kEmbedding = 1.25;
+  const float kFeature = 0.5;
+  const float kWeight = 1.5;
+  const float kBias = 0.75;
+  AddFixedEmbeddingMatrix(0, 50, kInputDim, kEmbedding);
+  AddWeights("softmax", kInputDim, kLogitsDim, kWeight);
+  AddBiases("softmax", kLogitsDim, kBias);
+
+  EXPECT_CALL(compute_session_, GetInputFeatures(_, _, _, _, _))
+      .WillOnce(Invoke(ExtractFeatures(0, {{1, kFeature}})));
+
+  TF_ASSERT_OK(Run(kSpec));
+
+  EXPECT_EQ("logits", network_unit_->GetLogitsName());
+  ExpectVector(GetActivations("logits"), kLogitsDim,
+               kInputDim * kEmbedding * kFeature * kWeight + kBias);
+}
+
+// Tests that the FeedForwardNetwork works with multiple hidden layers as well
+// as a softmax that computes logits.
+TEST_F(FeedForwardNetworkTest, MultiLayer) {
+  const size_t kDims[] = {5, 4, 3, 2};
+  const string kSpec = R"(fixed_feature {
+                            vocabulary_size: 50
+                            embedding_dim: 5
+                            size: 1
+                          }
+                          network_unit {
+                            parameters {
+                              key: 'hidden_layer_sizes'
+                              value: '4,3'
+                            }
+                          }
+                          num_actions: 2)";
+  const float kWeights[] = {-1.5, 1.0, 0.5};
+  const float kBiases[] = {0.75, -0.5, -1.0};
+  AddFixedEmbeddingMatrix(0, 50, 5, 1.0);
+  AddWeights("0", kDims[0], kDims[1], kWeights[0]);
+  AddBiases("0", kDims[1], kBiases[0]);
+  AddWeights("1", kDims[1], kDims[2], kWeights[1]);
+  AddBiases("1", kDims[2], kBiases[1]);
+  AddWeights("softmax", kDims[2], kDims[3], kWeights[2]);
+  AddBiases("softmax", kDims[3], kBiases[2]);
+
+  EXPECT_CALL(compute_session_, GetInputFeatures(_, _, _, _, _))
+      .WillOnce(Invoke(ExtractFeatures(0, {{1, 1.0}})));
+
+  TF_ASSERT_OK(Run(kSpec));
+
+  EXPECT_EQ("logits", network_unit_->GetLogitsName());
+  float expected = Relu(kDims[0] * kWeights[0] + kBiases[0]);
+  ExpectVector(GetActivations("layer_0"), kDims[1], expected);
+  expected = Relu(kDims[1] * expected * kWeights[1] + kBiases[1]);
+  ExpectVector(GetActivations("layer_1"), kDims[2], expected);
+  ExpectVector(GetActivations("last_layer"), kDims[2], expected);
+  expected = kDims[2] * expected * kWeights[2] + kBiases[2];
+  ExpectVector(GetActivations("logits"), kDims[3], expected);
+}
+
+// Tests that the FeedForwardNetwork does not produce logits and does not use
+// the softmax variables when the component is deterministic.
+TEST_F(FeedForwardNetworkTest, NoLogitsOrSoftmaxWhenDeterministic) {
+  const size_t kDims[] = {5, 4};
+  const string kSpec = R"(num_actions: 1
+                          fixed_feature {
+                            vocabulary_size: 50
+                            embedding_dim: 5
+                            size: 1
+                          }
+                          network_unit {
+                            parameters {
+                              key: 'hidden_layer_sizes'
+                              value: '4'
+                            }
+                          })";
+  const float kEmbedding = 1.25;
+  const float kFeature = 0.5;
+  const float kWeight = -1.5;
+  const float kBias = 0.75;
+  AddFixedEmbeddingMatrix(0, 50, kDims[0], kEmbedding);
+
+  // No "softmax" weights or biases.
+  AddWeights("0", kDims[0], kDims[1], kWeight);
+  AddBiases("0", kDims[1], kBias);
+
+  EXPECT_CALL(compute_session_, GetInputFeatures(_, _, _, _, _))
+      .WillOnce(Invoke(ExtractFeatures(0, {{1, kFeature}})));
+
+  TF_ASSERT_OK(Run(kSpec));
+
+  // No specified logits layer.
+  EXPECT_TRUE(network_unit_->GetLogitsName().empty());
+
+  // No "logits" layer.
+  size_t unused_dimension = 0;
+  LayerHandle<float> unused_handle;
+  EXPECT_THAT(
+      network_state_manager_.LookupLayer(kTestComponentName, "logits",
+                                         &unused_dimension, &unused_handle),
+      test::IsErrorWithSubstr(
+          "Unknown layer 'logits' in component 'test_component'"));
+
+  // Hidden layer is still produced.
+  const float kExpected =
+      Relu(kDims[0] * kEmbedding * kFeature * kWeight + kBias);
+  ExpectVector(GetActivations("layer_0"), kDims[1], kExpected);
+  ExpectVector(GetActivations("last_layer"), kDims[1], kExpected);
+}
+
+// Tests that the FeedForwardNetwork does not produce logits when omit_logits is
+// true, even if there are actions.
+TEST_F(FeedForwardNetworkTest, NoLogitsOrSoftmaxWhenOmitLogitsTrue) {
+  const size_t kDims[] = {5, 4};
+  const string kSpec = R"(fixed_feature {
+                            vocabulary_size: 50
+                            embedding_dim: 5
+                            size: 1
+                          }
+                          network_unit {
+                            parameters {
+                              key: 'hidden_layer_sizes'
+                              value: '4'
+                            }
+                            parameters {
+                              key: 'omit_logits'
+                              value: 'true'
+                            }
+                          }
+                          num_actions: 10)";
+  const float kEmbedding = 1.25;
+  const float kFeature = 0.5;
+  const float kWeight = 1.5;
+  const float kBias = 0.75;
+  AddFixedEmbeddingMatrix(0, 50, kDims[0], kEmbedding);
+
+  // No "softmax" weights or biases.
+  AddWeights("0", kDims[0], kDims[1], kWeight);
+  AddBiases("0", kDims[1], kBias);
+
+  EXPECT_CALL(compute_session_, GetInputFeatures(_, _, _, _, _))
+      .WillOnce(Invoke(ExtractFeatures(0, {{1, kFeature}})));
+
+  TF_ASSERT_OK(Run(kSpec));
+
+  // No specified logits layer.
+  EXPECT_TRUE(network_unit_->GetLogitsName().empty());
+
+  // No "logits" layer.
+  size_t unused_dimension = 0;
+  LayerHandle<float> unused_handle;
+  EXPECT_THAT(
+      network_state_manager_.LookupLayer(kTestComponentName, "logits",
+                                         &unused_dimension, &unused_handle),
+      test::IsErrorWithSubstr(
+          "Unknown layer 'logits' in component 'test_component'"));
+
+  // Hidden layer is still produced.
+  const float kExpected = kDims[0] * kEmbedding * kFeature * kWeight + kBias;
+  ExpectVector(GetActivations("layer_0"), kDims[1], kExpected);
+  ExpectVector(GetActivations("last_layer"), kDims[1], kExpected);
+}
+
+}  // namespace
+}  // namespace runtime
+}  // namespace dragnn
+}  // namespace syntaxnet
--- a/research/syntaxnet/dragnn/runtime/file_array_variable_store.cc
+++ b/research/syntaxnet/dragnn/runtime/file_array_variable_store.cc
+// Copyright 2017 Google Inc. All Rights Reserved.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+// =============================================================================
+
+#include "dragnn/runtime/file_array_variable_store.h"
+
+#include <string.h>
+#include <utility>
+
+#include "tensorflow/core/lib/core/errors.h"
+#include "tensorflow/core/platform/env.h"
+
+namespace syntaxnet {
+namespace dragnn {
+namespace runtime {
+
+tensorflow::Status FileArrayVariableStore::Reset(
+    const ArrayVariableStoreSpec &spec, const string &path) {
+  string content;
+  TF_RETURN_IF_ERROR(
+      tensorflow::ReadFileToString(tensorflow::Env::Default(), path, &content));
+
+  UniqueAlignedArray data;
+  data.Reset(content.size());
+  memcpy(data.view().data(), content.data(), content.size());
+  TF_RETURN_IF_ERROR(ArrayVariableStore::Reset(spec, AlignedView(data.view())));
+
+  // Success; make modifications.
+  data_ = std::move(data);
+  return tensorflow::Status::OK();
+}
+
+}  // namespace runtime
+}  // namespace dragnn
+}  // namespace syntaxnet
--- a/research/syntaxnet/dragnn/runtime/file_array_variable_store.h
+++ b/research/syntaxnet/dragnn/runtime/file_array_variable_store.h
+// Copyright 2017 Google Inc. All Rights Reserved.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+// =============================================================================
+
+#ifndef DRAGNN_RUNTIME_FILE_ARRAY_VARIABLE_STORE_H_
+#define DRAGNN_RUNTIME_FILE_ARRAY_VARIABLE_STORE_H_
+
+#include <string>
+
+#include "dragnn/protos/runtime.pb.h"
+#include "dragnn/runtime/alignment.h"
+#include "dragnn/runtime/array_variable_store.h"
+#include "syntaxnet/base.h"
+#include "tensorflow/core/lib/core/status.h"
+
+namespace syntaxnet {
+namespace dragnn {
+namespace runtime {
+
+// An ArrayVariableStore subclass that reads a file into a new-allocated array.
+class FileArrayVariableStore : public ArrayVariableStore {
+ public:
+  // Creates an uninitialized store.
+  FileArrayVariableStore() = default;
+
+  // Resets this to represent the variables defined by the |spec|, loading the
+  // byte array from the |path|.  On error, returns non-OK and modifies nothing.
+  tensorflow::Status Reset(const ArrayVariableStoreSpec &spec,
+                           const string &path);
+
+ private:
+  // The byte array containing the variables.
+  UniqueAlignedArray data_;
+};
+
+}  // namespace runtime
+}  // namespace dragnn
+}  // namespace syntaxnet
+
+#endif  // DRAGNN_RUNTIME_FILE_ARRAY_VARIABLE_STORE_H_
--- a/research/syntaxnet/dragnn/runtime/fixed_embeddings.cc
+++ b/research/syntaxnet/dragnn/runtime/fixed_embeddings.cc
+// Copyright 2017 Google Inc. All Rights Reserved.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+// =============================================================================
+
+#include "dragnn/runtime/fixed_embeddings.h"
+
+#include <string.h>
+#include <algorithm>
+#include <limits>
+#include <utility>
+
+#include "dragnn/runtime/math/arithmetic.h"
+#include "tensorflow/core/lib/core/errors.h"
+#include "tensorflow/core/lib/gtl/array_slice.h"
+#include "tensorflow/core/lib/strings/strcat.h"
+
+namespace syntaxnet {
+namespace dragnn {
+namespace runtime {
+namespace {
+
+// Returns the name of the embedding matrix for the |channel_id|'th fixed
+// feature channel of the |component_spec|.
+string FixedEmbeddingMatrixVariableName(const ComponentSpec &component_spec,
+                                        int channel_id) {
+  // Cf. _add_hooks_for_fixed_embedding_matrix() in runtime_support.py.
+  return tensorflow::strings::StrCat(component_spec.name(),
+                                     "/fixed_embedding_matrix_", channel_id,
+                                     "/trimmed");
+}
+
+// Resizes |buffer| to |size| and returns the array it manages.  Helper for the
+// allocator functors used by ComputeSession::GetInputFeatures().
+template <class T>
+T *Alloc(int size, std::vector<T> *buffer) {
+  buffer->resize(size);
+  return buffer->data();
+}
+
+// Returns true if two pointers have the same address.
+bool SameAddress(const void *pointer1, const void *pointer2) {
+  return pointer1 == pointer2;
+}
+
+// Number of IDs to allow per embedding.
+constexpr size_t kMaxNumFeatureIds = 1;
+
+}  // namespace
+
+tensorflow::Status FixedEmbeddingManager::Reset(
+    const ComponentSpec &component_spec, VariableStore *variable_store,
+    NetworkStateManager *network_state_manager) {
+  const int num_channels = component_spec.fixed_feature_size();
+  std::vector<ChannelConfig> channel_configs(num_channels);
+  size_t max_dimension = 0;  // maximum dimension across all channels
+  size_t num_embeddings = 0;
+  for (int channel_id = 0; channel_id < num_channels; ++channel_id) {
+    const FixedFeatureChannel &channel_spec =
+        component_spec.fixed_feature(channel_id);
+    ChannelConfig &channel_config = channel_configs[channel_id];
+
+    if (channel_spec.size() < 1) {
+      return tensorflow::errors::InvalidArgument(
+          "Invalid channel size for channel ", channel_id, ": ",
+          channel_spec.ShortDebugString());
+    }
+    const size_t channel_size = channel_spec.size();
+    channel_config.channel_base = num_embeddings;
+    num_embeddings += channel_size;
+    channel_config.handles.resize(channel_size);
+    channel_config.is_embedded = channel_spec.embedding_dim() >= 0;
+
+    // Configure non-embedded channels separately.
+    if (!channel_config.is_embedded) {
+      for (size_t i = 0; i < channel_size; ++i) {
+        TF_RETURN_IF_ERROR(network_state_manager->AddLocal(
+            kMaxNumFeatureIds, &channel_config.handles[i].ids));
+      }
+      continue;
+    }
+
+    // The remainder of the loop configures embedded channels.
+    const size_t dimension = channel_spec.embedding_dim();
+    max_dimension = std::max(max_dimension, dimension);
+
+    for (size_t i = 0; i < channel_size; ++i) {
+      TF_RETURN_IF_ERROR(network_state_manager->AddLocal(
+          dimension, &channel_config.handles[i].sum));
+    }
+
+    Matrix<float> &embedding_matrix = channel_config.embedding_matrix;
+    TF_RETURN_IF_ERROR(variable_store->Lookup(
+        FixedEmbeddingMatrixVariableName(component_spec, channel_id),
+        &embedding_matrix));
+
+    if (embedding_matrix.num_rows() != channel_spec.vocabulary_size()) {
+      return tensorflow::errors::InvalidArgument(
+          "ComponentSpec (", channel_spec.vocabulary_size(),
+          ") and VariableStore (", embedding_matrix.num_rows(),
+          ") disagree on vocabulary size for channel ", channel_id, ": ",
+          channel_spec.ShortDebugString());
+    }
+
+    if (embedding_matrix.num_columns() != dimension) {
+      return tensorflow::errors::InvalidArgument(
+          "ComponentSpec (", dimension, ") and VariableStore (",
+          embedding_matrix.num_columns(),
+          ") disagree on embedding dim for channel ", channel_id, ": ",
+          channel_spec.ShortDebugString());
+    }
+  }
+
+  // Success; make modifications.
+  component_name_ = component_spec.name();
+  num_embeddings_ = num_embeddings;
+  channel_configs_ = std::move(channel_configs);
+  zeros_.Resize(max_dimension * sizeof(float));
+  memset(zeros_.view().data(), 0, zeros_.view().size());
+  return tensorflow::Status::OK();
+}
+
+tensorflow::Status FixedEmbeddings::Reset(const FixedEmbeddingManager *manager,
+                                          const NetworkStates &network_states,
+                                          ComputeSession *compute_session) {
+  const AlignedView zeros(manager->zeros_.view());
+  const size_t num_channels = manager->num_channels();
+  features_.clear();
+  features_.reserve(manager->num_embeddings());
+  for (size_t channel_id = 0; channel_id < num_channels; ++channel_id) {
+    const FixedEmbeddingManager::ChannelConfig &channel_config =
+        manager->channel_configs_[channel_id];
+    const std::vector<FixedEmbeddingManager::Handle> &handles =
+        channel_config.handles;
+    const size_t channel_base = channel_config.channel_base;
+    const size_t channel_size = handles.size();
+    DCHECK_EQ(channel_base, features_.size());
+    DCHECK_LE(channel_base + channel_size, manager->num_embeddings());
+
+    const int num_features = compute_session->GetInputFeatures(
+        manager->component_name(),
+        [this](int size) { return Alloc(size, &indices_); },
+        [this](int size) { return Alloc(size, &ids_); },
+        [this](int size) { return Alloc(size, &weights_); }, channel_id);
+    DCHECK_EQ(num_features, indices_.size());
+    DCHECK_EQ(num_features, ids_.size());
+    DCHECK_EQ(num_features, weights_.size());
+    DCHECK(std::all_of(indices_.begin(), indices_.end(),
+                       [channel_size](int32 index) {
+                         return index >= 0 && index < channel_size;
+                       }));
+
+    // Handle non-embedded channels separately.
+    if (!channel_config.is_embedded) {
+      for (size_t index = 0; index < channel_size; ++index) {
+        features_.emplace_back(/*is_embedded=*/false);
+        features_.back().ids = network_states.GetLocal(handles[index].ids);
+        features_.back().ids[0] = -1;  // so we can check that all IDs are set
+      }
+
+      for (int feature = 0; feature < num_features; ++feature) {
+        const int32 index = indices_[feature];
+        const int64 id = ids_[feature];
+        if (id < 0 || id > std::numeric_limits<int32>::max()) {
+          return tensorflow::errors::Internal(
+              "Component '", manager->component_name_, "' channel ", channel_id,
+              " index ", index, ": Invalid non-embedded feature ID ", id);
+        }
+
+        const float weight = weights_[feature];
+        if (weight != 1.0) {
+          return tensorflow::errors::Internal(
+              "Component '", manager->component_name_, "' channel ", channel_id,
+              " index ", index, ": Invalid non-embedded feature weight ",
+              weight, " (expected 1.0)");
+        }
+
+        int32 &output_id = features_[channel_base + index].ids[0];
+        if (output_id != -1) {
+          return tensorflow::errors::Internal(
+              "Component '", manager->component_name_, "' channel ", channel_id,
+              " index ", index, ": Duplicate non-embedded feature ID ", id);
+        }
+
+        output_id = id;
+      }
+
+      for (size_t index = 0; index < channel_size; ++index) {
+        if (features_[channel_base + index].ids[0] == -1) {
+          return tensorflow::errors::Internal(
+              "Component '", manager->component_name_, "' channel ", channel_id,
+              " index ", index, ": Missing non-embedded feature ID");
+        }
+      }
+
+      continue;
+    }
+
+    // The remainder of the loop handles embedded channels.
+    const Matrix<float> &embedding_matrix = channel_config.embedding_matrix;
+
+    // Acquire the local sum operands and initialize embeddings to zero.
+    sums_.resize(channel_size);
+    for (size_t i = 0; i < channel_size; ++i) {
+      sums_[i] = network_states.GetLocal(handles[i].sum);
+      features_.emplace_back(/*is_embedded=*/true);
+      features_.back().embedding = Vector<float>(zeros, sums_[i].size());
+    }
+
+    // Add in a weighted embedding for each feature.  The extracted features do
+    // not have any ordering guarantee (e.g., sorted by |indices|), which makes
+    // applying special-case shortcuts difficult, but not impossible.  If the
+    // features did have an ordering guarantee, we could use a less intricate
+    // algorithm, but it's not clear if it would be much faster.
+    for (int feature = 0; feature < num_features; ++feature) {
+      const int32 index = indices_[feature];
+      const int64 id = ids_[feature];
+      const float weight = weights_[feature];
+      const Vector<float> row = embedding_matrix.row(id);
+      const MutableVector<float> sum = sums_[index];
+      Vector<float> &embedding = features_[channel_base + index].embedding;
+
+      if (SameAddress(embedding.data(), zeros.data())) {
+        // If the |embedding| points at |zeros|, then this is the first addition
+        // so we can use simplified arithmetic.
+        if (weight == 1.0) {
+          // Trivial scaling: Point at the |row|.
+          embedding = row;
+        } else {
+          // Adding to zero: Scale into the |sum| and point at it.
+          ScaleElements(weight, row, sum);
+          embedding = sum;
+        }
+      } else {
+        if (!SameAddress(embedding.data(), sum.data())) {
+          // If the |embedding| does not point at |zeros| or |sum|, then this is
+          // the second addition and we also used the "Trivial scaling" shortcut
+          // in the first addition.  Therefore, the |embedding| currently points
+          // at another row of the embedding matrix.  Copy that row to |sum| and
+          // point at it, so we can add the current row to it.
+          memcpy(sum.data(), embedding.data(), sum.size() * sizeof(float));
+          embedding = sum;
+        }
+
+        // General case: Add to the |sum|, which is aliased by the |embedding|.
+        AddScaledElements(weight, row, sum);
+      }
+
+      DCHECK_EQ(embedding.size(), embedding_matrix.num_columns());
+    }
+  }
+
+  return tensorflow::Status::OK();
+}
+
+}  // namespace runtime
+}  // namespace dragnn
+}  // namespace syntaxnet
--- a/research/syntaxnet/dragnn/runtime/fixed_embeddings.h
+++ b/research/syntaxnet/dragnn/runtime/fixed_embeddings.h
+// Copyright 2017 Google Inc. All Rights Reserved.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+// =============================================================================
+
+// Utils for extracting and embedding fixed features.
+//
+// Fixed feature embeddings are organized into channels, where each channel
+// contains of a fixed number of embedding vectors.  Each embedding, in turn, is
+// the feature-weighted sum of the rows of an embedding matrix.  Note that a
+// multi-embedding channel shares the same embedding matrix across all of its
+// embedding vectors.
+//
+// Logically, a multi-embedding channel is the concatenation of its embedding
+// vectors.  For efficiency, however, the utils here do not actually perform
+// this concatenation.  The rationale is that almost all downstream use cases
+// will concatenate the fixed and linked embeddings together, "wasting" any
+// concatenation here.
+//
+// Instead, the utils here merge the embedding vectors of all channels into a
+// single list, such that the concatenation of this list is equivalent to the
+// concatenation of the channels.  Individual channels can still be accessed,
+// when needed, as sub-spans of the list of embedding vectors.
+//
+// If FixedFeatureChannel.embedding_dim=-1, then the associated fixed feature
+// channel is non-embedded.  Instead of producing sums of embedding vectors, a
+// non-embedded channel produces feature IDs.  The features in a non-embedded
+// channel must extract exactly one feature ID with weight=1.0.
+//
+// TODO(googleuser): Support zero/multiple/weighted non-embedded features?
+
+#ifndef DRAGNN_RUNTIME_FIXED_EMBEDDINGS_H_
+#define DRAGNN_RUNTIME_FIXED_EMBEDDINGS_H_
+
+#include <stddef.h>
+#include <string>
+#include <vector>
+
+#include "dragnn/core/compute_session.h"
+#include "dragnn/protos/spec.pb.h"
+#include "dragnn/runtime/alignment.h"
+#include "dragnn/runtime/math/types.h"
+#include "dragnn/runtime/network_states.h"
+#include "dragnn/runtime/variable_store.h"
+#include "syntaxnet/base.h"
+#include "tensorflow/core/lib/core/status.h"
+
+namespace syntaxnet {
+namespace dragnn {
+namespace runtime {
+
+// A class that manages a set of embedded fixed features for some component.
+// Feature embeddings can be extracted using FixedEmbeddings, defined below.
+class FixedEmbeddingManager {
+ public:
+  // Creates an empty manager.
+  FixedEmbeddingManager() = default;
+
+  // Resets this to manage the fixed features specified by the |component_spec|.
+  // Retrieves embedding matrices from the |variable_store|, which must outlive
+  // this.  Adds locals to the |network_state_manager|, which must be positioned
+  // at the current component.  Channel ordering follows the |component_spec|.
+  // On error, returns non-OK and does not modify this.
+  tensorflow::Status Reset(const ComponentSpec &component_spec,
+                           VariableStore *variable_store,
+                           NetworkStateManager *network_state_manager);
+
+  // Accessors.
+  const string &component_name() const { return component_name_; }
+  size_t num_channels() const { return channel_configs_.size(); }
+  size_t embedding_dim(size_t channel_id) const;
+  size_t num_embeddings() const { return num_embeddings_; }
+  size_t channel_base(size_t channel_id) const;
+  size_t channel_size(size_t channel_id) const;
+  bool is_embedded(size_t channel_id) const;
+  LocalVectorHandle<int32> id_handle(size_t channel_id, size_t index) const;
+
+ private:
+  friend class FixedEmbeddings;
+  friend class SequenceFeatureManager;
+
+  // Handles for the features in a channel.  Only one handle is used.
+  struct Handle {
+    // Embedding sum handle.  Only used if |ChannelConfig.is_embedded| is true.
+    LocalVectorHandle<float> sum;
+
+    // Feature ID handle.  Only used if |ChannelConfig.is_embedded| is true.
+    LocalVectorHandle<int32> ids;
+  };
+
+  // Configuration for a single fixed embedding channel.
+  struct ChannelConfig {
+    // Index of the first embedding vector in this channel.
+    size_t channel_base = 0;
+
+    // Whether this channel is embedded.
+    bool is_embedded = true;
+
+    // Handles for each embedding in the channel.  The active member of each
+    // handle is determined by |is_embedded|.
+    std::vector<Handle> handles;
+
+    // Embedding matrix of this channel.  Only used if |is_embedded| is true.
+    Matrix<float> embedding_matrix;
+  };
+
+  // Name of the component for which features are extracted.
+  string component_name_;
+
+  // Total number of embedding vectors across all channels.
+  size_t num_embeddings_ = 0;
+
+  // Ordered list of configurations for each channel.
+  std::vector<ChannelConfig> channel_configs_;
+
+  // Array of zeros that can be substituted for any embedding vector, in the
+  // case that no features are extracted.
+  UniqueAlignedArray zeros_;
+};
+
+// A set of embedded fixed features, configured via the FixedEmbeddingManager.
+class FixedEmbeddings {
+ public:
+  // Creates an empty set of embedded features.
+  FixedEmbeddings() = default;
+
+  // Resets this to the embedded features managed by the |manager|.  Retrieves
+  // local operands from the |network_states| and extracts features from the
+  // |compute_session|; both must be positioned at the relevant component.  The
+  // |manager| must live until this is destroyed or Reset(), and should not be
+  // modified during that time.  On error, returns non-OK.
+  tensorflow::Status Reset(const FixedEmbeddingManager *manager,
+                           const NetworkStates &network_states,
+                           ComputeSession *compute_session);
+
+  // Accessors.
+  size_t num_embeddings() const { return features_.size(); }
+  Vector<float> embedding(size_t index) const;
+  Vector<int32> ids(size_t index) const;
+
+ private:
+  // Data for a feature in a channel.
+  struct Feature {
+    // Creates a possibly-embedded feature.
+    explicit Feature(bool is_embedded) : is_embedded(is_embedded) {}
+
+
+    // Whether this feature is embedded.
+    const bool is_embedded;
+
+    // Weighted embedding sum.  Only used if |is_embedded| is true.
+    Vector<float> embedding;
+
+    // Singleton vector of feature IDs.  Only used if |is_embedded| is false.
+    // This is mutable to simplify construction.  Recall that a non-embedded
+    // channel must extract exactly one feature ID with weight=1.0.
+    MutableVector<int32> ids;
+  };
+
+  // The following three arrays are the same length, with exactly one element
+  // per feature.  For the i'th extracted feature, |indices_[i]| is the index of
+  // the embedding vector it should be added to, |ids_[i]| is its sparse ID, and
+  // |weights_[i]| is its weight.  These are reused by each channel.
+  std::vector<int32> indices_;
+  std::vector<int64> ids_;
+  std::vector<float> weights_;
+
+  // List of fixed embedding sums, reused by each channel.
+  std::vector<MutableVector<float>> sums_;
+
+  // Ordered list of features, merged across all channels.
+  std::vector<Feature> features_;
+};
+
+// Implementation details below.
+
+inline size_t FixedEmbeddingManager::embedding_dim(size_t channel_id) const {
+  // NB: A multi-embedding channel is logically a concatenation of its embedding
+  // vectors, so its dimension must be scaled accordingly.  On the other hand, a
+  // non-embedded feature is assumed to have dimension=1, as in TF-based DRAGNN;
+  // see NetworkUnitInterface.__init__().
+  const ChannelConfig &channel = channel_configs_[channel_id];
+  return (channel.is_embedded ? channel.embedding_matrix.num_columns() : 1) *
+         channel_size(channel_id);
+}
+
+inline size_t FixedEmbeddingManager::channel_base(size_t channel_id) const {
+  return channel_configs_[channel_id].channel_base;
+}
+
+inline size_t FixedEmbeddingManager::channel_size(size_t channel_id) const {
+  return channel_configs_[channel_id].handles.size();
+}
+
+inline bool FixedEmbeddingManager::is_embedded(size_t channel_id) const {
+  return channel_configs_[channel_id].is_embedded;
+}
+
+inline LocalVectorHandle<int32> FixedEmbeddingManager::id_handle(
+    size_t channel_id, size_t index) const {
+  DCHECK(!is_embedded(channel_id));
+  return channel_configs_[channel_id].handles[index].ids;
+}
+
+inline Vector<float> FixedEmbeddings::embedding(size_t index) const {
+  DCHECK(features_[index].is_embedded);
+  return features_[index].embedding;
+}
+
+inline Vector<int32> FixedEmbeddings::ids(size_t index) const {
+  DCHECK(!features_[index].is_embedded);
+  return Vector<int32>(features_[index].ids);
+}
+
+}  // namespace runtime
+}  // namespace dragnn
+}  // namespace syntaxnet
+
+#endif  // DRAGNN_RUNTIME_FIXED_EMBEDDINGS_H_
--- a/research/syntaxnet/dragnn/runtime/fixed_embeddings_test.cc
+++ b/research/syntaxnet/dragnn/runtime/fixed_embeddings_test.cc
+// Copyright 2017 Google Inc. All Rights Reserved.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+// =============================================================================
+
+#include "dragnn/runtime/fixed_embeddings.h"
+
+#include <string>
+#include <utility>
+#include <vector>
+
+#include "dragnn/core/test/generic.h"
+#include "dragnn/protos/spec.pb.h"
+#include "dragnn/runtime/test/network_test_base.h"
+#include "syntaxnet/base.h"
+#include <gmock/gmock.h>
+#include "tensorflow/core/lib/core/errors.h"
+#include "tensorflow/core/lib/core/status.h"
+#include "tensorflow/core/lib/core/status_test_util.h"
+#include "tensorflow/core/lib/strings/strcat.h"
+#include "tensorflow/core/platform/logging.h"
+#include "tensorflow/core/platform/test.h"
+
+namespace syntaxnet {
+namespace dragnn {
+namespace runtime {
+namespace {
+
+using ::testing::_;
+using ::testing::Invoke;
+
+// A working one-channel ComponentSpec.
+const char kSingleSpec[] = R"(fixed_feature {
+                                vocabulary_size: 11
+                                embedding_dim: 35
+                                size: 1
+                              })";
+const size_t kSingleRows = 11;
+const size_t kSingleColumns = 35;
+
+// A working multi-channel ComponentSpec.
+const char kMultiSpec[] = R"(fixed_feature {
+                               vocabulary_size: 13
+                               embedding_dim: 11
+                               size: 1
+                             }
+                             fixed_feature {
+                               vocabulary_size: 19
+                               embedding_dim: 17
+                               size: 3
+                             }
+                             fixed_feature {
+                               vocabulary_size: 29
+                               embedding_dim: 23
+                               size: 2
+                             })";
+const size_t kMultiRows[] = {13, 19, 29};
+const size_t kMultiColumns[] = {11, 17, 23};
+const size_t kMultiBases[] = {0, 1, 4};
+const size_t kMultiSizes[] = {1, 3, 2};
+const int kMultiNumChannels = 3;
+const int kMultiNumEmbeddings = 6;
+
+// A working one-channel ComponentSpec with non-embedded features.
+const char kNonEmbeddedSpec[] = R"(fixed_feature {
+                                     embedding_dim: -1
+                                     size: 3
+                                   })";
+
+class FixedEmbeddingManagerTest : public NetworkTestBase {
+ protected:
+  // Resets the |manager_| and returns the result of Reset()-ing it using the
+  // |component_spec_text|, |variable_store_|, and |network_state_manager_|.
+  tensorflow::Status ResetManager(const string &component_spec_text) {
+    ComponentSpec component_spec;
+    CHECK(TextFormat::ParseFromString(component_spec_text, &component_spec));
+    component_spec.set_name(kTestComponentName);
+
+    AddComponent(kTestComponentName);
+    return manager_.Reset(component_spec, &variable_store_,
+                          &network_state_manager_);
+  }
+
+  FixedEmbeddingManager manager_;
+};
+
+// Tests that FixedEmbeddingManager is empty by default.
+TEST_F(FixedEmbeddingManagerTest, EmptyByDefault) {
+  EXPECT_EQ(manager_.num_channels(), 0);
+  EXPECT_EQ(manager_.num_embeddings(), 0);
+}
+
+// Tests that FixedEmbeddingManager is empty when reset to an empty spec.
+TEST_F(FixedEmbeddingManagerTest, EmptySpec) {
+  TF_EXPECT_OK(ResetManager(""));
+
+  EXPECT_EQ(manager_.component_name(), kTestComponentName);
+  EXPECT_EQ(manager_.num_channels(), 0);
+  EXPECT_EQ(manager_.num_embeddings(), 0);
+}
+
+// Tests that FixedEmbeddingManager produces the correct embedding dimension
+// when configured with a single channel.
+TEST_F(FixedEmbeddingManagerTest, OneChannel) {
+  AddFixedEmbeddingMatrix(0, kSingleRows, kSingleColumns, 0.25);
+
+  TF_EXPECT_OK(ResetManager(kSingleSpec));
+
+  EXPECT_EQ(manager_.component_name(), kTestComponentName);
+  EXPECT_EQ(manager_.num_channels(), 1);
+  EXPECT_EQ(manager_.embedding_dim(0), kSingleColumns);
+  EXPECT_EQ(manager_.num_embeddings(), 1);
+  EXPECT_EQ(manager_.channel_base(0), 0);
+  EXPECT_EQ(manager_.channel_size(0), 1);
+  EXPECT_TRUE(manager_.is_embedded(0));
+}
+
+// Tests that FixedEmbeddingManager produces the correct embedding dimensions
+// when configured with multiple channels.
+TEST_F(FixedEmbeddingManagerTest, MultipleChannels) {
+  for (int i = 0; i < kMultiNumChannels; ++i) {
+    AddFixedEmbeddingMatrix(i, kMultiRows[i], kMultiColumns[i], -1.0);
+  }
+
+  TF_EXPECT_OK(ResetManager(kMultiSpec));
+
+  EXPECT_EQ(manager_.component_name(), kTestComponentName);
+  EXPECT_EQ(manager_.num_channels(), kMultiNumChannels);
+  EXPECT_EQ(manager_.num_embeddings(), kMultiNumEmbeddings);
+  for (int i = 0; i < kMultiNumChannels; ++i) {
+    EXPECT_EQ(manager_.embedding_dim(i), kMultiColumns[i] * kMultiSizes[i]);
+    EXPECT_EQ(manager_.channel_base(i), kMultiBases[i]);
+    EXPECT_EQ(manager_.channel_size(i), kMultiSizes[i]);
+    EXPECT_TRUE(manager_.is_embedded(i));
+  }
+}
+
+// Tests that FixedEmbeddingManager works for non-embedded features.
+TEST_F(FixedEmbeddingManagerTest, NonEmbeddedFeature) {
+  TF_ASSERT_OK(ResetManager(kNonEmbeddedSpec));
+
+  EXPECT_EQ(manager_.component_name(), kTestComponentName);
+  EXPECT_EQ(manager_.num_channels(), 1);
+  EXPECT_EQ(manager_.embedding_dim(0), 3);
+  EXPECT_EQ(manager_.num_embeddings(), 3);
+  EXPECT_EQ(manager_.channel_base(0), 0);
+  EXPECT_EQ(manager_.channel_size(0), 3);
+  EXPECT_FALSE(manager_.is_embedded(0));
+}
+
+// Tests that FixedEmbeddingManager fails when there are no embedding matrices.
+TEST_F(FixedEmbeddingManagerTest, NoEmbeddingMatrices) {
+  EXPECT_THAT(ResetManager(kSingleSpec),
+              test::IsErrorWithSubstr("Unknown variable"));
+}
+
+// Tests that FixedEmbeddingManager fails when there are embedding matrices, but
+// not for the right channel.
+TEST_F(FixedEmbeddingManagerTest, MissingEmbeddingMatrix) {
+  AddFixedEmbeddingMatrix(/* bad */ 1, kSingleRows, kSingleColumns, 0.25);
+
+  EXPECT_THAT(ResetManager(kSingleSpec),
+              test::IsErrorWithSubstr("Unknown variable"));
+}
+
+// Tests that FixedEmbeddingManager fails when the channel size is 0.
+TEST_F(FixedEmbeddingManagerTest, InvalidChannelSize) {
+  const string kBadSpec = R"(fixed_feature {
+                               vocabulary_size: 8
+                               embedding_dim: 16
+                               size: 0  # bad
+                             })";
+  AddFixedEmbeddingMatrix(0, 8, 16, 0.25);
+
+  EXPECT_THAT(ResetManager(kBadSpec),
+              test::IsErrorWithSubstr("Invalid channel size"));
+}
+
+// Tests that the FixedEmbeddingManager fails when the embedding dimension does
+// not match the embedding matrix.
+TEST_F(FixedEmbeddingManagerTest, MismatchedEmbeddingDim) {
+  const string kBadSpec = R"(fixed_feature {
+                               vocabulary_size: 8
+                               embedding_dim: 17  # bad
+                               size: 1
+                             })";
+  AddFixedEmbeddingMatrix(0, 8, 16, 0.25);
+
+  EXPECT_THAT(ResetManager(kBadSpec),
+              test::IsErrorWithSubstr("ComponentSpec (17) and VariableStore "
+                                      "(16) disagree on embedding dim"));
+}
+
+// Tests that the FixedEmbeddingManager fails when the vocabulary size does not
+// match the embedding matrix.
+TEST_F(FixedEmbeddingManagerTest, MismatchedVocabularySize) {
+  const string kBadSpec = R"(fixed_feature {
+                               vocabulary_size: 7  # bad
+                               embedding_dim: 16
+                               size: 1
+                             })";
+  AddFixedEmbeddingMatrix(0, 8, 16, 0.25);
+
+  EXPECT_THAT(ResetManager(kBadSpec),
+              test::IsErrorWithSubstr("ComponentSpec (7) and VariableStore "
+                                      "(8) disagree on vocabulary size"));
+}
+
+class FixedEmbeddingsTest : public FixedEmbeddingManagerTest {
+ protected:
+  // Resets the |fixed_embeddings_| using the |manager_|, |network_states_|, and
+  // |compute_session_|, and returns the resulting status.
+  tensorflow::Status ResetFixedEmbeddings() {
+    network_states_.Reset(&network_state_manager_);
+    StartComponent(0);
+    return fixed_embeddings_.Reset(&manager_, network_states_,
+                                   &compute_session_);
+  }
+
+  // Returns a list of the expected size and value of each fixed embedding sum,
+  // given that the channel-wise sums are the |channel_sums|.
+  std::vector<std::pair<size_t, float>> ToEmbeddingSums(
+      const std::vector<float> &channel_sums) {
+    CHECK_EQ(channel_sums.size(), kMultiNumChannels);
+    std::vector<std::pair<size_t, float>> expected_sums;
+    for (int channel_id = 0; channel_id < kMultiNumChannels; ++channel_id) {
+      for (int i = 0; i < kMultiSizes[channel_id]; ++i) {
+        expected_sums.emplace_back(kMultiColumns[channel_id],
+                                   channel_sums[channel_id]);
+      }
+    }
+    return expected_sums;
+  }
+
+  // As above, but computes the channel sums as the product of |lhs| and |rhs|.
+  std::vector<std::pair<size_t, float>> ToEmbeddingSums(
+      const std::vector<float> &lhs, const std::vector<float> &rhs) {
+    CHECK_EQ(lhs.size(), rhs.size());
+    std::vector<float> channel_sums;
+    for (int i = 0; i < lhs.size(); ++i) {
+      channel_sums.push_back(lhs[i] * rhs[i]);
+    }
+    return ToEmbeddingSums(channel_sums);
+  }
+
+  FixedEmbeddings fixed_embeddings_;
+};
+
+// Tests that FixedEmbeddings is empty by default.
+TEST_F(FixedEmbeddingsTest, EmptyByDefault) {
+  EXPECT_EQ(fixed_embeddings_.num_embeddings(), 0);
+}
+
+// Tests that FixedEmbeddings is empty when reset with an empty manager.
+TEST_F(FixedEmbeddingsTest, EmptyManager) {
+  TF_ASSERT_OK(ResetManager(""));
+
+  TF_ASSERT_OK(ResetFixedEmbeddings());
+  EXPECT_EQ(fixed_embeddings_.num_embeddings(), 0);
+}
+
+// Tests that FixedEmbeddings produces a zero vector when no features are
+// extracted.
+TEST_F(FixedEmbeddingsTest, OneChannelNoFeatures) {
+  AddFixedEmbeddingMatrix(0, kSingleRows, kSingleColumns, 0.5);
+  TF_ASSERT_OK(ResetManager(kSingleSpec));
+
+  EXPECT_CALL(compute_session_, GetInputFeatures(_, _, _, _, _))
+      .WillOnce(Invoke(ExtractFeatures(0, {})));
+
+  TF_ASSERT_OK(ResetFixedEmbeddings());
+  ASSERT_EQ(fixed_embeddings_.num_embeddings(), 1);
+  ExpectVector(fixed_embeddings_.embedding(0), kSingleColumns, 0.0);
+}
+
+// Tests that FixedEmbeddings produces a row of the embedding matrix when
+// exactly one feature with weight=1 is extracted.
+TEST_F(FixedEmbeddingsTest, OneChannelOneFeature) {
+  AddFixedEmbeddingMatrix(0, kSingleRows, kSingleColumns, 0.125);
+  TF_ASSERT_OK(ResetManager(kSingleSpec));
+
+  EXPECT_CALL(compute_session_, GetInputFeatures(_, _, _, _, _))
+      .WillOnce(Invoke(ExtractFeatures(0, {{kSingleRows - 1, 1.0}})));
+
+  TF_ASSERT_OK(ResetFixedEmbeddings());
+  ASSERT_EQ(fixed_embeddings_.num_embeddings(), 1);
+  ExpectVector(fixed_embeddings_.embedding(0), kSingleColumns, 0.125);
+}
+
+// Tests that FixedEmbeddings produces a scaled row of the embedding matrix when
+// exactly one feature with weight!=1 is extracted.
+TEST_F(FixedEmbeddingsTest, OneChannelOneWeightedFeature) {
+  AddFixedEmbeddingMatrix(0, kSingleRows, kSingleColumns, 0.5);
+  TF_ASSERT_OK(ResetManager(kSingleSpec));
+
+  EXPECT_CALL(compute_session_, GetInputFeatures(_, _, _, _, _))
+      .WillOnce(Invoke(ExtractFeatures(0, {{0, -1.5}})));
+
+  TF_ASSERT_OK(ResetFixedEmbeddings());
+  ASSERT_EQ(fixed_embeddings_.num_embeddings(), 1);
+  ExpectVector(fixed_embeddings_.embedding(0), kSingleColumns, -0.75);
+}
+
+// Tests that FixedEmbeddings produces a weighted embedding sum when multiple
+// weighted features are extracted.
+TEST_F(FixedEmbeddingsTest, OneChannelManyFeatures) {
+  AddFixedEmbeddingMatrix(0, kSingleRows, kSingleColumns, 0.5);
+  TF_ASSERT_OK(ResetManager(kSingleSpec));
+
+  EXPECT_CALL(compute_session_, GetInputFeatures(_, _, _, _, _))
+      .WillOnce(Invoke(ExtractFeatures(0, {{0, 1.0}, {1, -2.0}, {2, 4.0}})));
+  const float kSum = 1.5;  // = 0.5 * (1.0 - 2.0 + 4.0)
+
+  TF_ASSERT_OK(ResetFixedEmbeddings());
+  ASSERT_EQ(fixed_embeddings_.num_embeddings(), 1);
+  ExpectVector(fixed_embeddings_.embedding(0), kSingleColumns, kSum);
+}
+
+// Tests that FixedEmbeddings produces zero vectors for multiple channels that
+// extract no features.
+TEST_F(FixedEmbeddingsTest, ManyChannelsNoFeatures) {
+  const std::vector<float> kValues = {0.0, 0.0, 0.0};
+  for (int i = 0; i < kMultiNumChannels; ++i) {
+    AddFixedEmbeddingMatrix(i, kMultiRows[i], kMultiColumns[i], 1.0);
+  }
+  TF_ASSERT_OK(ResetManager(kMultiSpec));
+
+  EXPECT_CALL(compute_session_, GetInputFeatures(_, _, _, _, _))
+      .WillOnce(Invoke(ExtractFeatures(0, {})))
+      .WillOnce(Invoke(ExtractFeatures(1, {})))
+      .WillOnce(Invoke(ExtractFeatures(2, {})));
+
+  TF_ASSERT_OK(ResetFixedEmbeddings());
+  const auto kSums = ToEmbeddingSums(kValues);
+  ASSERT_EQ(fixed_embeddings_.num_embeddings(), kSums.size());
+  for (int i = 0; i < kSums.size(); ++i) {
+    ExpectVector(fixed_embeddings_.embedding(i), kSums[i].first,
+                 kSums[i].second);
+  }
+}
+
+// Tests that FixedEmbeddings produces rows of the embedding matrix for multiple
+// channels that extract exactly one feature with weight=1.
+TEST_F(FixedEmbeddingsTest, ManyChannelsOneFeature) {
+  const std::vector<float> kValues = {1.0, -0.5, 0.75};
+  ASSERT_EQ(kValues.size(), kMultiNumChannels);
+
+  for (int i = 0; i < kMultiNumChannels; ++i) {
+    AddFixedEmbeddingMatrix(i, kMultiRows[i], kMultiColumns[i], kValues[i]);
+  }
+  TF_ASSERT_OK(ResetManager(kMultiSpec));
+
+  // NB: Sometimes the feature indices are extracted out-of-order.
+  EXPECT_CALL(compute_session_, GetInputFeatures(_, _, _, _, _))
+      .WillOnce(Invoke(ExtractFeatures(0, {{0, 10, 1.0}})))
+      .WillOnce(Invoke(ExtractFeatures(1, {{1, 11, 1.0},  //
+                                           {0, 11, 1.0},  //
+                                           {2, 11, 1.0}})))
+      .WillOnce(Invoke(ExtractFeatures(2, {{0, 12, 1.0},  //
+                                           {1, 12, 1.0}})));
+
+  TF_ASSERT_OK(ResetFixedEmbeddings());
+  const auto kSums = ToEmbeddingSums(kValues);
+  ASSERT_EQ(fixed_embeddings_.num_embeddings(), kSums.size());
+  for (int i = 0; i < kSums.size(); ++i) {
+    ExpectVector(fixed_embeddings_.embedding(i), kSums[i].first,
+                 kSums[i].second);
+  }
+}
+
+// Tests that FixedEmbeddings produces scaled rows of the embedding matrix for
+// multiple channels that extract exactly one feature with weight!=1.
+TEST_F(FixedEmbeddingsTest, ManyChannelsOneWeightedFeature) {
+  const std::vector<float> kValues = {1.0, -0.5, 0.75};
+  const std::vector<float> kFeatures = {1.25, 0.75, -1.5};
+  ASSERT_EQ(kValues.size(), kMultiNumChannels);
+  ASSERT_EQ(kFeatures.size(), kMultiNumChannels);
+
+  for (int i = 0; i < kMultiNumChannels; ++i) {
+    AddFixedEmbeddingMatrix(i, kMultiRows[i], kMultiColumns[i], kValues[i]);
+  }
+  TF_ASSERT_OK(ResetManager(kMultiSpec));
+
+  // NB: Sometimes the feature indices are extracted out-of-order.
+  EXPECT_CALL(compute_session_, GetInputFeatures(_, _, _, _, _))
+      .WillOnce(Invoke(ExtractFeatures(0, {{0, 10, kFeatures[0]}})))
+      .WillOnce(Invoke(ExtractFeatures(1, {{0, 11, kFeatures[1]},  //
+                                           {1, 11, kFeatures[1]},  //
+                                           {2, 11, kFeatures[1]}})))
+      .WillOnce(Invoke(ExtractFeatures(2, {{1, 12, kFeatures[2]},  //
+                                           {0, 12, kFeatures[2]}})));
+
+  TF_ASSERT_OK(ResetFixedEmbeddings());
+  const auto kSums = ToEmbeddingSums(kValues, kFeatures);
+  ASSERT_EQ(fixed_embeddings_.num_embeddings(), kSums.size());
+  for (int i = 0; i < kSums.size(); ++i) {
+    ExpectVector(fixed_embeddings_.embedding(i), kSums[i].first,
+                 kSums[i].second);
+  }
+}
+
+// Tests that FixedEmbeddings produces weighted embedding sums for multiple
+// channels that extract multiple weighted features.
+TEST_F(FixedEmbeddingsTest, ManyChannelsManyFeatures) {
+  const std::vector<float> kValues = {1.0, -0.5, 0.75};
+  ASSERT_EQ(kValues.size(), kMultiNumChannels);
+
+  for (int i = 0; i < kMultiNumChannels; ++i) {
+    AddFixedEmbeddingMatrix(i, kMultiRows[i], kMultiColumns[i], kValues[i]);
+  }
+  TF_ASSERT_OK(ResetManager(kMultiSpec));
+
+  // NB: Sometimes the feature indices are extracted out-of-order.
+  EXPECT_CALL(compute_session_, GetInputFeatures(_, _, _, _, _))
+      .WillOnce(Invoke(ExtractFeatures(0, {{0, 0, 1.0},   //
+                                           {0, 1, -2.0},  //
+                                           {0, 2, 9.0}})))
+      .WillOnce(Invoke(ExtractFeatures(1, {{0, 0, 2.0},   //
+                                           {1, 1, -4.0},  //
+                                           {2, 2, 8.0},   //
+                                           {1, 0, 2.0},   //
+                                           {2, 1, -4.0},  //
+                                           {0, 2, 8.0},   //
+                                           {2, 0, 2.0},   //
+                                           {0, 1, -4.0},  //
+                                           {1, 2, 8.0}})))
+      .WillOnce(Invoke(ExtractFeatures(2, {{0, 0, 3.0},   //
+                                           {0, 1, -6.0},  //
+                                           {0, 2, 7.0},   //
+                                           {1, 2, 7.0},   //
+                                           {1, 1, -6.0},  //
+                                           {1, 0, 3.0}})));
+  const std::vector<float> kFeatures = {1.0 - 2.0 + 9.0,
+                                        2.0 - 4.0 + 8.0,
+                                        3.0 - 6.0 + 7.0};
+  ASSERT_EQ(kFeatures.size(), kMultiNumChannels);
+
+  TF_ASSERT_OK(ResetFixedEmbeddings());
+  const auto kSums = ToEmbeddingSums(kValues, kFeatures);
+  ASSERT_EQ(fixed_embeddings_.num_embeddings(), kSums.size());
+  for (int i = 0; i < kSums.size(); ++i) {
+    ExpectVector(fixed_embeddings_.embedding(i), kSums[i].first,
+                 kSums[i].second);
+  }
+}
+
+// Tests that FixedEmbeddings produces feature IDs when configured with a
+// non-embedded feature channel.
+TEST_F(FixedEmbeddingsTest, NonEmbeddedFeature) {
+  TF_ASSERT_OK(ResetManager(kNonEmbeddedSpec));
+
+  // These feature values probe the boundaries of valid feature IDs.
+  EXPECT_CALL(compute_session_, GetInputFeatures(_, _, _, _, _))
+      .WillOnce(Invoke(ExtractFeatures(0, {{2, 2147483647, 1.0},  //
+                                           {0, 0, 1.0},           //
+                                           {1, 34, 1.0}})));
+
+  TF_ASSERT_OK(ResetFixedEmbeddings());
+  ASSERT_EQ(fixed_embeddings_.num_embeddings(), 3);
+  ASSERT_EQ(fixed_embeddings_.ids(0).size(), 1);
+  EXPECT_EQ(fixed_embeddings_.ids(0)[0], 0);
+  ASSERT_EQ(fixed_embeddings_.ids(1).size(), 1);
+  EXPECT_EQ(fixed_embeddings_.ids(1)[0], 34);
+  ASSERT_EQ(fixed_embeddings_.ids(2).size(), 1);
+  EXPECT_EQ(fixed_embeddings_.ids(2)[0], 2147483647);
+
+  Vector<int32> ids;
+  ids = network_states_.GetLocal(manager_.id_handle(0, 0));
+  ASSERT_EQ(ids.size(), 1);
+  EXPECT_EQ(ids[0], 0);
+  ids = network_states_.GetLocal(manager_.id_handle(0, 1));
+  ASSERT_EQ(ids.size(), 1);
+  EXPECT_EQ(ids[0], 34);
+  ids = network_states_.GetLocal(manager_.id_handle(0, 2));
+  ASSERT_EQ(ids.size(), 1);
+  EXPECT_EQ(ids[0], 2147483647);
+}
+
+// Tests that FixedEmbeddings fails if a feature ID has a negative ID.
+TEST_F(FixedEmbeddingsTest, NonEmbeddedFeatureNegativeId) {
+  TF_ASSERT_OK(ResetManager(kNonEmbeddedSpec));
+
+  EXPECT_CALL(compute_session_, GetInputFeatures(_, _, _, _, _))
+      .WillOnce(Invoke(ExtractFeatures(0, {{2, -1, 1.0},  //
+                                           {0, 12, 1.0},  //
+                                           {1, 34, 1.0}})));
+
+  EXPECT_THAT(ResetFixedEmbeddings(),
+              test::IsErrorWithSubstr(tensorflow::strings::StrCat(
+                  "Component '", kTestComponentName,
+                  "' channel 0 index 2: Invalid non-embedded feature ID -1")));
+}
+
+// Tests that FixedEmbeddings fails if a feature ID has an ID that is too large.
+TEST_F(FixedEmbeddingsTest, NonEmbeddedFeatureIdTooLarge) {
+  TF_ASSERT_OK(ResetManager(kNonEmbeddedSpec));
+
+  EXPECT_CALL(compute_session_, GetInputFeatures(_, _, _, _, _))
+      .WillOnce(Invoke(ExtractFeatures(0, {{2, 56, 1.0},          //
+                                           {0, 2147483648, 1.0},  //
+                                           {1, 34, 1.0}})));
+
+  EXPECT_THAT(ResetFixedEmbeddings(),
+              test::IsErrorWithSubstr(tensorflow::strings::StrCat(
+                  "Component '", kTestComponentName,
+                  "' channel 0 index 0: Invalid non-embedded feature ID "
+                  "2147483648")));
+}
+
+// Tests that FixedEmbeddings fails if a feature weight is not 1.0.
+TEST_F(FixedEmbeddingsTest, NonEmbeddedFeatureNonIdentityWeight) {
+  TF_ASSERT_OK(ResetManager(kNonEmbeddedSpec));
+
+  EXPECT_CALL(compute_session_, GetInputFeatures(_, _, _, _, _))
+      .WillOnce(Invoke(ExtractFeatures(0, {{2, 56, 1.0},  //
+                                           {0, 12, 1.0},  //
+                                           {1, 34, 1.5}})));
+
+  EXPECT_THAT(ResetFixedEmbeddings(),
+              test::IsErrorWithSubstr(tensorflow::strings::StrCat(
+                  "Component '", kTestComponentName,
+                  "' channel 0 index 1: Invalid non-embedded feature weight "
+                  "1.5 (expected 1.0)")));
+}
+
+// Tests that FixedEmbeddings fails if a feature ID is duplicated.
+TEST_F(FixedEmbeddingsTest, NonEmbeddedFeatureDuplicateId) {
+  TF_ASSERT_OK(ResetManager(kNonEmbeddedSpec));
+
+  EXPECT_CALL(compute_session_, GetInputFeatures(_, _, _, _, _))
+      .WillOnce(Invoke(ExtractFeatures(0, {{2, 56, 1.0},  //
+                                           {2, 56, 1.0},  //
+                                           {0, 12, 1.0},  //
+                                           {1, 34, 1.0}})));
+
+  EXPECT_THAT(
+      ResetFixedEmbeddings(),
+      test::IsErrorWithSubstr(tensorflow::strings::StrCat(
+          "Component '", kTestComponentName,
+          "' channel 0 index 2: Duplicate non-embedded feature ID 56")));
+}
+
+// Tests that FixedEmbeddings fails if a feature ID is missing.
+TEST_F(FixedEmbeddingsTest, NonEmbeddedFeatureMissingId) {
+  TF_ASSERT_OK(ResetManager(kNonEmbeddedSpec));
+
+  EXPECT_CALL(compute_session_, GetInputFeatures(_, _, _, _, _))
+      .WillOnce(Invoke(ExtractFeatures(0, {{2, 56, 1.0},  //
+                                           {1, 34, 1.0}})));
+
+  EXPECT_THAT(ResetFixedEmbeddings(),
+              test::IsErrorWithSubstr(tensorflow::strings::StrCat(
+                  "Component '", kTestComponentName,
+                  "' channel 0 index 0: Missing non-embedded feature ID")));
+}
+
+}  // namespace
+}  // namespace runtime
+}  // namespace dragnn
+}  // namespace syntaxnet
--- a/research/syntaxnet/dragnn/runtime/flexible_matrix_kernel.cc
+++ b/research/syntaxnet/dragnn/runtime/flexible_matrix_kernel.cc
+// Copyright 2017 Google Inc. All Rights Reserved.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+// =============================================================================
+
+#include "dragnn/runtime/flexible_matrix_kernel.h"
+
+#include "dragnn/runtime/math/avx_vector_array.h"
+#include "tensorflow/core/lib/strings/strcat.h"
+
+namespace syntaxnet {
+namespace dragnn {
+namespace runtime {
+namespace {
+
+// Rounds a number, |rows|, up to a multiple of |multiple|. For example,
+// PadRows(6, 4) will return 8, because 8 is the nearest number after 6 that is
+// divisible by 4. This method requires that |multiple| be positive. It is used
+// for pre-calculating the dimension of a blocked matrix, instead of having to
+// read the entire matrix.
+inline int PadRows(int rows, int multiple) {
+  return multiple * ((rows + multiple - 1) / multiple);
+}
+
+}  // namespace
+
+constexpr char FlexibleMatrixKernel::kSuffix[];
+
+tensorflow::Status FlexibleMatrixKernel::Initialize(
+    const string &debug_name, const string &weights_name, int output_dimension,
+    VariableStore *variable_store) {
+  padded_output_dimension_ = PadRows(output_dimension, kAvxWidth);
+
+  // Try retrieving the flexible matrix variable using all matrix formats.  Only
+  // one format will work (see FlexibleMatrixVariableStoreWrapper).
+  const string variable_name =
+      tensorflow::strings::StrCat(weights_name, kSuffix);
+
+  // Handle the simpler non-blocked case first.
+  tensorflow::Status status = variable_store->Lookup(variable_name, &weights_);
+  if (status.ok()) {
+    LOG(INFO) << "Matrix of size " << weights_.num_rows() << " x "
+              << weights_.num_columns() << " for layer " << debug_name
+              << " will be computed with non-blocked arithmetic";
+    weights_type_ = WeightsType::kNormal;
+    return status;
+  }
+
+  // Otherwise, we must have a blocked format.
+  BlockedMatrix<float> blocked_transpose;
+  TF_RETURN_IF_ERROR(variable_store->Lookup(variable_name, &blocked_transpose));
+  const auto blocked = blocked_transpose.Transpose();
+
+  // Blocked matrices must use a supported block size.
+  switch (blocked.block_size()) {
+    case 32:
+      weights_type_ = WeightsType::kBlocked32;
+      status = fast_weights_32_.Initialize(blocked);
+      break;
+
+    case 48:
+      weights_type_ = WeightsType::kBlocked48;
+      status = fast_weights_48_.Initialize(blocked);
+      break;
+
+    default:
+      return tensorflow::errors::FailedPrecondition(
+          "Unsupported block size: ", blocked.block_size(), " for weights ",
+          weights_name, " of layer ", debug_name);
+  }
+
+  if (status.ok()) {
+    LOG(INFO) << "Matrix of size " << blocked.num_rows() << " x "
+              << blocked.num_columns() << " for layer " << debug_name
+              << " will be computed with SGEMV<block_size="
+              << blocked.block_size() << ">";
+  } else {
+    // This should (almost?) never happen, because SgevmMatrix::Initialize()
+    // only fails on bad block sizes, and the switch above ensures that the
+    // SgemvMatrix and variable agree on block size.
+    LOG(ERROR) << "Error formatting SGEMV matrix: " << status
+               << " - matrix size " << blocked.num_rows() << " x "
+               << blocked.num_columns() << " for layer " << debug_name;
+  }
+
+  return status;
+}
+
+int FlexibleMatrixKernel::NumPaddedRows() const {
+  switch (weights_type_) {
+    case WeightsType::kNormal:
+      return weights_.num_rows();
+    case WeightsType::kBlocked32:
+      return fast_weights_32_.matrix().num_rows();
+    case WeightsType::kBlocked48:
+      return fast_weights_48_.matrix().num_rows();
+  }
+}
+
+int FlexibleMatrixKernel::NumColumns() const {
+  switch (weights_type_) {
+    case WeightsType::kNormal:
+      return weights_.num_columns();
+    case WeightsType::kBlocked32:
+      return fast_weights_32_.matrix().num_columns();
+    case WeightsType::kBlocked48:
+      return fast_weights_48_.matrix().num_columns();
+  }
+}
+
+bool FlexibleMatrixKernel::MatchesOutputDimension(int output_dimension) const {
+  int max_padding = 0;
+  if (weights_type_ == WeightsType::kBlocked32) {
+    max_padding = 32;
+  } else if (weights_type_ == WeightsType::kBlocked48) {
+    max_padding = 48;
+  }
+  return (NumPaddedRows() >= output_dimension &&
+          NumPaddedRows() <= output_dimension + max_padding);
+}
+
+string FlexibleMatrixKernel::TypeName(WeightsType value) {
+  switch (value) {
+    case WeightsType::kNormal:
+      return "normal (non-blocked)";
+    case WeightsType::kBlocked32:
+      return "32-row blocked";
+    case WeightsType::kBlocked48:
+      return "48-row blocked";
+  }
+}
+
+}  // namespace runtime
+}  // namespace dragnn
+}  // namespace syntaxnet
--- a/research/syntaxnet/dragnn/runtime/flexible_matrix_kernel.h
+++ b/research/syntaxnet/dragnn/runtime/flexible_matrix_kernel.h
+// Copyright 2017 Google Inc. All Rights Reserved.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+// =============================================================================
+
+#ifndef DRAGNN_RUNTIME_FLEXIBLE_MATRIX_KERNEL_H_
+#define DRAGNN_RUNTIME_FLEXIBLE_MATRIX_KERNEL_H_
+
+#include "dragnn/runtime/alignment.h"
+#include "dragnn/runtime/math/arithmetic.h"
+#include "dragnn/runtime/math/sgemvv.h"
+#include "dragnn/runtime/math/types.h"
+#include "dragnn/runtime/variable_store.h"
+
+#include "tensorflow/core/lib/core/errors.h"
+#include "tensorflow/core/lib/core/status.h"
+
+#define DRAGNN_FMK_ATTRIBUTE_ALWAYS_INLINE __attribute__((always_inline)) inline
+
+namespace syntaxnet {
+namespace dragnn {
+namespace runtime {
+
+// Matrix-vector multiplication helper, which will switch the type of the
+// underlying matrix based on estimates of how well it will perform. For
+// example, a 32x32 matrix-multiplication might get a specialized SGEMV routine,
+// while a 2x128 matrix-multiplication might use a naive (non-SSE/AVX)
+// algorithm.
+//
+// Call Initialize() before using, then call one of the MatrixVectorProduct()
+// routines.
+class FlexibleMatrixKernel {
+ public:
+  // Suffix appended to variable lookups issued by the kernel.
+  static constexpr char kSuffix[] = "/FlexibleMatrixKernel";
+
+  FlexibleMatrixKernel() = default;
+
+  // Initializes the underlying matrices for this kernel; call this method
+  // before using this class. Arguments: |debug_name| is the name of the matrix
+  // being accessed, which usually should specify the component name and other
+  // relevant aspects; |weights_name| is the name of the variable in the
+  // TensorFlow graph to access; |output_dimension| is the real output
+  // dimension, which is comparable to the number of rows in the matrix but does
+  // not include padding; |variable_store| is the store which is queried for
+  // variables.
+  tensorflow::Status Initialize(const string &debug_name,
+                                const string &weights_name,
+                                int output_dimension,
+                                VariableStore *variable_store);
+
+  // Number of columns for the matrix. This may be padded, if a blocked format
+  // is chosen.
+  int NumPaddedRows() const;
+
+  // Number of columns for the matrix. This should not be padded.
+  int NumColumns() const;
+
+  // Whether a layer's logical output dimension matches the shape of this class'
+  // underlying matrix.
+  bool MatchesOutputDimension(int output_dimension) const;
+
+  // Computes the matrix-vector product of a single vector, with an initial
+  // value. This runs different code based on what kind of blocked matrix was
+  // chosen. There are generally no restrictions, i.e. it is fairly common to
+  // have initial == output.
+  DRAGNN_FMK_ATTRIBUTE_ALWAYS_INLINE
+  void MatrixVectorProduct(Vector<float> input, Vector<float> initial,
+                           MutableVector<float> output) const;
+
+  // Computes the matrix-vector product of two vectors at once. This is the
+  // entrypoint for SGEMVV, and is more efficient.
+
+  DRAGNN_FMK_ATTRIBUTE_ALWAYS_INLINE
+  void MatrixVectorVectorProduct(Vector<float> input0, Vector<float> input1,
+                                 Vector<float> initial0, Vector<float> initial1,
+                                 MutableVector<float> output0,
+                                 MutableVector<float> output1) const;
+
+  // Convenience function, calculating `output += M * input`.
+  void AddMatrixVectorProduct(Vector<float> input,
+                              MutableVector<float> output) const {
+    MatrixVectorProduct(input, Vector<float>(output), output);
+  }
+
+  // Same as above, without initial bias.
+  DRAGNN_FMK_ATTRIBUTE_ALWAYS_INLINE
+  void MatrixVectorProduct(Vector<float> input,
+                           MutableVector<float> output) const;
+
+ private:
+
+
+  enum class WeightsType { kNormal, kBlocked32, kBlocked48 };
+
+
+  // Returns the human-readable name of a WeightsType.
+  static string TypeName(WeightsType value);
+
+  WeightsType weights_type_;
+
+  // Actual matrix data. Which matrix is active is determined by
+  // |weights_type_|.
+  Matrix<float> weights_;
+  SgemvMatrix<32> fast_weights_32_;
+  SgemvMatrix<48> fast_weights_48_;
+
+  // Output dimension padded to alignment.
+  int padded_output_dimension_;
+};
+
+// Implementation details below.
+
+DRAGNN_FMK_ATTRIBUTE_ALWAYS_INLINE
+void FlexibleMatrixKernel::MatrixVectorProduct(
+    Vector<float> input, Vector<float> initial,
+    MutableVector<float> output) const {
+  SgemvOutputBatch<1> outputs = {{output.data()}};
+  SgemvInputBatch<1> inputs = {{input.data()}, {initial.data()}};
+  switch (weights_type_) {
+    case WeightsType::kNormal:
+      MultiplyMatrixAndVectorWithBias(weights_, initial, input, output);
+      return;
+    case WeightsType::kBlocked32:
+      fast_weights_32_.MaskedMatrixMultiVectorProduct(
+          inputs, padded_output_dimension_, &outputs);
+      return;
+    case WeightsType::kBlocked48:
+      fast_weights_48_.MaskedMatrixMultiVectorProduct(
+          inputs, padded_output_dimension_, &outputs);
+      return;
+  }
+}
+
+DRAGNN_FMK_ATTRIBUTE_ALWAYS_INLINE
+void FlexibleMatrixKernel::MatrixVectorVectorProduct(
+    Vector<float> input0, Vector<float> input1, Vector<float> initial0,
+    Vector<float> initial1, MutableVector<float> output0,
+    MutableVector<float> output1) const {
+  SgemvOutputBatch<2> outputs = {{output0.data(), output1.data()}};
+  SgemvInputBatch<2> inputs = {{input0.data(), input1.data()},
+                               {initial0.data(), initial1.data()}};
+  switch (weights_type_) {
+    case WeightsType::kNormal:
+      MultiplyMatrixAndVectorWithBias(weights_, initial0, input0, output0);
+      MultiplyMatrixAndVectorWithBias(weights_, initial1, input1, output1);
+      return;
+    case WeightsType::kBlocked32:
+      fast_weights_32_.MaskedMatrixMultiVectorProduct(
+          inputs, padded_output_dimension_, &outputs);
+      return;
+    case WeightsType::kBlocked48:
+      fast_weights_48_.MaskedMatrixMultiVectorProduct(
+          inputs, padded_output_dimension_, &outputs);
+      return;
+  }
+}
+
+DRAGNN_FMK_ATTRIBUTE_ALWAYS_INLINE
+void FlexibleMatrixKernel::MatrixVectorProduct(
+    Vector<float> input, MutableVector<float> output) const {
+  SgemvOutputBatch<1> outputs = {{output.data()}};
+  SgemvInputBatch<1> inputs = {{input.data()}, {nullptr}};
+  switch (weights_type_) {
+    case WeightsType::kNormal:
+      MultiplyMatrixAndVector(weights_, input, output);
+      return;
+    case WeightsType::kBlocked32:
+      fast_weights_32_.MaskedMatrixMultiVectorProductNoInitial(
+          inputs, padded_output_dimension_, &outputs);
+      return;
+    case WeightsType::kBlocked48:
+      fast_weights_48_.MaskedMatrixMultiVectorProductNoInitial(
+          inputs, padded_output_dimension_, &outputs);
+      return;
+  }
+}
+
+}  // namespace runtime
+}  // namespace dragnn
+}  // namespace syntaxnet
+
+#undef DRAGNN_FMK_ATTRIBUTE_ALWAYS_INLINE
+
+#endif  // DRAGNN_RUNTIME_FLEXIBLE_MATRIX_KERNEL_H_
--- a/research/syntaxnet/dragnn/runtime/flexible_matrix_kernel_test.cc
+++ b/research/syntaxnet/dragnn/runtime/flexible_matrix_kernel_test.cc
+// Copyright 2017 Google Inc. All Rights Reserved.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+// =============================================================================
+
+#include <vector>
+
+#include "dragnn/runtime/flexible_matrix_kernel.h"
+
+#include "dragnn/core/test/generic.h"
+#include "dragnn/protos/runtime.pb.h"
+#include "dragnn/runtime/math/transformations.h"
+#include "dragnn/runtime/test/fake_variable_store.h"
+#include "dragnn/runtime/test/helpers.h"
+
+#include "tensorflow/core/lib/core/status_test_util.h"
+#include "tensorflow/core/lib/strings/strcat.h"
+#include "tensorflow/core/platform/test.h"
+
+namespace syntaxnet {
+namespace dragnn {
+namespace runtime {
+
+std::vector<std::vector<float>> TestValues(int inner_dimension) {
+  std::vector<std::vector<float>> values;
+  for (int block = 0; block < 32; ++block) {
+    std::vector<float> row_values;
+    for (int value = 0; value < inner_dimension; ++value) {
+      row_values.push_back(0.1f);
+    }
+    values.push_back(row_values);
+  }
+  return values;
+}
+
+// Tests that the FlexibleMatrixKernel will use a blocked matrix if that is the
+// only available format.
+TEST(FlexibleMatrixKernelTest, UseBlockedMatrix) {
+  std::vector<std::vector<float>> values = TestValues(32);
+
+  for (int actual_rows : {24, 30, 32}) {
+    // Add the variable using a blocked format.
+    FakeVariableStore store;
+    store.AddOrDie(
+        tensorflow::strings::StrCat("weights", FlexibleMatrixKernel::kSuffix),
+        values, VariableSpec::FORMAT_COLUMN_BLOCKED_ROW_MAJOR_MATRIX);
+
+    FlexibleMatrixKernel kernel;
+    TF_EXPECT_OK(
+        kernel.Initialize("test_weights", "weights", actual_rows, &store));
+    EXPECT_EQ(kernel.NumPaddedRows(), 32);
+
+    UniqueVector<float> vector(values.back());
+    UniqueVector<float> output(actual_rows);
+
+    kernel.MatrixVectorProduct(Vector<float>(*vector), *output);
+
+    // Every value in `output` should be 32 * 0.1 * 0.1 = 0.32.
+    for (int i = 0; i < actual_rows; ++i) {
+      EXPECT_NEAR((*output)[i], 0.32f, 1e-6f);
+    }
+
+    kernel.MatrixVectorProduct(Vector<float>(*vector), Vector<float>(*output),
+                               *output);
+
+    // Every value in `output` should be 2 * 32 * 0.1 * 0.1 = 0.64.
+    for (int i = 0; i < actual_rows; ++i) {
+      EXPECT_NEAR((*output)[i], 0.64f, 1e-6f);
+    }
+  }
+}
+
+// Tests that the FlexibleMatrixKernel will use a non-blocked matrix if that is
+// the only available format.
+TEST(FlexibleMatrixKernelTest, UseNonBlockedMatrix) {
+  const int kOutputDim = 32;
+  std::vector<std::vector<float>> values = TestValues(kOutputDim);
+
+  // Add the variable using a non-blocked format.
+  FakeVariableStore store;
+  store.AddOrDie(
+      tensorflow::strings::StrCat("weights", FlexibleMatrixKernel::kSuffix),
+      values, VariableSpec::FORMAT_ROW_MAJOR_MATRIX);
+
+  FlexibleMatrixKernel kernel;
+  TF_EXPECT_OK(
+      kernel.Initialize("test_weights", "weights", kOutputDim, &store));
+
+  EXPECT_EQ(kernel.NumPaddedRows(), 32);
+  EXPECT_EQ(kernel.NumColumns(), kOutputDim);
+
+  UniqueVector<float> vector(values.back());
+  UniqueVector<float> output(kOutputDim);
+
+  kernel.MatrixVectorProduct(Vector<float>(*vector), *output);
+
+  const float kExpectedFirstResult = kOutputDim * 0.1 * 0.1;
+  for (int i = 0; i < kOutputDim; ++i) {
+    EXPECT_NEAR((*output)[i], kExpectedFirstResult, 1e-6f);
+  }
+
+  kernel.MatrixVectorProduct(Vector<float>(*vector), Vector<float>(*output),
+                             *output);
+
+  const float kExpectedSecondResult = 2.0 * kExpectedFirstResult;
+  for (int i = 0; i < kOutputDim; ++i) {
+    EXPECT_NEAR((*output)[i], kExpectedSecondResult, 1e-6f);
+  }
+}
+
+TEST(FlexibleMatrixKernelTest, MissingVariableIsFailure) {
+  FakeVariableStore store;
+
+  FlexibleMatrixKernel kernel;
+  EXPECT_THAT(kernel.Initialize("test_weights", "weights", 30, &store),
+              test::IsErrorWithSubstr("Unknown variable: weights"));
+}
+
+
+}  // namespace runtime
+}  // namespace dragnn
+}  // namespace syntaxnet
--- a/research/syntaxnet/dragnn/runtime/fml_parsing.cc
+++ b/research/syntaxnet/dragnn/runtime/fml_parsing.cc
+// Copyright 2017 Google Inc. All Rights Reserved.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+// =============================================================================
+
+#include "dragnn/runtime/fml_parsing.h"
+
+#include "syntaxnet/fml_parser.h"
+#include "tensorflow/core/lib/core/errors.h"
+#include "tensorflow/core/lib/strings/str_util.h"
+#include "tensorflow/core/platform/protobuf.h"
+
+namespace syntaxnet {
+namespace dragnn {
+namespace runtime {
+
+tensorflow::Status FeatureFunctionAttributes::Reset(
+    const FeatureFunctionDescriptor &function) {
+  Attributes::Mapping mapping;
+  for (const Parameter &parameter : function.parameter()) {
+    mapping[parameter.name()] = parameter.value();
+  }
+  return Attributes::Reset(mapping);
+}
+
+tensorflow::Status ParseFeatureChainFml(const string &fml,
+                                        const std::vector<string> &types,
+                                        FeatureFunctionDescriptor *leaf) {
+  if (types.empty()) {
+    return tensorflow::errors::InvalidArgument("Empty chain of feature types");
+  }
+  const tensorflow::Status error = tensorflow::errors::InvalidArgument(
+      "Failed to parse feature chain [",
+      tensorflow::str_util::Join(types, ", "), "] from FML: ", fml);
+
+  FeatureExtractorDescriptor extractor;
+  FMLParser().Parse(fml, &extractor);
+  if (extractor.feature_size() != 1) return error;
+  const FeatureFunctionDescriptor *function = &extractor.feature(0);
+
+  // Check prefix of non-leaf features.
+  for (int i = 0; i + 1 < types.size(); ++i) {
+    if (function->type() != types[i]) return error;
+    if (function->argument() != 0) return error;
+    if (function->parameter_size() != 0) return error;
+    if (function->feature_size() != 1) return error;
+    function = &function->feature(0);
+  }
+
+  // Check leaf feature.
+  if (function->type() != types.back()) return error;
+  if (function->feature_size() != 0) return error;
+
+  // Success; make modifications.
+  *leaf = *function;
+  return tensorflow::Status::OK();
+}
+
+}  // namespace runtime
+}  // namespace dragnn
+}  // namespace syntaxnet
--- a/research/syntaxnet/dragnn/runtime/fml_parsing.h
+++ b/research/syntaxnet/dragnn/runtime/fml_parsing.h
+// Copyright 2017 Google Inc. All Rights Reserved.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+// =============================================================================
+
+// Utils for extracting information from FML specifications.
+
+#ifndef DRAGNN_RUNTIME_FML_PARSING_H_
+#define DRAGNN_RUNTIME_FML_PARSING_H_
+
+#include <string>
+#include <vector>
+
+#include "dragnn/runtime/attributes.h"
+#include "syntaxnet/base.h"
+#include "syntaxnet/feature_extractor.pb.h"
+#include "tensorflow/core/lib/core/status.h"
+
+namespace syntaxnet {
+namespace dragnn {
+namespace runtime {
+
+// Attributes that can be parsed from a feature descriptor.
+class FeatureFunctionAttributes : public Attributes {
+ public:
+  // Parses registered attributes from the parameters of the |function|.  On
+  // error, returns non-OK.
+  tensorflow::Status Reset(const FeatureFunctionDescriptor &function);
+};
+
+// Parses the |fml| as a chain of nested features matching the |types|.  All of
+// the features must have no parameters, except the innermost, whose descriptor
+// is set to |leaf|.  On error, returns non-OK and modifies nothing.
+tensorflow::Status ParseFeatureChainFml(const string &fml,
+                                        const std::vector<string> &types,
+                                        FeatureFunctionDescriptor *leaf);
+
+}  // namespace runtime
+}  // namespace dragnn
+}  // namespace syntaxnet
+
+#endif  // DRAGNN_RUNTIME_FML_PARSING_H_
--- a/research/syntaxnet/dragnn/runtime/fml_parsing_test.cc
+++ b/research/syntaxnet/dragnn/runtime/fml_parsing_test.cc
+// Copyright 2017 Google Inc. All Rights Reserved.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+// =============================================================================
+
+#include "dragnn/runtime/fml_parsing.h"
+
+#include <string>
+#include <vector>
+
+#include "dragnn/core/test/generic.h"
+#include "syntaxnet/base.h"
+#include "syntaxnet/feature_extractor.pb.h"
+#include "tensorflow/core/lib/core/status.h"
+#include "tensorflow/core/lib/core/status_test_util.h"
+#include "tensorflow/core/platform/test.h"
+
+namespace syntaxnet {
+namespace dragnn {
+namespace runtime {
+namespace {
+
+// Attributes for the test.
+struct TestAttributes : public FeatureFunctionAttributes {
+  Optional<int32> foo{"foo", -1, this};
+  Mandatory<float> bar{"bar", this};
+};
+
+// Tests that attributes can be parsed from a valid feature descriptor.
+TEST(FeatureFunctionAttributesTest, ValidDescriptor) {
+  FeatureFunctionDescriptor function;
+  Parameter *parameter = function.add_parameter();
+  parameter->set_name("bar");
+  parameter->set_value("1.75");
+
+  TestAttributes attributes;
+  TF_ASSERT_OK(attributes.Reset(function));
+  EXPECT_EQ(attributes.foo(), -1);
+  EXPECT_EQ(attributes.bar(), 1.75);
+}
+
+// Tests that a feature chain can be parsed from valid FML, and the feature
+// options can then be extracted as attributes.
+TEST(ParseFeatureChainFmlTest, ValidFml) {
+  FeatureFunctionDescriptor leaf;
+  TF_ASSERT_OK(ParseFeatureChainFml("path.to.feature(foo=123,bar=-0.5)",
+                                    {"path", "to", "feature"}, &leaf));
+
+  TestAttributes attributes;
+  TF_ASSERT_OK(attributes.Reset(leaf));
+  EXPECT_EQ(attributes.foo(), 123);
+  EXPECT_EQ(attributes.bar(), -0.5);
+}
+
+// Tests that an empty feature chain cannot be parsed.
+TEST(ParseFeatureChainFmlTest, EmptyChain) {
+  FeatureFunctionDescriptor leaf;
+  EXPECT_THAT(ParseFeatureChainFml("foo", {}, &leaf),
+              test::IsErrorWithSubstr("Empty chain of feature types"));
+}
+
+// Tests that empty FML cannot be parsed as a chain.
+TEST(ParseFeatureChainFmlTest, EmptyFml) {
+  FeatureFunctionDescriptor leaf;
+  EXPECT_THAT(ParseFeatureChainFml("", {"foo"}, &leaf),
+              test::IsErrorWithSubstr("Failed to parse feature chain"));
+}
+
+// Tests that feature chain parsing fails if the chain is too short.
+TEST(ParseFeatureChainFmlTest, ChainTooShort) {
+  FeatureFunctionDescriptor leaf;
+  EXPECT_THAT(ParseFeatureChainFml("path.to.feature", {"path", "to"}, &leaf),
+              test::IsErrorWithSubstr("Failed to parse feature chain"));
+}
+
+// Tests that feature chain parsing fails if the chain is too long.
+TEST(ParseFeatureChainFmlTest, ChainTooLong) {
+  FeatureFunctionDescriptor leaf;
+  EXPECT_THAT(ParseFeatureChainFml("path.to", {"path", "to", "feature"}, &leaf),
+              test::IsErrorWithSubstr("Failed to parse feature chain"));
+}
+
+// Tests that initial elements of the chain must match the specified types.
+TEST(ParseFeatureChainFmlTest, WrongTypeInPrefix) {
+  FeatureFunctionDescriptor leaf;
+  EXPECT_THAT(
+      ParseFeatureChainFml("path.to.feature", {"bad", "to", "feature"}, &leaf),
+      test::IsErrorWithSubstr("Failed to parse feature chain"));
+}
+
+// Tests that the last feature in the chain must match the specified type.
+TEST(ParseFeatureChainFmlTest, WrongTypeInLeaf) {
+  FeatureFunctionDescriptor leaf;
+  EXPECT_THAT(
+      ParseFeatureChainFml("path.to.feature", {"path", "to", "bad"}, &leaf),
+      test::IsErrorWithSubstr("Failed to parse feature chain"));
+}
+
+// Tests that initial elements of the chain cannot have an argument.
+TEST(ParseFeatureChainFmlTest, ArgumentInPrefix) {
+  FeatureFunctionDescriptor leaf;
+  EXPECT_THAT(
+      ParseFeatureChainFml("ok.bad(1).leaf", {"ok", "bad", "leaf"}, &leaf),
+      test::IsErrorWithSubstr("Failed to parse feature chain"));
+}
+
+// Tests that initial elements of the chain cannot have an argument.
+TEST(ParseFeatureChainFmlTest, OptionInPrefix) {
+  FeatureFunctionDescriptor leaf;
+  EXPECT_THAT(
+      ParseFeatureChainFml("ok.bad(foo=1).leaf", {"ok", "bad", "leaf"}, &leaf),
+      test::IsErrorWithSubstr("Failed to parse feature chain"));
+}
+
+}  // namespace
+}  // namespace runtime
+}  // namespace dragnn
+}  // namespace syntaxnet
--- a/research/syntaxnet/dragnn/runtime/head_selection_component_base.cc
+++ b/research/syntaxnet/dragnn/runtime/head_selection_component_base.cc
+// Copyright 2018 Google Inc. All Rights Reserved.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+// =============================================================================
+
+#include "dragnn/runtime/head_selection_component_base.h"
+
+#include <stddef.h>
+#include <algorithm>
+
+#include "tensorflow/core/lib/core/errors.h"
+
+namespace syntaxnet {
+namespace dragnn {
+namespace runtime {
+
+HeadSelectionComponentBase::HeadSelectionComponentBase(
+    const string &builder_name, const string &backend_name)
+    : builder_name_(builder_name), backend_name_(backend_name) {}
+
+bool HeadSelectionComponentBase::Supports(
+    const ComponentSpec &component_spec,
+    const string &normalized_builder_name) const {
+  return (normalized_builder_name == "BulkAnnotatorComponent" ||
+          normalized_builder_name == builder_name_) &&
+         (component_spec.backend().registered_name() == "StatelessComponent" ||
+          component_spec.backend().registered_name() == backend_name_) &&
+         component_spec.transition_system().registered_name() == "heads" &&
+         component_spec.network_unit().registered_name() == "IdentityNetwork" &&
+         component_spec.fixed_feature_size() == 0 &&
+         component_spec.linked_feature_size() == 1;
+}
+
+tensorflow::Status HeadSelectionComponentBase::Initialize(
+    const ComponentSpec &component_spec, VariableStore *variable_store,
+    NetworkStateManager *network_state_manager,
+    ExtensionManager *extension_manager) {
+  const LinkedFeatureChannel &link = component_spec.linked_feature(0);
+  size_t dimension = 0;
+  TF_RETURN_IF_ERROR(network_state_manager->LookupLayer(
+      link.source_component(), link.source_layer(), &dimension,
+      &adjacency_handle_));
+
+  if (dimension != 1) {
+    return tensorflow::errors::InvalidArgument(
+        "Adjacency matrix has dimension ", dimension, " but expected 1");
+  }
+
+  extension_manager->GetShared(&heads_handle_);
+  return tensorflow::Status::OK();
+}
+
+const std::vector<int> &HeadSelectionComponentBase::ComputeHeads(
+    SessionState *session_state) const {
+  Matrix<float> adjacency(
+      session_state->network_states.GetLayer(adjacency_handle_));
+  std::vector<int> &heads = session_state->extensions.Get(heads_handle_);
+  heads.resize(adjacency.num_rows());
+  for (size_t i = 0; i < adjacency.num_rows(); ++i) {
+    Vector<float> row = adjacency.row(i);
+    const int head = std::max_element(row.begin(), row.end()) - row.begin();
+    heads[i] = head != i ? head : -1;  // self-loops are roots
+  }
+  return heads;
+}
+
+}  // namespace runtime
+}  // namespace dragnn
+}  // namespace syntaxnet
--- a/research/syntaxnet/dragnn/runtime/head_selection_component_base.h
+++ b/research/syntaxnet/dragnn/runtime/head_selection_component_base.h
+// Copyright 2018 Google Inc. All Rights Reserved.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+// =============================================================================
+
+#ifndef DRAGNN_RUNTIME_HEAD_SELECTION_COMPONENT_BASE_H_
+#define DRAGNN_RUNTIME_HEAD_SELECTION_COMPONENT_BASE_H_
+
+#include <vector>
+
+#include "dragnn/core/compute_session.h"
+#include "dragnn/protos/spec.pb.h"
+#include "dragnn/protos/trace.pb.h"
+#include "dragnn/runtime/alignment.h"
+#include "dragnn/runtime/component.h"
+#include "dragnn/runtime/extensions.h"
+#include "dragnn/runtime/math/types.h"
+#include "dragnn/runtime/network_states.h"
+#include "dragnn/runtime/session_state.h"
+#include "dragnn/runtime/variable_store.h"
+#include "syntaxnet/base.h"
+#include "tensorflow/core/lib/core/status.h"
+
+namespace syntaxnet {
+namespace dragnn {
+namespace runtime {
+
+// Base class for head-selection components, which select heads independently
+// per token.  Although this process is not guaranteed to produce a tree, for
+// accurate parsers it often produces a tree.
+//
+// This base class only computes the selected heads, while subclasses apply
+// those heads to the annotations in the ComputeSession.
+class HeadSelectionComponentBase : public Component {
+ public:
+  // Partially implements Component.
+  bool Supports(const ComponentSpec &component_spec,
+                const string &normalized_builder_name) const override;
+  tensorflow::Status Initialize(const ComponentSpec &component_spec,
+                                VariableStore *variable_store,
+                                NetworkStateManager *network_state_manager,
+                                ExtensionManager *extension_manager) override;
+  bool PreferredTo(const Component &other) const override { return false; }
+
+ protected:
+  // Creates a component that supports the |builder_name| and |backend_name|.
+  HeadSelectionComponentBase(const string &builder_name,
+                             const string &backend_name);
+
+  // Returns the list of heads computed from the |session_state|, where -1
+  // indicates a root.
+  const std::vector<int> &ComputeHeads(SessionState *session_state) const;
+
+ private:
+  // Names of the supported component builder and backend.
+  const string builder_name_;
+  const string backend_name_;
+
+  // Directed adjacency matrix input.
+  PairwiseLayerHandle<float> adjacency_handle_;
+
+  // List of selected head indices.
+  SharedExtensionHandle<std::vector<int>> heads_handle_;
+};
+
+}  // namespace runtime
+}  // namespace dragnn
+}  // namespace syntaxnet
+
+#endif  // DRAGNN_RUNTIME_HEAD_SELECTION_COMPONENT_BASE_H_
--- a/research/syntaxnet/dragnn/runtime/head_selection_component_base_test.cc
+++ b/research/syntaxnet/dragnn/runtime/head_selection_component_base_test.cc
+// Copyright 2018 Google Inc. All Rights Reserved.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+// =============================================================================
+
+#include "dragnn/runtime/head_selection_component_base.h"
+
+#include <stddef.h>
+#include <string>
+#include <vector>
+
+#include "dragnn/core/compute_session.h"
+#include "dragnn/core/input_batch_cache.h"
+#include "dragnn/core/test/generic.h"
+#include "dragnn/protos/spec.pb.h"
+#include "dragnn/protos/trace.pb.h"
+#include "dragnn/runtime/network_states.h"
+#include "dragnn/runtime/session_state.h"
+#include "dragnn/runtime/test/network_test_base.h"
+#include "dragnn/runtime/variable_store.h"
+#include "syntaxnet/base.h"
+#include "tensorflow/core/lib/core/status.h"
+#include "tensorflow/core/lib/core/status_test_util.h"
+#include "tensorflow/core/platform/test.h"
+
+namespace syntaxnet {
+namespace dragnn {
+namespace runtime {
+namespace {
+
+constexpr size_t kNumSteps = 12;
+constexpr size_t kRootIndex = 7;  // the root and head of all other tokens
+
+constexpr char kTestBuilder[] = "TestBuilder";
+constexpr char kTestBackend[] = "TestBackend";
+constexpr char kPreviousComponentName[] = "previous_component";
+constexpr char kAdjacencyLayerName[] = "adjacency_layer";
+constexpr char kBadDimLayerName[] = "bad_layer";
+
+// A subclass for tests.
+class BasicHeadSelectionComponent : public HeadSelectionComponentBase {
+ public:
+  BasicHeadSelectionComponent()
+      : HeadSelectionComponentBase(kTestBuilder, kTestBackend) {}
+
+  // Implements Component.  These methods are never called, but must be defined
+  // so the class is not abstract.
+  tensorflow::Status Evaluate(
+      SessionState *session_state, ComputeSession *compute_session,
+      ComponentTrace *component_trace) const override {
+    return tensorflow::Status::OK();
+  }
+
+  // Publicizes the base class's method.
+  using HeadSelectionComponentBase::ComputeHeads;
+};
+
+// Returns a ComponentSpec that works with the head selection component.
+ComponentSpec MakeGoodSpec() {
+  ComponentSpec component_spec;
+  component_spec.mutable_component_builder()->set_registered_name(kTestBuilder);
+  component_spec.mutable_backend()->set_registered_name(kTestBackend);
+  component_spec.mutable_transition_system()->set_registered_name("heads");
+  component_spec.mutable_network_unit()->set_registered_name("IdentityNetwork");
+  LinkedFeatureChannel *link = component_spec.add_linked_feature();
+  link->set_source_component(kPreviousComponentName);
+  link->set_source_layer(kAdjacencyLayerName);
+  return component_spec;
+}
+
+class HeadSelectionComponentBaseTest : public NetworkTestBase {
+ protected:
+  // Initializes a head selection component from the |component_spec| and sets
+  // |heads| to the extracted head indices.  Returs non-OK on error.
+  tensorflow::Status Run(const ComponentSpec &component_spec,
+                         std::vector<int> *heads) {
+    AddComponent(kPreviousComponentName);
+    AddPairwiseLayer(kAdjacencyLayerName, 1);
+    AddPairwiseLayer(kBadDimLayerName, 2);
+
+    BasicHeadSelectionComponent component;
+    TF_RETURN_IF_ERROR(component.Initialize(component_spec, &variable_store_,
+                                            &network_state_manager_,
+                                            &extension_manager_));
+
+    network_states_.Reset(&network_state_manager_);
+    StartComponent(kNumSteps);
+
+    // Fill the |kRootIndex|'th column of the adjacency matrix with higher
+    // scores, so all tokens select it as head.  The |kRootIndex|'th token
+    // itself is a self-loop, so it becomes a root.
+    MutableMatrix<float> adjacency =
+        GetPairwiseLayer(kPreviousComponentName, kAdjacencyLayerName);
+    for (size_t target = 0; target < kNumSteps; ++target) {
+      for (size_t source = 0; source < kNumSteps; ++source) {
+        adjacency.row(target)[source] = source == kRootIndex ? 1.0 : 0.0;
+      }
+    }
+
+    session_state_.extensions.Reset(&extension_manager_);
+    *heads = component.ComputeHeads(&session_state_);
+
+    return tensorflow::Status::OK();
+  }
+};
+
+// Tests that the expected heads are produced for a good spec.
+TEST_F(HeadSelectionComponentBaseTest, RunsGoodSpec) {
+  std::vector<int> heads;
+  TF_ASSERT_OK(Run(MakeGoodSpec(), &heads));
+
+  std::vector<int> expected_heads(kNumSteps, kRootIndex);
+  expected_heads[kRootIndex] = -1;
+  EXPECT_EQ(heads, expected_heads);
+}
+
+// Tests that a layer with the wrong dimension is rejected
+TEST_F(HeadSelectionComponentBaseTest, WrongDimension) {
+  ComponentSpec component_spec = MakeGoodSpec();
+  component_spec.mutable_linked_feature(0)->set_source_layer(kBadDimLayerName);
+
+  std::vector<int> heads;
+  EXPECT_THAT(Run(component_spec, &heads),
+              test::IsErrorWithSubstr(
+                  "Adjacency matrix has dimension 2 but expected 1"));
+}
+
+// Tests that the component is always dis-preferred.
+TEST_F(HeadSelectionComponentBaseTest, NotPreferred) {
+  BasicHeadSelectionComponent component;
+  EXPECT_FALSE(component.PreferredTo(component));
+}
+
+// Tests that the good spec is supported.
+TEST_F(HeadSelectionComponentBaseTest, SupportsGoodSpec) {
+  ComponentSpec component_spec = MakeGoodSpec();
+
+  BasicHeadSelectionComponent component;
+  EXPECT_TRUE(component.Supports(component_spec, kTestBuilder));
+}
+
+// Tests that various bad specs are rejected.
+TEST_F(HeadSelectionComponentBaseTest, RejectsBadSpecs) {
+  ComponentSpec component_spec = MakeGoodSpec();
+  BasicHeadSelectionComponent component;
+  EXPECT_FALSE(component.Supports(component_spec, "bad"));
+
+  component_spec = MakeGoodSpec();
+  component_spec.mutable_backend()->set_registered_name("bad");
+  EXPECT_FALSE(component.Supports(component_spec, kTestBuilder));
+
+  component_spec = MakeGoodSpec();
+  component_spec.mutable_transition_system()->set_registered_name("bad");
+  EXPECT_FALSE(component.Supports(component_spec, kTestBuilder));
+
+  component_spec = MakeGoodSpec();
+  component_spec.mutable_network_unit()->set_registered_name("bad");
+  EXPECT_FALSE(component.Supports(component_spec, kTestBuilder));
+
+  component_spec = MakeGoodSpec();
+  component_spec.add_fixed_feature();
+  EXPECT_FALSE(component.Supports(component_spec, kTestBuilder));
+
+  component_spec = MakeGoodSpec();
+  component_spec.add_linked_feature();
+  EXPECT_FALSE(component.Supports(component_spec, kTestBuilder));
+
+  component_spec = MakeGoodSpec();
+  component_spec.clear_linked_feature();
+  EXPECT_FALSE(component.Supports(component_spec, kTestBuilder));
+}
+
+}  // namespace
+}  // namespace runtime
+}  // namespace dragnn
+}  // namespace syntaxnet
--- a/research/syntaxnet/dragnn/runtime/identity_sequence_linker.cc
+++ b/research/syntaxnet/dragnn/runtime/identity_sequence_linker.cc
+// Copyright 2017 Google Inc. All Rights Reserved.
+//
+// Licensed under the Apache License, Version 2.0 (the "License");
+// you may not use this file except in compliance with the License.
+// You may obtain a copy of the License at
+//
+//     http://www.apache.org/licenses/LICENSE-2.0
+//
+// Unless required by applicable law or agreed to in writing, software
+// distributed under the License is distributed on an "AS IS" BASIS,
+// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+// See the License for the specific language governing permissions and
+// limitations under the License.
+// =============================================================================
+
+#include <stddef.h>
+#include <vector>
+
+#include "dragnn/core/input_batch_cache.h"
+#include "dragnn/protos/spec.pb.h"
+#include "dragnn/runtime/sequence_linker.h"
+#include "dragnn/runtime/transition_system_traits.h"
+#include "syntaxnet/base.h"
+#include "tensorflow/core/lib/core/errors.h"
+#include "tensorflow/core/lib/core/status.h"
+
+namespace syntaxnet {
+namespace dragnn {
+namespace runtime {
+namespace {
+
+// Applies an identity function.
+class IdentitySequenceLinker : public SequenceLinker {
+ public:
+  // Implements SequenceLinker.
+  bool Supports(const LinkedFeatureChannel &channel,
+                const ComponentSpec &component_spec) const override;
+  tensorflow::Status Initialize(const LinkedFeatureChannel &channel,
+                                const ComponentSpec &component_spec) override;
+  tensorflow::Status GetLinks(size_t source_num_steps, InputBatchCache *input,
+                              std::vector<int32> *links) const override;
+};
+
+bool IdentitySequenceLinker::Supports(
+    const LinkedFeatureChannel &channel,
+    const ComponentSpec &component_spec) const {
+  TransitionSystemTraits traits(component_spec);
+
+  // Note: Add more "||" clauses as needed.
+  return (channel.fml() == "input.focus" ||
+          channel.fml() == "char-input.focus") &&
+         channel.source_translator() == "identity" && traits.is_sequential;
+}
+
+tensorflow::Status IdentitySequenceLinker::Initialize(
+    const LinkedFeatureChannel &channel, const ComponentSpec &component_spec) {
+  return tensorflow::Status::OK();
+}
+
+tensorflow::Status IdentitySequenceLinker::GetLinks(
+    size_t source_num_steps, InputBatchCache *input,
+    std::vector<int32> *links) const {
+  links->resize(source_num_steps);
+  int32 index = 0;
+  for (int32 &link : *links) link = index++;
+  return tensorflow::Status::OK();
+}
+
+DRAGNN_RUNTIME_REGISTER_SEQUENCE_LINKER(IdentitySequenceLinker);
+
+}  // namespace
+}  // namespace runtime
+}  // namespace dragnn
+}  // namespace syntaxnet