Save models and write inference results.

PiperOrigin-RevId: 701159583
google-research · Dec 3, 2024 · c548aa9 · c548aa9
1 parent caa1962
commit c548aa9
Show file tree

Hide file tree

Showing 2 changed files with 180 additions and 3 deletions.
diff --git a/hoplite/agile/classifier.py b/hoplite/agile/classifier.py
@@ -15,15 +15,64 @@
 
 """Functions for training and applying a linear classifier."""
 
-from typing import Any
+import base64
+import dataclasses
+import json
+from typing import Any, Sequence
 
 from hoplite.agile import classifier_data
 from hoplite.agile import metrics
+from hoplite.db import interface as db_interface
+from hoplite.taxonomy import namespace
+from ml_collections import config_dict
 import numpy as np
 import tensorflow as tf
 import tqdm
 
 
+@dataclasses.dataclass
+class LinearClassifier:
+  """Wrapper for linear classifier params and metadata."""
+
+  beta: np.ndarray
+  beta_bias: np.ndarray
+  classes: tuple[str, ...]
+  embedding_model_config: Any
+
+  def __call__(self, embeddings: np.ndarray):
+    return np.dot(embeddings, self.beta) + self.beta_bias
+
+  def save(self, path: str):
+    """Save the classifier to a path."""
+    cfg = config_dict.ConfigDict()
+    cfg.model_config = self.embedding_model_config
+    cfg.classes = self.classes
+    # Convert numpy arrays to base64 encoded blobs.
+    beta_bytes = base64.b64encode(np.float32(self.beta).tobytes()).decode(
+        'ascii'
+    )
+    beta_bias_bytes = base64.b64encode(
+        np.float32(self.beta_bias).tobytes()
+    ).decode('ascii')
+    cfg.beta = beta_bytes
+    cfg.beta_bias = beta_bias_bytes
+    with open(path, 'w') as f:
+      f.write(cfg.to_json())
+
+  @classmethod
+  def load(cls, path: str):
+    """Load a classifier from a path."""
+    with open(path, 'r') as f:
+      cfg_json = json.loads(f.read())
+      cfg = config_dict.ConfigDict(cfg_json)
+    classes = cfg.classes
+    beta = np.frombuffer(base64.b64decode(cfg.beta), dtype=np.float32)
+    beta = np.reshape(beta, (-1, len(classes)))
+    beta_bias = np.frombuffer(base64.b64decode(cfg.beta_bias), dtype=np.float32)
+    embedding_model_config = cfg.model_config
+    return cls(beta, beta_bias, classes, embedding_model_config)
+
+
 def get_linear_model(embedding_dim: int, num_classes: int) -> tf.keras.Model:
   """Create a simple linear Keras model."""
   model = tf.keras.Sequential([
@@ -105,7 +154,7 @@ def train_linear_classifier(
     learning_rate: float,
     weak_neg_weight: float,
     num_train_steps: int,
-):
+) -> tuple[LinearClassifier, dict[str, float]]:
   """Train a linear classifier."""
   embedding_dim = data_manager.db.embedding_dimension()
   num_classes = len(data_manager.get_target_labels())
@@ -147,4 +196,58 @@ def train_step(y_true, embeddings, is_labeled_mask):
       'beta_bias': lin_model.get_weights()[1],
   }
   eval_scores = eval_classifier(params, data_manager, eval_idxes)
-  return params, eval_scores
+
+  model_config = data_manager.db.get_metadata('model_config')
+  linear_classifier = LinearClassifier(
+      beta=params['beta'],
+      beta_bias=params['beta_bias'],
+      classes=data_manager.get_target_labels(),
+      embedding_model_config=model_config,
+  )
+  return linear_classifier, eval_scores
+
+
+def write_inference_csv(
+    linear_classifier: LinearClassifier,
+    db: db_interface.HopliteDBInterface,
+    output_filepath: str,
+    threshold: float,
+    labels: Sequence[str] | None = None,
+):
+  """Write a CSV for all audio windows with logits above a threshold.
+
+  Args:
+    params: The parameters of the linear classifier.
+    class_list: The class list of labels associated with the classifier.
+    db: HopliteDBInterface to read embeddings from.
+    output_filepath: Path to write the CSV to.
+    threshold: Logits must be above this value to be written.
+    labels: If provided, only write logits for these labels. If None, write
+      logits for all labels.
+
+  Returns:
+    None
+  """
+  idxes = db.get_embedding_ids()
+  if labels is None:
+    labels = linear_classifier.classes
+  label_ids = {cl: i for i, cl in enumerate(linear_classifier.classes)}
+  target_label_ids = np.array([label_ids[l] for l in labels])
+  logits_fn = lambda emb: linear_classifier(emb)[target_label_ids]
+  with open(output_filepath, 'w') as f:
+    f.write('idx,dataset_name,source_id,offset,label,logits\n')
+    for idx in tqdm.tqdm(idxes):
+      source = db.get_embedding_source(idx)
+      emb = db.get_embedding(idx)
+      logits = logits_fn(emb)
+      for a in np.argwhere(logits > threshold):
+        lbl = labels[a]
+        row = [
+            idx,
+            source.dataset_name,
+            source.source_id,
+            source.offsets[0],
+            lbl,
+            logits[a],
+        ]
+        f.write(','.join(map(str, row)) + '\n')
diff --git a/hoplite/agile/tests/classifier_test.py b/hoplite/agile/tests/classifier_test.py
@@ -0,0 +1,74 @@
+# coding=utf-8
+# Copyright 2024 The Perch Authors.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+
+"""Tests for linear classifier implementation."""
+
+import os
+import tempfile
+
+from hoplite.agile import classifier
+from ml_collections import config_dict
+import numpy as np
+
+from absl.testing import absltest
+
+
+class ClassifierTest(absltest.TestCase):
+
+  def setUp(self):
+    super().setUp()
+    # `self.create_tempdir()` raises an UnparsedFlagAccessError, which is why
+    # we use `tempdir` directly.
+    self.tempdir = tempfile.mkdtemp()
+
+  def _make_linear_classifier(self, embedding_dim, classes):
+    np.random.seed(1234)
+    beta = np.float32(np.random.normal(size=(embedding_dim, len(classes))))
+    beta_bias = np.float32(np.random.normal(size=(len(classes),)))
+    embedding_model_config = config_dict.ConfigDict({
+        'model_name': 'nelson',
+    })
+    return classifier.LinearClassifier(
+        beta, beta_bias, classes, embedding_model_config
+    )
+
+  def test_call_linear_classifier(self):
+    embedding_dim = 8
+    classes = ('a', 'b', 'c')
+    classy = self._make_linear_classifier(embedding_dim, classes)
+
+    batch_embeddings = np.random.normal(size=(10, embedding_dim))
+    predictions = classy(batch_embeddings)
+    self.assertEqual(predictions.shape, (10, len(classes)))
+
+    single_embedding = np.random.normal(size=(embedding_dim,))
+    predictions = classy(single_embedding)
+    self.assertEqual(predictions.shape, (len(classes),))
+
+  def test_save_load_linear_classifier(self):
+    embedding_dim = 8
+    classes = ('a', 'b', 'c')
+    classy = self._make_linear_classifier(embedding_dim, classes)
+    classy_path = os.path.join(self.tempdir, 'classifier.json')
+    classy.save(classy_path)
+    classy_loaded = classifier.LinearClassifier.load(classy_path)
+    np.testing.assert_allclose(classy_loaded.beta, classy.beta)
+    np.testing.assert_allclose(classy_loaded.beta_bias, classy.beta_bias)
+    self.assertSequenceEqual(classy_loaded.classes, classy.classes)
+    self.assertEqual(classy_loaded.embedding_model_config.model_name, 'nelson')
+
+
+if __name__ == '__main__':
+  absltest.main()