eth-easl · francescodeaglio · Sep 18, 2023 · Jun 22, 2023 · Jun 22, 2023 · Jun 24, 2023
diff --git a/integrationtests/selector/integrationtest_selector.py b/integrationtests/selector/integrationtest_selector.py
@@ -922,14 +922,15 @@ def test_get_available_labels(reset_after_trigger: bool):
         )
     )
 
-    selector.inform_data(
+    selector.inform_data_and_trigger(
         DataInformRequest(
             pipeline_id=pipeline_id,
             keys=[4, 5, 6],
             timestamps=[4, 5, 6],
             labels=[10, 7, 45],
         )
     )
+
     available_labels = selector.get_available_labels(
         GetAvailableLabelsRequest(pipeline_id=pipeline_id)
     ).available_labels

diff --git a/modyn/models/README.md b/modyn/models/README.md
@@ -5,4 +5,9 @@ The user can define models here. The model definition should take as a parameter
 # Wild Time models
 The code for the models used for WildTime is taken from the official [repository](https://github.com/huaxiuyao/Wild-Time). 
 The original version is linked in each class.
-You can find [here](https://raw.githubusercontent.com/huaxiuyao/Wild-Time/main/LICENSE) a copy of the MIT license
+You can find [here](https://raw.githubusercontent.com/huaxiuyao/Wild-Time/main/LICENSE) a copy of the MIT license
+
+# Embedding Recorder
+Many coreset methods are adapted from the [DeepCore](https://github.com/PatrickZH/DeepCore/) library. To use them, the models must keep track of the embeddings (activations of the penultimate layer). This is
+done using the `EmbeddingRecorder` class, which is adapted from the aforementioned project.
+You can find a copy of their MIT license [here](https://raw.githubusercontent.com/PatrickZH/DeepCore/main/LICENSE.md)
diff --git a/modyn/models/articlenet/articlenet.py b/modyn/models/articlenet/articlenet.py
@@ -1,6 +1,7 @@
 from typing import Any
 
 import torch
+from modyn.models.coreset_methods_support import CoresetMethodsSupport
 from torch import nn
 from transformers import DistilBertModel
 
@@ -43,12 +44,16 @@ def __call__(self, data: torch.Tensor) -> torch.Tensor:
         return pooled_output
 
 
-class ArticleNetwork(nn.Module):
+class ArticleNetwork(CoresetMethodsSupport):
     def __init__(self, num_classes: int) -> None:
         super().__init__()
         self.featurizer = DistilBertFeaturizer.from_pretrained("distilbert-base-uncased")
         self.classifier = nn.Linear(self.featurizer.d_out, num_classes)
 
     def forward(self, data: torch.Tensor) -> torch.Tensor:
         embedding = self.featurizer(data)
+        embedding = self.embedding_recorder(embedding)
         return self.classifier(embedding)
+
+    def get_last_layer(self) -> nn.Module:
+        return self.classifier
diff --git a/modyn/models/coreset_methods_support.py b/modyn/models/coreset_methods_support.py
@@ -0,0 +1,60 @@
+from abc import ABC, abstractmethod
+from typing import Optional
+
+import torch
+from torch import nn
+
+
+# acknowledgment: github.com/PatrickZH/DeepCore/
+class EmbeddingRecorder(nn.Module):
+    def __init__(self, record_embedding: bool = False):
+        super().__init__()
+        self.record_embedding = record_embedding
+        self.embedding: Optional[torch.Tensor] = None
+
+    def forward(self, tensor: torch.Tensor) -> torch.Tensor:
+        if self.record_embedding:
+            self.embedding = tensor
+        return tensor
+
+    def start_recording(self) -> None:
+        self.record_embedding = True
+
+    def end_recording(self) -> None:
+        self.record_embedding = False
+        self.embedding = None
+
+
+class CoresetMethodsSupport(nn.Module, ABC):
+    """
+    This class is used to support some Coreset Methods.
+    Embeddings, here defined as the activation before the last layer, are often used to estimate the importance of
+    a point. To implement this class correctly, it is necessary to
+        - implement the get_last_layer method
+        - modify the forward pass so that the last layer embedding is recorded. For example, in a simple network like
+            x = self.fc1(input)
+            x = self.fc2(x)
+            output = self.fc3(x)
+        it must be modified as follows
+            x = self.fc1(input)
+            x = self.fc2(x)
+            x = self.embedding_recorder(x)
+            output = self.fc3(x)
+    """
+
+    def __init__(self, record_embedding: bool = False) -> None:
+        super().__init__()
+        self.embedding_recorder = EmbeddingRecorder(record_embedding)
+
+    @property
+    def embedding(self) -> Optional[torch.Tensor]:
+        assert self.embedding_recorder is not None
+        return self.embedding_recorder.embedding
+
+    @abstractmethod
+    def get_last_layer(self) -> nn.Module:
+        """
+        Returns the last layer. Used for example to obtain the pre-layer and post-layer dimensions of tensors
+
+        """
+        raise NotImplementedError()
diff --git a/modyn/models/dlrm/dlrm.py b/modyn/models/dlrm/dlrm.py
@@ -1,7 +1,8 @@
-from typing import Any
+from typing import Any, Optional
 
 import numpy as np
 import torch
+from modyn.models.coreset_methods_support import CoresetMethodsSupport, EmbeddingRecorder
 from modyn.models.dlrm.nn.factories import create_interaction
 from modyn.models.dlrm.nn.parts import DlrmBottom, DlrmTop
 from modyn.models.dlrm.utils.install_lib import install_cuda_extensions_if_not_present
@@ -16,7 +17,7 @@ def __init__(self, model_configuration: dict[str, Any], device: str, amp: bool)
         self.model.to(device)
 
 
-class DlrmModel(nn.Module):
+class DlrmModel(CoresetMethodsSupport):
     # pylint: disable=too-many-instance-attributes
     def __init__(self, model_configuration: dict[str, Any], device: str, amp: bool) -> None:
         super().__init__()
@@ -124,3 +125,15 @@ def forward(self, data: torch.Tensor) -> torch.Tensor:
             numerical_input, self.reorder_categorical_input(categorical_input)
         )
         return self.top_model(from_bottom, bottom_mlp_output).squeeze()
+
+    # delegate the embedding handling to the top model
+    @property
+    def embedding(self) -> Optional[torch.Tensor]:
+        return self.top_model.embedding
+
+    @property
+    def embedding_recorder(self) -> EmbeddingRecorder:
+        return self.top_model.embedding_recorder
+
+    def get_last_layer(self) -> nn.Module:
+        return self.top_model.get_last_layer()
diff --git a/modyn/models/dlrm/nn/parts.py b/modyn/models/dlrm/nn/parts.py
@@ -19,6 +19,7 @@
 from typing import Optional, Sequence, Tuple
 
 import torch
+from modyn.models.coreset_methods_support import CoresetMethodsSupport
 from modyn.models.dlrm.nn.embeddings import Embeddings
 from modyn.models.dlrm.nn.factories import create_embeddings, create_mlp
 from modyn.models.dlrm.nn.interactions import Interaction
@@ -104,7 +105,7 @@ def forward(self, numerical_input, categorical_inputs) -> Tuple[torch.Tensor, Op
         return torch.cat(bottom_output, dim=1), bottom_mlp_output
 
 
-class DlrmTop(nn.Module):
+class DlrmTop(CoresetMethodsSupport):
     def __init__(self, top_mlp_sizes: Sequence[int], interaction: Interaction, device: str, use_cpp_mlp: bool = False):
         super().__init__()
 
@@ -127,4 +128,9 @@ def forward(self, bottom_output, bottom_mlp_output):
             bottom_mlp_output (Tensor): with shape [batch_size, embedding_dim]
         """
         interaction_output = self.interaction.interact(bottom_output, bottom_mlp_output)
-        return self.out(self.mlp(interaction_output))
+        mlp_output = self.mlp(interaction_output)
+        mlp_output = self.embedding_recorder(mlp_output)
+        return self.out(mlp_output)
+
+    def get_last_layer(self) -> nn.Module:
+        return self.out
diff --git a/modyn/models/fmownet/fmownet.py b/modyn/models/fmownet/fmownet.py
@@ -2,6 +2,7 @@
 
 import torch
 import torch.nn.functional as F
+from modyn.models.coreset_methods_support import CoresetMethodsSupport
 from torch import nn
 from torchvision.models import densenet121
 
@@ -19,7 +20,7 @@ def __init__(self, model_configuration: dict[str, Any], device: str, amp: bool)
         self.model.to(device)
 
 
-class FmowNetModel(nn.Module):
+class FmowNetModel(CoresetMethodsSupport):
     def __init__(self, num_classes: int) -> None:
         super().__init__()
         self.num_classes = num_classes
@@ -31,5 +32,8 @@ def forward(self, data: torch.Tensor) -> torch.Tensor:
         out = F.relu(features, inplace=True)
         out = F.adaptive_avg_pool2d(out, (1, 1))
         out = torch.flatten(out, 1)
-
+        out = self.embedding_recorder(out)
         return self.classifier(out)
+
+    def get_last_layer(self) -> nn.Module:
+        return self.classifier
diff --git a/modyn/models/resnet18/resnet18.py b/modyn/models/resnet18/resnet18.py
@@ -1,10 +1,44 @@
 from typing import Any
 
-from torchvision import models
+import torch
+from modyn.models.coreset_methods_support import CoresetMethodsSupport
+from torch import Tensor, nn
+from torchvision.models.resnet import BasicBlock, ResNet
 
 
 class ResNet18:
     # pylint: disable-next=unused-argument
     def __init__(self, model_configuration: dict[str, Any], device: str, amp: bool) -> None:
-        self.model = models.__dict__["resnet18"](**model_configuration)
+        self.model = ResNet18Modyn(model_configuration)
         self.model.to(device)
+
+
+# the following class is adapted from
+# torchvision https://github.com/pytorch/vision/blob/main/torchvision/models/resnet.py
+
+
+class ResNet18Modyn(ResNet, CoresetMethodsSupport):
+    def __init__(self, model_configuration: dict[str, Any]) -> None:
+        super().__init__(BasicBlock, [2, 2, 2, 2], **model_configuration)
+
+    def _forward_impl(self, x: Tensor) -> Tensor:
+        x = self.conv1(x)
+        x = self.bn1(x)
+        x = self.relu(x)
+        x = self.maxpool(x)
+
+        x = self.layer1(x)
+        x = self.layer2(x)
+        x = self.layer3(x)
+        x = self.layer4(x)
+
+        x = self.avgpool(x)
+        x = torch.flatten(x, 1)
+        # the following line is the only difference compared to the original implementation
+        x = self.embedding_recorder(x)
+        x = self.fc(x)
+
+        return x
+
+    def get_last_layer(self) -> nn.Module:
+        return self.fc
diff --git a/modyn/models/yearbooknet/yearbooknet.py b/modyn/models/yearbooknet/yearbooknet.py
@@ -1,6 +1,7 @@
 from typing import Any
 
 import torch
+from modyn.models.coreset_methods_support import CoresetMethodsSupport
 from torch import nn
 
 
@@ -17,7 +18,7 @@ def __init__(self, model_configuration: dict[str, Any], device: str, amp: bool)
         self.model.to(device)
 
 
-class YearbookNetModel(nn.Module):
+class YearbookNetModel(CoresetMethodsSupport):
     def __init__(self, num_input_channels: int, num_classes: int) -> None:
         super().__init__()
         self.enc = nn.Sequential(
@@ -37,5 +38,8 @@ def conv_block(self, in_channels: int, out_channels: int) -> nn.Module:
     def forward(self, data: torch.Tensor) -> torch.Tensor:
         data = self.enc(data)
         data = torch.mean(data, dim=(2, 3))
-
+        data = self.embedding_recorder(data)
         return self.classifier(data)
+
+    def get_last_layer(self) -> nn.Module:
+        return self.classifier
diff --git a/modyn/selector/internal/selector_strategies/abstract_selection_strategy.py b/modyn/selector/internal/selector_strategies/abstract_selection_strategy.py
@@ -404,7 +404,7 @@ def get_available_labels(self) -> list[int]:
                 database.session.query(SelectorStateMetadata.label)
                 .filter(
                     SelectorStateMetadata.pipeline_id == self._pipeline_id,
-                    SelectorStateMetadata.seen_in_trigger_id >= self._next_trigger_id - self.tail_triggers
+                    SelectorStateMetadata.seen_in_trigger_id >= self._next_trigger_id - self.tail_triggers - 1
                     if self.tail_triggers is not None
                     else True,
                 )

diff --git a/modyn/tests/models/test_dlrm.py b/modyn/tests/models/test_dlrm.py
@@ -67,3 +67,48 @@ def test_dlrm_reorder_categorical_input():
     assert reordered_test_data.shape == (64, 26)
     assert reordered_test_data.dtype == torch.long
     assert torch.equal(reordered_test_data, input_data)
+
+
+def test_get_last_layer():
+    net = DLRM(get_dlrm_configuration(), "cpu", False)
+    last_layer = net.model.get_last_layer()
+
+    assert isinstance(last_layer, torch.nn.Linear)
+    assert last_layer.in_features == 16
+    assert last_layer.out_features == 1
+    assert last_layer.bias.shape == (1,)
+    assert last_layer.weight.shape == (1, 16)
+
+
+def test_dlrm_no_side_effect():
+    model = DLRM(get_dlrm_configuration(), "cpu", False)
+
+    data = {
+        "numerical_input": torch.ones((64, 13), dtype=torch.float32),
+        "categorical_input": torch.ones((64, 26), dtype=torch.long),
+    }
+    out_off = model.model(data)
+    model.model.embedding_recorder.record_embedding = True
+    out_on = model.model(data)
+
+    assert torch.equal(out_on, out_off)
+
+
+def test_shape_embedding_recorder():
+    model = DLRM(get_dlrm_configuration(), "cpu", False)
+
+    data = {
+        "numerical_input": torch.ones((64, 13), dtype=torch.float32),
+        "categorical_input": torch.ones((64, 26), dtype=torch.long),
+    }
+    model.model(data)
+    assert model.model.embedding is None
+    model.model.embedding_recorder.record_embedding = True
+
+    last_layer = model.model.get_last_layer()
+    recorded_output = model.model(data)
+    recorded_embedding = model.model.embedding
+
+    assert recorded_embedding is not None
+    assert recorded_embedding.shape == (64, last_layer.in_features)
+    assert torch.equal(torch.squeeze(last_layer(recorded_embedding)), recorded_output)
diff --git a/modyn/tests/models/test_embedding_recorder.py b/modyn/tests/models/test_embedding_recorder.py
@@ -0,0 +1,33 @@
+import torch
+from modyn.models.coreset_methods_support import EmbeddingRecorder
+
+
+def test_embedding_recording():
+    recorder = EmbeddingRecorder()
+    recorder.start_recording()
+    input_tensor = torch.tensor([1, 2, 3])
+    output_tensor = recorder(input_tensor)
+    assert torch.equal(recorder.embedding, input_tensor)
+    assert torch.equal(output_tensor, input_tensor)
+
+
+def test_no_embedding_recording():
+    recorder = EmbeddingRecorder()
+    input_tensor = torch.tensor([4, 5, 6])
+    output_tensor = recorder(input_tensor)
+    assert recorder.embedding is None
+    assert torch.equal(output_tensor, input_tensor)
+
+
+def test_toggle_embedding_recording():
+    recorder = EmbeddingRecorder()
+    recorder.start_recording()
+    input_tensor = torch.tensor([7, 8, 9])
+    output_tensor = recorder(input_tensor)
+    assert torch.equal(recorder.embedding, input_tensor)
+    assert torch.equal(output_tensor, input_tensor)
+    recorder.end_recording()
+    input_tensor = torch.tensor([10, 11, 12])
+    output_tensor = recorder(input_tensor)
+    assert recorder.embedding is None
+    assert torch.equal(output_tensor, input_tensor)