MTSWebServices
diff --git a/‎benchmark/compare_sasrec_unisrec.py‎
Lines changed: 5 additions & 5 deletions b/‎benchmark/compare_sasrec_unisrec.py‎
Lines changed: 5 additions & 5 deletions
diff --git a/‎rectools/fast_transformers/__init__.py‎
Lines changed: 8 additions & 8 deletions b/‎rectools/fast_transformers/__init__.py‎
Lines changed: 8 additions & 8 deletions
diff --git a/‎rectools/fast_transformers/metrics.py‎
Lines changed: 149 additions & 0 deletions b/‎rectools/fast_transformers/metrics.py‎
Lines changed: 149 additions & 0 deletions
diff --git a/‎rectools/fast_transformers/preprocessing/__init__.py‎
Lines changed: 13 additions & 0 deletions b/‎rectools/fast_transformers/preprocessing/__init__.py‎
Lines changed: 13 additions & 0 deletions
diff --git a/‎…tools/fast_transformers/sequence_data.py‎ ‎…nsformers/preprocessing/sequence_data.py‎rectools/fast_transformers/sequence_data.py renamed to rectools/fast_transformers/preprocessing/sequence_data.py
Lines changed: 0 additions & 39 deletions b/‎…tools/fast_transformers/sequence_data.py‎ ‎…nsformers/preprocessing/sequence_data.py‎rectools/fast_transformers/sequence_data.py renamed to rectools/fast_transformers/preprocessing/sequence_data.py
Lines changed: 0 additions & 39 deletions
diff --git a/‎rectools/fast_transformers/unisrec/__init__.py‎
Lines changed: 12 additions & 0 deletions b/‎rectools/fast_transformers/unisrec/__init__.py‎
Lines changed: 12 additions & 0 deletions
diff --git a/‎…s/fast_transformers/demo_kion_unisrec.md‎ ‎…s/fast_transformers/unisrec/demo_kion.md‎rectools/fast_transformers/demo_kion_unisrec.md renamed to rectools/fast_transformers/unisrec/demo_kion.md
Lines changed: 1 addition & 1 deletion b/‎…s/fast_transformers/demo_kion_unisrec.md‎ ‎…s/fast_transformers/unisrec/demo_kion.md‎rectools/fast_transformers/demo_kion_unisrec.md renamed to rectools/fast_transformers/unisrec/demo_kion.md
Lines changed: 1 addition & 1 deletion
diff --git a/‎…s/fast_transformers/unisrec_lightning.py‎ ‎…s/fast_transformers/unisrec/lightning.py‎rectools/fast_transformers/unisrec_lightning.py renamed to rectools/fast_transformers/unisrec/lightning.py
Lines changed: 7 additions & 17 deletions b/‎…s/fast_transformers/unisrec_lightning.py‎ ‎…s/fast_transformers/unisrec/lightning.py‎rectools/fast_transformers/unisrec_lightning.py renamed to rectools/fast_transformers/unisrec/lightning.py
Lines changed: 7 additions & 17 deletions
@@ -18,7 +18,7 @@
 from rectools import Columns
 from rectools.dataset import Dataset
 from rectools.fast_transformers import UniSRecModel
-from rectools.fast_transformers.sequence_data import build_sequences
+from rectools.fast_transformers.preprocessing import build_sequences
 from rectools.models import SASRecModel
 
 DATA_DIR = Path("data/ml-20m")
@@ -78,13 +78,13 @@ def to_tensors(df):
 
 
 @torch.no_grad()
-def evaluate_unisrec(model, train_df, test_df, k=10, batch_size=256, use_id=False):
+def evaluate_unisrec(model, train_df, test_df, k=10, batch_size=256):
     net = model.net
     net.cuda().eval()
     device = torch.device("cuda")
     maxlen = net.session_max_len
 
-    item_embs = net.item_emb.weight if use_id else net.project_all()
+    item_embs = net.project_all()
     unique_items = model.item_id_mapping
     ext_to_int = {int(unique_items[i].item()): i + 1 for i in range(len(unique_items))}
 
@@ -107,7 +107,7 @@ def evaluate_unisrec(model, train_df, test_df, k=10, batch_size=256, use_id=Fals
         if not seqs:
             continue
         x = torch.tensor(seqs, dtype=torch.long, device=device)
-        h = net.encode_last(x, use_id=use_id)
+        h = net.encode_last(x)
         scores = h @ item_embs.T
         scores[:, 0] = float("-inf")
         for i, target_int in enumerate(targets):
@@ -430,7 +430,7 @@ def sasrec_val_mask(interactions_df, **kwargs):
     # Eval
     print("  Evaluating...")
     t0 = time.time()
-    unisrec_metrics = evaluate_unisrec(unisrec_id, train_with_val, test_ratings, use_id=True)
+    unisrec_metrics = evaluate_unisrec(unisrec_id, train_with_val, test_ratings)
     timings["unisrec_eval"] = time.time() - t0
     print(f"  Eval: {timings['unisrec_eval']:.1f}s")
     hr = unisrec_metrics["HR@10"]
 
@@ -1,27 +1,27 @@
 """Fast Transformers: flat sequential recommenders without ItemNet hierarchy."""
 
+from .metrics import compute_metrics, hitrate_at_k, mrr_at_k, ndcg_at_k
 from .net import FlatSASRec, SASRecBlock
-from .sequence_data import (
-    GPUBatchDataset,
+from .preprocessing import (
     SequenceBatchDataset,
     align_embeddings,
     build_sequences,
-    make_dataloader,
 )
-from .unisrec_lightning import UniSRecLightning
-from .unisrec_model import UniSRecModel
-from .unisrec_net import FeedForward, UniSRec
+from .unisrec import UniSRec, UniSRecLightning, UniSRecModel
+from .unisrec.net import FeedForward
 
 __all__ = [
     "build_sequences",
     "align_embeddings",
     "SequenceBatchDataset",
-    "GPUBatchDataset",
-    "make_dataloader",
     "FlatSASRec",
     "SASRecBlock",
     "UniSRec",
     "FeedForward",
     "UniSRecLightning",
     "UniSRecModel",
+    "hitrate_at_k",
+    "ndcg_at_k",
+    "mrr_at_k",
+    "compute_metrics",
 ]
@@ -0,0 +1,149 @@
+"""GPU-friendly ranking metrics for leave-one-out evaluation.
+
+All functions operate on PyTorch tensors and stay on the original device
+(CPU or CUDA), avoiding numpy/pandas roundtrips.  Results are numerically
+identical to the corresponding RecTools metrics with default settings:
+
+- :class:`rectools.metrics.HitRate` (k=K)
+- :class:`rectools.metrics.NDCG` (k=K, log_base=2, divide_by_achievable=False)
+- :class:`rectools.metrics.MRR` (k=K)
+
+These functions assume **leave-one-out** evaluation: each user has exactly
+one ground-truth target item.
+"""
+
+import typing as tp
+
+import torch
+
+
+@torch.no_grad()
+def hitrate_at_k(
+    topk_ids: torch.Tensor,
+    targets: torch.Tensor,
+) -> torch.Tensor:
+    """Hit Rate @ K (leave-one-out).
+
+    Parameters
+    ----------
+    topk_ids : LongTensor (B, K)
+        Top-K predicted item IDs per user.
+    targets : LongTensor (B,)
+        Ground-truth item ID per user.
+
+    Returns
+    -------
+    Tensor (scalar)
+        Mean hit rate across users.
+    """
+    hits = (topk_ids == targets.unsqueeze(1)).any(dim=1)
+    return hits.float().mean()
+
+
+@torch.no_grad()
+def ndcg_at_k(
+    topk_ids: torch.Tensor,
+    targets: torch.Tensor,
+    log_base: int = 2,
+) -> torch.Tensor:
+    """NDCG @ K (leave-one-out, divide_by_achievable=False).
+
+    Matches :class:`rectools.metrics.NDCG` with default parameters.
+    IDCG is computed as the maximum possible DCG when all K positions are
+    relevant (constant across users), which is the RecTools default.
+
+    Parameters
+    ----------
+    topk_ids : LongTensor (B, K)
+        Top-K predicted item IDs per user.
+    targets : LongTensor (B,)
+        Ground-truth item ID per user.
+    log_base : int, default 2
+        Logarithm base for the discount factor.
+
+    Returns
+    -------
+    Tensor (scalar)
+        Mean NDCG across users.
+    """
+    k = topk_ids.shape[1]
+    hits = (topk_ids == targets.unsqueeze(1)).float()  # (B, K)
+    ranks = torch.arange(1, k + 1, device=topk_ids.device, dtype=torch.float)
+    discounts = 1.0 / torch.log(ranks + 1) * (1.0 / _log(log_base))
+    dcg = (hits * discounts.unsqueeze(0)).sum(dim=1)  # (B,)
+    idcg = discounts.sum()
+    return (dcg / idcg).mean()
+
+
+@torch.no_grad()
+def mrr_at_k(
+    topk_ids: torch.Tensor,
+    targets: torch.Tensor,
+) -> torch.Tensor:
+    """MRR @ K (leave-one-out).
+
+    Parameters
+    ----------
+    topk_ids : LongTensor (B, K)
+        Top-K predicted item IDs per user.
+    targets : LongTensor (B,)
+        Ground-truth item ID per user.
+
+    Returns
+    -------
+    Tensor (scalar)
+        Mean reciprocal rank across users.
+    """
+    hits = (topk_ids == targets.unsqueeze(1))  # (B, K)
+    # For each user find the rank of the first hit (1-based), 0 if no hit
+    has_hit = hits.any(dim=1)
+    # argmax returns the first True index
+    first_hit_rank = hits.float().argmax(dim=1) + 1  # (B,)
+    rr = torch.zeros_like(first_hit_rank, dtype=torch.float)
+    rr[has_hit] = 1.0 / first_hit_rank[has_hit].float()
+    return rr.mean()
+
+
+@torch.no_grad()
+def compute_metrics(
+    topk_ids: torch.Tensor,
+    targets: torch.Tensor,
+    ks: tp.Optional[tp.List[int]] = None,
+    log_base: int = 2,
+) -> tp.Dict[str, float]:
+    """Compute HR, NDCG, MRR at multiple K values.
+
+    Parameters
+    ----------
+    topk_ids : LongTensor (B, K_max)
+        Top-K_max predicted item IDs per user.
+    targets : LongTensor (B,)
+        Ground-truth item ID per user.
+    ks : list of int, optional
+        K values to evaluate. Defaults to ``[K_max]``.
+    log_base : int, default 2
+        Logarithm base for NDCG discount.
+
+    Returns
+    -------
+    dict
+        Keys like ``"HR@10"``, ``"NDCG@10"``, ``"MRR@10"``.
+    """
+    k_max = topk_ids.shape[1]
+    if ks is None:
+        ks = [k_max]
+    results: tp.Dict[str, float] = {}
+    for k in ks:
+        if k > k_max:
+            raise ValueError(f"k={k} exceeds topk_ids width {k_max}")
+        top = topk_ids[:, :k]
+        results[f"HR@{k}"] = hitrate_at_k(top, targets).item()
+        results[f"NDCG@{k}"] = ndcg_at_k(top, targets, log_base=log_base).item()
+        results[f"MRR@{k}"] = mrr_at_k(top, targets).item()
+    return results
+
+
+def _log(base: int) -> float:
+    """Natural log of base (cached constant)."""
+    import math
+    return math.log(base)
@@ -0,0 +1,13 @@
+"""Vectorized sequence preprocessing for transformer recommenders."""
+
+from .sequence_data import (
+    SequenceBatchDataset,
+    align_embeddings,
+    build_sequences,
+)
+
+__all__ = [
+    "build_sequences",
+    "align_embeddings",
+    "SequenceBatchDataset",
+]
@@ -7,7 +7,6 @@
 import typing as tp
 
 import torch
-from torch.utils.data import DataLoader
 from torch.utils.data import Dataset as TorchDataset
 
 
@@ -171,41 +170,3 @@ def __getitem__(self, idx: int) -> tp.Dict[str, torch.Tensor]:
         if self.transform:
             batch = self.transform(batch)
         return batch
-
-
-# Keep old name as alias for backwards compatibility
-GPUBatchDataset = SequenceBatchDataset
-
-
-def make_dataloader(
-    x: torch.Tensor,
-    y: torch.Tensor,
-    batch_size: int,
-    shuffle: bool = True,
-    transform: tp.Optional[tp.Callable] = None,
-    num_workers: int = 0,
-    **kwargs: tp.Any,
-) -> DataLoader:
-    """Create a DataLoader from prebuilt sequence tensors.
-
-    Parameters
-    ----------
-    x, y : Tensor
-        Input and target sequences from :func:`build_sequences`.
-    batch_size : int
-        Batch size.
-    shuffle : bool, default True
-        Whether to shuffle.
-    transform : callable, optional
-        Per-sample transform (e.g. negative sampling).
-    num_workers : int, default 0
-        Number of DataLoader workers.
-    **kwargs
-        Additional keyword arguments passed to :class:`~torch.utils.data.DataLoader`.
-
-    Returns
-    -------
-    DataLoader
-    """
-    ds = SequenceBatchDataset(x, y, transform=transform)
-    return DataLoader(ds, batch_size=batch_size, shuffle=shuffle, num_workers=num_workers, **kwargs)
@@ -0,0 +1,12 @@
+"""UniSRec: sequential recommender with pretrained text embeddings."""
+
+from .lightning import UniSRecLightning
+from .model import UniSRecModel
+from .net import FeedForward, UniSRec
+
+__all__ = [
+    "UniSRec",
+    "FeedForward",
+    "UniSRecLightning",
+    "UniSRecModel",
+]
@@ -206,7 +206,7 @@ with torch.no_grad():
         if not seqs:
             continue
         x = torch.tensor(seqs, dtype=torch.long, device=device)
-        h = net.encode_last(x, use_id=False)
+        h = net.encode_last(x)
         scores = h @ item_embs.T
         scores[:, 0] = float("-inf")
         for i, target_int in enumerate(targets):
 
@@ -8,7 +8,7 @@
 import torch.nn.functional as F
 from torch.optim.lr_scheduler import LambdaLR
 
-from .unisrec_net import UniSRec
+from .net import UniSRec
 
 SUPPORTED_LOSSES = ("softmax", "BCE", "gBCE", "sampled_softmax")
 SUPPORTED_OPTIMIZERS = ("adam", "adamw")
@@ -17,17 +17,16 @@
 
 class UniSRecLightning(pl.LightningModule):
     """
-    Thin Lightning wrapper reused across all training phases.
+    Thin Lightning wrapper for joint UniSRec training.
 
-    Each phase creates a fresh ``UniSRecLightning`` with appropriate
-    ``param_groups`` and ``use_id`` flag, sharing the same ``net`` instance.
+    Wraps a :class:`UniSRec` network with configurable loss, optimizer,
+    and learning-rate scheduler.
     """
 
     def __init__(
         self,
         net: UniSRec,
         param_groups: tp.List[tp.Dict[str, tp.Any]],
-        use_id: bool = False,
         loss: str = "softmax",
         n_negatives: tp.Optional[int] = None,
         gbce_t: float = 0.2,
@@ -40,7 +39,6 @@ def __init__(
         super().__init__()
         self.net = net
         self._param_groups = param_groups
-        self.use_id = use_id
         self.loss_name = loss
         self.n_negatives = n_negatives
         self.gbce_t = gbce_t
@@ -53,13 +51,9 @@ def __init__(
     # ── helpers ──
 
     def _get_item_embs(self, item_ids: torch.Tensor) -> torch.Tensor:
-        if self.use_id:
-            return self.net.item_emb(item_ids)
         return self.net._adapt_score(self.net._sample_frozen(item_ids))
 
     def _get_all_embs(self) -> torch.Tensor:
-        if self.use_id:
-            return self.net.item_emb.weight
         return self.net.project_all()
 
     def _get_pos_neg_logits(
@@ -90,11 +84,7 @@ def _calc_loss(
         labels = batch["y"]
         has_neg = "negatives" in batch
 
-        if self.loss_name == "softmax" and not has_neg:
-            return self._full_softmax_loss(hidden, labels)
-
-        if self.loss_name == "softmax" and has_neg:
-            # full softmax even if negatives are available
+        if self.loss_name == "softmax":
             return self._full_softmax_loss(hidden, labels)
 
         if not has_neg:
@@ -165,13 +155,13 @@ def _gbce_loss(self, logits: torch.Tensor, mask: torch.Tensor) -> torch.Tensor:
     # ── training / validation ──
 
     def training_step(self, batch: tp.Dict[str, torch.Tensor], batch_idx: int) -> torch.Tensor:
-        hidden = self.net(batch["x"], use_id=self.use_id)
+        hidden = self.net(batch["x"])
         loss = self._calc_loss(hidden, batch)
         self.log("train_loss", loss, prog_bar=True, on_step=False, on_epoch=True)
         return loss
 
     def validation_step(self, batch: tp.Dict[str, torch.Tensor], batch_idx: int) -> torch.Tensor:
-        hidden = self.net(batch["x"], use_id=self.use_id)
+        hidden = self.net(batch["x"])
         # Validation batch has y of shape (B, 1) -- take last hidden position only
         hidden = hidden[:, -1:, :]
         loss = self._calc_loss(hidden, batch)