feat(feature-retrieval): add single image feature extraction method

2026-07-12 20:15:31 +08:00 · 2026-02-05 21:08:49 +08:00
parent 7ce97c1965
commit a0df45ab05
3 changed files with 52 additions and 23 deletions
--- a/mini-nav/feature_retrieval.py
+++ b/mini-nav/feature_retrieval.py
@@ -1,8 +1,10 @@
-from typing import Any, Dict, List, Optional, cast
+from typing import Any, Dict, List, Optional, Union, cast
 import polars as pl
 import torch
 from database import db_manager
-from datasets import Dataset, load_dataset
+from datasets import load_dataset
 from PIL import Image
 from tqdm.auto import tqdm
 from transformers import AutoImageProcessor, AutoModel
@@ -101,10 +103,37 @@ class FeatureRetrieval:
                ]
            )
    @torch.no_grad()
    def extract_single_image_feature(self, image: Union[Image.Image, Any]) -> pl.Series:
        """Extract feature from a single image without storing to database.
        Args:
            image: A single image (PIL Image or other supported format).
        Returns:
            pl.Series: The extracted CLS token feature vector as a Polars Series.
        """
        device = self.model.device
        self.model.eval()
        # 预处理图片
        inputs = self.processor(images=image, return_tensors="pt")
        inputs.to(device, non_blocking=True)
        # 提取特征
        outputs = self.model(**inputs)
        # 获取 CLS token
        feats = outputs.last_hidden_state  # [1, N, D]
        cls_token = feats[:, 0]  # [1, D]
        cls_token = cast(torch.Tensor, cls_token)
        # 返回 Polars Series
        return pl.Series("feature", cls_token.cpu().squeeze(0).tolist())
 if __name__ == "__main__":
    train_dataset = load_dataset("uoft-cs/cifar10", split="train")
    train_dataset = cast(Dataset, train_dataset)
    label_map = [
        "airplane",
        "automobile",
--- a/mini-nav/visualizer/app.py
+++ b/mini-nav/visualizer/app.py
@@ -1,5 +1,5 @@
 import datetime
-from typing import Optional
+from typing import List, Optional, Union
 import dash_ag_grid as dag
 import dash_mantine_components as dmc
@@ -7,24 +7,6 @@ from dash import Dash, Input, Output, State, callback, dcc, html
 from database import db_manager
 def parse_contents(contents, filename, date):
    return html.Div(
        [
            html.H5(filename),
            html.H6(datetime.datetime.fromtimestamp(date)),
            # HTML images accept base64 encoded strings in the same format
            # that is supplied by the upload
            html.Img(src=contents),
            html.Hr(),
            html.Div("Raw Content"),
            html.Pre(
                contents[0:200] + "...",
                style={"whiteSpace": "pre-wrap", "wordBreak": "break-all"},
            ),
        ]
    )
 class APP(Dash):
    """Singleton Dash Application"""
@@ -93,7 +75,22 @@ class APP(Dash):
        State("upload-image", "filename"),
        State("upload-image", "last_modified"),
    )
-    def update_output(list_of_contents, list_of_names, list_of_dates):
+    def update_output(
        list_of_contents: List[str],
        list_of_names: List[str],
        list_of_dates: List[int] | List[float],
    ):
        def parse_contents(contents: str, filename: str, date: Union[int, float]):
            return html.Div(
                [
                    html.H5(filename),
                    html.H6(datetime.datetime.fromtimestamp(date)),
                    # HTML images accept base64 encoded strings in the same format
                    # that is supplied by the upload
                    dmc.Image(src=contents),
                ]
            )
        if list_of_contents is not None:
            children = [
                parse_contents(c, n, d)
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -38,3 +38,6 @@ torch = [
 torchvision = [
    { index = "pytorch-cu130", marker = "sys_platform == 'linux' or sys_platform == 'win32'" },
 ]
 [tool.ty.environment]
 root = ["./mini-nav"]