Merge pull request #625 from plotly/add-dino

Xing Han Lu · web-flow · commit 069846d88c5e · 2021-05-03T23:46:08.000-04:00
Add dash dino app (#minor) Former-commit-id: ffb717b
diff --git a/apps/dash-dino/.gitignore b/apps/dash-dino/.gitignore
@@ -0,0 +1,141 @@
+flask_cache
+.vscode
+
+# Byte-compiled / optimized / DLL files
+__pycache__/
+*.py[cod]
+*$py.class
+
+# C extensions
+*.so
+
+# Distribution / packaging
+.Python
+build/
+develop-eggs/
+dist/
+downloads/
+eggs/
+.eggs/
+lib/
+lib64/
+parts/
+sdist/
+var/
+wheels/
+share/python-wheels/
+*.egg-info/
+.installed.cfg
+*.egg
+MANIFEST
+
+# PyInstaller
+#  Usually these files are written by a python script from a template
+#  before PyInstaller builds the exe, so as to inject date/other infos into it.
+*.manifest
+*.spec
+
+# Installer logs
+pip-log.txt
+pip-delete-this-directory.txt
+
+# Unit test / coverage reports
+htmlcov/
+.tox/
+.nox/
+.coverage
+.coverage.*
+.cache
+nosetests.xml
+coverage.xml
+*.cover
+*.py,cover
+.hypothesis/
+.pytest_cache/
+cover/
+
+# Translations
+*.mo
+*.pot
+
+# Django stuff:
+*.log
+local_settings.py
+db.sqlite3
+db.sqlite3-journal
+
+# Flask stuff:
+instance/
+.webassets-cache
+
+# Scrapy stuff:
+.scrapy
+
+# Sphinx documentation
+docs/_build/
+
+# PyBuilder
+.pybuilder/
+target/
+
+# Jupyter Notebook
+.ipynb_checkpoints
+
+# IPython
+profile_default/
+ipython_config.py
+
+# pyenv
+#   For a library or package, you might want to ignore these files since the code is
+#   intended to run in multiple environments; otherwise, check them in:
+# .python-version
+
+# pipenv
+#   According to pypa/pipenv#598, it is recommended to include Pipfile.lock in version control.
+#   However, in case of collaboration, if having platform-specific dependencies or dependencies
+#   having no cross-platform support, pipenv may install dependencies that don't work, or not
+#   install all needed dependencies.
+#Pipfile.lock
+
+# PEP 582; used by e.g. github.com/David-OConnor/pyflow
+__pypackages__/
+
+# Celery stuff
+celerybeat-schedule
+celerybeat.pid
+
+# SageMath parsed files
+*.sage.py
+
+# Environments
+.env
+.venv
+env/
+venv/
+ENV/
+env.bak/
+venv.bak/
+
+# Spyder project settings
+.spyderproject
+.spyproject
+
+# Rope project settings
+.ropeproject
+
+# mkdocs documentation
+/site
+
+# mypy
+.mypy_cache/
+.dmypy.json
+dmypy.json
+
+# Pyre type checker
+.pyre/
+
+# pytype static type analyzer
+.pytype/
+
+# Cython debug symbols
+cython_debug/
diff --git a/apps/dash-dino/Procfile b/apps/dash-dino/Procfile
@@ -0,0 +1 @@
+web: gunicorn app:server --workers 4
diff --git a/apps/dash-dino/README.md b/apps/dash-dino/README.md
@@ -0,0 +1,48 @@
+# Dash DINO
+
+This is a demo of [Facebook AI's DINO](https://github.com/facebookresearch/dino) model, built using [Dash Labs](https://github.com/plotly/dash-labs).
+
+![](./demo.gif)
+
+Using Dash Labs, you can build apps without specifying a layout. This app was built using this single function:
+
+```python
+@app.callback(
+    args=dict(
+        url=tpl.textbox_input(default_url, label="Image URL", kind=dl.State),
+        run=tpl.button_input("Run", label=""),
+        head=tpl.dropdown_input(list(range(6)), value="0", label="Attention Head"),
+        options=tpl.checklist_input(["use threshold", "overlay"], []),
+        threshold=tpl.slider_input(0, 1, 0.6, 0.01),
+    ),
+    output=tpl.graph_output(),
+    template=tpl,
+)
+def callback(url, run, threshold, head, options):
+    try:
+        im = download_img(url)
+    except:
+        return go.Figure().update_layout(title="Incorrect URL")
+
+    ix = int(head)
+    # Run model
+    img = transform(im).to(device)
+    attentions, w_featmap, h_featmap = predict(img)
+    th_attn, scalar_attn = apply_threshold(attentions, w_featmap, h_featmap, threshold)
+
+    attns = th_attn if "use threshold" in options else scalar_attn
+
+    if "overlay" in options:
+        fig = px.imshow(im)
+        fig.add_trace(go.Heatmap(z=attns[ix], opacity=0.55))
+    else:
+        fig = make_subplots(1, 2)
+        fig.add_trace(go.Image(z=im), 1, 1)
+        fig.add_trace(go.Heatmap(z=attns[ix]), 1, 2)
+        fig.update_xaxes(matches="x")
+        fig.update_yaxes(matches="y")
+
+    return fig
+```
+
+The entire layout was built from the args specified in the `app.callback` thanks to [templates](https://community.plotly.com/t/introducing-dash-labs-dash-2-0-preview/52087).
diff --git a/apps/dash-dino/app.py b/apps/dash-dino/app.py
@@ -0,0 +1,138 @@
+import dash
+import dash_bootstrap_components as dbc
+import dash_labs as dl
+import plotly.express as px
+import plotly.graph_objs as go
+from plotly.subplots import make_subplots
+import requests
+import torch
+import torch.nn as nn
+from torchvision import transforms as pth_transforms
+from PIL import Image
+from flask_caching import Cache
+
+
+def download_img(url, size=(600, 600)):
+    im = Image.open(requests.get(url, stream=True).raw).convert("RGB")
+    im.thumbnail(size)
+    return im
+
+
+# Source: https://github.com/facebookresearch/dino/blob/main/visualize_attention.py
+def compute_attentions(model, patch_size=16):
+    def aux(img):
+        # make the image divisible by the patch size
+        w, h = (
+            img.shape[1] - img.shape[1] % patch_size,
+            img.shape[2] - img.shape[2] % patch_size,
+        )
+        img = img[:, :w, :h].unsqueeze(0)
+        w_featmap = img.shape[-2] // patch_size
+        h_featmap = img.shape[-1] // patch_size
+        attentions = model.forward_selfattention(img)
+
+        return attentions, w_featmap, h_featmap
+
+    return aux
+
+
+# Source: https://github.com/facebookresearch/dino/blob/main/visualize_attention.py
+def apply_threshold(attentions, w_featmap, h_featmap, threshold, patch_size=16):
+    nh = attentions.shape[1]  # number of head
+    # we keep only the output patch attention
+    attentions = attentions[0, :, 0, 1:].reshape(nh, -1)
+    # we keep only a certain percentage of the mass
+    val, idx = torch.sort(attentions)
+    val /= torch.sum(val, dim=1, keepdim=True)
+    cumval = torch.cumsum(val, dim=1)
+    th_attn = cumval > (1 - threshold)
+    idx2 = torch.argsort(idx)
+    for head in range(nh):
+        th_attn[head] = th_attn[head][idx2[head]]
+    th_attn = th_attn.reshape(nh, w_featmap, h_featmap).float()
+    th_attn = nn.functional.interpolate(
+        th_attn.unsqueeze(0), scale_factor=patch_size, mode="nearest"
+    )
+    th_attn = th_attn[0].detach().cpu().numpy()
+
+    attentions = attentions.reshape(nh, w_featmap, h_featmap)
+    attentions = nn.functional.interpolate(
+        attentions.unsqueeze(0), scale_factor=patch_size, mode="nearest"
+    )
+    attentions = attentions[0].detach().cpu().numpy()
+
+    return th_attn, attentions
+
+
+# VARS
+default_url = "https://dl.fbaipublicfiles.com/dino/img.png"
+
+# Load model
+torch.hub.set_dir("./")
+device = torch.device("cuda") if torch.cuda.is_available() else torch.device("cpu")
+print("Running on", device)
+model = torch.hub.load("facebookresearch/dino:main", "dino_deits16").to(device)
+transform = pth_transforms.Compose(
+    [
+        pth_transforms.ToTensor(),
+        pth_transforms.Normalize((0.485, 0.456, 0.406), (0.229, 0.224, 0.225)),
+    ]
+)
+
+# Initialize dash app and dash-labs template
+title = "Zero-shot segmentation with DINO and Dash Labs"
+app = dash.Dash(__name__, title=title, plugins=[dl.plugins.FlexibleCallbacks()])
+server = app.server
+tpl = dl.templates.DbcSidebar(title=title, theme=dbc.themes.DARKLY)
+cache = Cache(
+    app.server, config={"CACHE_TYPE": "filesystem", "CACHE_DIR": "flask_cache"},
+)
+
+# memoize functions
+predict = cache.memoize(timeout=300)(compute_attentions(model))
+download_img = cache.memoize(timeout=300)(download_img)
+
+# Define callback function
+@app.callback(
+    args=dict(
+        url=tpl.textbox_input(default_url, label="Image URL", kind=dl.State),
+        run=tpl.button_input("Run", label=""),
+        head=tpl.dropdown_input(list(range(6)), value="0", label="Attention Head"),
+        options=tpl.checklist_input(["use threshold", "overlay"], []),
+        threshold=tpl.slider_input(0, 1, 0.6, 0.01),
+    ),
+    output=tpl.graph_output(),
+    template=tpl,
+)
+def callback(url, run, threshold, head, options):
+    try:
+        im = download_img(url)
+    except:
+        return go.Figure().update_layout(title="Incorrect URL")
+
+    ix = int(head)
+    # Run model
+    img = transform(im).to(device)
+    attentions, w_featmap, h_featmap = predict(img)
+    th_attn, scalar_attn = apply_threshold(attentions, w_featmap, h_featmap, threshold)
+
+    attns = th_attn if "use threshold" in options else scalar_attn
+
+    if "overlay" in options:
+        fig = px.imshow(im)
+        fig.add_trace(go.Heatmap(z=attns[ix], opacity=0.55))
+    else:
+        fig = make_subplots(1, 2)
+        fig.add_trace(go.Image(z=im), 1, 1)
+        fig.add_trace(go.Heatmap(z=attns[ix]), 1, 2)
+        fig.update_xaxes(matches="x")
+        fig.update_yaxes(matches="y")
+
+    return fig
+
+
+app.layout = tpl.layout(app)
+
+
+if __name__ == "__main__":
+    app.run_server(debug=True)
diff --git a/apps/dash-dino/demo.gif b/apps/dash-dino/demo.gif
diff --git a/apps/dash-dino/requirements.txt b/apps/dash-dino/requirements.txt
@@ -0,0 +1,12 @@
+torch
+dash-labs==0.1.0
+dash-bootstrap-components
+spectra
+colormath
+requests
+tinycss2
+pandas
+torchvision
+Pillow
+Flask-Caching
+gunicorn