From 9238339b99afea902fb2e4a5c614699fd97f6b02 Mon Sep 17 00:00:00 2001
From: Rene <errissa@gmail.com>
Date: Tue, 14 Mar 2023 21:49:09 -0400
Subject: [PATCH] Add new Mitsuba Python example + update CPU rendering docs
 (#5991)

* Add new material estimation example
* Update docs for CPU rendering for Ubuntu 22.04
Co-authored-by: Sameer Sheorey <sameer.sheorey@intel.com>
---
 docs/docker.in.rst                            |  60 ++++-
 docs/tutorial/visualization/cpu_rendering.rst |  30 ++-
 docs/versions.js                              |   4 +-
 .../mitsuba_material_estimation.py            | 236 ++++++++++++++++++
 4 files changed, 305 insertions(+), 25 deletions(-)
 create mode 100644 examples/python/visualization/mitsuba_material_estimation.py

diff --git a/docs/docker.in.rst b/docs/docker.in.rst
index f22c0a3b03d..25714d0f5d8 100644
--- a/docs/docker.in.rst
+++ b/docs/docker.in.rst
@@ -30,10 +30,11 @@ Python applications looks like this:
 .. code-block:: dockerfile
 
     # This could also be another Ubuntu or Debian based distribution
-    FROM ubuntu:latest
+    FROM ubuntu:22.04
 
     # Install Open3D system dependencies and pip
     RUN apt-get update && apt-get install --no-install-recommends -y \
+        libegl1 \
         libgl1 \
         libgomp1 \
         python3-pip \
@@ -52,11 +53,11 @@ To run GUI applications from the docker container, add these options to the
 
 1. GPU:
 
-  - Intel (Mesa drivers): ``--device=/dev/dri:/dev/dri``
+  - Intel (Mesa drivers): ``--device=/dev/dri:/dev/dri`` or ``--device=/dev/dri/card0:/dev/dri/card0 --device=/dev/dri/renderD128:/dev/dri/renderD128``, depending on your hardware.
 
   - NVIDIA: ``--gpus 'all,"capabilities=compute,utility,graphics"'``
 
-  - No GPU (CPU rendering): ``--env OPEN3D_CPU_RENDERING=true``
+  - No GPU (CPU rendering): ``--env OPEN3D_CPU_RENDERING=true`` on Ubuntu 18.04. Later versions automaticaly select CPU rendering if a GPU is not available.
 
 2. X server: ``-v /tmp/.X11-unix:/tmp/.X11-unix -e DISPLAY``
 
@@ -72,7 +73,7 @@ folder that contains data you wish to visualize.
     wget https://github.com/isl-org/Open3D/releases/download/v@OPEN3D_VERSION@/open3d-app-@OPEN3D_VERSION@-Ubuntu.deb
     # Build docker image in folder containing Open3D deb package.
     docker build -t open3d-viewer -f- . <<EOF
-    FROM ubuntu:latest
+    FROM ubuntu:20.04
     COPY open3d*.deb /root/
     RUN apt-get update \
         && apt-get install --yes /root/open3d*.deb \
@@ -91,22 +92,57 @@ folder that contains data you wish to visualize.
         -v /tmp/.X11-unix:/tmp/.X11-unix -e DISPLAY \
         -v "$PWD":/root open3d-viewer:latest
     # Run Open3D viewer docker image without a GPU (CPU rendering)
-    docker run  --env OPEN3D_CPU_RENDERING=true\
-        -v /tmp/.X11-unix:/tmp/.X11-unix -e DISPLAY \
+    docker run -v /tmp/.X11-unix:/tmp/.X11-unix -e DISPLAY \
         -v "$PWD":/root open3d-viewer:latest
 
 Also see the `docker tutorial for ROS
 <http://wiki.ros.org/docker/Tutorials/Hardware%20Acceleration>`__ for more
-information.
+information. Note that differences in hardware, OS drivers and OS packages may
+require you to modify these instructions.
 
 
 Headless rendering
 ------------------
 If a GUI display server (X11 or Wayland) is not available (either in the docker
-container or the host OS), Open3D can still be used for headless rendering. This
-requires installing some additional dependencies. Here is an example Ubuntu /
-Debian based docker file that runs the ``render_to_image.py`` rendering example.
-Other Linux (e.g. RHEL) distributions will need different dependency packages.
+container or the host OS), Open3D can still be used for headless rendering. In
+Ubuntu 20.04+ (with Mesa version 20.2+) this requires configuring the Mesa
+driver with an environment variable (``EGL_PLATFORM=surfaceless``):
+
+.. code-block:: bash
+
+    mkdir open3d-headless-docker && cd open3d-headless-docker
+    wget https://raw.githubusercontent.com/isl-org/Open3D/v@OPEN3D_VERSION@/examples/python/visualization/render_to_image.py
+    # Build docker image
+    docker build -t open3d-headless -f- . <<EOF
+    FROM ubuntu:20.04
+    RUN apt-get update \
+        && apt-get install --yes --no-install-recommends \
+        libegl1 libgl1 libgomp1 python3-pip \
+        && rm -rf /var/lib/apt/lists/*
+
+    # Install Open3D from the PyPI repositories
+    RUN python3 -m pip install --no-cache-dir --upgrade pip && \
+        python3 -m pip install --no-cache-dir --upgrade open3d==@OPEN3D_VERSION@
+
+    # Configure Mesa EGL for headless rendering
+    ENV EGL_PLATFORM=surfaceless
+    WORKDIR /root/
+    ENTRYPOINT ["python3", "/root/render_to_image.py"]
+    EOF
+
+    # Run headless rendering example with Intel GPU
+    docker run --device=/dev/dri:/dev/dri \
+        -v "$PWD":/root open3d-headless:latest
+    # Run headless rendering example with Nvidia GPU
+    docker run  --gpus 'all,"capabilities=compute,utility,graphics"' \
+        -v "$PWD":/root open3d-headless:latest
+    # Run headless rendering example without GPU (CPU rendering)
+    docker run -v "$PWD":/root open3d-headless:latest
+
+In Ubuntu 18.04, we need to install some additional dependencies. Here is an
+example Ubuntu / Debian based docker file that runs the ``render_to_image.py``
+rendering example.  Other (old) Linux (e.g. RHEL) distributions will need
+different dependency packages.
 
 .. code-block:: bash
 
@@ -114,7 +150,7 @@ Other Linux (e.g. RHEL) distributions will need different dependency packages.
     wget https://raw.githubusercontent.com/isl-org/Open3D/v@OPEN3D_VERSION@/examples/python/visualization/render_to_image.py
     # Build docker image
     docker build -t open3d-headless -f- . <<EOF
-    FROM ubuntu:latest
+    FROM ubuntu:18.04
     RUN apt-get update \
         && apt-get install --yes --no-install-recommends \
         libgl1 libgomp1 python3-pip \
diff --git a/docs/tutorial/visualization/cpu_rendering.rst b/docs/tutorial/visualization/cpu_rendering.rst
index 7eed9efa007..b748ae2f4a8 100644
--- a/docs/tutorial/visualization/cpu_rendering.rst
+++ b/docs/tutorial/visualization/cpu_rendering.rst
@@ -27,28 +27,35 @@ Headless CPU Rendering
 ----------------------
 
 For Python code, you can enable CPU rendering for headless rendering when using
-the :class: `.OffscreenRenderer` for a process by setting the environment
-variable ``OPEN3D_CPU_RENDERING=true`` before importing Open3D. Here are the
-different ways to do that:
+the :class: `.OffscreenRenderer` for a process by setting an environment
+variable  before importing Open3D::
+
+ - ``EGL_PLATFORM=surfaceless`` for Ubuntu 20.04+ (Mesa v20.2 or newer)
+ - ``OPEN3D_CPU_RENDERING=true`` for Ubuntu 18.04 (Mesa older than v20.2).
+
+Here are the different ways to do that:
 
 .. code:: bash
 
-    # from the command line
-    OPEN3D_CPU_RENDERING=true python
-    examples/python/visualization/render_to_image.py
+    # from the command line (Ubuntu 20.04+)
+    EGL_PLATFORM=surfaceless python examples/python/visualization/render_to_image.py
+    # or Ubuntu 18.04
+    OPEN3D_CPU_RENDERING=true python examples/python/visualization/render_to_image.py
 
 .. code:: python
 
     # In Python code
     import os
-    os.environ['OPEN3D_CPU_RENDERING'] = 'true'
+    os.environ['EGL_PLATFORM'] = 'surfaceless'   # Ubunu 20.04+
+    os.environ['OPEN3D_CPU_RENDERING'] = 'true'  # Ubuntu 18.04
     import open3d as o3d
 
     # In a Jupyter notebook
-    %env OPEN3D_CPU_RENDERING true
+    %env EGL_PLATFORM surfaceless   # Ubuntu 20.04+
+    %env OPEN3D_CPU_RENDERING true  # Ubuntu 18.04
     import open3d as o3d
 
-.. note:: Seeting the environment variable after importing ``open3d`` will not work,
+.. note:: Setting the environment variable after importing ``open3d`` will not work,
     even if ``open3d`` is re-imported. In this case, if no usable GPU is present, the
     Python interpreter or Jupyter kernel will crash when visualization functions are
     used.
@@ -89,8 +96,9 @@ The method for enabling interactive CPU rendering depends on your system:
     <https://github.com/isl-org/open3d_downloads/releases/download/mesa-libgl/mesa_libGL_22.0.tar.xz>`__.
     This is automatically downloaded to
     `build/_deps/download_mesa_libgl-src/libGL.so.1.5.0` when you build Open3D
-    from source. If you want to use CPU rendering all the time, install this
-    library to ``/usr/local/lib`` or ``$HOME/.local/lib`` and *prepend* it to your
+    from source. The prebuilt version works on Ubuntu 18.04 and Ubuntu 20.04. If
+    you want to use CPU rendering all the time, install this library to
+    ``/usr/local/lib`` or ``$HOME/.local/lib`` and *prepend* it to your
     ``LD_LIBRARY_PATH``:
 
     .. code:: bash
diff --git a/docs/versions.js b/docs/versions.js
index 40108d54b97..1522323da11 100644
--- a/docs/versions.js
+++ b/docs/versions.js
@@ -22,8 +22,8 @@ document.write('\
             <td><a href="http://www.open3d.org/docs/release/cpp_api">0.17.0 C++ (release)</a></td>\
         </tr>\
         <tr>\
-            <td><a href="http://www.open3d.org/docs/0.16.1">0.16.1</a></td>\
-            <td><a href="http://www.open3d.org/docs/0.16.1/cpp_api">0.16.1 C++</a></td>\
+            <td><a href="http://www.open3d.org/docs/0.16.0">0.16.0</a></td>\
+            <td><a href="http://www.open3d.org/docs/0.16.0/cpp_api">0.16.0 C++</a></td>\
         </tr>\
         <tr>\
             <td><a href="http://www.open3d.org/docs/0.15.1">0.15.1</a></td>\
diff --git a/examples/python/visualization/mitsuba_material_estimation.py b/examples/python/visualization/mitsuba_material_estimation.py
new file mode 100644
index 00000000000..79783edcf3f
--- /dev/null
+++ b/examples/python/visualization/mitsuba_material_estimation.py
@@ -0,0 +1,236 @@
+# ----------------------------------------------------------------------------
+# -                        Open3D: www.open3d.org                            -
+# ----------------------------------------------------------------------------
+# Copyright (c) 2018-2023 www.open3d.org
+# SPDX-License-Identifier: MIT
+# ----------------------------------------------------------------------------
+
+import sys
+import argparse
+from pathlib import Path
+import open3d as o3d
+import mitsuba as mi
+import drjit as dr
+import numpy as np
+import math
+
+
+def make_mitsuba_scene(mesh, cam_xform, fov, width, height, principle_pts,
+                       envmap):
+    # Camera transform
+    t_from_np = mi.ScalarTransform4f(cam_xform)
+    # Transform necessary to get from Open3D's environment map coordinate system
+    # to Mitsuba's
+    env_t = mi.ScalarTransform4f.rotate(axis=[0, 0, 1],
+                                        angle=90).rotate(axis=[1, 0, 0],
+                                                         angle=90)
+    scene_dict = {
+        "type": "scene",
+        "integrator": {
+            'type': 'path'
+        },
+        "light": {
+            "type": "envmap",
+            "to_world": env_t,
+            "bitmap": mi.Bitmap(envmap),
+        },
+        "sensor": {
+            "type": "perspective",
+            "fov": fov,
+            "to_world": t_from_np,
+            "principal_point_offset_x": principle_pts[0],
+            "principal_point_offset_y": principle_pts[1],
+            "thefilm": {
+                "type": "hdrfilm",
+                "width": width,
+                "height": height,
+            },
+            "thesampler": {
+                "type": "multijitter",
+                "sample_count": 64,
+            },
+        },
+        "themesh": mesh,
+    }
+
+    scene = mi.load_dict(scene_dict)
+    return scene
+
+
+def run_estimation(mesh, cam_info, ref_image, env_width, iterations, tv_alpha):
+    # Make Mitsuba mesh from Open3D mesh -- conversion will attach a Mitsuba
+    # Principled BSDF to the mesh
+    mesh_opt = mesh.to_mitsuba('themesh')
+
+    # Prepare empty environment map
+    empty_envmap = np.ones((int(env_width / 2), env_width, 3))
+
+    # Create Mitsuba scene
+    scene = make_mitsuba_scene(mesh_opt, cam_info[0], cam_info[1], cam_info[2],
+                               cam_info[3], cam_info[4], empty_envmap)
+
+    def total_variation(image, alpha):
+        diff1 = image[1:, :, :] - image[:-1, :, :]
+        diff2 = image[:, 1:, :] - image[:, :-1, :]
+        return alpha * (dr.sum(dr.abs(diff1)) / len(diff1) +
+                        dr.sum(dr.abs(diff2)) / len(diff2))
+
+    def mse(image, ref_img):
+        return dr.mean(dr.sqr(image - ref_img))
+
+    params = mi.traverse(scene)
+    print(params)
+
+    # Create a Mitsuba Optimizer and configure it to optimize albedo and
+    # environment maps
+    opt = mi.ad.Adam(lr=0.05, mask_updates=True)
+    opt['themesh.bsdf.base_color.data'] = params['themesh.bsdf.base_color.data']
+    opt['light.data'] = params['light.data']
+    params.update(opt)
+
+    integrator = mi.load_dict({'type': 'prb'})
+    for i in range(iterations):
+        img = mi.render(scene, params, spp=8, seed=i, integrator=integrator)
+
+        # Compute loss
+        loss = mse(img, ref_image)
+        # Apply TV regularization if requested
+        if tv_alpha > 0.0:
+            loss = loss + total_variation(opt['themesh.bsdf.base_color.data'],
+                                          tv_alpha)
+
+        # Backpropogate and step. Note: if we were optimizing over a larger set
+        # of inputs not just a single image we might want to step only every x
+        # number of inputs
+        dr.backward(loss)
+        opt.step()
+
+        # Make sure albedo values stay in allowed range
+        opt['themesh.bsdf.base_color.data'] = dr.clamp(
+            opt['themesh.bsdf.base_color.data'], 0.0, 1.0)
+        params.update(opt)
+        print(f'Iteration {i} complete')
+
+    # Done! Return the estimated maps
+    albedo_img = params['themesh.bsdf.base_color.data'].numpy()
+    envmap_img = params['light.data'].numpy()
+    return (albedo_img, envmap_img)
+
+
+def load_input_mesh(model_path, tex_dim):
+    mesh = o3d.t.io.read_triangle_mesh(str(model_path))
+    mesh.material.set_default_properties()
+    mesh.material.material_name = 'defaultLit'  # note: ignored by Mitsuba, just used to visualize in Open3D
+    mesh.material.texture_maps['albedo'] = o3d.t.geometry.Image(0.5 + np.zeros(
+        (tex_dim, tex_dim, 3), dtype=np.float32))
+    return mesh
+
+
+def load_input_data(object, camera_pose, input_image, tex_dim):
+    print(f'Loading {object}...')
+    mesh = load_input_mesh(object, tex_dim)
+
+    print(f'Loading camera pose from {camera_pose}...')
+    cam_npz = np.load(camera_pose)
+    img_width = cam_npz['width'].item()
+    img_height = cam_npz['height'].item()
+    cam_xform = np.linalg.inv(cam_npz['T'])
+    cam_xform = np.matmul(
+        cam_xform,
+        np.array([[-1, 0, 0, 0], [0, -1, 0, 0], [0, 0, 1, 0], [0, 0, 0, 1]],
+                 dtype=np.float32))
+    fov = 2 * np.arctan(0.5 * img_width / cam_npz['K'][0, 0])
+    fov = (180.0 / math.pi) * fov.item()
+    camera = (cam_xform, fov, img_width, img_height, (0.0, 0.0))
+
+    print(f'Loading reference image from {input_image}...')
+    ref_img = o3d.t.io.read_image(str(input_image))
+    ref_img = ref_img.as_tensor()[:, :, 0:3].to(o3d.core.Dtype.Float32) / 255.0
+    bmp = mi.Bitmap(ref_img.numpy()).convert(srgb_gamma=False)
+    ref_img = mi.TensorXf(bmp)
+    return (mesh, camera, ref_img)
+
+
+if __name__ == '__main__':
+    parser = argparse.ArgumentParser(
+        description=
+        "Script that estimates texture and environment map from an input image and geometry. You can find data to test this script here: https://github.com/isl-org/open3d_downloads/releases/download/mitsuba-demos/raven_mitsuba.zip.",
+        formatter_class=argparse.ArgumentDefaultsHelpFormatter)
+    parser.add_argument(
+        'object_path',
+        type=Path,
+        help=
+        "Path to geometry for which to estimate albedo. It is assumed that in the same directory will be an object-name.npz which contains the camera pose information and an object-name.png which is the input image"
+    )
+    parser.add_argument('--env-width', type=int, default=1024)
+    parser.add_argument('--tex-width',
+                        type=int,
+                        default=2048,
+                        help="The dimensions of the texture")
+    parser.add_argument(
+        '--device',
+        default='cuda' if o3d.core.cuda.is_available() else 'cpu',
+        choices=('cpu', 'cuda'),
+        help="Run Mitsuba on 'cuda' or 'cpu'")
+    parser.add_argument('--iterations',
+                        type=int,
+                        default=40,
+                        help="Number of iterations")
+    parser.add_argument(
+        '--total-variation',
+        type=float,
+        default=0.01,
+        help="Factor to apply to total_variation loss. 0.0 disables TV")
+
+    if len(sys.argv) < 2:
+        parser.print_help(sys.stderr)
+        sys.exit(1)
+    args = parser.parse_args()
+    print("Arguments: ", vars(args))
+
+    # Initialize Mitsuba
+    if args.device == 'cpu':
+        mi.set_variant('llvm_ad_rgb')
+    else:
+        mi.set_variant('cuda_ad_rgb')
+
+    # Confirm that the 3 required inputs exist
+    object_path = args.object_path
+    object_name = object_path.stem
+    datadir = args.object_path.parent
+    camera_pose = datadir / (object_name + '.npz')
+    input_image = datadir / (object_name + '.png')
+    if not object_path.exists():
+        print(f'{object_path} does not exist!')
+        sys.exit()
+    if not camera_pose.exists():
+        print(f'{camera_pose} does not exist!')
+        sys.exit()
+    if not input_image.exists():
+        print(f'{input_image} does not exist!')
+        sys.exit()
+
+    # Load input data
+    mesh, cam_info, input_image = load_input_data(object_path, camera_pose,
+                                                  input_image, args.tex_width)
+
+    # Estimate albedo map
+    print('Running material estimation...')
+    albedo, envmap = run_estimation(mesh, cam_info, input_image, args.env_width,
+                                    args.iterations, args.total_variation)
+
+    # Save maps
+    def save_image(img, name, output_dir):
+        # scale to 0-255
+        texture = o3d.core.Tensor(img * 255.0).to(o3d.core.Dtype.UInt8)
+        texture = o3d.t.geometry.Image(texture)
+        o3d.t.io.write_image(str(output_dir / name), texture)
+
+    print('Saving final results...')
+    save_image(albedo, 'estimated_albedo.png', datadir)
+    mi.Bitmap(envmap).write(str(datadir / 'predicted_envmap.exr'))
+
+    # Visualize result with Open3D
+    mesh.material.texture_maps['albedo'] = o3d.t.io.read_image(
+        str(datadir / 'estimated_albedo.png'))
+    o3d.visualization.draw(mesh)