{ "cells": [ { "cell_type": "code", "execution_count": 1, "source": [ "import sys\n", "import os\n", "import torch\n", "import torch.nn as nn\n", "import matplotlib.pyplot as plt\n", "\n", "rootdir = os.path.abspath(sys.path[0] + '/../')\n", "sys.path.append(rootdir)\n", "torch.cuda.set_device(0)\n", "print(\"Set CUDA:%d as current device.\" % torch.cuda.current_device())\n", "torch.autograd.set_grad_enabled(False)\n", "\n", "from configs.spherical_view_syn import SphericalViewSynConfig\n", "from utils import netio\n", "from utils import img\n", "from utils import device\n", "from utils.view import *\n", "from components.fnr import FoveatedNeuralRenderer\n", "\n", "\n", "def load_net(path):\n", " config = SphericalViewSynConfig()\n", " config.from_id(os.path.splitext(path)[0])\n", " config.sa['perturb_sample'] = False\n", " net = config.create_net().to(device.default())\n", " netio.load(path, net)\n", " return net\n", "\n", "\n", "def find_file(prefix):\n", " for path in os.listdir():\n", " if path.startswith(prefix):\n", " return path\n", " return None\n", "\n", "\n", "def plot_images(images):\n", " plt.figure(figsize=(12, 4))\n", " plt.subplot(131)\n", " img.plot(images['layers_img'][0])\n", " plt.subplot(132)\n", " img.plot(images['layers_img'][1])\n", " plt.subplot(133)\n", " img.plot(images['layers_img'][2])\n", " #plt.figure(figsize=(12, 12))\n", " #img.plot(images['overlaid'])\n", " #plt.figure(figsize=(12, 12))\n", " #img.plot(images['blended_raw'])\n", " plt.figure(figsize=(12, 12))\n", " img.plot(images['blended'])\n", "\n", "\n", "scenes = {\n", " 'classroom': 'classroom_all',\n", " 'stones': 'stones_all',\n", " 'barbershop': 'barbershop_all',\n", " 'lobby': 'lobby_all'\n", "}\n", "\n", "fov_list = [20, 45, 110]\n", "res_list = [(256, 256), (256, 256), (400, 360)]\n", "res_full = (1600, 1440)" ], "outputs": [ { "output_type": "stream", "name": "stdout", "text": [ "Set CUDA:0 as current device.\n" ] } ], "metadata": {} }, { "cell_type": "code", "execution_count": 2, "source": [ "scene = 'barbershop'\n", "os.chdir(f'{rootdir}/data/__new/{scenes[scene]}')\n", "print('Change working directory to ', os.getcwd())\n", "\n", "fovea_net = load_net(find_file('fovea'))\n", "periph_net = load_net(find_file('periph'))\n", "renderer = FoveatedNeuralRenderer(fov_list, res_list, nn.ModuleList([fovea_net, periph_net, periph_net]),\n", " res_full, device=device.default())" ], "outputs": [ { "output_type": "stream", "name": "stdout", "text": [ "Change working directory to /home/dengnc/dvs/data/__new/barbershop_all\n", "Load net from fovea200@snerffast4-rgb_e6_fc512x4_d1.20-6.00_s64_~p.pth ...\n", "Load net from periph200@snerffast2-rgb_e6_fc256x4_d1.20-6.00_s32_~p.pth ...\n" ] } ], "metadata": {} }, { "cell_type": "code", "execution_count": 3, "source": [ "params = {\n", " 'classroom': [\n", " #[0, 0, 0, -53, 0, 0, 0],\n", " \n", " #For Eval\n", " [0, 0, 0, 0, 0, 0, 0],\n", " [0, 0, 0, 20, -20, 0, 0],\n", " [-0.03, 0, 0, 0, 0, 0, -83],\n", " [0.03, 0, 0, 0, 0, 0, -83],\n", " [0.3, 0, 0.3, 0, 0], # For panorama (Trans)\n", " [-0.3, -0.3, -0.3, 0, 0], # For panorama (Trans)\n", " [0, -0.3, 0.3, 0, 10, 0, 0], # For panorama (V-D)\n", " [0, 0.3, 0.3, 0, 10, 0, 0], # For panorama (V-D)\n", " [0, 0.3, 0.3, 0, 10, 160, 350], # For panorama (New)\n", " \n", " # For fig latency-quality\n", " #[0, 0, 0, 10, -13, 0, 0], \n", " ],\n", " 'stones': [\n", " #[0, 0, 0, 0, 10, -300, -50],\n", " #[0, 0, 0, 0, 10, 200, -50],\n", " #For Eval\n", " [-0.5, -0.5, -0.5, -25, 0, 50, -230],\n", " [-0.5, -0.5, -0.5, 0, 0, 280, -220],\n", " [-0.5, 0, 0.0, -30, 5, 0, 0],\n", " ],\n", " 'barbershop': [\n", " #[0, 0, 0, 0, 0, 0, 0],\n", " #[0, 0, 0, 20, 0, -300, 50], #For fig rendering-system\n", " #[0, 0, 0, -140, -30, 150, -250],\n", " #[0, 0, 0, -60, -30, 75, -125],\n", " #For Teaser & Eval\n", " [0, 0, 0, 20, 10, 0, 0],\n", " [0, 0, 0, -20, -10, 0, 0],\n", " [0.15, 0, 0.15, -13, -5, 0, 0],\n", " [-0.15, -0.15, 0, 12, 12, 0, 0],\n", " [-0.15, 0, 0.15, -35, 2, 0, 0],\n", " [0, 0.15, 0.15, -13, 10, 0, 0],\n", " [0.15, 0.15, 0, 43, 2, 0, 0],\n", " [-0.15, 0.15, 0.15, -53, -21, 0, 0],\n", " [-0.15, 0.15, 0.15, -53, -21, 200, -200]\n", " ],\n", " 'lobby': [\n", " #[0, 0, 0, 0, 0, 75, 0],\n", " #[0, 0, 0, 0, 0, 5, 150],\n", " #[0.5, 0, 0.5, 29, -12, 0, 0],\n", " #For Eval\n", " [-0.5, -0.5, -0.5, -25, 0, -150, 0],\n", " [-0.5, -0.5, -0.5, 25, 25, -150, 200],\n", " [-0.03, 0, 0, 0, 0, 75, -20],\n", " [0.03, 0, 0, 0, 0, 71, -20]\n", " #[0, 0, 0, -120, 0, 75, 50],\n", " ]\n", "}\n", "\n", "for i, param in enumerate(params[scene]):\n", " view = Trans(torch.tensor(param[:3], device=device.default()),\n", " torch.tensor(euler_to_matrix([-param[4], param[3], 0]), device=device.default()).view(3, 3))\n", " images = renderer(view, param[-2:], using_mask=False, ret_raw=True)\n", " images['overlaid'] = renderer.foveation.synthesis(images['layers_raw'], param[-2:], do_blend=False)\n", " if True:\n", " outputdir = '../__demo/mono/'\n", " misc.create_dir(outputdir)\n", " img.save(images['layers_img'][0], f'{outputdir}{scene}_{i}_fovea.png')\n", " img.save(images['layers_img'][1], f'{outputdir}{scene}_{i}_mid.png')\n", " img.save(images['layers_img'][2], f'{outputdir}{scene}_{i}_periph.png')\n", " img.save(images['blended'], f'{outputdir}{scene}_{i}_blended.png')\n", " #img.save(images['overlaid'], f'{outputdir}{scene}_{i}_overlaid.png')\n", " #img.save(images['blended_raw'], f'{outputdir}{scene}_{i}.png')\n", " else:\n", " images = plot_images(images)\n" ], "outputs": [], "metadata": {} }, { "cell_type": "code", "execution_count": 9, "source": [ "def load_views(data_desc_file) -> Trans:\n", " with open(data_desc_file, 'r', encoding='utf-8') as file:\n", " data_desc = json.loads(file.read())\n", " view_centers = torch.tensor(\n", " data_desc['view_centers'], device=device.default()).view(-1, 3)\n", " view_rots = torch.tensor(\n", " data_desc['view_rots'], device=device.default()).view(-1, 3, 3)\n", " return Trans(view_centers, view_rots)\n", "\n", "\n", "views = load_views('for_panorama_cvt.json')\n", "print('Dataset loaded.')\n", "for view_idx in range(views.size()[0]):\n", " center = (0, 0)\n", " images = renderer(views.get(view_idx), center, using_mask=True)\n", " outputdir = 'panorama'\n", " misc.create_dir(outputdir)\n", " img.save(images['blended'], f'{outputdir}/{view_idx:04d}.png')" ], "outputs": [ { "output_type": "stream", "name": "stdout", "text": [ "Dataset loaded.\n" ] } ], "metadata": {} } ], "metadata": { "kernelspec": { "name": "python3", "display_name": "Python 3.8.5 64-bit ('base': conda)" }, "language_info": { "codemirror_mode": { "name": "ipython", "version": 3 }, "file_extension": ".py", "mimetype": "text/x-python", "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", "version": "3.8.5" }, "metadata": { "interpreter": { "hash": "82066b63b621a9e3d15e3b7c11ca76da6238eff3834294910d715044bd0561e5" } }, "interpreter": { "hash": "82066b63b621a9e3d15e3b7c11ca76da6238eff3834294910d715044bd0561e5" } }, "nbformat": 4, "nbformat_minor": 4 }