Iainmon
diff --git a/‎bridge/.DS_Store‎
0 Bytes b/‎bridge/.DS_Store‎
0 Bytes
diff --git a/‎bridge/lib/bridge.cpp‎
Lines changed: 19 additions & 11 deletions b/‎bridge/lib/bridge.cpp‎
Lines changed: 19 additions & 11 deletions
diff --git a/‎demos/models/readme.md‎
Lines changed: 1 addition & 0 deletions b/‎demos/models/readme.md‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎demos/models/transformer_net.py‎
Lines changed: 103 additions & 0 deletions b/‎demos/models/transformer_net.py‎
Lines changed: 103 additions & 0 deletions
diff --git a/‎demos/video/chapel-webcam/model.ipynb‎
Lines changed: 84 additions & 4 deletions b/‎demos/video/chapel-webcam/model.ipynb‎
Lines changed: 84 additions & 4 deletions
diff --git a/‎demos/video/chapel-webcam/model2.ipynb‎
Lines changed: 117 additions & 0 deletions b/‎demos/video/chapel-webcam/model2.ipynb‎
Lines changed: 117 additions & 0 deletions
diff --git a/‎demos/video/chapel-webcam/sobel.pt‎
0 Bytes b/‎demos/video/chapel-webcam/sobel.pt‎
0 Bytes
@@ -1,6 +1,8 @@
 #include <bridge.h>
 
 #include <torch/torch.h>
+#include <Aten/ATen.h>
+
 #include <torch/script.h>
 
 // #include <torch/script.h>
@@ -27,6 +29,9 @@
 
 
 
+torch::NoGradGuard no_grad;
+torch::AutoGradMode enable_grad(false);
+
 int bridge_tensor_elements(bridge_tensor_t &bt) {
     int size = 1;
     for (int i = 0; i < bt.dim; ++i) {
@@ -39,14 +44,14 @@ size_t bridge_tensor_size(bridge_tensor_t &bt) {
     return sizeof(float32_t) * bridge_tensor_elements(bt);
 }
 
-void store_tensor(torch::Tensor &input, float32_t* dest) {
+void store_tensor(at::Tensor &input, float32_t* dest) {
     float32_t * data = input.data_ptr<float32_t>();
     size_t bytes_size = sizeof(float32_t) * input.numel();
     // std::memmove(dest,data,bytes_size);
     std::memcpy(dest,data,bytes_size);
 }
 
-bridge_tensor_t torch_to_bridge(torch::Tensor &tensor) {
+bridge_tensor_t torch_to_bridge(at::Tensor &tensor) {
     bridge_tensor_t result;
     result.created_by_c = true;
     result.dim = tensor.dim();
@@ -59,13 +64,13 @@ bridge_tensor_t torch_to_bridge(torch::Tensor &tensor) {
     return result;
 }
 
-torch::Tensor bridge_to_torch(bridge_tensor_t &bt) {
+at::Tensor bridge_to_torch(bridge_tensor_t &bt) {
     std::vector<int64_t> sizes_vec(bt.sizes, bt.sizes + bt.dim);
     auto shape = torch::IntArrayRef(sizes_vec);
     return torch::from_blob(bt.data, shape, torch::kFloat);
 }
 
-torch::Tensor bridge_to_torch(bridge_tensor_t &bt,torch::Device device, bool copy,torch::ScalarType dtype = torch::kFloat32) {
+at::Tensor bridge_to_torch(bridge_tensor_t &bt,torch::Device device, bool copy,torch::ScalarType dtype = torch::kFloat32) {
     std::vector<int64_t> sizes_vec(bt.sizes, bt.sizes + bt.dim);
     auto shape = torch::IntArrayRef(sizes_vec);
     auto t = torch::from_blob(bt.data, shape, torch::kFloat);
@@ -144,6 +149,10 @@ extern "C" bridge_tensor_t load_run_model(const uint8_t* model_path, bridge_tens
 }
 
 
+#define DEVICE torch::kMPS
+#define DTYPE torch::kFloat16
+
+
 extern "C" bridge_pt_model_t load_model(const uint8_t* model_path) {
 
     std::cout << "Begin loading model from path: " << model_path << std::endl;
@@ -153,9 +162,8 @@ extern "C" bridge_pt_model_t load_model(const uint8_t* model_path) {
     std::cout.flush();
 
     try {
-
         auto* module = new torch::jit::Module(torch::jit::load(path));
-        module->to(torch::kMPS,torch::kFloat16,false);
+        module->to(DEVICE,DTYPE,false);
         module->eval();
         std::cout << "Model loaded successfully!" << std::endl;
         std::cout.flush();
@@ -204,23 +212,23 @@ extern "C" bridge_pt_model_t load_model(const uint8_t* model_path) {
 
 
 bridge_tensor_t model_forward(bridge_pt_model_t model, bridge_tensor_t input, bool is_vgg_based_model) {
-
-    auto tn_mps = bridge_to_torch(input,torch::kMPS,true,torch::kFloat16);
-    // auto tn_mps = tn.to(torch::kMPS,false,true);
+    auto tn_mps = bridge_to_torch(input,DEVICE,true,DTYPE);
     auto tn = tn_mps.permute({2, 0, 1}).unsqueeze(0).contiguous();
 
     std::vector<torch::jit::IValue> ins;
     ins.push_back(tn);
 
     auto* module = static_cast<torch::jit::Module*>(model.pt_module);
     auto o = module->forward(ins).toTensor();
-    auto tn_out = o.squeeze(0).contiguous().permute({1, 2, 0}).contiguous();
+    auto tn_out = o.squeeze(0).permute({1, 2, 0}).contiguous();
+    // auto tn_out = o.squeeze(0).contiguous().permute({1, 2, 0}).contiguous();
 
     if (is_vgg_based_model) {
-        tn_out = tn_out / 255.0;
+        tn_out.div_(255.0);
     }
 
     auto tn_out_cpu = tn_out.to(torch::kCPU,torch::kFloat32,false,true);
+    
     return torch_to_bridge(tn_out_cpu);
 
 }
 
@@ -0,0 +1 @@
+This folder contains the model architectures used in the demos.
@@ -0,0 +1,103 @@
+import torch
+
+
+class TransformerNet(torch.nn.Module):
+    def __init__(self):
+        super(TransformerNet, self).__init__()
+        # Initial convolution layers
+        self.conv1 = ConvLayer(3, 32, kernel_size=9, stride=1)
+        self.in1 = torch.nn.InstanceNorm2d(32, affine=True)
+        self.conv2 = ConvLayer(32, 64, kernel_size=3, stride=2)
+        self.in2 = torch.nn.InstanceNorm2d(64, affine=True)
+        self.conv3 = ConvLayer(64, 128, kernel_size=3, stride=2)
+        self.in3 = torch.nn.InstanceNorm2d(128, affine=True)
+        # Residual layers
+        self.res1 = ResidualBlock(128)
+        self.res2 = ResidualBlock(128)
+        self.res3 = ResidualBlock(128)
+        self.res4 = ResidualBlock(128)
+        self.res5 = ResidualBlock(128)
+        # Upsampling Layers
+        self.deconv1 = UpsampleConvLayer(128, 64, kernel_size=3, stride=1, upsample=2)
+        self.in4 = torch.nn.InstanceNorm2d(64, affine=True)
+        self.deconv2 = UpsampleConvLayer(64, 32, kernel_size=3, stride=1, upsample=2)
+        self.in5 = torch.nn.InstanceNorm2d(32, affine=True)
+        self.deconv3 = ConvLayer(32, 3, kernel_size=9, stride=1)
+        # Non-linearities
+        self.relu = torch.nn.ReLU()
+
+    def forward(self, X):
+        y = self.relu(self.in1(self.conv1(X)))
+        y = self.relu(self.in2(self.conv2(y)))
+        y = self.relu(self.in3(self.conv3(y)))
+        y = self.res1(y)
+        y = self.res2(y)
+        y = self.res3(y)
+        y = self.res4(y)
+        y = self.res5(y)
+        y = self.relu(self.in4(self.deconv1(y)))
+        y = self.relu(self.in5(self.deconv2(y)))
+        y = self.deconv3(y)
+        return y
+
+
+class ConvLayer(torch.nn.Module):
+    def __init__(self, in_channels, out_channels, kernel_size, stride):
+        super(ConvLayer, self).__init__()
+        reflection_padding = kernel_size // 2
+        self.reflection_pad = torch.nn.ReflectionPad2d(reflection_padding)
+        self.conv2d = torch.nn.Conv2d(in_channels, out_channels, kernel_size, stride)
+
+    def forward(self, x):
+        out = self.reflection_pad(x)
+        out = self.conv2d(out)
+        return out
+
+
+class ResidualBlock(torch.nn.Module):
+    """ResidualBlock
+    introduced in: https://arxiv.org/abs/1512.03385
+    recommended architecture: http://torch.ch/blog/2016/02/04/resnets.html
+    """
+
+    def __init__(self, channels):
+        super(ResidualBlock, self).__init__()
+        self.conv1 = ConvLayer(channels, channels, kernel_size=3, stride=1)
+        self.in1 = torch.nn.InstanceNorm2d(channels, affine=True)
+        self.conv2 = ConvLayer(channels, channels, kernel_size=3, stride=1)
+        self.in2 = torch.nn.InstanceNorm2d(channels, affine=True)
+        self.relu = torch.nn.ReLU()
+
+    def forward(self, x):
+        residual = x
+        out = self.relu(self.in1(self.conv1(x)))
+        out = self.in2(self.conv2(out))
+        out = out + residual
+        return out
+
+
+class UpsampleConvLayer(torch.nn.Module):
+    """UpsampleConvLayer
+    Upsamples the input and then does a convolution. This method gives better results
+    compared to ConvTranspose2d.
+    ref: http://distill.pub/2016/deconv-checkerboard/
+    """
+
+    def __init__(self, in_channels, out_channels, kernel_size, stride, upsample):
+        super(UpsampleConvLayer, self).__init__()
+        # self.upsample = upsample
+        self.upsample = torch.nn.Upsample(scale_factor=2, mode='nearest')
+        reflection_padding = kernel_size // 2
+        self.reflection_pad = torch.nn.ReflectionPad2d(reflection_padding)
+        self.conv2d = torch.nn.Conv2d(in_channels, out_channels, kernel_size, stride)
+
+    def forward(self, x):
+        x_in = x
+        # print('upsample', self.upsample)
+        # x_in = torch.nn.functional.interpolate(x_in, mode='nearest', scale_factor=self.upsample)
+        # if self.upsample:
+        #     x_in = torch.nn.functional.interpolate(x_in, mode='nearest', scale_factor=self.upsample)
+        out = self.upsample(x_in)
+        out = self.reflection_pad(out)
+        out = self.conv2d(out)
+        return out
@@ -0,0 +1,117 @@
+{
+ "cells": [
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "22e96cc8",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import torch\n",
+    "from torchvision.io import decode_image,read_image\n",
+    "from torchvision import transforms\n",
+    "from torchvision.transforms import functional as F\n",
+    "from PIL import Image\n",
+    "import matplotlib.pyplot as plt\n",
+    "def show_image(image):\n",
+    "    # plt.imshow(transforms.ToPILImage()(image), interpolation=\"bicubic\")\n",
+    "    # # pil_image = transforms.ToPILImage()(image)\n",
+    "    # # pil_image.show()\n",
+    "    plt.imshow(image.detach().permute(1, 2, 0).cpu())\n",
+    "    plt.axis('off')\n",
+    "    plt.show()\n",
+    "\n",
+    "# img = decode_image('coast.jpeg', mode='RGB')\n",
+    "# img = img.to(torch.float32) / 255.0\n",
+    "\n",
+    "pil_img = Image.open('coast.jpeg')\n",
+    "img = F.to_tensor(pil_img)\n",
+    "print(img.shape)\n",
+    "show_image(img)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "335855a9",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "device = torch.device('mps')\n",
+    "stm = torch.jit.load('../style-transfer/models/exports/mps/mosaic_float16.pt', map_location=device)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "9d32c34b",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "stm.to(device)\n",
+    "stm.eval()\n",
+    "print(\"Model loaded.\")\n",
+    "# help(stm)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "20e724b3",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "in_img = img.to(device).to(torch.float16).unsqueeze(0).contiguous()\n",
+    "in_img.shape\n",
+    "x = in_img.squeeze(0).to(torch.float32)\n",
+    "print(x.shape)\n",
+    "show_image(x)\n"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "a6de87a4",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "output = stm(in_img).detach()\n",
+    "print(output.shape,output.dtype,output.device)\n",
+    "torch.mps.empty_cache()"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "473c1852",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "out_img = (output.squeeze(0) / 255.0).to(torch.float32)\n",
+    "print(out_img.shape)\n",
+    "show_image(out_img)"
+   ]
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": ".venv",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.12.9"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 5
+}
Original file line number	Diff line number	Diff line change
`@@ -0,0 +1 @@`
	`1`	`+This folder contains the model architectures used in the demos.`