Iainmon
diff --git a/‎demos/video/CMakeLists.txt‎
Lines changed: 53 additions & 8 deletions b/‎demos/video/CMakeLists.txt‎
Lines changed: 53 additions & 8 deletions
diff --git a/‎demos/video/cvtool.hpp‎ ‎demos/video/include/cvtool.hpp‎demos/video/cvtool.hpp renamed to demos/video/include/cvtool.hpp b/‎demos/video/cvtool.hpp‎ ‎demos/video/include/cvtool.hpp‎demos/video/cvtool.hpp renamed to demos/video/include/cvtool.hpp
diff --git a/‎demos/video/imageops.hpp‎ ‎demos/video/include/imageops.hpp‎demos/video/imageops.hpp renamed to demos/video/include/imageops.hpp b/‎demos/video/imageops.hpp‎ ‎demos/video/include/imageops.hpp‎demos/video/imageops.hpp renamed to demos/video/include/imageops.hpp
diff --git a/‎demos/video/style-transfer/model.ipynb‎
Lines changed: 170 additions & 0 deletions b/‎demos/video/style-transfer/model.ipynb‎
Lines changed: 170 additions & 0 deletions
diff --git a/‎demos/video/style-transfer/models/my_module.pt‎
4.43 KB b/‎demos/video/style-transfer/models/my_module.pt‎
4.43 KB
diff --git a/‎demos/video/style-transfer/style_transfer.cpp‎
Lines changed: 48 additions & 0 deletions b/‎demos/video/style-transfer/style_transfer.cpp‎
Lines changed: 48 additions & 0 deletions
diff --git a/‎demos/video/webcam_infer.cpp‎ ‎…os/video/webcam-capture/webcam_infer.cpp‎demos/video/webcam_infer.cpp renamed to demos/video/webcam-capture/webcam_infer.cpp b/‎demos/video/webcam_infer.cpp‎ ‎…os/video/webcam-capture/webcam_infer.cpp‎demos/video/webcam_infer.cpp renamed to demos/video/webcam-capture/webcam_infer.cpp
diff --git a/‎examples/.gitignore‎ b/‎examples/.gitignore‎
diff --git a/‎examples/pytorch-examples/fast_neural_style/.gitignore‎
Lines changed: 1 addition & 0 deletions b/‎examples/pytorch-examples/fast_neural_style/.gitignore‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎examples/pytorch-examples/fast_neural_style/README.md‎
Lines changed: 66 additions & 0 deletions b/‎examples/pytorch-examples/fast_neural_style/README.md‎
Lines changed: 66 additions & 0 deletions
@@ -9,22 +9,19 @@ find_library(METAL Metal REQUIRED)
 find_library(FOUNDATION Foundation REQUIRED)
 
 
+
 add_executable(VidStreamer
-    ${CMAKE_CURRENT_SOURCE_DIR}/webcam_infer.cpp
-    ${CMAKE_CURRENT_SOURCE_DIR}/cvtool.hpp
-    ${CMAKE_CURRENT_SOURCE_DIR}/imageops.hpp
+    ${CMAKE_CURRENT_SOURCE_DIR}/webcam-capture/webcam_infer.cpp
 )
 
 target_include_directories(VidStreamer
     PRIVATE
+        ${CMAKE_CURRENT_SOURCE_DIR}/include
         ${LIBTORCH_DIR}/include
         ${LIBTORCH_DIR}/include/torch/csrc/api/include
 )
 
-target_link_directories(VidStreamer
-    PRIVATE
-        ${LIBTORCH_DIR}/lib
-)
+target_link_directories(VidStreamer PRIVATE ${LIBTORCH_DIR}/lib)
 
 target_link_libraries(VidStreamer
     PRIVATE 
@@ -43,10 +40,58 @@ set_target_properties(VidStreamer PROPERTIES
     RUNTIME_OUTPUT_DIRECTORY ${CMAKE_BINARY_DIR}
 )
 
-
 if (CMAKE_CXX_COMPILER_ID MATCHES "Clang")
   target_compile_options(VidStreamer PRIVATE -Ofast -flto -ffast-math)
   target_link_options(VidStreamer PRIVATE -flto)
 endif()
 
 
+
+
+
+
+
+add_executable(StyleTransfer
+    ${CMAKE_CURRENT_SOURCE_DIR}/style-transfer/style_transfer.cpp
+)
+
+target_include_directories(StyleTransfer
+    PRIVATE
+        ${CMAKE_CURRENT_SOURCE_DIR}/include
+        ${LIBTORCH_DIR}/include
+        ${LIBTORCH_DIR}/include/torch/csrc/api/include
+)
+
+target_link_directories(StyleTransfer PRIVATE ${LIBTORCH_DIR}/lib)
+
+target_link_libraries(StyleTransfer
+    PRIVATE 
+        -ltorch
+        -ltorch_cpu
+        -lc10
+        -ltorch_global_deps
+        ${OpenCV_LIBS}
+        # ${TORCH_LIBRARIES}
+        ${ACCELERATE}
+        ${METAL}
+        ${FOUNDATION}
+)
+
+set_target_properties(StyleTransfer PROPERTIES
+    RUNTIME_OUTPUT_DIRECTORY ${CMAKE_BINARY_DIR}
+)
+
+if (CMAKE_CXX_COMPILER_ID MATCHES "Clang")
+  target_compile_options(StyleTransfer PRIVATE -Ofast -flto -ffast-math)
+  target_link_options(StyleTransfer PRIVATE -flto)
+endif()
+
+
+add_custom_command(
+    TARGET StyleTransfer
+    POST_BUILD
+    COMMAND ${CMAKE_COMMAND} -E copy_directory
+            "${CMAKE_CURRENT_SOURCE_DIR}/style-transfer/models"
+            "$<TARGET_FILE_DIR:StyleTransfer>/style-transfer/models"
+    COMMENT "NOT! Copying ${PROJECT_ROOT_DIR}/examples/vgg/images to $<TARGET_FILE_DIR:vgg>/images"
+)
@@ -0,0 +1,170 @@
+{
+ "cells": [
+  {
+   "cell_type": "code",
+   "execution_count": 1,
+   "id": "6e4d2e04",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import torch"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 11,
+   "id": "ec74c8a7",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "class MyModule(torch.nn.Module):\n",
+    "    def __init__(self, N, M):\n",
+    "        super(MyModule, self).__init__()\n",
+    "        self.linear = torch.nn.Linear(N, M)\n",
+    "\n",
+    "    def forward(self, input):\n",
+    "        return self.linear(input)\n"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "180e54ac",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "my_module = MyModule(10,20)\n",
+    "# sm = torch.jit.script(my_module)\n",
+    "sm = torch.jit.script(my_module)\n",
+    "sm.save(\"models/my_module.pt\")"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "d5e377e0",
+   "metadata": {},
+   "outputs": [],
+   "source": []
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "89e90304",
+   "metadata": {},
+   "outputs": [
+    {
+     "ename": "RuntimeError",
+     "evalue": "Parent directory models does not exist.",
+     "output_type": "error",
+     "traceback": [
+      "\u001b[0;31m---------------------------------------------------------------------------\u001b[0m",
+      "\u001b[0;31mRuntimeError\u001b[0m                              Traceback (most recent call last)",
+      "Cell \u001b[0;32mIn[4], line 1\u001b[0m\n\u001b[0;32m----> 1\u001b[0m \u001b[43msm\u001b[49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43msave\u001b[49m\u001b[43m(\u001b[49m\u001b[38;5;124;43m\"\u001b[39;49m\u001b[38;5;124;43mmodels/my_module.pt\u001b[39;49m\u001b[38;5;124;43m\"\u001b[39;49m\u001b[43m)\u001b[49m\n",
+      "File \u001b[0;32m~/.venv/lib/python3.12/site-packages/torch/jit/_script.py:754\u001b[0m, in \u001b[0;36mRecursiveScriptModule.save\u001b[0;34m(self, f, **kwargs)\u001b[0m\n\u001b[1;32m    745\u001b[0m \u001b[38;5;28;01mdef\u001b[39;00m\u001b[38;5;250m \u001b[39m\u001b[38;5;21msave\u001b[39m(\u001b[38;5;28mself\u001b[39m, f, \u001b[38;5;241m*\u001b[39m\u001b[38;5;241m*\u001b[39mkwargs):\n\u001b[1;32m    746\u001b[0m \u001b[38;5;250m    \u001b[39m\u001b[38;5;124mr\u001b[39m\u001b[38;5;124;03m\"\"\"Save with a file-like object.\u001b[39;00m\n\u001b[1;32m    747\u001b[0m \n\u001b[1;32m    748\u001b[0m \u001b[38;5;124;03m    save(f, _extra_files={})\u001b[39;00m\n\u001b[0;32m   (...)\u001b[0m\n\u001b[1;32m    752\u001b[0m \u001b[38;5;124;03m    DO NOT confuse these two functions when it comes to the 'f' parameter functionality.\u001b[39;00m\n\u001b[1;32m    753\u001b[0m \u001b[38;5;124;03m    \"\"\"\u001b[39;00m\n\u001b[0;32m--> 754\u001b[0m     \u001b[38;5;28;01mreturn\u001b[39;00m \u001b[38;5;28;43mself\u001b[39;49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43m_c\u001b[49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43msave\u001b[49m\u001b[43m(\u001b[49m\u001b[38;5;28;43mstr\u001b[39;49m\u001b[43m(\u001b[49m\u001b[43mf\u001b[49m\u001b[43m)\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[38;5;241;43m*\u001b[39;49m\u001b[38;5;241;43m*\u001b[39;49m\u001b[43mkwargs\u001b[49m\u001b[43m)\u001b[49m\n",
+      "\u001b[0;31mRuntimeError\u001b[0m: Parent directory models does not exist."
+     ]
+    }
+   ],
+   "source": [
+    "# sm.save(\"models/my_module.pt\")"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "d85b6e83",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "m = torch.jit.load(\"models/my_module.pt\")"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 17,
+   "id": "7d6255fd",
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "RecursiveScriptModule(\n",
+       "  original_name=MyModule\n",
+       "  (linear): RecursiveScriptModule(original_name=Linear)\n",
+       ")"
+      ]
+     },
+     "execution_count": 17,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "m"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 20,
+   "id": "0d8ff397",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "x = torch.randn(10)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 21,
+   "id": "ffe62563",
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "tensor([-0.5386,  0.6545,  0.4650, -0.3320,  0.2735,  0.2796, -0.4549,  0.2646,\n",
+       "        -0.9322, -0.3031, -0.3441, -0.3761,  0.6457,  0.6456, -0.2478, -0.2270,\n",
+       "         0.8485,  0.9710, -0.0596,  0.6110], grad_fn=<ViewBackward0>)"
+      ]
+     },
+     "execution_count": 21,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "m(x)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "51739d61",
+   "metadata": {},
+   "outputs": [],
+   "source": []
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": ".venv",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.12.9"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 5
+}
@@ -0,0 +1,48 @@
+#include <torch/torch.h>
+#include <torch/script.h>
+#include <iostream>
+#include <fstream>
+#include <string>
+#include <vector>
+
+torch::jit::Module load_model(const std::string& model_path) {
+    std::cout << "Loading model from path: " << model_path << std::endl;
+    torch::jit::Module module;
+    try {
+        // Deserialize the ScriptModule from a file using torch::jit::load().
+        module = torch::jit::load(model_path);
+    } catch (const c10::Error& e) {
+        std::cerr << "error loading the model\n" << e.msg();
+    }
+    std::cout << "Model loaded successfully." << std::endl;
+    return module;
+
+}
+
+torch::Tensor run_model(torch::jit::Module& module, const torch::Tensor& input) {
+    std::vector<torch::jit::IValue> inputs;
+    inputs.push_back(input);
+
+    std::cout << "Input tensor: " << input.sizes() << std::endl;
+    auto output = module.forward(inputs).toTensor();
+    std::cout << "Model output: " << output.sizes() << std::endl;
+    return output;
+}
+
+
+int main() {
+    // Load the model
+    std::string model_path = "style-transfer/models/my_module.pt";
+    torch::jit::Module module = load_model(model_path);
+
+    // Create a random input tensor
+    torch::Tensor input = torch::randn({10});
+
+    // Run the model
+    torch::Tensor output = run_model(module, input);
+
+    // Print the output tensor
+    std::cout << "Output tensor: " << output.sizes() << std::endl;
+
+    return 0;
+}
@@ -0,0 +1 @@
+saved_models/*
@@ -0,0 +1,66 @@
+# fast-neural-style :city_sunrise: :rocket:
+
+This repository contains a pytorch implementation of an algorithm for artistic style transfer. The algorithm can be used to mix the content of an image with the style of another image. For example, here is a photograph of a door arch rendered in the style of a stained glass painting.
+
+The model uses the method described in [Perceptual Losses for Real-Time Style Transfer and Super-Resolution](https://arxiv.org/abs/1603.08155) along with [Instance Normalization](https://arxiv.org/pdf/1607.08022.pdf). The saved-models for examples shown in the README can be downloaded from [here](https://www.dropbox.com/s/lrvwfehqdcxoza8/saved_models.zip?dl=0).
+
+<p align="center">
+    <img src="images/style-images/mosaic.jpg" height="200px">
+    <img src="images/content-images/amber.jpg" height="200px">
+    <img src="images/output-images/amber-mosaic.jpg" height="440px">
+</p>
+
+## Requirements
+
+The program is written in Python, and uses [pytorch](http://pytorch.org/), [scipy](https://www.scipy.org). A GPU is not necessary, but can provide a significant speed up especially for training a new model. Regular sized images can be styled on a laptop or desktop using saved models.
+
+## Usage
+
+Stylize image
+
+```
+python neural_style/neural_style.py eval --content-image </path/to/content/image> --model </path/to/saved/model> --output-image </path/to/output/image> --accel
+```
+
+- `--content-image`: path to content image you want to stylize.
+- `--model`: saved model to be used for stylizing the image (eg: `mosaic.pth`)
+- `--output-image`: path for saving the output image.
+- `--content-scale`: factor for scaling down the content image if memory is an issue (eg: value of 2 will halve the height and width of content-image)
+- `--accel`: use accelerator
+
+Train model
+
+```bash
+python neural_style/neural_style.py train --dataset </path/to/train-dataset> --style-image </path/to/style/image> --save-model-dir </path/to/save-model/folder> --epochs 2 --accel
+```
+
+There are several command line arguments, the important ones are listed below
+
+- `--dataset`: path to training dataset, the path should point to a folder containing another folder with all the training images. I used COCO 2014 Training images dataset [80K/13GB] [(download)](https://cocodataset.org/#download).
+- `--style-image`: path to style-image.
+- `--save-model-dir`: path to folder where trained model will be saved.
+- `--accel`: use accelerator.
+
+If `--accel` argument is given, pytorch will search for available hardware acceleration device and attempt to use it. This example is known to work on CUDA, MPS and XPU devices.
+
+Refer to `neural_style/neural_style.py` for other command line arguments. For training new models you might have to tune the values of `--content-weight` and `--style-weight`. The mosaic style model shown above was trained with `--content-weight 1e5` and `--style-weight 1e10`. The remaining 3 models were also trained with similar order of weight parameters with slight variation in the `--style-weight` (`5e10` or `1e11`).
+
+## Models
+
+Models for the examples shown below can be downloaded from [here](https://www.dropbox.com/s/lrvwfehqdcxoza8/saved_models.zip?dl=0) or by running the script `download_saved_models.py`.
+
+<div align='center'>
+  <img src='images/content-images/amber.jpg' height="174px">		
+</div>
+
+<div align='center'>
+  <img src='images/style-images/mosaic.jpg' height="174px">
+  <img src='images/output-images/amber-mosaic.jpg' height="174px">
+  <img src='images/output-images/amber-candy.jpg' height="174px">
+  <img src='images/style-images/candy.jpg' height="174px">
+  <br>
+  <img src='images/style-images/rain-princess-cropped.jpg' height="174px">
+  <img src='images/output-images/amber-rain-princess.jpg' height="174px">
+  <img src='images/output-images/amber-udnie.jpg' height="174px">
+  <img src='images/style-images/udnie.jpg' height="174px">
+</div>