Search code examples
unity-game-engineonnxmobilenetbarracuda

Unity Object Detection: Barracuda, MobileNET and Webcam


I am trying to run the following ONNX model in Unity, using Barracuda and the following pre-trained model: https://github.com/onnx/models/tree/master/vision/classification/mobilenet with my webcam as the camera, and using the following script to test the system:

using UnityEngine;
using UnityEngine.UI;
using Unity.Barracuda;
using System.IO;
using System.Linq;

public class Webcam : MonoBehaviour
{
    public NNModel mob_net;
    public Model model;
    private IWorker worker;

    int current_cam_index = 0;

    WebCamTexture tex;

    public RawImage display;

    private bool brain_on = false;

    private const int SIZE = 224;

    public void start_cam()
    {

       model = ModelLoader.Load(mob_net);
       worker = WorkerFactory.CreateWorker(WorkerFactory.Type.ComputePrecompiled, model);

    if (tex != null)
        {
            stop_cam();
        }
        else
        {
            WebCamDevice device = WebCamTexture.devices[current_cam_index];
            tex = new WebCamTexture(device.name);
            display.texture = tex;
            tex.Play();
        }
    }

    public void stop_cam()
    {
        display.texture = null;
        tex.Stop();
        tex = null;
    }


    void crop__normalize_inference(WebCamTexture src)
    {
        int x = Mathf.FloorToInt(display.transform.position.x);
        int y = Mathf.FloorToInt(display.transform.position.y);

        Color[] pix = src.GetPixels(x, y, SIZE, SIZE);

        Texture2D dest = new Texture2D(SIZE, SIZE);

        dest.SetPixels(pix);
        dest.Apply();

        float[] floats = new float[224 * 224 * 3];

        for (int i = 0; i < pix.Length; ++i)
        {
            var color = pix[i];

            floats[i * 3 + 0] = (color.r - 127) / 127.5f;
            floats[i * 3 + 1] = (color.g - 127) / 127.5f;
            floats[i * 3 + 2] = (color.b - 127) / 127.5f;
        }

        Tensor in_tensor = new Tensor(1, 224, 224, 3, floats);

        worker.Execute(in_tensor);

        Tensor out_tensor = worker.PeekOutput("MobilenetV2/Predictions/Reshape_1");

        var max = Mathf.Max(out_tensor.ToReadOnlyArray());
        var arr = out_tensor.ToReadOnlyArray();
        var index = System.Array.IndexOf(arr, max);

        string line = File.ReadLines(@"D:\Unity\WebCam\Cam\Assets\Scenes\mobile_net.txt").Skip(index).Take(1).First();

        Debug.Log(line);

        in_tensor.Dispose();
        out_tensor.Dispose();
        worker.Dispose();
    }

    public void brain()
    {
        brain_on = !brain_on;
    }

    private void Update()
    {
        if (brain_on)
        {
            crop_and_normalize(tex);

            brain_on = false;
        }
    }
}

But when I run it I get an error which says:

ArgumentException: Can only specify one unknown dimension

My guess is that either Unity doesn't support the model, or that for some reason my input tensor form is incorrect . . .

Any help would be massively appreciated,

K


Solution

  • Solution: Set to barracuda V1.3.0