adding files

Files changed (11) hide show

.gitattributes +3 -0
Border Texture.png +3 -0
README.md +42 -0
RunLaboroTomato.cs +275 -0
classes.txt +6 -0
info.js +5 -0
info.json +5 -0
laboro_tomato_yolov8.onnx +3 -0
laboro_tomato_yolov8.sentis +3 -0
preview.png +3 -0
tomatoes.mp4 +3 -0

.gitattributes CHANGED Viewed

@@ -33,3 +33,6 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text

 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text
+*.sentis filter=lfs diff=lfs merge=lfs -text
+*.png filter=lfs diff=lfs merge=lfs -text
+*.mp4 filter=lfs diff=lfs merge=lfs -text

Border Texture.png ADDED Viewed

Git LFS Details

SHA256: 817b7b67f24ee7ae264ad196237553d0e76d9e41878e3647ff2b9750cf73443d
Pointer size: 128 Bytes
Size of remote file: 658 Bytes

README.md ADDED Viewed

	@@ -0,0 +1,42 @@

+---
+library_name: unity-sentis
+pipeline_tag: object-detection
+---
+# LaboroTomato for Unity Sentis (Version 1.4.0-pre.3*)
+[LaboroTomato](https://github.com/laboroai/LaboroTomato) is is an image dataset of growing tomatoes at different stages of their ripening.
+This model was trained on the LaboroTomato image dataset using the Ultralytics [YOLOv8n](https://docs.ultralytics.com/models/yolov8/) object detection framework. The sentis example implementation was copied from [sentis-YOLOv8n](https://huggingface.co/unity/sentis-YOLOv8n).
+## How to Use
+First get the package `com.unity.sentis` from the package manager.
+You will also need the Unity UI package.
+* Create a new scene in Unity 6.
+* Install `com.unity.sentis` version `1.4.0-pre.3` from the package manager
+* Add the c# script to the Main Camera.
+* Create a Raw Image in the scene and link it as the `displayImage`
+* Drag the yolov8n.sentis file into the model asset field
+* Drag the classes.txt on to the labelAssets field
+* Put a video file in the Assets/StreamingAssets folder and set the name of videoName to the filename in the script ("tomatoes.mp4")
+* Set the fields for the bounding box texture sprite (you can [create your own one](https://docs.unity3d.com/Manual/9SliceSprites.html) using a transparent texture or use an inbuilt one) and the font
+## Preview
+If working correctly you should see something like this:
+![preview](preview.png)
+## Information
+The onnx model was designed with the same inputs as [sentis-YOLOv8n](https://huggingface.co/unity/sentis-YOLOv8n). If you are using that implementation, you can simply swap out the model and labels with the ones in this project and it should work.
+## References
+For information on how the model was trained and exported to onnx, see the [project github page](https://github.com/DavidAtRedpine/LaboroTomatoYoloV8).
+## Unity Sentis
+Unity Sentis is the inference engine that runs in Unity 3D. More information can be found at [here](https://unity.com/products/sentis)
+## License
+Ultralytics YOLOv8 uses the GPLv3 license. Details [here](https://github.com/autogyro/yolo-V8?tab=readme-ov-file#license).
+The LaboroTomato dataset uses the Creative Commons Attribution-NonCommercial-ShareAlike 4.0 International License. Details [here](https://github.com/laboroai/LaboroTomato/blob/master/README.md#license).

RunLaboroTomato.cs ADDED Viewed

	@@ -0,0 +1,275 @@

+using System.Collections.Generic;
+using Unity.Sentis;
+using UnityEngine;
+using UnityEngine.UI;
+using UnityEngine.Video;
+using Lays = Unity.Sentis.Layers;
+using System.IO;
+using FF = Unity.Sentis.Functional;
+/*
+ *  LaboroTomato (made with YoloV8) Inference Script
+ *  ========================
+ *
+ * Place this script on the Main Camera.
+ *
+ * Place the laboro_tomato_yolov8.sentis file in the asset folder and drag onto the asset field
+ * Place a *.mp4 video file in the Assets/StreamingAssets folder
+ * Create a RawImage in your scene and set it as the displayImage field
+ * Drag the classes.txt into the labelsAsset field
+ * Add a reference to a sprite image for the bounding box and a font for the text
+ *
+ */
+public class RunLaboroTomato : MonoBehaviour
+{
+    // Drag the yolov8n.sentis file here
+    public ModelAsset asset;
+    const string modelName = "laboro_tomato_yolov8.sentis";
+    // Change this to the name of the video you put in StreamingAssets folder:
+    const string videoName = "tomatoes.mp4";
+    // Link the classes.txt here:
+    public TextAsset labelsAsset;
+    // Create a Raw Image in the scene and link it here:
+    public RawImage displayImage;
+    // Link to a bounding box sprite or texture here:
+    public Sprite borderSprite;
+    public Texture2D borderTexture;
+    // Link to the font for the labels:
+    public Font font;
+    const BackendType backend = BackendType.GPUCompute;
+    private Transform displayLocation;
+    private IWorker engine;
+    private string[] labels;
+    private RenderTexture targetRT;
+    //Image size for the model
+    private const int imageWidth = 640;
+    private const int imageHeight = 640;
+    //The number of classes in the model
+    private const int numClasses = 80;
+    private VideoPlayer video;
+    List<GameObject> boxPool = new();
+    [SerializeField, Range(0, 1)] float iouThreshold = 0.5f;
+    [SerializeField, Range(0, 1)] float scoreThreshold = 0.5f;
+    int maxOutputBoxes = 64;
+    TensorFloat centersToCorners;
+    //bounding box data
+    public struct BoundingBox
+    {
+        public float centerX;
+        public float centerY;
+        public float width;
+        public float height;
+        public string label;
+    }
+    void Start()
+    {
+        Application.targetFrameRate = 60;
+        Screen.orientation = ScreenOrientation.LandscapeLeft;
+        //Parse neural net labels
+        labels = labelsAsset.text.Split('\n');
+        LoadModel();
+        targetRT = new RenderTexture(imageWidth, imageHeight, 0);
+        //Create image to display video
+        displayLocation = displayImage.transform;
+        SetupInput();
+        if (borderSprite == null)
+        {
+            borderSprite = Sprite.Create(borderTexture, new Rect(0, 0, borderTexture.width, borderTexture.height), new Vector2(borderTexture.width / 2, borderTexture.height / 2));
+        }
+    }
+    void LoadModel()
+    {
+        //Load model
+        //var model1 = ModelLoader.Load(Path.Join(Application.streamingAssetsPath, modelName));
+        var model1 = ModelLoader.Load(asset);
+        centersToCorners = new TensorFloat(new TensorShape(4, 4),
+        new float[]
+        {
+                    1,      0,      1,      0,
+                    0,      1,      0,      1,
+                    -0.5f,  0,      0.5f,   0,
+                    0,      -0.5f,  0,      0.5f
+        });
+        //Here we transform the output of the model1 by feeding it through a Non-Max-Suppression layer.
+        var model2 = Functional.Compile(
+               input =>
+               {
+                   var modelOutput = model1.Forward(input)[0];
+                   var boxCoords = modelOutput[0, 0..4, ..].Transpose(0, 1);        //shape=(8400,4)
+                   var allScores = modelOutput[0, 4.., ..];                         //shape=(80,8400)
+                   var scores = FF.ReduceMax(allScores, 0) - scoreThreshold;        //shape=(8400)
+                   var classIDs = FF.ArgMax(allScores, 0);                          //shape=(8400)
+                   var boxCorners = FF.MatMul(boxCoords, FunctionalTensor.FromTensor(centersToCorners));
+                   var indices = FF.NMS(boxCorners, scores, iouThreshold);           //shape=(N)
+                   var indices2 = indices.Unsqueeze(-1).BroadcastTo(new int[] { 4 });//shape=(N,4)
+                   var coords = FF.Gather(boxCoords, 0, indices2);                  //shape=(N,4)
+                   var labelIDs = FF.Gather(classIDs, 0, indices);                  //shape=(N)
+                   return (coords, labelIDs);
+               },
+               InputDef.FromModel(model1)[0]
+         );
+        //Create engine to run model
+        engine = WorkerFactory.CreateWorker(backend, model2);
+    }
+    void SetupInput()
+    {
+        video = gameObject.AddComponent<VideoPlayer>();
+        video.renderMode = VideoRenderMode.APIOnly;
+        video.source = VideoSource.Url;
+        video.url = Path.Join(Application.streamingAssetsPath, videoName);
+        video.isLooping = true;
+        video.Play();
+    }
+    private void Update()
+    {
+        ExecuteML();
+        if (Input.GetKeyDown(KeyCode.Escape))
+        {
+            Application.Quit();
+        }
+    }
+    public void ExecuteML()
+    {
+        ClearAnnotations();
+        if (video && video.texture)
+        {
+            float aspect = video.width * 1f / video.height;
+            Graphics.Blit(video.texture, targetRT, new Vector2(1f / aspect, 1), new Vector2(0, 0));
+            displayImage.texture = targetRT;
+        }
+        else return;
+        using var input = TextureConverter.ToTensor(targetRT, imageWidth, imageHeight, 3);
+        engine.Execute(input);
+        var output = engine.PeekOutput("output_0") as TensorFloat;
+        var labelIDs = engine.PeekOutput("output_1") as TensorInt;
+        output.CompleteOperationsAndDownload();
+        labelIDs.CompleteOperationsAndDownload();
+        float displayWidth = displayImage.rectTransform.rect.width;
+        float displayHeight = displayImage.rectTransform.rect.height;
+        float scaleX = displayWidth / imageWidth;
+        float scaleY = displayHeight / imageHeight;
+        int boxesFound = output.shape[0];
+        //Draw the bounding boxes
+        for (int n = 0; n < Mathf.Min(boxesFound, 200); n++)
+        {
+            var box = new BoundingBox
+            {
+                centerX = output[n, 0] * scaleX - displayWidth / 2,
+                centerY = output[n, 1] * scaleY - displayHeight / 2,
+                width = output[n, 2] * scaleX,
+                height = output[n, 3] * scaleY,
+                label = labels[labelIDs[n]],
+            };
+            DrawBox(box, n, displayHeight * 0.05f);
+        }
+    }
+    public void DrawBox(BoundingBox box, int id, float fontSize)
+    {
+        //Create the bounding box graphic or get from pool
+        GameObject panel;
+        if (id < boxPool.Count)
+        {
+            panel = boxPool[id];
+            panel.SetActive(true);
+        }
+        else
+        {
+            panel = CreateNewBox(Color.yellow);
+        }
+        //Set box position
+        panel.transform.localPosition = new Vector3(box.centerX, -box.centerY);
+        //Set box size
+        RectTransform rt = panel.GetComponent<RectTransform>();
+        rt.sizeDelta = new Vector2(box.width, box.height);
+        //Set label text
+        var label = panel.GetComponentInChildren<Text>();
+        label.text = box.label;
+        label.fontSize = (int)fontSize;
+    }
+    public GameObject CreateNewBox(Color color)
+    {
+        //Create the box and set image
+        var panel = new GameObject("ObjectBox");
+        panel.AddComponent<CanvasRenderer>();
+        Image img = panel.AddComponent<Image>();
+        img.color = color;
+        img.sprite = borderSprite;
+        img.type = Image.Type.Sliced;
+        panel.transform.SetParent(displayLocation, false);
+        //Create the label
+        var text = new GameObject("ObjectLabel");
+        text.AddComponent<CanvasRenderer>();
+        text.transform.SetParent(panel.transform, false);
+        Text txt = text.AddComponent<Text>();
+        txt.font = font;
+        txt.color = color;
+        txt.fontSize = 40;
+        txt.horizontalOverflow = HorizontalWrapMode.Overflow;
+        RectTransform rt2 = text.GetComponent<RectTransform>();
+        rt2.offsetMin = new Vector2(20, rt2.offsetMin.y);
+        rt2.offsetMax = new Vector2(0, rt2.offsetMax.y);
+        rt2.offsetMin = new Vector2(rt2.offsetMin.x, 0);
+        rt2.offsetMax = new Vector2(rt2.offsetMax.x, 30);
+        rt2.anchorMin = new Vector2(0, 0);
+        rt2.anchorMax = new Vector2(1, 1);
+        boxPool.Add(panel);
+        return panel;
+    }
+    public void ClearAnnotations()
+    {
+        foreach (var box in boxPool)
+        {
+            box.SetActive(false);
+        }
+    }
+    private void OnDestroy()
+    {
+        centersToCorners?.Dispose();
+        engine?.Dispose();
+    }
+}

classes.txt ADDED Viewed

	@@ -0,0 +1,6 @@

+b_fully_ripened
+b_half_ripened
+b_green
+l_fully_ripened
+l_half_ripened
+l_green

info.js ADDED Viewed

	@@ -0,0 +1,5 @@

+{
+      "version" : [
+         "1.4.0-pre.2"
+    ]
+}

info.json ADDED Viewed

	@@ -0,0 +1,5 @@

+{
+    "code": [ "RunLaboroTomato.cs"],
+    "models": [ "laboro_tomato_yolov8.sentis"],
+    "data": [ "classes.txt" ]
+}

laboro_tomato_yolov8.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:0de233be5f31b89ab1482268ff7e72aca0ebb5917bf92afb500de79c0476a86a
+size 44739449

laboro_tomato_yolov8.sentis ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b24b5e411a644600616be29245edc37876df080c86398fb5368a83fe759217cc
+size 44738340

preview.png ADDED Viewed

Git LFS Details

SHA256: f2bfbcdc74d8bb1607ae761e809a39fc60cb7590461250d8b53d4641621c6a9f
Pointer size: 132 Bytes
Size of remote file: 2.63 MB

tomatoes.mp4 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:217ecb66a7235e4d3a6eb2557f62b15e69b5c6141ccae8e6ca076680efe0bc7f
+size 3199970