Upload 4 files

Browse files

Files changed (5) hide show

.gitattributes +1 -0
MiniLMv6.cs +158 -0
MiniLMv6.onnx +3 -0
MiniLMv6.sentis +3 -0
vocab.txt +0 -0

.gitattributes CHANGED Viewed

@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text

 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text
+MiniLMv6.sentis filter=lfs diff=lfs merge=lfs -text

MiniLMv6.cs ADDED Viewed

	@@ -0,0 +1,158 @@

+using System.Collections.Generic;
+using UnityEngine;
+using Unity.Sentis;
+using System.IO;
+using System.Text;
+/*
+ *              Tiny Stories Inference Code
+ *              ===========================
+ *
+ *  Put this script on the Main Camera
+ *
+ *  In Assets/StreamingAssets put:
+ *
+ *  MiniLMv6.sentis
+ *  vocab.txt
+ *
+ *  Install package com.unity.sentis
+ *
+ */
+public class MiniLM : MonoBehaviour
+{
+    const BackendType backend = BackendType.GPUCompute;
+    string string1 = "That is a happy person";          // similarity = 1
+    //Choose a string to comapre string1  to:
+    string string2 = "That is a happy dog";             // similarity = 0.695
+    //string string2 = "That is a very happy person";   // similarity = 0.943
+    //string string2 = "Today is a sunny day";          // similarity = 0.257
+    //Special tokens
+    const int START_TOKEN = 101;
+    const int END_TOKEN = 102;
+    Ops ops;
+    ITensorAllocator allocator;
+    //Store the vocabulary
+    string[] tokens;
+    IWorker engine;
+    void Start()
+    {
+        allocator = new TensorCachingAllocator();
+        ops = WorkerFactory.CreateOps(backend, allocator);
+        tokens = File.ReadAllLines(Application.streamingAssetsPath + "/vocab.txt");
+        Model model = ModelLoader.Load(Application.streamingAssetsPath + "/MiniLMv6.sentis");
+        engine = WorkerFactory.CreateWorker(backend, model);
+        var tokens1 = GetTokens(string1);
+        var tokens2 = GetTokens(string2);
+        TensorFloat embedding1 = GetEmbedding(tokens1);
+        TensorFloat embedding2 = GetEmbedding(tokens2);
+        Debug.Log("Similarity Score: " + DotScore(embedding1, embedding2));
+    }
+    float DotScore(TensorFloat embedding1, TensorFloat embedding2)
+    {
+        using var prod = ops.Mul(embedding1, embedding2);
+        using var dot = ops.ReduceSum(prod, new int[] { 1 }, false);
+        dot.MakeReadable();
+        return dot[0];
+    }
+    TensorFloat GetEmbedding(List<int> tokens)
+    {
+        int N = tokens.Count;
+        using var input_ids = new TensorInt(new TensorShape(1, N), tokens.ToArray());
+        using var token_type_ids = new TensorInt(new TensorShape(1, N), new int[N]);
+        int[] mask = new int[N];
+        for (int i = 0; i < mask.Length; i++)
+        {
+            mask[i] = 1;
+        }
+        using var attention_mask = new TensorInt(new TensorShape(1, N), mask);
+        var inputs = new Dictionary<string, Tensor>
+        {
+            {"input_ids",input_ids },
+            {"token_type_ids",  token_type_ids},
+            {"attention_mask", attention_mask }
+        };
+        engine.Execute(inputs);
+        var tokenEmbeddings = engine.PeekOutput("output") as TensorFloat;
+        return MeanPooling(tokenEmbeddings, attention_mask);
+    }
+    //Get average of token embeddings taking into account the attention mask
+    TensorFloat MeanPooling(TensorFloat tokenEmbeddings, TensorInt attentonMask)
+    {
+        using var mask0 = attentonMask.ShallowReshape(attentonMask.shape.Unsqueeze(-1)) as TensorInt;
+        using var maskExpanded = ops.Expand(mask0, tokenEmbeddings.shape);
+        using var maskExpandedF = ops.Cast(maskExpanded, DataType.Float) as TensorFloat;
+        using var D = ops.Mul(tokenEmbeddings, maskExpandedF);
+        using var A = ops.ReduceSum(D, new[] { 1 }, false);
+        using var C = ops.ReduceSum(maskExpandedF, new[] { 1 }, false);
+        using var B = ops.Clip(C, 1e-9f, float.MaxValue);
+        using var E = ops.Div(A, B);
+        using var F = ops.ReduceL2(E, new[] { 1 }, true);
+        return ops.Div(E, F);
+    }
+    List<int> GetTokens(string text)
+    {
+        //split over whitespace
+        string[] words = text.ToLower().Split(null);
+        var ids = new List<int>
+        {
+            START_TOKEN
+        };
+        string s = "";
+        foreach (var word in words)
+        {
+            int start = 0;
+            for(int i = word.Length; i >= 0;i--)
+            {
+                string subword = start == 0 ? word.Substring(start, i) : "##" + word.Substring(start, i-start);
+                int index = System.Array.IndexOf(tokens, subword);
+                if (index >= 0)
+                {
+                    ids.Add(index);
+                    s += subword + " ";
+                    if (i == word.Length) break;
+                    start = i;
+                    i = word.Length + 1;
+                }
+            }
+        }
+        ids.Add(END_TOKEN);
+        Debug.Log("Tokenized sentece = " + s);
+        return ids;
+    }
+    private void OnDestroy()
+    {
+        engine?.Dispose();
+        ops?.Dispose();
+        allocator?.Dispose();
+    }
+}

MiniLMv6.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ef2a4bb91d5aff608459c2df78ba333404358b7809af564167e740a1e415e724
+size 90984173

MiniLMv6.sentis ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:cd3cc73a83d426dd085c1839e587b6a7155ce91d6698f7ae2596a3f3cd02d1cf
+size 90952597

vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff