Upload 5 files

Browse files

Files changed (5) hide show

AudioResample.cs +21 -17
README.md +1 -3
audio_resample_22050_16000.sentis +0 -0
audio_resample_44100_16000.sentis +0 -0
info.json +2 -2

AudioResample.cs CHANGED Viewed

@@ -21,17 +21,13 @@ public class AudioResample : MonoBehaviour
     public bool playFinalAudio = true;
     IWorker engine;
-    BackendType backend = BackendType.GPUCompute;
-    Ops ops;
-    ITensorAllocator allocator;
     void Start()
     {
-        allocator = new TensorCachingAllocator();
-        ops = WorkerFactory.CreateOps(backend, allocator);
         ConvertAudio();
     }
@@ -62,7 +58,7 @@ public class AudioResample : MonoBehaviour
             return;
         }
-        engine = WorkerFactory.CreateWorker(backend, model);
         int channels = inputAudio.channels;
         int size = inputAudio.samples * channels;
@@ -76,15 +72,23 @@ public class AudioResample : MonoBehaviour
         var output = engine.PeekOutput() as TensorFloat;
         if (inputAudio.frequency == 44100)
-        {
-            using var A = output.ShallowReshape(new TensorShape( output.shape[1] / 2 , 2)) as TensorFloat;
-            using var B = ops.Slice(A, new[] { 0 }, new[] { 1 }, new[] { 1 }, new[] { 1 });
-            B.MakeReadable();
-            outData = B.ToReadOnlyArray();
         }
         else
         {
-            output.MakeReadable();
             outData = output.ToReadOnlyArray();
         }
@@ -103,7 +107,7 @@ public class AudioResample : MonoBehaviour
     private void OnDestroy()
     {
-        ops?.Dispose();
-        allocator?.Dispose();
     }
-}

     public bool playFinalAudio = true;
     IWorker engine;
+    IBackend backend;
+    BackendType backendType = BackendType.GPUCompute;
     void Start()
     {
+        backend = WorkerFactory.CreateBackend(backendType);
         ConvertAudio();
     }
             return;
         }
+        engine = WorkerFactory.CreateWorker(backendType, model);
         int channels = inputAudio.channels;
         int size = inputAudio.samples * channels;
         var output = engine.PeekOutput() as TensorFloat;
         if (inputAudio.frequency == 44100)
+        {
+            //The model gives 2x as many samples as we would like so we fix it:
+            //We need to pad it if it has odd number of samples
+            int n = output.shape[1] % 2;
+            using var output2 = TensorFloat.AllocNoData(new TensorShape(1, output.shape[1] + n));
+            backend.Pad(output, output2, new int[] { 0, n }, Unity.Sentis.Layers.PadMode.Constant, 0);
+            //Now we take every second sample:
+            output2.Reshape(new TensorShape(output2.shape[1] / 2, 2));
+            using var output3 = TensorFloat.AllocNoData(new TensorShape(output2.shape[0], 1));
+            backend.Slice(output2, output3, new[] { 0 }, new[] { 1 }, new[] { 1 });
+            output3.CompleteOperationsAndDownload();
+            outData = output3.ToReadOnlyArray();
         }
         else
         {
+            output.CompleteOperationsAndDownload();
             outData = output.ToReadOnlyArray();
         }
     private void OnDestroy()
     {
+        engine?.Dispose();
+        backend?.Dispose();
     }
+}

README.md CHANGED Viewed

@@ -4,9 +4,7 @@ library_name: unity-sentis
 pipeline_tag: audio-to-audio
 ---
-# Model to turn 44kHz and 22kHz audio to 16kHz for Sentis (Version 1.3.0-pre.3*)
-*Version 1.3.0 Sentis files are not compatible with Sentis version 1.4.0 and need to be recreated/downloaded
 This contains models in Sentis format to convert 44kHz and 22kHz audioclips to 16kHz. Useful for models such as [Whisper-Tiny](https://huggingface.co/unity/sentis-whisper-tiny)
 ## How to Use

 pipeline_tag: audio-to-audio
 ---
+# Model to turn 44kHz and 22kHz audio to 16kHz (Sentis version 1.4.0)
 This contains models in Sentis format to convert 44kHz and 22kHz audioclips to 16kHz. Useful for models such as [Whisper-Tiny](https://huggingface.co/unity/sentis-whisper-tiny)
 ## How to Use

audio_resample_22050_16000.sentis CHANGED Viewed

Binary files a/audio_resample_22050_16000.sentis and b/audio_resample_22050_16000.sentis differ

audio_resample_44100_16000.sentis CHANGED Viewed

Binary files a/audio_resample_44100_16000.sentis and b/audio_resample_44100_16000.sentis differ

info.json CHANGED Viewed

@@ -6,7 +6,7 @@
         "audio_resample_22050_16000.sentis",
         "audio_resample_44100_16000.sentis"
     ],
-    "version": [
-        "1.3.0-pre.3"
     ]
 }

         "audio_resample_22050_16000.sentis",
         "audio_resample_44100_16000.sentis"
     ],
+    "version":[
+        "1.4.0"
     ]
 }