Paul Bird commited on
Commit
3a9be66
·
verified ·
1 Parent(s): 0cb2349

Upload RunWhisper.cs

Browse files
Files changed (1) hide show
  1. RunWhisper.cs +9 -7
RunWhisper.cs CHANGED
@@ -100,9 +100,17 @@ public class RunWhisper : MonoBehaviour
100
  if(audioClip.frequency != 16000)
101
  {
102
  Debug.Log($"The audio clip should have frequency 16kHz. It has frequency {audioClip.frequency / 1000f}kHz");
 
103
  }
104
 
105
  numSamples = audioClip.samples;
 
 
 
 
 
 
 
106
  data = new float[numSamples];
107
  audioClip.GetData(data, 0);
108
  }
@@ -122,11 +130,6 @@ public class RunWhisper : MonoBehaviour
122
  void EncodeAudio()
123
  {
124
  using var input = new TensorFloat(new TensorShape(1, numSamples), data);
125
- if (numSamples > maxSamples)
126
- {
127
- Debug.Log("The AudioClip is too long.");
128
- return;
129
- }
130
 
131
  // Pad out to 30 seconds at 16khz if necessary
132
  using var input30seconds = ops.Pad(input, new int[] { 0, 0, 0, maxSamples - numSamples });
@@ -160,8 +163,7 @@ public class RunWhisper : MonoBehaviour
160
 
161
  int ID = tokensPredictions[currentToken];
162
 
163
- currentToken++;
164
- outputTokens[currentToken] = ID;
165
 
166
  if (ID == END_OF_TEXT)
167
  {
 
100
  if(audioClip.frequency != 16000)
101
  {
102
  Debug.Log($"The audio clip should have frequency 16kHz. It has frequency {audioClip.frequency / 1000f}kHz");
103
+ return;
104
  }
105
 
106
  numSamples = audioClip.samples;
107
+
108
+ if (numSamples > maxSamples)
109
+ {
110
+ Debug.Log($"The AudioClip is too long. It must be less than 30 seconds. This clip is {numSamples/ audioClip.frequency} seconds.");
111
+ return;
112
+ }
113
+
114
  data = new float[numSamples];
115
  audioClip.GetData(data, 0);
116
  }
 
130
  void EncodeAudio()
131
  {
132
  using var input = new TensorFloat(new TensorShape(1, numSamples), data);
 
 
 
 
 
133
 
134
  // Pad out to 30 seconds at 16khz if necessary
135
  using var input30seconds = ops.Pad(input, new int[] { 0, 0, 0, maxSamples - numSamples });
 
163
 
164
  int ID = tokensPredictions[currentToken];
165
 
166
+ outputTokens[++currentToken] = ID;
 
167
 
168
  if (ID == END_OF_TEXT)
169
  {