Spaces:

harveysamson
/

wav2vec2-speech-emotion-recognition

Runtime error

App Files Files Community

harveysamson commited on Mar 28, 2022

Commit

5d47fc0

1 Parent(s): 1b2ab2d

update examples

Browse files

Files changed (7) hide show

app.py +1 -1
data/heart.wav +0 -0
src/__pycache__/__init__.cpython-39.pyc +0 -0
src/__pycache__/modeling_outputs.cpython-39.pyc +0 -0
src/__pycache__/models.cpython-39.pyc +0 -0
src/collator.py +0 -58
src/trainer.py +0 -62

app.py CHANGED Viewed

@@ -33,7 +33,7 @@ inputs = gr.inputs.Audio(label="Input Audio", type="filepath", source="upload")
 outputs = gr.outputs.Label(type="confidences", label = "Output Scores")
 title = "Wav2Vec2 Speech Emotion Recognition"
 description = "This is a demo of the Wav2Vec2 Speech Emotion Recognition model. Upload a .wav file (preferably small) and the top emotions predicted will be displayed."
-examples = ['data/cant_see.wav', 'data/happy26.wav', 'data/jm24.wav', 'data/newton.wav', 'data/speeding.wav']
 article = "<a href = 'https://github.com/m3hrdadfi/soxan'> Wav2Vec2 Speech Classification Github Repository"

 outputs = gr.outputs.Label(type="confidences", label = "Output Scores")
 title = "Wav2Vec2 Speech Emotion Recognition"
 description = "This is a demo of the Wav2Vec2 Speech Emotion Recognition model. Upload a .wav file (preferably small) and the top emotions predicted will be displayed."
+examples = ['data/heart.wav', 'data/happy26.wav', 'data/jm24.wav', 'data/newton.wav', 'data/speeding.wav']
 article = "<a href = 'https://github.com/m3hrdadfi/soxan'> Wav2Vec2 Speech Classification Github Repository"

data/heart.wav ADDED Viewed

Binary file (12.1 kB). View file

src/__pycache__/__init__.cpython-39.pyc CHANGED Viewed

Binary files a/src/__pycache__/__init__.cpython-39.pyc and b/src/__pycache__/__init__.cpython-39.pyc differ

src/__pycache__/modeling_outputs.cpython-39.pyc CHANGED Viewed

Binary files a/src/__pycache__/modeling_outputs.cpython-39.pyc and b/src/__pycache__/modeling_outputs.cpython-39.pyc differ

src/__pycache__/models.cpython-39.pyc CHANGED Viewed

Binary files a/src/__pycache__/models.cpython-39.pyc and b/src/__pycache__/models.cpython-39.pyc differ

src/collator.py DELETED Viewed

@@ -1,58 +0,0 @@
-from dataclasses import dataclass
-from typing import Dict, List, Optional, Union
-import torch
-import transformers
-from transformers import Wav2Vec2Processor, Wav2Vec2FeatureExtractor
-@dataclass
-class DataCollatorCTCWithPadding:
-    """
-    Data collator that will dynamically pad the inputs received.
-    Args:
-        feature_extractor (:class:`~transformers.Wav2Vec2FeatureExtractor`)
-            The feature_extractor used for proccessing the data.
-        padding (:obj:`bool`, :obj:`str` or :class:`~transformers.tokenization_utils_base.PaddingStrategy`, `optional`, defaults to :obj:`True`):
-            Select a strategy to pad the returned sequences (according to the model's padding side and padding index)
-            among:
-            * :obj:`True` or :obj:`'longest'`: Pad to the longest sequence in the batch (or no padding if only a single
-              sequence if provided).
-            * :obj:`'max_length'`: Pad to a maximum length specified with the argument :obj:`max_length` or to the
-              maximum acceptable input length for the model if that argument is not provided.
-            * :obj:`False` or :obj:`'do_not_pad'` (default): No padding (i.e., can output a batch with sequences of
-              different lengths).
-        max_length (:obj:`int`, `optional`):
-            Maximum length of the ``input_values`` of the returned list and optionally padding length (see above).
-        max_length_labels (:obj:`int`, `optional`):
-            Maximum length of the ``labels`` returned list and optionally padding length (see above).
-        pad_to_multiple_of (:obj:`int`, `optional`):
-            If set will pad the sequence to a multiple of the provided value.
-            This is especially useful to enable the use of Tensor Cores on NVIDIA hardware with compute capability >=
-            7.5 (Volta).
-    """
-    feature_extractor: Wav2Vec2FeatureExtractor
-    padding: Union[bool, str] = True
-    max_length: Optional[int] = None
-    max_length_labels: Optional[int] = None
-    pad_to_multiple_of: Optional[int] = None
-    pad_to_multiple_of_labels: Optional[int] = None
-    def __call__(self, features: List[Dict[str, Union[List[int], torch.Tensor]]]) -> Dict[str, torch.Tensor]:
-        input_features = [{"input_values": feature["input_values"]} for feature in features]
-        label_features = [feature["labels"] for feature in features]
-        d_type = torch.long if isinstance(label_features[0], int) else torch.float
-        batch = self.feature_extractor.pad(
-            input_features,
-            padding=self.padding,
-            max_length=self.max_length,
-            pad_to_multiple_of=self.pad_to_multiple_of,
-            return_tensors="pt",
-        )
-        batch["labels"] = torch.tensor(label_features, dtype=d_type)
-        return batch

src/trainer.py DELETED Viewed

@@ -1,62 +0,0 @@
-from typing import Any, Dict, Union
-import torch
-from packaging import version
-from torch import nn
-from transformers import (
-    Trainer,
-    is_apex_available,
-)
-if is_apex_available():
-    from apex import amp
-if version.parse(torch.__version__) >= version.parse("1.6"):
-    _is_native_amp_available = True
-    from torch.cuda.amp import autocast
-class CTCTrainer(Trainer):
-    def training_step(self, model: nn.Module, inputs: Dict[str, Union[torch.Tensor, Any]]) -> torch.Tensor:
-        """
-        Perform a training step on a batch of inputs.
-        Subclass and override to inject custom behavior.
-        Args:
-            model (:obj:`nn.Module`):
-                The model to train.
-            inputs (:obj:`Dict[str, Union[torch.Tensor, Any]]`):
-                The inputs and targets of the model.
-                The dictionary will be unpacked before being fed to the model. Most models expect the targets under the
-                argument :obj:`labels`. Check your model's documentation for all accepted arguments.
-        Return:
-            :obj:`torch.Tensor`: The tensor with training loss on this batch.
-        """
-        model.train()
-        inputs = self._prepare_inputs(inputs)
-        if self.use_amp:
-            with autocast():
-                loss = self.compute_loss(model, inputs)
-        else:
-            loss = self.compute_loss(model, inputs)
-        if self.args.gradient_accumulation_steps > 1:
-            loss = loss / self.args.gradient_accumulation_steps
-        if self.use_amp:
-            self.scaler.scale(loss).backward()
-        elif self.use_apex:
-            with amp.scale_loss(loss, self.optimizer) as scaled_loss:
-                scaled_loss.backward()
-        elif self.deepspeed:
-            self.deepspeed.backward(loss)
-        else:
-            loss.backward()
-        return loss.detach()