Spaces:
Running
Running
README.md
CHANGED
|
@@ -1,6 +1,6 @@
|
|
| 1 |
---
|
| 2 |
title: Speech analysis
|
| 3 |
-
emoji:
|
| 4 |
colorFrom: gray
|
| 5 |
colorTo: gray
|
| 6 |
sdk: gradio
|
|
|
|
| 1 |
---
|
| 2 |
title: Speech analysis
|
| 3 |
+
emoji: 💤
|
| 4 |
colorFrom: gray
|
| 5 |
colorTo: gray
|
| 6 |
sdk: gradio
|
app.py
CHANGED
|
@@ -69,9 +69,8 @@ class AgeGenderModel(Wav2Vec2PreTrainedModel):
|
|
| 69 |
|
| 70 |
return hidden_states, logits_age, logits_gender
|
| 71 |
|
| 72 |
-
|
| 73 |
-
|
| 74 |
-
# Fusion = AgeWav2Vec2Model forward() will accept already computed CNN7 features from ExpressioNmodel forward()
|
| 75 |
def _forward(
|
| 76 |
self,
|
| 77 |
frozen_cnn7=None, # CNN7 fetures of wav2vec2 calc. from CNN7 feature extractor (once)
|
|
@@ -94,10 +93,6 @@ def _forward(
|
|
| 94 |
return_dict=None,
|
| 95 |
)[0]
|
| 96 |
|
| 97 |
-
if self.wav2vec2.adapter is not None:
|
| 98 |
-
raise ValueError
|
| 99 |
-
hidden_states = self.adapter(hidden_states)
|
| 100 |
-
|
| 101 |
return hidden_states
|
| 102 |
|
| 103 |
|
|
@@ -125,13 +120,7 @@ def _forward_and_cnn7(
|
|
| 125 |
return_dict=None,
|
| 126 |
)[0]
|
| 127 |
|
| 128 |
-
|
| 129 |
-
raise ValueError
|
| 130 |
-
hidden_states = self.adapter(hidden_states)
|
| 131 |
-
|
| 132 |
-
return hidden_states, frozen_cnn7 # feature_proj is trainable thus we have to access the frozen_cnn7 before projection layer
|
| 133 |
-
|
| 134 |
-
# Fusion ============================= End
|
| 135 |
|
| 136 |
|
| 137 |
class ExpressionHead(nn.Module):
|
|
|
|
| 69 |
|
| 70 |
return hidden_states, logits_age, logits_gender
|
| 71 |
|
| 72 |
+
# AgeGenderModel.forward() is switched to accept computed frozen CNN7 features from ExpressioNmodel
|
| 73 |
+
|
|
|
|
| 74 |
def _forward(
|
| 75 |
self,
|
| 76 |
frozen_cnn7=None, # CNN7 fetures of wav2vec2 calc. from CNN7 feature extractor (once)
|
|
|
|
| 93 |
return_dict=None,
|
| 94 |
)[0]
|
| 95 |
|
|
|
|
|
|
|
|
|
|
|
|
|
| 96 |
return hidden_states
|
| 97 |
|
| 98 |
|
|
|
|
| 120 |
return_dict=None,
|
| 121 |
)[0]
|
| 122 |
|
| 123 |
+
return hidden_states, frozen_cnn7 #feature_proj is trainable thus we have to access the frozen_cnn7 before projection layer
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 124 |
|
| 125 |
|
| 126 |
class ExpressionHead(nn.Module):
|