Spaces:

akhil2808
/

ASR-Opensource

Sleeping

App Files Files Community

akhil2808 commited on Oct 3, 2024

Commit

1e116aa

verified ·

1 Parent(s): 1f9ba8e

Update app (7).py

Browse files

Files changed (1) hide show

app (7).py +8 -33

app (7).py CHANGED Viewed

@@ -1,18 +1,3 @@
-# Copyright (c) 2022 Horizon Robotics. (authors: Binbin Zhang)
-#               2022 Chengdong Liang (liangchengdong@mail.nwpu.edu.cn)
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#   http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
 import gradio as gr
 import torch
 from wenet.cli.model import load_model
@@ -43,7 +28,7 @@ model = download_rev_models()
 def recognition(audio, style=0):
     if audio is None:
         return "Input Error! Please enter one audio!"
-    # NOTE: model supports 16k sample_rate
     cat_embs = ','.join([str(s) for s in (style, 1-style)])
     cat_embs = process_cat_embs(cat_embs)
@@ -62,29 +47,21 @@ inputs = [
     gr.Slider(0, 1, value=0, label="Verbatimicity - from non-verbatim (0) to verbatim (1)", info="Choose a transcription style between non-verbatim and verbatim"),
 ]
-examples = [
-    ['examples/POD1000000012_S0000335.wav'],
-    ['examples/POD1000000013_S0000062.wav'],
-    ['examples/POD1000000032_S0000020.wav'],
-    ['examples/POD1000000032_S0000038.wav'],
-    ['examples/POD1000000032_S0000050.wav'],
-    ['examples/POD1000000032_S0000058.wav'],
-]
 output = gr.outputs.Textbox(label="Output Text")
-text = "Reverb ASR Transcription Styles Demo"
 # description
 description = (
-    "Reverb ASR supports verbatim and non-verbatim transcription. Try recording an audio with disfluencies (ex: \'uh\', \'um\') and testing both transcription styles. Or, choose an example audio below."  # noqa
 )
-article = (
-    "<p style='text-align: center'>"
-    "<a href='https://rev.com' target='_blank'>Learn more about Rev</a>"  # noqa
-    "</p>")
 interface = gr.Interface(
     fn=recognition,
@@ -92,8 +69,6 @@ interface = gr.Interface(
     outputs=output,
     title=text,
     description=description,
-    article=article,
-    examples=examples,
     theme='huggingface',
 )

 import gradio as gr
 import torch
 from wenet.cli.model import load_model
 def recognition(audio, style=0):
     if audio is None:
         return "Input Error! Please enter one audio!"
     cat_embs = ','.join([str(s) for s in (style, 1-style)])
     cat_embs = process_cat_embs(cat_embs)
     gr.Slider(0, 1, value=0, label="Verbatimicity - from non-verbatim (0) to verbatim (1)", info="Choose a transcription style between non-verbatim and verbatim"),
 ]
 output = gr.outputs.Textbox(label="Output Text")
+text = "ASR Transcription Opensource Demo"
 # description
 description = (
+    " Opensource Automatic Speech Recognition in English
+      Verbatim Transcript style(1) refers to word to word-to-word transcription of an audio
+      Non Verbatim Transcript style(0) refers to just conserving the message of the original audio
+      "
 )
 interface = gr.Interface(
     fn=recognition,
     outputs=output,
     title=text,
     description=description,
     theme='huggingface',
 )