add documentation and remove unneccesary comments

Epic-Eric · Epic-Eric · commit 7d771b503beb · 2024-09-04T13:12:25.000-04:00
diff --git a/examples/speech_to_text/readme.md b/examples/speech_to_text/readme.md
@@ -62,3 +62,17 @@ WER     LAAL    AL      AP      DAL     ATD
 ```
 
 This agent can also perform S2T task, by adding `--task translate`.
+
+### Streaming Speech-to-Text Demo
+
+A streaming speech to text demo feature, taking input from user's microphone, sending it to Whisper's wait-k model, and displaying the prediction texts in the terminal.
+
+1. Kick off a remote agent. More information [Remote_agent](../../docs/tutorials/remote_evaluation.rst)
+2. Enter demo mode by providing a desired segment size (usually 500ms):
+
+```bash
+simuleval --remote-eval --demo --source-segment-size 500 --remote-port 8888
+```
+
+3. Speak into the microphone and watch the live transcription!
+4. Press ^c (Control C) to exit the program in terminal
diff --git a/examples/speech_to_text/whisper_waitk.py b/examples/speech_to_text/whisper_waitk.py
@@ -48,7 +48,6 @@ def add_args(parser):
         )
 
     def policy(self, states: Optional[AgentStates] = None):
-        print(states)
         if states is None:
             states = self.states
 
diff --git a/simuleval/evaluator/remote.py b/simuleval/evaluator/remote.py
@@ -148,7 +148,7 @@ def remote_eval(self):
             else:
                 segment = SpeechSegment(
                     index=self.source_segment_size,
-                    content=[0.0, 0.0],
+                    content=[0.0 for _ in range(8192)],
                     sample_rate=self.sample_rate,
                     finished=True,
                 )

Original file line number	Diff line number	Diff line change
`@@ -48,7 +48,6 @@ def add_args(parser):`
`48`	`48`	`)`
`49`	`49`
`50`	`50`	`def policy(self, states: Optional[AgentStates] = None):`
`51`		`- print(states)`
`52`	`51`	`if states is None:`
`53`	`52`	`states = self.states`
`54`	`53`
Original file line number	Diff line number	Diff line change
`@@ -148,7 +148,7 @@ def remote_eval(self):`
`148`	`148`	`else:`
`149`	`149`	`segment = SpeechSegment(`
`150`	`150`	`index=self.source_segment_size,`
`151`		`- content=[0.0, 0.0],`
	`151`	`+ content=[0.0 for _ in range(8192)],`
`152`	`152`	`sample_rate=self.sample_rate,`
`153`	`153`	`finished=True,`
`154`	`154`	`)`