fix tabs and sample audio files

eric-urban · eric-urban · commit 39137a6d0e50 · 2023-08-15T06:30:02.000-07:00
diff --git a/articles/ai-services/speech-service/audio-processing-speech-sdk.md b/articles/ai-services/speech-service/audio-processing-speech-sdk.md
@@ -123,7 +123,7 @@ MicrophoneCoordinates[] microphoneCoordinates = new MicrophoneCoordinates[7]
 };
 var microphoneArrayGeometry = new MicrophoneArrayGeometry(MicrophoneArrayType.Planar, microphoneCoordinates);
 var audioProcessingOptions = AudioProcessingOptions.Create(AudioProcessingConstants.AUDIO_INPUT_PROCESSING_ENABLE_DEFAULT, microphoneArrayGeometry, SpeakerReferenceChannel.LastChannel);
-var audioInput = AudioConfig.FromWavFileInput("katiesteve_mono.wav", audioProcessingOptions);
+var audioInput = AudioConfig.FromWavFileInput("katiesteve.wav", audioProcessingOptions);
 
 var recognizer = new SpeechRecognizer(speechConfig, audioInput);
 ```
@@ -139,7 +139,7 @@ MicrophoneArrayGeometry microphoneArrayGeometry
     { { 0, 0, 0 }, { 40, 0, 0 }, { 20, -35, 0 }, { -20, -35, 0 }, { -40, 0, 0 }, { -20, 35, 0 }, { 20, 35, 0 } }
 };
 auto audioProcessingOptions = AudioProcessingOptions::Create(AUDIO_INPUT_PROCESSING_ENABLE_DEFAULT, microphoneArrayGeometry, SpeakerReferenceChannel::LastChannel);
-auto audioInput = AudioConfig::FromWavFileInput("katiesteve_mono.wav", audioProcessingOptions);
+auto audioInput = AudioConfig::FromWavFileInput("katiesteve.wav", audioProcessingOptions);
 
 auto recognizer = SpeechRecognizer::FromConfig(speechConfig, audioInput);
 ```
@@ -159,7 +159,7 @@ microphoneCoordinates[5] = new MicrophoneCoordinates(-20, 35, 0);
 microphoneCoordinates[6] = new MicrophoneCoordinates(20, 35, 0);
 MicrophoneArrayGeometry microphoneArrayGeometry = new MicrophoneArrayGeometry(MicrophoneArrayType.Planar, microphoneCoordinates);
 AudioProcessingOptions audioProcessingOptions = AudioProcessingOptions.create(AudioProcessingConstants.AUDIO_INPUT_PROCESSING_ENABLE_DEFAULT, microphoneArrayGeometry, SpeakerReferenceChannel.LastChannel);
-AudioConfig audioInput = AudioConfig.fromWavFileInput("katiesteve_mono.wav", audioProcessingOptions);
+AudioConfig audioInput = AudioConfig.fromWavFileInput("katiesteve.wav", audioProcessingOptions);
 
 SpeechRecognizer recognizer = new SpeechRecognizer(speechConfig, audioInput);
 ```
diff --git a/articles/ai-services/speech-service/includes/quickstarts/stt-diarization/cpp.md b/articles/ai-services/speech-service/includes/quickstarts/stt-diarization/cpp.md
@@ -59,7 +59,7 @@ Follow these steps to create a new console application and install the Speech SD
 
         speechConfig->SetSpeechRecognitionLanguage("en-US");
 
-        auto audioConfig = AudioConfig::FromWavFileInput("katiesteve_mono.wav");
+        auto audioConfig = AudioConfig::FromWavFileInput("katiesteve.wav");
         auto conversationTranscriber = ConversationTranscriber::FromConfig(speechConfig, audioConfig);
 
         // promise for synchronization of recognition end.
@@ -134,7 +134,7 @@ Follow these steps to create a new console application and install the Speech SD
     }
     ```
 
-1. Replace `katiesteve_mono.wav` with the filepath and filename of your `.wav` file. The intent of this quickstart is to recognize speech from multiple participants in the conversation. Your audio file should contain multiple speakers. For example, you can use the [sample audio file](https://github.com/Azure-Samples/cognitive-services-speech-sdk/blob/master/quickstart/csharp/dotnet/conversation-transcription/helloworld/katiesteve_mono.wav) provided in the Speech SDK samples repository on GitHub.
+1. Replace `katiesteve.wav` with the filepath and filename of your `.wav` file. The intent of this quickstart is to recognize speech from multiple participants in the conversation. Your audio file should contain multiple speakers. For example, you can use the [sample audio file](https://github.com/Azure-Samples/cognitive-services-speech-sdk/blob/master/sampledata/audiofiles/katiesteve.wav) provided in the Speech SDK samples repository on GitHub.
     > [!NOTE]
     > The service performs best with at least 7 seconds of continuous audio from a single speaker. This allows the system to differentiate the speakers properly. Otherwise the Speaker ID is returned as `Unknown`.
 1. To change the speech recognition language, replace `en-US` with another [supported language](~/articles/cognitive-services/speech-service/supported-languages.md). For example, `es-ES` for Spanish (Spain). The default language is `en-US` if you don't specify a language. For details about how to identify one of multiple languages that might be spoken, see [language identification](~/articles/cognitive-services/speech-service/language-identification.md). 
diff --git a/articles/ai-services/speech-service/includes/quickstarts/stt-diarization/csharp.md b/articles/ai-services/speech-service/includes/quickstarts/stt-diarization/csharp.md
@@ -48,7 +48,7 @@ Follow these steps to create a new console application and install the Speech SD
     
         async static Task Main(string[] args)
         {
-            var filepath = "katiesteve_mono.wav";
+            var filepath = "katiesteve.wav";
             var speechConfig = SpeechConfig.FromSubscription(speechKey, speechRegion);        
             speechConfig.SpeechRecognitionLanguage = "en-US";
     
@@ -110,7 +110,7 @@ Follow these steps to create a new console application and install the Speech SD
     }
     ```
 
-1. Replace `katiesteve_mono.wav` with the filepath and filename of your `.wav` file. The intent of this quickstart is to recognize speech from multiple participants in the conversation. Your audio file should contain multiple speakers. For example, you can use the [sample audio file](https://github.com/Azure-Samples/cognitive-services-speech-sdk/blob/master/quickstart/csharp/dotnet/conversation-transcription/helloworld/katiesteve_mono.wav) provided in the Speech SDK samples repository on GitHub.
+1. Replace `katiesteve.wav` with the filepath and filename of your `.wav` file. The intent of this quickstart is to recognize speech from multiple participants in the conversation. Your audio file should contain multiple speakers. For example, you can use the [sample audio file](https://github.com/Azure-Samples/cognitive-services-speech-sdk/blob/master/sampledata/audiofiles/katiesteve.wav) provided in the Speech SDK samples repository on GitHub.
     > [!NOTE]
     > The service performs best with at least 7 seconds of continuous audio from a single speaker. This allows the system to differentiate the speakers properly. Otherwise the Speaker ID is returned as `Unknown`.
 1. To change the speech recognition language, replace `en-US` with another [supported language](~/articles/cognitive-services/speech-service/supported-languages.md). For example, `es-ES` for Spanish (Spain). The default language is `en-US` if you don't specify a language. For details about how to identify one of multiple languages that might be spoken, see [language identification](~/articles/cognitive-services/speech-service/language-identification.md). 
diff --git a/articles/ai-services/speech-service/includes/quickstarts/stt-diarization/java.md b/articles/ai-services/speech-service/includes/quickstarts/stt-diarization/java.md
@@ -82,7 +82,7 @@ Follow these steps to create a new console application for conversation transcri
             
             SpeechConfig speechConfig = SpeechConfig.fromSubscription(speechKey, speechRegion);
             speechConfig.setSpeechRecognitionLanguage("en-US");
-            AudioConfig audioInput = AudioConfig.fromWavFileInput("katiesteve_mono.wav");
+            AudioConfig audioInput = AudioConfig.fromWavFileInput("katiesteve.wav");
             
             Semaphore stopRecognitionSemaphore = new Semaphore(0);
     
@@ -139,7 +139,7 @@ Follow these steps to create a new console application for conversation transcri
     }
     ```
 
-1. Replace `katiesteve_mono.wav` with the filepath and filename of your `.wav` file. The intent of this quickstart is to recognize speech from multiple participants in the conversation. Your audio file should contain multiple speakers. For example, you can use the [sample audio file](https://github.com/Azure-Samples/cognitive-services-speech-sdk/blob/master/quickstart/csharp/dotnet/conversation-transcription/helloworld/katiesteve_mono.wav) provided in the Speech SDK samples repository on GitHub.
+1. Replace `katiesteve.wav` with the filepath and filename of your `.wav` file. The intent of this quickstart is to recognize speech from multiple participants in the conversation. Your audio file should contain multiple speakers. For example, you can use the [sample audio file](https://github.com/Azure-Samples/cognitive-services-speech-sdk/blob/master/sampledata/audiofiles/katiesteve.wav) provided in the Speech SDK samples repository on GitHub.
     > [!NOTE]
     > The service performs best with at least 7 seconds of continuous audio from a single speaker. This allows the system to differentiate the speakers properly. Otherwise the Speaker ID is returned as `Unknown`.
 1. To change the speech recognition language, replace `en-US` with another [supported language](~/articles/cognitive-services/speech-service/supported-languages.md). For example, `es-ES` for Spanish (Spain). The default language is `en-US` if you don't specify a language. For details about how to identify one of multiple languages that might be spoken, see [language identification](~/articles/cognitive-services/speech-service/language-identification.md). 
diff --git a/articles/ai-services/speech-service/includes/quickstarts/stt-diarization/python.md b/articles/ai-services/speech-service/includes/quickstarts/stt-diarization/python.md
@@ -64,7 +64,7 @@ Follow these steps to create a new console application.
         speech_config = speechsdk.SpeechConfig(subscription=os.environ.get('SPEECH_KEY'), region=os.environ.get('SPEECH_REGION'))
         speech_config.speech_recognition_language="en-US"
 
-        audio_config = speechsdk.audio.AudioConfig(filename="katiesteve_mono.wav")
+        audio_config = speechsdk.audio.AudioConfig(filename="katiesteve.wav")
         conversation_transcriber = speechsdk.transcription.ConversationTranscriber(speech_config=speech_config, audio_config=audio_config)
 
         transcribing_stop = False
@@ -100,7 +100,7 @@ Follow these steps to create a new console application.
         print("Encountered exception. {}".format(err))
     ```
 
-1. Replace `katiesteve_mono.wav` with the filepath and filename of your `.wav` file. The intent of this quickstart is to recognize speech from multiple participants in the conversation. Your audio file should contain multiple speakers. For example, you can use the [sample audio file](https://github.com/Azure-Samples/cognitive-services-speech-sdk/blob/master/quickstart/csharp/dotnet/conversation-transcription/helloworld/katiesteve_mono.wav) provided in the Speech SDK samples repository on GitHub.
+1. Replace `katiesteve.wav` with the filepath and filename of your `.wav` file. The intent of this quickstart is to recognize speech from multiple participants in the conversation. Your audio file should contain multiple speakers. For example, you can use the [sample audio file](https://github.com/Azure-Samples/cognitive-services-speech-sdk/blob/master/sampledata/audiofiles/katiesteve.wav) provided in the Speech SDK samples repository on GitHub.
     > [!NOTE]
     > The service performs best with at least 7 seconds of continuous audio from a single speaker. This allows the system to differentiate the speakers properly. Otherwise the Speaker ID is returned as `Unknown`.
 1. To change the speech recognition language, replace `en-US` with another [supported language](~/articles/cognitive-services/speech-service/supported-languages.md). For example, `es-ES` for Spanish (Spain). The default language is `en-US` if you don't specify a language. For details about how to identify one of multiple languages that might be spoken, see [language identification](~/articles/cognitive-services/speech-service/language-identification.md). 
@@ -140,9 +140,9 @@ TRANSCRIBED:
         Text=That's exciting. Let me try it right now.
         Speaker ID=Guest-2
 Canceled event
-CLOSING on ConversationTranscriptionCanceledEventArgs(session_id=606e8b5e65b94419b824d224127d9f92, result=ConversationTranscriptionResult(result_id=21d17c5738b442f8a7d428d0d5363fa8, speaker_id=, text=, reason=ResultReason.Canceled))  
+CLOSING on ConversationTranscriptionCanceledEventArgs(session_id=92a0abb68636471dac07041b335d9be3, result=ConversationTranscriptionResult(result_id=ad1b1d83b5c742fcacca0692baa8df74, speaker_id=, text=, reason=ResultReason.Canceled))
 SessionStopped event
-CLOSING on SessionEventArgs(session_id=606e8b5e65b94419b824d224127d9f92)
+CLOSING on SessionEventArgs(session_id=92a0abb68636471dac07041b335d9be3)
 ```
 
 Speakers are identified as Guest-1, Guest-2, and so on, depending on the number of speakers in the conversation.

Original file line number	Diff line number	Diff line change
`@@ -48,7 +48,7 @@ Follow these steps to create a new console application and install the Speech SD`
`48`	`48`
`49`	`49`	`async static Task Main(string[] args)`
`50`	`50`	`{`
`51`		`- var filepath = "katiesteve_mono.wav";`
	`51`	`+ var filepath = "katiesteve.wav";`
`52`	`52`	`var speechConfig = SpeechConfig.FromSubscription(speechKey, speechRegion);`
`53`	`53`	`speechConfig.SpeechRecognitionLanguage = "en-US";`
`54`	`54`
`@@ -110,7 +110,7 @@ Follow these steps to create a new console application and install the Speech SD`
`110`	`110`	`}`
`111`	`111`	```
`112`	`112`
`113`		-1. Replace `katiesteve_mono.wav` with the filepath and filename of your `.wav` file. The intent of this quickstart is to recognize speech from multiple participants in the conversation. Your audio file should contain multiple speakers. For example, you can use the [sample audio file](https://github.com/Azure-Samples/cognitive-services-speech-sdk/blob/master/quickstart/csharp/dotnet/conversation-transcription/helloworld/katiesteve_mono.wav) provided in the Speech SDK samples repository on GitHub.
	`113`	+1. Replace `katiesteve.wav` with the filepath and filename of your `.wav` file. The intent of this quickstart is to recognize speech from multiple participants in the conversation. Your audio file should contain multiple speakers. For example, you can use the [sample audio file](https://github.com/Azure-Samples/cognitive-services-speech-sdk/blob/master/sampledata/audiofiles/katiesteve.wav) provided in the Speech SDK samples repository on GitHub.
`114`	`114`	`> [!NOTE]`
`115`	`115`	> The service performs best with at least 7 seconds of continuous audio from a single speaker. This allows the system to differentiate the speakers properly. Otherwise the Speaker ID is returned as `Unknown`.
`116`	`116`	1. To change the speech recognition language, replace `en-US` with another [supported language](~/articles/cognitive-services/speech-service/supported-languages.md). For example, `es-ES` for Spanish (Spain). The default language is `en-US` if you don't specify a language. For details about how to identify one of multiple languages that might be spoken, see [language identification](~/articles/cognitive-services/speech-service/language-identification.md).