Merge pull request #217800 from valindrae/media-streaming-updates

denrea · web-flow · commit 32b13ad6c34d · 2022-11-16T10:34:56.000-08:00
Media streaming updates
diff --git a/articles/communication-services/concepts/voice-video-calling/media-streaming.md b/articles/communication-services/concepts/voice-video-calling/media-streaming.md
@@ -40,7 +40,7 @@ Audio streams can be used in many ways, below are some examples of how developer
 ## Supported formats
 
 ### Mixed format
-Contains mixed audio of all participants on the call.
+Contains mixed audio of all participants on the call. As this is mixed audio, the participantRawID will be null.
 	
 ### Unmixed
 Contains audio per participant per channel, with support for up to four channels for four dominant speakers. You will also get a participantRawID that you can use to determine the speaker. 
diff --git a/articles/communication-services/quickstarts/voice-video-calling/includes/call-automation-media/media-streaming-quickstart-csharp.md b/articles/communication-services/quickstarts/voice-video-calling/includes/call-automation-media/media-streaming-quickstart-csharp.md
@@ -66,68 +66,53 @@ The sample below demonstrates how to listen to media stream using your websocket
 HttpListener httpListener = new HttpListener();
 httpListener.Prefixes.Add("http://localhost:80/");
 httpListener.Start();
-while (true) {
-     HttpListenerContext httpListenerContext = await httpListener.GetContextAsync();
-     if (httpListenerContext.Request.IsWebSocketRequest) {
-         WebSocketContext websocketContext;
-         try {
+while (true)
+{
+    HttpListenerContext httpListenerContext = await httpListener.GetContextAsync();
+    if (httpListenerContext.Request.IsWebSocketRequest)
+    {
+        WebSocketContext websocketContext;
+        try
+        {
             websocketContext = await httpListenerContext.AcceptWebSocketAsync(subProtocol: null);
-            string ipAddress = httpListenerContext.Request.RemoteEndPoint.Address.ToString();
-         } catch (Exception ex) {
-           httpListenerContext.Response.StatusCode = 500;
-           httpListenerContext.Response.Close();
-           return;
-         }
+        }
+        catch (Exception ex)
+        {
+            return;
+        }
         WebSocket webSocket = websocketContext.WebSocket;
-        try {
-           while (webSocket.State == WebSocketState.Open || webSocket.State == WebSocketState.CloseSent) {
+        try
+        {
+            while (webSocket.State == WebSocketState.Open || webSocket.State == WebSocketState.CloseSent)
+            {
                 byte[] receiveBuffer = new byte[2048];
                 var cancellationToken = new CancellationTokenSource(TimeSpan.FromSeconds(60)).Token;
-                WebSocketReceiveResult receiveResult = await webSocket.ReceiveAsync(new ArraySegment < byte >.                               (receiveBuffer), cancellationToken);
-                if (receiveResult.MessageType != WebSocketMessageType.Close) {
-                  var data = Encoding.UTF8.GetString(receiveBuffer).TrimEnd('\0');
-                  try {
-                      var json = JsonConvert.DeserializeObject < Audio > (data);
-                      if (json != null) {
-                        var byteArray = json.AudioData;
-                        //Processing mixed audio data
-                        if (string.IsNullOrEmpty(json?.ParticipantId)) {
-                           if (string.IsNullOrEmpty(WebSocketData.FirstReceivedMixedAudioBufferTimeStamp)) {
-                             WebSocketData.FirstReceivedMixedAudioBufferTimeStamp = json.Timestamp;
-                           }
-                           //Process byteArray ( audioData ) however you want
-                        }
-                      }
-
-                     //Processing unmixed audio data
-                    else if (!string.IsNullOrEmpty(json?.ParticipantId) && !json.IsSilence) {
-                        if (json.ParticipantId != null) {
-                           switch (json.ParticipantId) {
-                           case {
-                               participantRawId1
-                           }:
-                           //Process audio data
-                           break;
-                           case {
-                               participantRawId2
-                           }::
-                           //Process audio data
-                           break;
-                           default:
-                                break;
-                           }
-                        }
-                        if (string.IsNullOrEmpty(WebSocketData.FirstReceivedUnmixedAudioBufferTimeStamp)) {
-                           WebSocketData.FirstReceivedUnmixedAudioBufferTimeStamp = json.Timestamp;
+                WebSocketReceiveResult receiveResult = await webSocket.ReceiveAsync(new ArraySegment<byte>(receiveBuffer), cancellationToken);
+                if (receiveResult.MessageType != WebSocketMessageType.Close)
+                {
+                    var data = Encoding.UTF8.GetString(receiveBuffer).TrimEnd('\0');
+                    try
+                    {
+                        var eventData = JsonConvert.DeserializeObject<AudioBaseClass>(data);
+                        if (eventData != null)
+                        {
+                            if(eventData.kind == "AudioMetadata")
+                            {
+                                //Process audio metadata
+                            }
+                            else if(eventData.kind == "AudioData") 
+                            {
+                                //Process audio data
+                                var byteArray = eventData.audioData.data;
+                               //use audio byteArray as you want
+                            }
                         }
                     }
-                 } catch {}
-              }
-           }
-        } catch (Exception ex) {}
-      } else {
-        httpListenerContext.Response.StatusCode = 400;
-        httpListenerContext.Response.Close();
-   }
+                    catch { }
+                }
+            }
+        }
+        catch (Exception ex) { }
+    }
 }
 ```
diff --git a/articles/communication-services/quickstarts/voice-video-calling/media-streaming.md b/articles/communication-services/quickstarts/voice-video-calling/media-streaming.md
@@ -33,42 +33,31 @@ Get started with using audio streams through Azure Communication Services Media
 When ACS has received the URL for your WebSocket server, it will create a connection to it. Once ACS has successfully connected to your WebSocket server, it will send through the first data packet which contains metadata regarding the incoming media packets.
 
 ``` code
-/**
- * The first message upon WebSocket connection will be the metadata packet
- * which contains the subscriptionId and audio format
- */
-public class AudioMetadataSample {
-    public string kind; // What kind of data this is, e.g. AudioMetadata, AudioData.
-    public AudioMetadata audioMetadata;
-}
-
-public class AudioMetadata {
-    public string subscriptionId // unique identifier for a subscription request
-    public string encoding; // PCM only supported
-    public int sampleRate; // 16000 default
-    public int channels; // 1 default
-    public int length; // 640 default
+{
+    "kind": <string> // What kind of data this is, e.g. AudioMetadata, AudioData.
+    "audioMetadata": {
+        "subscriptionId": <string>, // unique identifier for a subscription request
+        "encoding":<string>, // PCM only supported
+        "sampleRate": <int>, // 16000 default
+        "channels": <int>, // 1 default
+        "length": <int> // 640 default
+    }
 }
 ```
 
 ## Audio streaming schema
 After sending through the metadata packet, ACS will start streaming audio media to your WebSocket server. Below is an example of what the media object your server will receive looks like. 
 
 ``` code
-/**
- * The audio buffer object which is then serialized to JSON format
- */
-public class AudioDataSample {
-    public string kind; // What kind of data this is, e.g. AudioMetadata, AudioData.
-    public AudioData audioData;
+{
+    "kind": <string>, // What kind of data this is, e.g. AudioMetadata, AudioData.
+    "audioData":{
+        "data": <string>, // Base64 Encoded audio buffer data
+        "timestamp": <string>, // In ISO 8601 format (yyyy-mm-ddThh:mm:ssZ) 
+        "participantRawID": <string>, 
+        "silent": <boolean> // Indicates if the received audio buffer contains only silence.
+    }
 }
-
-public class AudioData {
-    public string data; // Base64 Encoded audio buffer data
-    public string timestamp; // In ISO 8601 format (yyyy-mm-ddThh:mm:ssZ) 
-    public string participantRawID;
-    public boolean silent; // Indicates if the received audio buffer contains only silence.
-} 
 ```
 
 Example of audio data being streamed