aws-observability
diff --git a/‎aws-distro-opentelemetry-node-autoinstrumentation/src/patches/aws/services/bedrock.ts‎
Lines changed: 28 additions & 5 deletions b/‎aws-distro-opentelemetry-node-autoinstrumentation/src/patches/aws/services/bedrock.ts‎
Lines changed: 28 additions & 5 deletions
diff --git a/‎aws-distro-opentelemetry-node-autoinstrumentation/test/patches/aws/services/bedrock.test.ts‎
Lines changed: 54 additions & 0 deletions b/‎aws-distro-opentelemetry-node-autoinstrumentation/test/patches/aws/services/bedrock.test.ts‎
Lines changed: 54 additions & 0 deletions
diff --git a/‎contract-tests/images/applications/aws-sdk/server.js‎
Lines changed: 176 additions & 16 deletions b/‎contract-tests/images/applications/aws-sdk/server.js‎
Lines changed: 176 additions & 16 deletions
@@ -251,6 +251,22 @@ export class BedrockRuntimeServiceExtension implements ServiceExtension {
         if (requestBody.top_p !== undefined) {
           spanAttributes[AwsSpanProcessingUtil.GEN_AI_REQUEST_TOP_P] = requestBody.top_p;
         }
+      } else if (modelId.includes('cohere.command-r')) {
+        if (requestBody.max_tokens !== undefined) {
+          spanAttributes[AwsSpanProcessingUtil.GEN_AI_REQUEST_MAX_TOKENS] = requestBody.max_tokens;
+        }
+        if (requestBody.temperature !== undefined) {
+          spanAttributes[AwsSpanProcessingUtil.GEN_AI_REQUEST_TEMPERATURE] = requestBody.temperature;
+        }
+        if (requestBody.p !== undefined) {
+          spanAttributes[AwsSpanProcessingUtil.GEN_AI_REQUEST_TOP_P] = requestBody.p;
+        }
+        if (requestBody.message !== undefined) {
+          // NOTE: We approximate the token count since this value is not directly available in the body
+          // According to Bedrock docs they use (total_chars / 6) to approximate token count for pricing.
+          // https://docs.aws.amazon.com/bedrock/latest/userguide/model-customization-prepare.html
+          spanAttributes[AwsSpanProcessingUtil.GEN_AI_USAGE_INPUT_TOKENS] = Math.ceil(requestBody.message.length / 6);
+        }
       } else if (modelId.includes('cohere.command')) {
         if (requestBody.max_tokens !== undefined) {
           spanAttributes[AwsSpanProcessingUtil.GEN_AI_REQUEST_MAX_TOKENS] = requestBody.max_tokens;
@@ -261,6 +277,9 @@ export class BedrockRuntimeServiceExtension implements ServiceExtension {
         if (requestBody.p !== undefined) {
           spanAttributes[AwsSpanProcessingUtil.GEN_AI_REQUEST_TOP_P] = requestBody.p;
         }
+        if (requestBody.prompt !== undefined) {
+          spanAttributes[AwsSpanProcessingUtil.GEN_AI_USAGE_INPUT_TOKENS] = Math.ceil(requestBody.prompt.length / 6);
+        }
       } else if (modelId.includes('ai21.jamba')) {
         if (requestBody.max_tokens !== undefined) {
           spanAttributes[AwsSpanProcessingUtil.GEN_AI_REQUEST_MAX_TOKENS] = requestBody.max_tokens;
@@ -271,7 +290,7 @@ export class BedrockRuntimeServiceExtension implements ServiceExtension {
         if (requestBody.top_p !== undefined) {
           spanAttributes[AwsSpanProcessingUtil.GEN_AI_REQUEST_TOP_P] = requestBody.top_p;
         }
-      } else if (modelId.includes('mistral.mistral')) {
+      } else if (modelId.includes('mistral')) {
         if (requestBody.prompt !== undefined) {
           // NOTE: We approximate the token count since this value is not directly available in the body
           // According to Bedrock docs they use (total_chars / 6) to approximate token count for pricing.
@@ -335,13 +354,17 @@ export class BedrockRuntimeServiceExtension implements ServiceExtension {
         if (responseBody.stop_reason !== undefined) {
           span.setAttribute(AwsSpanProcessingUtil.GEN_AI_RESPONSE_FINISH_REASONS, [responseBody.stop_reason]);
         }
-      } else if (currentModelId.includes('cohere.command')) {
-        if (responseBody.prompt !== undefined) {
+      } else if (currentModelId.includes('cohere.command-r')) {
+        if (responseBody.text !== undefined) {
           // NOTE: We approximate the token count since this value is not directly available in the body
           // According to Bedrock docs they use (total_chars / 6) to approximate token count for pricing.
           // https://docs.aws.amazon.com/bedrock/latest/userguide/model-customization-prepare.html
-          span.setAttribute(AwsSpanProcessingUtil.GEN_AI_USAGE_INPUT_TOKENS, Math.ceil(responseBody.prompt.length / 6));
+          span.setAttribute(AwsSpanProcessingUtil.GEN_AI_USAGE_OUTPUT_TOKENS, Math.ceil(responseBody.text.length / 6));
         }
+        if (responseBody.finish_reason !== undefined) {
+          span.setAttribute(AwsSpanProcessingUtil.GEN_AI_RESPONSE_FINISH_REASONS, [responseBody.finish_reason]);
+        }
+      } else if (currentModelId.includes('cohere.command')) {
         if (responseBody.generations?.[0]?.text !== undefined) {
           span.setAttribute(
             AwsSpanProcessingUtil.GEN_AI_USAGE_OUTPUT_TOKENS,
@@ -368,7 +391,7 @@ export class BedrockRuntimeServiceExtension implements ServiceExtension {
             responseBody.choices[0].finish_reason,
           ]);
         }
-      } else if (currentModelId.includes('mistral.mistral')) {
+      } else if (currentModelId.includes('mistral')) {
         if (responseBody.outputs?.[0]?.text !== undefined) {
           span.setAttribute(
             AwsSpanProcessingUtil.GEN_AI_USAGE_OUTPUT_TOKENS,
 
@@ -520,6 +520,60 @@ describe('BedrockRuntime', () => {
       expect(invokeModelSpan.kind).toBe(SpanKind.CLIENT);
     });
 
+    it('Add Cohere Command R model attributes to span', async () => {
+      const modelId: string = 'cohere.command-r-v1:0"';
+      const prompt: string = "Describe the purpose of a 'hello world' program in one line";
+      const nativeRequest: any = {
+        message: prompt,
+        max_tokens: 512,
+        temperature: 0.5,
+        p: 0.65,
+      };
+      const mockRequestBody: string = JSON.stringify(nativeRequest);
+      const mockResponseBody: any = {
+        finish_reason: 'COMPLETE',
+        text: 'test-generation-text',
+        prompt: prompt,
+        request: {
+          commandInput: {
+            modelId: modelId,
+          },
+        },
+      };
+
+      nock(`https://bedrock-runtime.${region}.amazonaws.com`)
+        .post(`/model/${encodeURIComponent(modelId)}/invoke`)
+        .reply(200, mockResponseBody);
+
+      await bedrock
+        .invokeModel({
+          modelId: modelId,
+          body: mockRequestBody,
+        })
+        .catch((err: any) => {
+          console.log('error', err);
+        });
+
+      const testSpans: ReadableSpan[] = getTestSpans();
+      const invokeModelSpans: ReadableSpan[] = testSpans.filter((s: ReadableSpan) => {
+        return s.name === 'BedrockRuntime.InvokeModel';
+      });
+      expect(invokeModelSpans.length).toBe(1);
+      const invokeModelSpan = invokeModelSpans[0];
+      expect(invokeModelSpan.attributes[AWS_ATTRIBUTE_KEYS.AWS_BEDROCK_AGENT_ID]).toBeUndefined();
+      expect(invokeModelSpan.attributes[AWS_ATTRIBUTE_KEYS.AWS_BEDROCK_KNOWLEDGE_BASE_ID]).toBeUndefined();
+      expect(invokeModelSpan.attributes[AWS_ATTRIBUTE_KEYS.AWS_BEDROCK_DATA_SOURCE_ID]).toBeUndefined();
+      expect(invokeModelSpan.attributes[AwsSpanProcessingUtil.GEN_AI_SYSTEM]).toBe('aws_bedrock');
+      expect(invokeModelSpan.attributes[AwsSpanProcessingUtil.GEN_AI_REQUEST_MODEL]).toBe(modelId);
+      expect(invokeModelSpan.attributes[AwsSpanProcessingUtil.GEN_AI_REQUEST_MAX_TOKENS]).toBe(512);
+      expect(invokeModelSpan.attributes[AwsSpanProcessingUtil.GEN_AI_REQUEST_TEMPERATURE]).toBe(0.5);
+      expect(invokeModelSpan.attributes[AwsSpanProcessingUtil.GEN_AI_REQUEST_TOP_P]).toBe(0.65);
+      expect(invokeModelSpan.attributes[AwsSpanProcessingUtil.GEN_AI_USAGE_INPUT_TOKENS]).toBe(10);
+      expect(invokeModelSpan.attributes[AwsSpanProcessingUtil.GEN_AI_USAGE_OUTPUT_TOKENS]).toBe(4);
+      expect(invokeModelSpan.attributes[AwsSpanProcessingUtil.GEN_AI_RESPONSE_FINISH_REASONS]).toEqual(['COMPLETE']);
+      expect(invokeModelSpan.kind).toBe(SpanKind.CLIENT);
+    });
+
     it('Add Meta Llama model attributes to span', async () => {
       const modelId: string = 'meta.llama2-13b-chat-v1';
       const prompt: string = 'Describe the purpose of an interpreter program in one line.';
 
@@ -10,7 +10,6 @@ const { S3Client, CreateBucketCommand, PutObjectCommand, GetObjectCommand } = re
 const { DynamoDBClient, CreateTableCommand, PutItemCommand } = require('@aws-sdk/client-dynamodb');
 const { SQSClient, CreateQueueCommand, SendMessageCommand, ReceiveMessageCommand } = require('@aws-sdk/client-sqs');
 const { KinesisClient, CreateStreamCommand, PutRecordCommand } = require('@aws-sdk/client-kinesis');
-const fetch = require('node-fetch');
 const { BedrockClient, GetGuardrailCommand } = require('@aws-sdk/client-bedrock');
 const { BedrockAgentClient, GetKnowledgeBaseCommand, GetDataSourceCommand, GetAgentCommand } = require('@aws-sdk/client-bedrock-agent');
 const { BedrockRuntimeClient, InvokeModelCommand } = require('@aws-sdk/client-bedrock-runtime');
@@ -553,30 +552,190 @@ async function handleBedrockRequest(req, res, path) {
       });
       res.statusCode = 200;
     } else if (path.includes('invokemodel/invoke-model')) {
-      await withInjected200Success(bedrockRuntimeClient, ['InvokeModelCommand'], {}, async () => {
-        const modelId = 'amazon.titan-text-premier-v1:0';
-        const userMessage = "Describe the purpose of a 'hello world' program in one line.";
-        const prompt = `<s>[INST] ${userMessage} [/INST]`;
-
-        const body = JSON.stringify({
-          inputText: prompt,
-          textGenerationConfig: {
-            maxTokenCount: 3072,
-            stopSequences: [],
-            temperature: 0.7,
-            topP: 0.9,
-          },
-        });
+        const get_model_request_response = function () {
+          const prompt = "Describe the purpose of a 'hello world' program in one line.";
+          let modelId = ''
+          let request_body = {}
+          let response_body = {}
+          
+          if (path.includes('amazon.titan')) {
+            
+            modelId = 'amazon.titan-text-premier-v1:0';
+
+            request_body = {
+              inputText: prompt,
+              textGenerationConfig: {
+                maxTokenCount: 3072,
+                stopSequences: [],
+                temperature: 0.7,
+                topP: 0.9,
+              },
+            };
+
+            response_body = {
+              inputTextTokenCount: 15,
+              results: [
+                {
+                  tokenCount: 13,
+                  outputText: 'text-test-response',
+                  completionReason: 'CONTENT_FILTERED',
+                },
+              ],
+            }
+
+          }
+
+          if (path.includes('anthropic.claude')) {
+            
+            modelId = 'anthropic.claude-v2:1';
+            
+            request_body = {
+              anthropic_version: 'bedrock-2023-05-31',
+              max_tokens: 1000,
+              temperature: 0.99,
+              top_p: 1,
+              messages: [
+                {
+                  role: 'user',
+                  content: [{ type: 'text', text: prompt }],
+                },
+              ],
+            };
+
+            response_body = {
+              stop_reason: 'end_turn',
+              usage: {
+                input_tokens: 15,
+                output_tokens: 13,
+              },
+            }
+          }
+
+          if (path.includes('meta.llama')) {
+            modelId = 'meta.llama2-13b-chat-v1';
+            
+            request_body = {
+              prompt,
+              max_gen_len: 512,
+              temperature: 0.5,
+              top_p: 0.9
+            };
+
+            response_body = {
+              prompt_token_count: 31,
+              generation_token_count: 49,
+              stop_reason: 'stop'
+            }
+          }
+
+          if (path.includes('cohere.command')) {
+            modelId = 'cohere.command-light-text-v14';
+            
+            request_body = {
+              prompt,
+              max_tokens: 512,
+              temperature: 0.5,
+              p: 0.65,
+            };
+
+            response_body = {
+              generations: [
+                {
+                  finish_reason: 'COMPLETE',
+                  text: 'test-generation-text',
+                },
+              ],
+              prompt: prompt,
+            };
+          }
+
+          if (path.includes('cohere.command-r')) {
+            modelId = 'cohere.command-r-v1:0';
+            
+            request_body = {
+              message: prompt,
+              max_tokens: 512,
+              temperature: 0.5,
+              p: 0.65,
+            };
+
+            response_body = {
+              finish_reason: 'COMPLETE',
+              text: 'test-generation-text',
+              prompt: prompt,
+              request: {
+                commandInput: {
+                  modelId: modelId,
+                },
+              },
+            }
+          }
+  
+          if (path.includes('ai21.jamba')) {
+            modelId = 'ai21.jamba-1-5-large-v1:0';
+            
+            request_body = {
+              messages: [
+                {
+                  role: 'user',
+                  content: prompt,
+                },
+              ],
+              top_p: 0.8,
+              temperature: 0.6,
+              max_tokens: 512,
+            };
+
+            response_body = {
+              stop_reason: 'end_turn',
+              usage: {
+                prompt_tokens: 21,
+                completion_tokens: 24,
+              },
+              choices: [
+                {
+                  finish_reason: 'stop',
+                },
+              ],
+            }
+          }
+  
+          if (path.includes('mistral')) {
+            modelId = 'mistral.mistral-7b-instruct-v0:2';
+            
+            request_body = {
+              prompt,
+              max_tokens: 4096,
+              temperature: 0.75,
+              top_p: 0.99,
+            };
+
+            response_body = {
+              outputs: [
+                {
+                  text: 'test-output-text',
+                  stop_reason: 'stop',
+                },
+              ]
+            }
+          }
+          
+          return [modelId, JSON.stringify(request_body), new TextEncoder().encode(JSON.stringify(response_body))]
+        }
+        
+        const [modelId, request_body, response_body] = get_model_request_response();
 
+      await withInjected200Success(bedrockRuntimeClient, ['InvokeModelCommand'], { body: response_body }, async () => {          
         await bedrockRuntimeClient.send(
           new InvokeModelCommand({
-            body: body,
+            body: request_body,
             modelId: modelId,
             accept: 'application/json',
             contentType: 'application/json',
           })
         );
       });
+
       res.statusCode = 200;
     } else {
       res.statusCode = 404;
@@ -624,3 +783,4 @@ prepareAwsServer().then(() => {
     console.log('Ready');
   });
 });
+