DataDog
diff --git a/‎packages/datadog-instrumentations/src/openai.js
Lines changed: 3 additions & 2 deletions b/‎packages/datadog-instrumentations/src/openai.js
Lines changed: 3 additions & 2 deletions
diff --git a/‎packages/datadog-plugin-openai/src/index.js
Lines changed: 157 additions & 17 deletions b/‎packages/datadog-plugin-openai/src/index.js
Lines changed: 157 additions & 17 deletions
@@ -143,7 +143,8 @@ addHook({ name: 'openai', file: 'dist/api.js', versions: ['>=3.0.0 <4'] }, expor
   return exports
 })
 
-function addStreamedChunkChoices (content, chunk) {
+function addStreamedChunk (content, chunk) {
+  content.usage = chunk.usage // add usage if it was specified to be returned
   for (const choice of chunk.choices) {
     const choiceIdx = choice.index
     const oldChoice = content.choices.find(choice => choice?.index === choiceIdx)
@@ -247,7 +248,7 @@ function wrapStreamIterator (response, options, n) {
                   body = { ...chunks[0], choices: Array.from({ length: n }) }
                   // start from the first chunk, and add its choices into the body
                   for (let i = 0; i < chunks.length; i++) {
-                    addStreamedChunkChoices(body, chunks[i])
+                    addStreamedChunk(body, chunks[i])
                   }
                 }
               }
 
@@ -15,6 +15,14 @@ const RE_TAB = /\t/g
 // TODO: In the future we should refactor config.js to make it requirable
 let MAX_TEXT_LEN = 128
 
+let encodingForModel
+try {
+  // eslint-disable-next-line import/no-extraneous-dependencies
+  encodingForModel = require('tiktoken').encoding_for_model
+} catch {
+  // we will use token count estimations in this case
+}
+
 class OpenApiPlugin extends TracingPlugin {
   static get id () { return 'openai' }
   static get operation () { return 'request' }
@@ -232,27 +240,47 @@ class OpenApiPlugin extends TracingPlugin {
 
     super.finish()
     this.sendLog(methodName, span, tags, store, error)
-    this.sendMetrics(headers, body, endpoint, span._duration, error)
+    this.sendMetrics(headers, body, endpoint, span._duration, error, tags)
   }
 
-  sendMetrics (headers, body, endpoint, duration, error) {
+  sendMetrics (headers, body, endpoint, duration, error, spanTags) {
     const tags = [`error:${Number(!!error)}`]
     if (error) {
       this.metrics.increment('openai.request.error', 1, tags)
     } else {
       tags.push(`org:${headers['openai-organization']}`)
       tags.push(`endpoint:${endpoint}`) // just "/v1/models", no method
-      tags.push(`model:${headers['openai-model']}`)
+      tags.push(`model:${headers['openai-model'] || body.model}`)
     }
 
     this.metrics.distribution('openai.request.duration', duration * 1000, tags)
 
-    if (body && body.usage) {
-      const promptTokens = body.usage.prompt_tokens
-      const completionTokens = body.usage.completion_tokens
-      this.metrics.distribution('openai.tokens.prompt', promptTokens, tags)
-      this.metrics.distribution('openai.tokens.completion', completionTokens, tags)
-      this.metrics.distribution('openai.tokens.total', promptTokens + completionTokens, tags)
+    const promptTokens = spanTags['openai.response.usage.prompt_tokens']
+    const promptTokensEstimated = spanTags['openai.response.usage.prompt_tokens_estimated']
+
+    const completionTokens = spanTags['openai.response.usage.completion_tokens']
+    const completionTokensEstimated = spanTags['openai.response.usage.completion_tokens_estimated']
+
+    if (!error) {
+      if (promptTokensEstimated) {
+        this.metrics.distribution(
+          'openai.tokens.prompt', promptTokens, [...tags, 'openai.estimated:true'])
+      } else {
+        this.metrics.distribution('openai.tokens.prompt', promptTokens, tags)
+      }
+      if (completionTokensEstimated) {
+        this.metrics.distribution(
+          'openai.tokens.completion', completionTokens, [...tags, 'openai.estimated:true'])
+      } else {
+        this.metrics.distribution('openai.tokens.completion', completionTokens, tags)
+      }
+
+      if (promptTokensEstimated || completionTokensEstimated) {
+        this.metrics.distribution(
+          'openai.tokens.total', promptTokens + completionTokens, [...tags, 'openai.estimated:true'])
+      } else {
+        this.metrics.distribution('openai.tokens.total', promptTokens + completionTokens, tags)
+      }
     }
 
     if (headers) {
@@ -290,6 +318,89 @@ class OpenApiPlugin extends TracingPlugin {
   }
 }
 
+function countPromptTokens (methodName, payload, model) {
+  let promptTokens = 0
+  let promptEstimated = false
+  if (methodName === 'chat.completions.create') {
+    const messages = payload.messages
+    for (const message of messages) {
+      const content = message.content
+      const { tokens, estimated } = countTokens(content, model)
+      promptTokens += tokens
+      promptEstimated = estimated
+    }
+  } else if (methodName === 'completions.create') {
+    let prompt = payload.prompt
+    if (!Array.isArray(prompt)) prompt = [prompt]
+
+    for (const p of prompt) {
+      const { tokens, estimated } = countTokens(p, model)
+      promptTokens += tokens
+      promptEstimated = estimated
+    }
+  }
+
+  return { promptTokens, promptEstimated }
+}
+
+function countCompletionTokens (body, model) {
+  let completionTokens = 0
+  let completionEstimated = false
+  if (body?.choices) {
+    for (const choice of body.choices) {
+      const message = choice.message || choice.delta // delta for streamed responses
+      const text = choice.text
+      const content = text || message?.content
+
+      const { tokens, estimated } = countTokens(content, model)
+      completionTokens += tokens
+      completionEstimated = estimated
+    }
+  }
+
+  return { completionTokens, completionEstimated }
+}
+
+function countTokens (content, model) {
+  if (encodingForModel) {
+    try {
+      // try using tiktoken if it was available
+      const encoder = encodingForModel(model)
+      const tokens = encoder.encode(content).length
+      encoder.free()
+      return { tokens, estimated: false }
+    } catch {
+      // possible errors from tiktoken:
+      // * model not available for token counts
+      // * issue encoding content
+    }
+  }
+
+  return {
+    tokens: estimateTokens(content),
+    estimated: true
+  }
+}
+
+// If model is unavailable or tiktoken is not imported, then provide a very rough estimate of the number of tokens
+// Approximate using the following assumptions:
+//    * English text
+//    * 1 token ~= 4 chars
+//    * 1 token ~= ¾ words
+function estimateTokens (content) {
+  let estimatedTokens = 0
+  if (typeof content === 'string') {
+    const estimation1 = content.length / 4
+
+    const matches = content.match(/[\w']+|[.,!?;~@#$%^&*()+/-]/g)
+    const estimation2 = matches ? matches.length * 0.75 : 0 // in the case of an empty string
+    estimatedTokens = Math.round((1.5 * estimation1 + 0.5 * estimation2) / 2)
+  } else if (Array.isArray(content) && typeof content[0] === 'number') {
+    estimatedTokens = content.length
+  }
+  return estimatedTokens
+}
+
 function createEditRequestExtraction (tags, payload, store) {
   const instruction = payload.instruction
   tags['openai.request.instruction'] = instruction
@@ -348,7 +459,7 @@ function responseDataExtractionByMethod (methodName, tags, body, store) {
     case 'chat.completions.create':
     case 'createEdit':
     case 'edits.create':
-      commonCreateResponseExtraction(tags, body, store)
+      commonCreateResponseExtraction(tags, body, store, methodName)
       break
 
     case 'listFiles':
@@ -584,8 +695,8 @@ function createModerationResponseExtraction (tags, body) {
 }
 
 // createCompletion, createChatCompletion, createEdit
-function commonCreateResponseExtraction (tags, body, store) {
-  usageExtraction(tags, body)
+function commonCreateResponseExtraction (tags, body, store, methodName) {
+  usageExtraction(tags, body, methodName)
 
   if (!body.choices) return
 
@@ -625,11 +736,40 @@ function commonCreateResponseExtraction (tags, body, store) {
 }
 
 // createCompletion, createChatCompletion, createEdit, createEmbedding
-function usageExtraction (tags, body) {
-  if (typeof body.usage !== 'object' || !body.usage) return
-  tags['openai.response.usage.prompt_tokens'] = body.usage.prompt_tokens
-  tags['openai.response.usage.completion_tokens'] = body.usage.completion_tokens
-  tags['openai.response.usage.total_tokens'] = body.usage.total_tokens
+function usageExtraction (tags, body, methodName) {
+  let promptTokens = 0
+  let completionTokens = 0
+  let totalTokens = 0
+  if (body && body.usage) {
+    promptTokens = body.usage.prompt_tokens
+    completionTokens = body.usage.completion_tokens
+    totalTokens = body.usage.total_tokens
+  } else if (['chat.completions.create', 'completions.create'].includes(methodName)) {
+    // estimate tokens based on method name for completions and chat completions
+    const { model } = body
+    let promptEstimated = false
+    let completionEstimated = false
+
+    // prompt tokens
+    const payload = storage.getStore().openai
+    const promptTokensCount = countPromptTokens(methodName, payload, model)
+    promptTokens = promptTokensCount.promptTokens
+    promptEstimated = promptTokensCount.promptEstimated
+
+    // completion tokens
+    const completionTokensCount = countCompletionTokens(body, model)
+    completionTokens = completionTokensCount.completionTokens
+    completionEstimated = completionTokensCount.completionEstimated
+
+    // total tokens
+    totalTokens = promptTokens + completionTokens
+    if (promptEstimated) tags['openai.response.usage.prompt_tokens_estimated'] = true
+    if (completionEstimated) tags['openai.response.usage.completion_tokens_estimated'] = true
+  }
+
+  if (promptTokens) tags['openai.response.usage.prompt_tokens'] = promptTokens
+  if (completionTokens) tags['openai.response.usage.completion_tokens'] = completionTokens
+  if (totalTokens) tags['openai.response.usage.total_tokens'] = totalTokens
 }
 
 function truncateApiKey (apiKey) {
Original file line number	Diff line number	Diff line change
`@@ -143,7 +143,8 @@ addHook({ name: 'openai', file: 'dist/api.js', versions: ['>=3.0.0 <4'] }, expor`
`143`	`143`	`return exports`
`144`	`144`	`})`
`145`	`145`
`146`		`-function addStreamedChunkChoices (content, chunk) {`
	`146`	`+function addStreamedChunk (content, chunk) {`
	`147`	`+ content.usage = chunk.usage // add usage if it was specified to be returned`
`147`	`148`	`for (const choice of chunk.choices) {`
`148`	`149`	`const choiceIdx = choice.index`
`149`	`150`	`const oldChoice = content.choices.find(choice => choice?.index === choiceIdx)`
`@@ -247,7 +248,7 @@ function wrapStreamIterator (response, options, n) {`
`247`	`248`	`body = { ...chunks[0], choices: Array.from({ length: n }) }`
`248`	`249`	`// start from the first chunk, and add its choices into the body`
`249`	`250`	`for (let i = 0; i < chunks.length; i++) {`
`250`		`- addStreamedChunkChoices(body, chunks[i])`
	`251`	`+ addStreamedChunk(body, chunks[i])`
`251`	`252`	`}`
`252`	`253`	`}`
`253`	`254`	`}`