feat(js): llama-index-ts initial retrieval span support (#643)

Arize-ai · Dec 6, 2024 · 8632b29 · 8632b29
1 parent 542501a
commit 8632b29
Show file tree

Hide file tree

Showing 4 changed files with 352 additions and 87 deletions.
diff --git a/js/packages/openinference-instrumentation-llama-index/src/instrumentation.ts b/js/packages/openinference-instrumentation-llama-index/src/instrumentation.ts
@@ -1,23 +1,14 @@
-/* eslint-disable @typescript-eslint/no-explicit-any */
 import type * as llamaindex from "llamaindex";
 
 import {
   InstrumentationBase,
   InstrumentationConfig,
   InstrumentationModuleDefinition,
   InstrumentationNodeModuleDefinition,
-  safeExecuteInTheMiddle,
 } from "@opentelemetry/instrumentation";
+import { diag } from "@opentelemetry/api";
+import { patchQueryMethod, patchRetrieveMethod } from "./utils";
 import { VERSION } from "./version";
-import {
-  Span,
-  SpanKind,
-  SpanStatusCode,
-  context,
-  diag,
-  trace,
-} from "@opentelemetry/api";
-import { isTracingSuppressed } from "@opentelemetry/core";
 
 const MODULE_NAME = "llamaindex";
 
@@ -34,28 +25,6 @@ export function isPatched() {
   return _isOpenInferencePatched;
 }
 
-import {
-  OpenInferenceSpanKind,
-  SemanticConventions,
-} from "@arizeai/openinference-semantic-conventions";
-
-/**
- * Resolves the execution context for the current span
- * If tracing is suppressed, the span is dropped and the current context is returned
- * @param span
- */
-function getExecContext(span: Span) {
-  const activeContext = context.active();
-  const suppressTracing = isTracingSuppressed(activeContext);
-  const execContext = suppressTracing
-    ? trace.setSpan(context.active(), span)
-    : activeContext;
-  // Drop the span from the context
-  if (suppressTracing) {
-    trace.deleteSpan(activeContext);
-  }
-  return execContext;
-}
 export class LlamaIndexInstrumentation extends InstrumentationBase<
   typeof llamaindex
 > {
@@ -66,7 +35,8 @@ export class LlamaIndexInstrumentation extends InstrumentationBase<
       Object.assign({}, config),
     );
   }
-  manuallyInstrument(module: typeof llamaindex) {
+
+  public manuallyInstrument(module: typeof llamaindex) {
     diag.debug(`Manually instrumenting ${MODULE_NAME}`);
     this.patch(module);
   }
@@ -87,71 +57,32 @@ export class LlamaIndexInstrumentation extends InstrumentationBase<
       return moduleExports;
     }
 
-    // eslint-disable-next-line @typescript-eslint/no-this-alias
-    const instrumentation: LlamaIndexInstrumentation = this;
-
-    type RetrieverQueryEngineQueryType =
-      typeof moduleExports.RetrieverQueryEngine.prototype.query;
-
+    // TODO: Support streaming
     this._wrap(
       moduleExports.RetrieverQueryEngine.prototype,
       "query",
-      (original: RetrieverQueryEngineQueryType): any => {
-        return function patchedQuery(
-          this: unknown,
-          ...args: Parameters<RetrieverQueryEngineQueryType>
-        ) {
-          const span = instrumentation.tracer.startSpan(`Query`, {
-            kind: SpanKind.INTERNAL,
-            attributes: {
-              [SemanticConventions.OPENINFERENCE_SPAN_KIND]:
-                OpenInferenceSpanKind.CHAIN,
-              [SemanticConventions.INPUT_VALUE]: args[0].query,
-            },
-          });
-
-          const execContext = getExecContext(span);
+      // eslint-disable-next-line @typescript-eslint/no-explicit-any
+      (original): any => {
+        return patchQueryMethod(original, moduleExports, this.tracer);
+      },
+    );
 
-          const execPromise = safeExecuteInTheMiddle<
-            ReturnType<RetrieverQueryEngineQueryType>
-          >(
-            () => {
-              return context.with(execContext, () => {
-                return original.apply(this, args);
-              });
-            },
-            (error) => {
-              // Push the error to the span
-              if (error) {
-                span.recordException(error);
-                span.setStatus({
-                  code: SpanStatusCode.ERROR,
-                  message: error.message,
-                });
-                span.end();
-              }
-            },
-          );
-          const wrappedPromise = execPromise.then((result) => {
-            span.setAttributes({
-              [SemanticConventions.OUTPUT_VALUE]: result.response,
-            });
-            span.end();
-            return result;
-          });
-          return context.bind(execContext, wrappedPromise);
-        };
+    this._wrap(
+      moduleExports.VectorIndexRetriever.prototype,
+      "retrieve",
+      (original) => {
+        return patchRetrieveMethod(original, moduleExports, this.tracer);
       },
     );
 
     _isOpenInferencePatched = true;
-
     return moduleExports;
   }
 
   private unpatch(moduleExports: typeof llamaindex, moduleVersion?: string) {
     this._diag.debug(`Un-patching ${MODULE_NAME}@${moduleVersion}`);
     this._unwrap(moduleExports.RetrieverQueryEngine.prototype, "query");
+    this._unwrap(moduleExports.VectorIndexRetriever.prototype, "retrieve");
 
     _isOpenInferencePatched = false;
   }

diff --git a/js/packages/openinference-instrumentation-llama-index/src/types.ts b/js/packages/openinference-instrumentation-llama-index/src/types.ts
@@ -0,0 +1,63 @@
+import { SemanticConventions } from "@arizeai/openinference-semantic-conventions";
+
+export type RetrievalDocument = {
+  [SemanticConventions.DOCUMENT_ID]?: string;
+  [SemanticConventions.DOCUMENT_CONTENT]?: string;
+  [SemanticConventions.DOCUMENT_SCORE]?: number | undefined;
+  [SemanticConventions.DOCUMENT_METADATA]?: string;
+};
+
+type LLMMessageToolCall = {
+  [SemanticConventions.TOOL_CALL_FUNCTION_NAME]?: string;
+  [SemanticConventions.TOOL_CALL_FUNCTION_ARGUMENTS_JSON]?: string;
+};
+
+export type LLMMessageToolCalls = {
+  [SemanticConventions.MESSAGE_TOOL_CALLS]?: LLMMessageToolCall[];
+};
+
+export type LLMMessageFunctionCall = {
+  [SemanticConventions.MESSAGE_FUNCTION_CALL_NAME]?: string;
+  [SemanticConventions.MESSAGE_FUNCTION_CALL_ARGUMENTS_JSON]?: string;
+};
+
+export type LLMMessage = LLMMessageToolCalls &
+  LLMMessageFunctionCall & {
+    [SemanticConventions.MESSAGE_ROLE]?: string;
+    [SemanticConventions.MESSAGE_CONTENT]?: string;
+  };
+
+export type LLMMessagesAttributes =
+  | {
+      [SemanticConventions.LLM_INPUT_MESSAGES]: LLMMessage[];
+    }
+  | {
+      [SemanticConventions.LLM_OUTPUT_MESSAGES]: LLMMessage[];
+    };
+
+// eslint-disable-next-line @typescript-eslint/no-explicit-any
+export type GenericFunction = (...args: any[]) => any;
+
+export type SafeFunction<T extends GenericFunction> = (
+  ...args: Parameters<T>
+) => ReturnType<T> | null;
+
+export type LLMParameterAttributes = {
+  [SemanticConventions.LLM_MODEL_NAME]?: string;
+  [SemanticConventions.LLM_INVOCATION_PARAMETERS]?: string;
+};
+
+export type PromptTemplateAttributes = {
+  [SemanticConventions.PROMPT_TEMPLATE_TEMPLATE]?: string;
+  [SemanticConventions.PROMPT_TEMPLATE_VARIABLES]?: string;
+};
+export type TokenCountAttributes = {
+  [SemanticConventions.LLM_TOKEN_COUNT_COMPLETION]?: number;
+  [SemanticConventions.LLM_TOKEN_COUNT_PROMPT]?: number;
+  [SemanticConventions.LLM_TOKEN_COUNT_TOTAL]?: number;
+};
+
+export type ToolAttributes = {
+  [SemanticConventions.TOOL_NAME]?: string;
+  [SemanticConventions.TOOL_DESCRIPTION]?: string;
+};
diff --git a/js/packages/openinference-instrumentation-llama-index/src/utils.ts b/js/packages/openinference-instrumentation-llama-index/src/utils.ts
@@ -0,0 +1,185 @@
+import type * as llamaindex from "llamaindex";
+
+import { TextNode } from "llamaindex";
+import { safeExecuteInTheMiddle } from "@opentelemetry/instrumentation";
+import {
+  Attributes,
+  Span,
+  SpanKind,
+  SpanStatusCode,
+  context,
+  trace,
+  Tracer,
+  diag,
+} from "@opentelemetry/api";
+import { isTracingSuppressed } from "@opentelemetry/core";
+import {
+  MimeType,
+  OpenInferenceSpanKind,
+  SemanticConventions,
+} from "@arizeai/openinference-semantic-conventions";
+import { GenericFunction, SafeFunction } from "./types";
+
+/**
+ * Wraps a function with a try-catch block to catch and log any errors.
+ * @param fn - A function to wrap with a try-catch block.
+ * @returns A function that returns null if an error is thrown.
+ */
+export function withSafety<T extends GenericFunction>(fn: T): SafeFunction<T> {
+  return (...args) => {
+    try {
+      return fn(...args);
+    } catch (error) {
+      diag.error(`Failed to get attributes for span: ${error}`);
+      return null;
+    }
+  };
+}
+
+const safelyJSONStringify = withSafety(JSON.stringify);
+
+/**
+ * Resolves the execution context for the current span
+ * If tracing is suppressed, the span is dropped and the current context is returned
+ * @param span
+ */
+function getExecContext(span: Span) {
+  const activeContext = context.active();
+  const suppressTracing = isTracingSuppressed(activeContext);
+  const execContext = suppressTracing
+    ? trace.setSpan(context.active(), span)
+    : activeContext;
+  // Drop the span from the context
+  if (suppressTracing) {
+    trace.deleteSpan(activeContext);
+  }
+  return execContext;
+}
+
+export function patchQueryMethod(
+  original: typeof module.RetrieverQueryEngine.prototype.query,
+  module: typeof llamaindex,
+  tracer: Tracer,
+) {
+  return function patchedQuery(
+    this: unknown,
+    ...args: Parameters<typeof module.RetrieverQueryEngine.prototype.query>
+  ) {
+    const span = tracer.startSpan(`query`, {
+      kind: SpanKind.INTERNAL,
+      attributes: {
+        [SemanticConventions.OPENINFERENCE_SPAN_KIND]:
+          OpenInferenceSpanKind.CHAIN,
+        [SemanticConventions.INPUT_VALUE]: args[0].query,
+        [SemanticConventions.INPUT_MIME_TYPE]: MimeType.TEXT,
+      },
+    });
+
+    const execContext = getExecContext(span);
+
+    const execPromise = safeExecuteInTheMiddle<
+      ReturnType<typeof module.RetrieverQueryEngine.prototype.query>
+    >(
+      () => {
+        return context.with(execContext, () => {
+          return original.apply(this, args);
+        });
+      },
+      (error) => {
+        // Push the error to the span
+        if (error) {
+          span.recordException(error);
+          span.setStatus({
+            code: SpanStatusCode.ERROR,
+            message: error.message,
+          });
+          span.end();
+        }
+      },
+    );
+
+    const wrappedPromise = execPromise.then((result) => {
+      span.setAttributes({
+        [SemanticConventions.OUTPUT_VALUE]: result.response,
+        [SemanticConventions.OUTPUT_MIME_TYPE]: MimeType.TEXT,
+      });
+      span.end();
+      return result;
+    });
+    return context.bind(execContext, wrappedPromise);
+  };
+}
+
+export function patchRetrieveMethod(
+  original: typeof module.VectorIndexRetriever.prototype.retrieve,
+  module: typeof llamaindex,
+  tracer: Tracer,
+) {
+  return function patchedRetrieve(
+    this: unknown,
+    ...args: Parameters<typeof module.VectorIndexRetriever.prototype.retrieve>
+  ) {
+    const span = tracer.startSpan(`retrieve`, {
+      kind: SpanKind.INTERNAL,
+      attributes: {
+        [SemanticConventions.OPENINFERENCE_SPAN_KIND]:
+          OpenInferenceSpanKind.RETRIEVER,
+        [SemanticConventions.INPUT_VALUE]: args[0].query,
+        [SemanticConventions.INPUT_MIME_TYPE]: MimeType.TEXT,
+      },
+    });
+
+    const execContext = getExecContext(span);
+
+    const execPromise = safeExecuteInTheMiddle<
+      ReturnType<typeof module.VectorIndexRetriever.prototype.retrieve>
+    >(
+      () => {
+        return context.with(execContext, () => {
+          return original.apply(this, args);
+        });
+      },
+      (error) => {
+        // Push the error to the span
+        if (error) {
+          span.recordException(error);
+          span.setStatus({
+            code: SpanStatusCode.ERROR,
+            message: error.message,
+          });
+          span.end();
+        }
+      },
+    );
+
+    const wrappedPromise = execPromise.then((result) => {
+      span.setAttributes(documentAttributes(result));
+      span.end();
+      return result;
+    });
+    return context.bind(execContext, wrappedPromise);
+  };
+}
+
+function documentAttributes(
+  output: llamaindex.NodeWithScore<llamaindex.Metadata>[],
+) {
+  const docs: Attributes = {};
+  output.forEach((document, index) => {
+    const { node, score } = document;
+
+    if (node instanceof TextNode) {
+      const nodeId = node.id_;
+      const nodeText = node.getContent();
+      const nodeMetadata = node.metadata;
+
+      const prefix = `${SemanticConventions.RETRIEVAL_DOCUMENTS}.${index}`;
+      docs[`${prefix}.${SemanticConventions.DOCUMENT_ID}`] = nodeId;
+      docs[`${prefix}.${SemanticConventions.DOCUMENT_SCORE}`] = score;
+      docs[`${prefix}.${SemanticConventions.DOCUMENT_CONTENT}`] = nodeText;
+      docs[`${prefix}.${SemanticConventions.DOCUMENT_METADATA}`] =
+        safelyJSONStringify(nodeMetadata) ?? undefined;
+    }
+  });
+  return docs;
+}