From 1363997621b440f0d9c1388063665fae6c9c2a69 Mon Sep 17 00:00:00 2001 From: Griffin Tarpenning Date: Wed, 27 Nov 2024 09:08:42 -0800 Subject: [PATCH 001/237] chore(ui): hide feedbackSidebar url param if false (#3091) --- .../Home/Browse3/pages/CallPage/CallPage.tsx | 4 ++-- .../Home/Browse3/pages/CallPage/PaginationControls.tsx | 2 +- 2 files changed, 3 insertions(+), 3 deletions(-) diff --git a/weave-js/src/components/PagePanelComponents/Home/Browse3/pages/CallPage/CallPage.tsx b/weave-js/src/components/PagePanelComponents/Home/Browse3/pages/CallPage/CallPage.tsx index 9b29fcc2e692..3a14c5dcfd91 100644 --- a/weave-js/src/components/PagePanelComponents/Home/Browse3/pages/CallPage/CallPage.tsx +++ b/weave-js/src/components/PagePanelComponents/Home/Browse3/pages/CallPage/CallPage.tsx @@ -222,7 +222,7 @@ const CallPageInnerVertical: FC<{ call.callId, path, !showTraceTree, - showFeedbackExpand + showFeedbackExpand ? true : undefined ) ); }, [ @@ -245,7 +245,7 @@ const CallPageInnerVertical: FC<{ call.callId, path, showTraceTree, - !showFeedbackExpand + !showFeedbackExpand ? true : undefined ) ); }, [currentRouter, history, path, showTraceTree, call, showFeedbackExpand]); diff --git a/weave-js/src/components/PagePanelComponents/Home/Browse3/pages/CallPage/PaginationControls.tsx b/weave-js/src/components/PagePanelComponents/Home/Browse3/pages/CallPage/PaginationControls.tsx index 03af4838d77c..9a2222e7e0a7 100644 --- a/weave-js/src/components/PagePanelComponents/Home/Browse3/pages/CallPage/PaginationControls.tsx +++ b/weave-js/src/components/PagePanelComponents/Home/Browse3/pages/CallPage/PaginationControls.tsx @@ -28,7 +28,7 @@ export const PaginationControls: FC<{ const showFeedbackExpand = FEEDBACK_EXPAND_PARAM in query ? query[FEEDBACK_EXPAND_PARAM] === '1' - : false; + : undefined; const onNextCall = useCallback(() => { const nextCallId = getNextRowId?.(call.callId); From 8531633c74779028a6812461defe0f55234827fb Mon Sep 17 00:00:00 2001 From: Andrew Truong Date: Wed, 27 Nov 2024 14:04:28 -0500 Subject: [PATCH 002/237] chore(weave): Pin instructor for python3.9 #3105 --- pyproject.toml | 5 ++++- 1 file changed, 4 insertions(+), 1 deletion(-) diff --git a/pyproject.toml b/pyproject.toml index 99c534303b61..27da86da7587 100644 --- a/pyproject.toml +++ b/pyproject.toml @@ -54,7 +54,10 @@ cohere = ["cohere>=5.9.1,<5.9.3"] dspy = ["dspy>=0.1.5", "litellm<=1.49.1"] google_ai_studio = ["google-generativeai>=0.8.3"] groq = ["groq>=0.9.0"] -instructor = ["instructor>=1.4.3"] +instructor = [ + "instructor>=1.4.3,<1.7.0; python_version <= '3.9'", + "instructor>=1.4.3; python_version > '3.9'", +] langchain = [ "langchain-core>=0.2.1", "langchain-openai>=0.1.7", From fd21fe6264ed337daa9c9c76f5490850d58f09fe Mon Sep 17 00:00:00 2001 From: Mollie Anderson <142847762+molliean@users.noreply.github.com> Date: Wed, 27 Nov 2024 11:27:22 -0800 Subject: [PATCH 003/237] fix(ui): Prevent Switch component from shrinking in flex containers (#3101) * fix(ui): Prevent Switch component from shrinking in flex containers * use `min-width` instead of `flex-shrink` --- weave-js/src/components/Switch/index.tsx | 4 +++- 1 file changed, 3 insertions(+), 1 deletion(-) diff --git a/weave-js/src/components/Switch/index.tsx b/weave-js/src/components/Switch/index.tsx index 98251dff0ca7..8c1e2799df64 100644 --- a/weave-js/src/components/Switch/index.tsx +++ b/weave-js/src/components/Switch/index.tsx @@ -13,7 +13,9 @@ export const Root = ({ 'flex items-center rounded-[12px] p-[1px] transition-colors duration-100 ease-out', 'focus-visible:outline focus-visible:outline-[2px] focus-visible:outline-teal-500', props.checked ? ' bg-teal-500' : 'bg-moon-350', - size === 'small' ? 'h-[16px] w-[28px]' : 'h-[24px] w-[44px]', + size === 'small' + ? 'min-w[28px] h-[16px] w-[28px]' + : 'h-[24px] w-[44px] min-w-[44px]', className )} {...props} From 5b08ca381f35c596869336fdf84be48382405028 Mon Sep 17 00:00:00 2001 From: Griffin Tarpenning Date: Wed, 27 Nov 2024 11:27:43 -0800 Subject: [PATCH 004/237] fix(ui): better defaults for trace/eval trace tree (#3106) --- .../Browse3/pages/CallsPage/callsTableColumns.tsx | 3 +++ .../Home/Browse3/pages/common/Links.tsx | 11 +++++++++-- 2 files changed, 12 insertions(+), 2 deletions(-) diff --git a/weave-js/src/components/PagePanelComponents/Home/Browse3/pages/CallsPage/callsTableColumns.tsx b/weave-js/src/components/PagePanelComponents/Home/Browse3/pages/CallsPage/callsTableColumns.tsx index 0fc4e8298a5b..93bd2ee030b1 100644 --- a/weave-js/src/components/PagePanelComponents/Home/Browse3/pages/CallsPage/callsTableColumns.tsx +++ b/weave-js/src/components/PagePanelComponents/Home/Browse3/pages/CallsPage/callsTableColumns.tsx @@ -29,6 +29,7 @@ import { getCostsFromCellParams, getTokensFromCellParams, } from '../CallPage/cost'; +import {isEvaluateOp} from '../common/heuristics'; import {CallLink} from '../common/Links'; import {StatusChip} from '../common/StatusChip'; import {buildDynamicColumns} from '../common/tabularListViews/columnBuilder'; @@ -228,6 +229,7 @@ function buildCallsTableColumns( rowParams.row.display_name ?? opVersionRefOpName(rowParams.row.op_name) ?? rowParams.row.op_name; + const isEval = isEvaluateOp(opVersionRefOpName(rowParams.row.op_name)); return ( ); }, diff --git a/weave-js/src/components/PagePanelComponents/Home/Browse3/pages/common/Links.tsx b/weave-js/src/components/PagePanelComponents/Home/Browse3/pages/common/Links.tsx index 915eaeb6935c..8a11252bc33c 100644 --- a/weave-js/src/components/PagePanelComponents/Home/Browse3/pages/common/Links.tsx +++ b/weave-js/src/components/PagePanelComponents/Home/Browse3/pages/common/Links.tsx @@ -282,6 +282,7 @@ export const CallLink: React.FC<{ tracetree?: boolean; icon?: React.ReactNode; color?: string; + isEval?: boolean; }> = props => { const history = useHistory(); const {peekingRouter} = useWeaveflowRouteContext(); @@ -297,8 +298,14 @@ export const CallLink: React.FC<{ const existingPath = peekParams.get(PATH_PARAM) ?? ''; // Preserve the path only when showing trace tree const path = props.preservePath ? existingPath : null; - // default to true if not specified - const showTraceTree = !(peekParams.get(TRACETREE_PARAM) === '0'); + // default to true if not specified and not an eval + const traceTreeParam = peekParams.get(TRACETREE_PARAM); + const showTraceTree = + traceTreeParam === '1' + ? true + : traceTreeParam === '0' + ? false + : !props.isEval; // default to false if not specified const showFeedbackExpand = peekParams.get(FEEDBACK_EXPAND_PARAM) === '1'; const to = peekingRouter.callUIUrl( From 6165c0faf0712f071707aab90250de560c24e1f6 Mon Sep 17 00:00:00 2001 From: Josiah Lee Date: Wed, 27 Nov 2024 11:45:08 -0800 Subject: [PATCH 005/237] style(weave): style try in playground, hide button in peek view in playground (#3075) * style try in plyground, hide in peek view in playground * follow slightly better pattern --- .../Home/Browse3/pages/CallPage/CallPage.tsx | 27 ++++++++++++++----- 1 file changed, 20 insertions(+), 7 deletions(-) diff --git a/weave-js/src/components/PagePanelComponents/Home/Browse3/pages/CallPage/CallPage.tsx b/weave-js/src/components/PagePanelComponents/Home/Browse3/pages/CallPage/CallPage.tsx index 3a14c5dcfd91..94bc220d1fec 100644 --- a/weave-js/src/components/PagePanelComponents/Home/Browse3/pages/CallPage/CallPage.tsx +++ b/weave-js/src/components/PagePanelComponents/Home/Browse3/pages/CallPage/CallPage.tsx @@ -81,6 +81,10 @@ const useCallTabs = (call: CallSchema) => { const {entity, project, callId} = call; const weaveRef = makeRefCall(entity, project, callId); + const {isPeeking} = useContext(WeaveflowPeekContext); + const showTryInPlayground = + !isPeeking || !window.location.toString().includes('/weave/playground'); + const handleOpenInPlayground = () => { window.open( urlPrefixed(`/${entity}/${project}/weave/playground/${callId}`), @@ -115,13 +119,22 @@ const useCallTabs = (call: CallSchema) => { label: 'Chat', content: ( <> - + {showTryInPlayground && ( + + + + )} From b95e46d0c4722d03f3f3853a5d05cc601a235b86 Mon Sep 17 00:00:00 2001 From: KyleGoyette Date: Wed, 27 Nov 2024 12:02:40 -0800 Subject: [PATCH 006/237] add data-test element (#3031) --- weave-js/src/components/Panel2/PanelComp.tsx | 1 + 1 file changed, 1 insertion(+) diff --git a/weave-js/src/components/Panel2/PanelComp.tsx b/weave-js/src/components/Panel2/PanelComp.tsx index 2991fdcec439..df8bbfd4e943 100644 --- a/weave-js/src/components/Panel2/PanelComp.tsx +++ b/weave-js/src/components/Panel2/PanelComp.tsx @@ -573,6 +573,7 @@ const ControlWrapper: React.FC = ({ return showControls || fullscreen ? ( { // onExpressionHover(); From 41ca390a19360d4b738c42d8446c139615d6dac0 Mon Sep 17 00:00:00 2001 From: J2-D2-3PO <188380414+J2-D2-3PO@users.noreply.github.com> Date: Wed, 27 Nov 2024 13:13:26 -0700 Subject: [PATCH 007/237] docs(weave): Update new feedback docs (#3093) Co-authored-by: Griffin Tarpenning --- docs/docs/guides/tracking/feedback.md | 176 ++++++++++++------ .../Browse3/pages/common/EmptyContent.tsx | 2 +- 2 files changed, 124 insertions(+), 54 deletions(-) diff --git a/docs/docs/guides/tracking/feedback.md b/docs/docs/guides/tracking/feedback.md index 81022d31bc92..68e27776d444 100644 --- a/docs/docs/guides/tracking/feedback.md +++ b/docs/docs/guides/tracking/feedback.md @@ -3,33 +3,77 @@ import TabItem from '@theme/TabItem'; # Feedback -Evaluating LLM applications automatically is challenging. Teams often rely on direct user feedback, particularly from domain experts, who assess the content quality using simple indicators such as thumbs up or down. Developers also actively identify and resolve content issues. +Efficiently evaluating LLM applications requires robust tooling to collect and analyze feedback. Weave provides an integrated feedback system, allowing users to provide call feedback directly through the UI or programmatically via the SDK. Various feedback types are supported, including emoji reactions, textual comments, and structured data, enabling teams to: -Weave's feedback feature enables users to provide feedback directly within the Weave UI or through the API. You can add emoji reactions, textual notes, and structured data to calls. This feedback helps compile evaluation datasets, monitor application performance, and collect examples for advanced tasks like fine-tuning. +- Build evaluation datasets for performance monitoring. +- Identify and resolve LLM content issues effectively. +- Gather examples for advanced tasks like fine-tuning. -## View and Add Feedback within UI +This guide covers how to use Weave’s feedback functionality in both the UI and SDK, query and manage feedback, and use human annotations for detailed evaluations. -Reactions and notes are displayed in a column in the calls grid. Hovering over these indicators provides more detail. Use these buttons to add reactions or notes. +- [Provide feedback in the UI](#provide-feedback-in-the-ui) +- [Provide feedback via the SDK](#provide-feedback-via-the-sdk) +- [Add human annotations](#add-human-annotations) -![Screenshot of calls grid with feedback column](imgs/feedback_calls.png) +## Provide feedback in the UI -View and edit feedback in the header of the call details page. +In the Weave UI, you can add and view feedback [from the call details page](#from-the-call-details-page) or [using the icons](#use-the-icons). -![Screenshot of feedback controls in call details header](imgs/feedback_call_header.png) +### From the call details page -View the feedback for a call on the "Feedback" tab of the call details page. +1. In the sidebar, navigate to **Traces**. +2. Find the row for the call that you want to add feedback to. +3. Open the call details page. +4. Select the **Feedback** column for the call. +5. Add, view, or delete feedback: + - *[Add and view feedback using the icons](#use-the-icons)* located in the upper right corner of the call details feedback view. + - *View and delete feedback from the call details feedback table.* Delete feedback by clicking the trashcan icon in the rightmost column of the appropriate feedback row. ![Screenshot of Feedback tab in call details](imgs/feedback_tab.png) -Access copy-and-paste examples on the "Use" tab of the call details page to manipulate the feedback for that call using the SDK. +### Use the icons + +You can add or remove a reaction, and add a note using the icons that are located in both the call table and individual call details pages. + +- *Call table*: Located in **Feedback** column in the appropriate row in the call table. +- *Call details page*: Located in the upper right corner of each call details page. + +To add a reaction: + 1. Click the emoji icon. + 2. Add a thumbs up, thumbs down, or click the **+** icon for more emojis. + +To remove a reaction: + 1. Hover over the emoji reaction you want to remove. + 2. Click the reaction to remove it. + +> You can also delete feedback from the [**Feedback** column on the call details page.](#from-the-call-details-page). + +To add a comment: + 1. Click the comment bubble icon. + 2. In the text box, add your note. + 3. To save the note, press the **Enter** key. You can add additional notes. + +![Screenshot of calls grid with feedback column](imgs/feedback_calls.png) + +## Provide feedback via the SDK + +> You can find SDK usage examples for feedback in the UI under the **Use** tab in the call details page. -![Screenshot of Use tab in call details](imgs/feedback_use.png) +You can use the Weave SDK to programmatically add, remove, and query feedback on calls. -## SDK +### Query a project's feedback -Use the Weave SDK to programmatically add, remove, and query feedback on calls. +You can query the feedback for your Weave project using the SDK. The SDK supports the following feedback query operations: -### Querying a project's feedback +- `client.get_feedback()`: Returns all feedback in a project. +- `client.get_feedback("")`: Return a specific feedback object specified by `` as a collection. +- `client.get_feedback(reaction="")`: Returns all feedback objects for a specific reaction type. + +You can also get additional information for each feedback object in `client.get_feedback()`: +- `id`: The feedback object ID. +- `created_at`: The creation time information for the feedback object. +- `feedback_type`: The type of feedback (reaction, note, custom). +- `payload`: The feedback payload @@ -41,14 +85,13 @@ Use the Weave SDK to programmatically add, remove, and query feedback on calls. all_feedback = client.get_feedback() # Fetch a specific feedback object by id. - # Note that the API still returns a collection, which is expected - # to contain zero or one item(s). + # The API returns a collection, which is expected to contain at most one item. one_feedback = client.get_feedback("")[0] # Find all feedback objects with a specific reaction. You can specify offset and limit. thumbs_up = client.get_feedback(reaction="👍", limit=10) - # After retrieval you can view the details of individual feedback objects. + # After retrieval, view the details of individual feedback objects. for f in client.get_feedback(): print(f.id) print(f.created_at) @@ -64,7 +107,13 @@ Use the Weave SDK to programmatically add, remove, and query feedback on calls. -### Adding feedback to a call +### Add feedback to a call + +You can add feedback to a call using the call's UUID. To use the UUID to get a particular call, [retrieve it during or after call execution](#retrieve-the-call-uuid). The SDK supports the following operations for adding feedback to a call: + +- `call.feedback.add_reaction("")`: Add one of the supported `` (emojis), such as 👍. +- `call.feedback.add_note("")`: Add a note. +- `call.feedback.add("