From 80479e905ebc629bf5ffadbd45e1518b3033bacd Mon Sep 17 00:00:00 2001
From: Lou Kratz <219901029+loukratz-bv@users.noreply.github.com>
Date: Wed, 11 Feb 2026 09:31:07 -0500
Subject: [PATCH 1/4] feat: Add Feedback Option for Flows

---
 .../category_feedback_example.qtype.yaml      |  62 ++++++
 .../explode_feedback_example.qtype.yaml       |  72 +++++++
 .../rating_feedback_example.qtype.yaml        |  56 ++++++
 .../thumbs_feedback_example.qtype.yaml        |  42 ++++
 pyproject.toml                                |   2 +-
 qtype/dsl/model.py                            |  55 ++++++
 qtype/interpreter/api.py                      |   7 +
 qtype/interpreter/base/base_step_executor.py  | 115 ++++++-----
 qtype/interpreter/base/stream_emitter.py      |  84 +++++++-
 qtype/interpreter/feedback_api.py             | 185 ++++++++++++++++++
 qtype/interpreter/metadata_api.py             |  21 ++
 qtype/interpreter/stream/chat/converter.py    |  22 ++-
 qtype/interpreter/types.py                    |  46 +++--
 qtype/interpreter/typing.py                   |  17 +-
 qtype/semantic/checker.py                     |  18 +-
 qtype/semantic/model.py                       |  40 ++++
 schema/qtype.schema.json                      | 115 +++++++++++
 tests/interpreter/test_step_executor.py       |  48 +++++
 ...alid_feedback_without_telemetry.qtype.yaml |  27 +++
 tests/semantic/test_checker_validation.py     |   4 +
 tests/semantic/test_feedback_validation.py    | 101 ++++++++++
 ui/components/FlowResponseCard.tsx            |  49 ++++-
 ui/components/FlowResponseTable.tsx           |  58 +++++-
 ui/components/chat/MessageBubble.tsx          |  34 +++-
 ui/components/feedback/CategoryFeedback.tsx   |  78 ++++++++
 ui/components/feedback/FeedbackButton.tsx     | 173 ++++++++++++++++
 .../feedback/FeedbackExplanationModal.tsx     |  72 +++++++
 ui/components/feedback/RatingFeedback.tsx     |  51 +++++
 ui/components/feedback/ThumbsFeedback.tsx     |  40 ++++
 ui/components/feedback/index.ts               |   5 +
 ui/components/flows/Chat.tsx                  |   2 +
 ui/components/flows/Rest.tsx                  |   4 +
 ui/lib/apiClient.ts                           |  19 +-
 ui/types/Feedback.ts                          |  37 ++++
 ui/types/FlowMetadata.ts                      |  22 +++
 uv.lock                                       |  72 +++++--
 36 files changed, 1750 insertions(+), 105 deletions(-)
 create mode 100644 examples/feedback/category_feedback_example.qtype.yaml
 create mode 100644 examples/feedback/explode_feedback_example.qtype.yaml
 create mode 100644 examples/feedback/rating_feedback_example.qtype.yaml
 create mode 100644 examples/feedback/thumbs_feedback_example.qtype.yaml
 create mode 100644 qtype/interpreter/feedback_api.py
 create mode 100644 tests/semantic/checker-error-specs/invalid_feedback_without_telemetry.qtype.yaml
 create mode 100644 tests/semantic/test_feedback_validation.py
 create mode 100644 ui/components/feedback/CategoryFeedback.tsx
 create mode 100644 ui/components/feedback/FeedbackButton.tsx
 create mode 100644 ui/components/feedback/FeedbackExplanationModal.tsx
 create mode 100644 ui/components/feedback/RatingFeedback.tsx
 create mode 100644 ui/components/feedback/ThumbsFeedback.tsx
 create mode 100644 ui/components/feedback/index.ts
 create mode 100644 ui/types/Feedback.ts

diff --git a/examples/feedback/category_feedback_example.qtype.yaml b/examples/feedback/category_feedback_example.qtype.yaml
new file mode 100644
index 00000000..ea252fd8
--- /dev/null
+++ b/examples/feedback/category_feedback_example.qtype.yaml
@@ -0,0 +1,62 @@
+id: category_feedback_example
+description: Example flow with categorical feedback collection
+
+flows:
+  - id: code_generator
+    description: Code generation with multi-category feedback
+    variables:
+      - id: requirement
+        type: text
+      - id: formatted_prompt
+        type: text
+      - id: generated_code
+        type: text
+    feedback:
+      type: category
+      categories:
+        - correct
+        - well_documented
+        - follows_best_practices
+        - efficient
+        - needs_improvement
+      allow_multiple: true
+      explanation: true
+    steps:
+      - type: PromptTemplate
+        id: prompt
+        template: |
+          Generate Python code for the following requirement:
+
+          {requirement}
+
+          Provide clean, well-documented code following Python best practices.
+        inputs:
+          - requirement
+        outputs:
+          - formatted_prompt
+
+      - type: LLMInference
+        id: llm
+        model: nova
+        inputs:
+          - formatted_prompt
+        outputs:
+          - generated_code
+    inputs:
+      - requirement
+    outputs:
+      - generated_code
+
+models:
+  - id: nova
+    type: Model
+    provider: aws-bedrock
+    model_id: amazon.nova-pro-v1:0
+    inference_params:
+      temperature: 0.2
+      max_tokens: 1000
+
+telemetry:
+  id: category_feedback_telemetry
+  provider: Phoenix
+  endpoint: http://localhost:6006/v1/traces
diff --git a/examples/feedback/explode_feedback_example.qtype.yaml b/examples/feedback/explode_feedback_example.qtype.yaml
new file mode 100644
index 00000000..34d21c36
--- /dev/null
+++ b/examples/feedback/explode_feedback_example.qtype.yaml
@@ -0,0 +1,72 @@
+id: explode_feedback_example
+description: Example flow with Explode fan-out and feedback collection
+
+flows:
+  - id: topic_facts_generator
+    description: Generate interesting facts for multiple topics with feedback
+    variables:
+      - id: topics_json
+        type: text
+      - id: topics
+        type: list[text]
+      - id: topic
+        type: text
+      - id: formatted_prompt
+        type: text
+      - id: fact
+        type: text
+    feedback:
+      type: thumbs
+      explanation: true
+    steps:
+      - type: Decoder
+        id: decode
+        format: json
+        inputs:
+          - topics_json
+        outputs:
+          - topics
+
+      - type: Explode
+        id: fan_out
+        inputs:
+          - topics
+        outputs:
+          - topic
+
+      - type: PromptTemplate
+        id: prompt
+        template: |
+          Generate one interesting, concise fact about: {topic}
+          
+          Keep it to 1-2 sentences and make it engaging.
+        inputs:
+          - topic
+        outputs:
+          - formatted_prompt
+
+      - type: LLMInference
+        id: llm
+        model: nova
+        inputs:
+          - formatted_prompt
+        outputs:
+          - fact
+    inputs:
+      - topics_json
+    outputs:
+      - fact
+
+models:
+  - id: nova
+    type: Model
+    provider: aws-bedrock
+    model_id: us.amazon.nova-lite-v1:0
+    inference_params:
+      temperature: 0.7
+      max_tokens: 200
+
+telemetry:
+  id: explode_feedback_telemetry
+  provider: Phoenix
+  endpoint: http://localhost:6006/v1/traces
diff --git a/examples/feedback/rating_feedback_example.qtype.yaml b/examples/feedback/rating_feedback_example.qtype.yaml
new file mode 100644
index 00000000..ccf5c078
--- /dev/null
+++ b/examples/feedback/rating_feedback_example.qtype.yaml
@@ -0,0 +1,56 @@
+id: rating_feedback_example
+description: Example flow with 1-10 rating scale feedback collection
+
+flows:
+  - id: document_summarizer
+    description: Document summarization with quality rating
+    variables:
+      - id: document_text
+        type: text
+      - id: formatted_prompt
+        type: text
+      - id: summary
+        type: text
+    feedback:
+      type: rating
+      scale: 10
+      explanation: true
+    steps:
+      - type: PromptTemplate
+        id: prompt
+        template: |
+          Summarize the following document in 2-3 sentences:
+
+          {document_text}
+
+          Summary:
+        inputs:
+          - document_text
+        outputs:
+          - formatted_prompt
+
+      - type: LLMInference
+        id: llm
+        model: nova
+        inputs:
+          - formatted_prompt
+        outputs:
+          - summary
+    inputs:
+      - document_text
+    outputs:
+      - summary
+
+models:
+  - id: nova
+    type: Model
+    provider: aws-bedrock
+    model_id: amazon.nova-pro-v1:0
+    inference_params:
+      temperature: 0.2
+      max_tokens: 1000
+
+telemetry:
+  id: category_feedback_telemetry
+  provider: Phoenix
+  endpoint: http://localhost:6006/v1/traces
diff --git a/examples/feedback/thumbs_feedback_example.qtype.yaml b/examples/feedback/thumbs_feedback_example.qtype.yaml
new file mode 100644
index 00000000..d4b1f736
--- /dev/null
+++ b/examples/feedback/thumbs_feedback_example.qtype.yaml
@@ -0,0 +1,42 @@
+id: simple_thumbs_chatbot
+description: A minimal chatbot example with thumbs up/down feedback
+
+flows:
+  - id: simple_chat
+    description: Simple conversational chatbot with feedback collection
+    variables:
+      - id: user_message
+        type: ChatMessage
+      - id: assistant_response
+        type: ChatMessage
+    interface:
+      type: Conversational
+    feedback:
+      type: thumbs
+      explanation: false
+    steps:
+      - type: LLMInference
+        id: chat_llm
+        model: nova
+        inputs:
+          - user_message
+        outputs:
+          - assistant_response
+    inputs:
+      - user_message
+    outputs:
+      - assistant_response
+
+models:
+  - id: nova
+    type: Model
+    provider: aws-bedrock
+    model_id: us.amazon.nova-lite-v1:0
+    inference_params:
+      temperature: 0.9
+      max_tokens: 300
+      
+telemetry:
+  id: chatbot_telemetry
+  provider: Phoenix
+  endpoint: http://localhost:6006/v1/traces
\ No newline at end of file
diff --git a/pyproject.toml b/pyproject.toml
index 93a0cc66..fbe32fdb 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -71,7 +71,7 @@ mcp = [
 
 [dependency-groups]
 dev = [
-    "arize-phoenix>=11.2.2",
+    "arize-phoenix>=12.35.0",
     "boto3>=1.34.0",
     "coverage>=7.0.0",
     "ipython>=8.37.0",
diff --git a/qtype/dsl/model.py b/qtype/dsl/model.py
index 27fe15ca..4fdefd94 100644
--- a/qtype/dsl/model.py
+++ b/qtype/dsl/model.py
@@ -600,6 +600,57 @@ class Agent(LLMInference):
     )
 
 
+class Feedback(StrictBaseModel):
+    """Base class for user feedback configurations on flow outputs."""
+
+    type: str = Field(..., description="Type of feedback widget to display.")
+    explanation: bool = Field(
+        default=False,
+        description="Whether to enable optional text explanation field.",
+    )
+
+
+class ThumbsFeedback(Feedback):
+    """Binary thumbs up/down feedback."""
+
+    type: Literal["thumbs"] = "thumbs"
+
+
+class RatingFeedback(Feedback):
+    """Numerical rating feedback (1-5 or 1-10 scale)."""
+
+    type: Literal["rating"] = "rating"
+    scale: int = Field(
+        default=5, description="Maximum value for rating scale."
+    )
+
+
+class CategoryFeedback(Feedback):
+    """Categorical feedback with predefined tags."""
+
+    type: Literal["category"] = "category"
+    categories: list[str] = Field(
+        ...,
+        description="List of category labels users can select from.",
+        min_length=1,
+    )
+    allow_multiple: bool = Field(
+        default=True,
+        description="Whether users can select multiple categories.",
+    )
+
+
+# Create a union type for all feedback types (defined here before Flow)
+FeedbackType = Annotated[
+    Union[
+        ThumbsFeedback,
+        RatingFeedback,
+        CategoryFeedback,
+    ],
+    Field(discriminator="type"),
+]
+
+
 class Flow(StrictBaseModel):
     """Defines a flow of steps that can be executed in sequence or parallel.
     If input or output variables are not specified, they are inferred from
@@ -616,6 +667,10 @@ class Flow(StrictBaseModel):
     )
 
     interface: FlowInterface | None = Field(default=None)
+    feedback: FeedbackType | None = Field(
+        default=None,
+        description="Optional feedback configuration for collecting user ratings on flow outputs.",
+    )
     variables: list[Variable] = Field(
         default_factory=list,
         description="List of variables available at the application scope.",
diff --git a/qtype/interpreter/api.py b/qtype/interpreter/api.py
index 5fe3091c..b1fa6a33 100644
--- a/qtype/interpreter/api.py
+++ b/qtype/interpreter/api.py
@@ -17,6 +17,7 @@
     create_rest_endpoint,
     create_streaming_endpoint,
 )
+from qtype.interpreter.feedback_api import create_feedback_endpoint
 from qtype.interpreter.metadata_api import create_metadata_endpoints
 from qtype.semantic.model import Application
 
@@ -110,6 +111,12 @@ async def shutdown_telemetry():
         # Create metadata endpoints for flow discovery
         create_metadata_endpoints(app, self.definition)
 
+        # Create feedback submission endpoint
+        if self.definition.telemetry:
+            create_feedback_endpoint(
+                app, self.definition.telemetry, secret_manager
+            )
+
         # Create executor context
         context = ExecutorContext(
             secret_manager=secret_manager,
diff --git a/qtype/interpreter/base/base_step_executor.py b/qtype/interpreter/base/base_step_executor.py
index 01dea695..7440d427 100644
--- a/qtype/interpreter/base/base_step_executor.py
+++ b/qtype/interpreter/base/base_step_executor.py
@@ -176,7 +176,10 @@ async def execute(
             Processed messages, with failed messages emitted first
         """
         # Start a span for tracking
-        # Note: We manually manage the span lifecycle to allow yielding
+        # Note: We do NOT attach this span to context here to avoid
+        # making upstream steps children of this step when we consume
+        # the input stream. Instead, _process_message_with_telemetry
+        # will attach it when calling process_message().
         span = self._tracer.start_span(
             f"step.{self.step.id}",
             attributes={
@@ -186,10 +189,8 @@ async def execute(
             },
         )
 
-        # Make this span the active context so child spans will nest under it
-        # Only attach if span is recording (i.e., real tracer is configured)
-        ctx = trace.set_span_in_context(span)
-        token = context.attach(ctx) if span.is_recording() else None
+        # Store span in self so _process_message_with_telemetry can access it
+        self._current_step_span = span
 
         # Initialize the cache
         # this is done once per execution so re-runs are fast
@@ -287,10 +288,8 @@ async def process_item(
                 span.set_status(Status(StatusCode.ERROR, f"Step failed: {e}"))
                 raise
             finally:
-                # Detach the context and end the span
-                # Only detach if we successfully attached (span was recording)
-                if token is not None:
-                    context.detach(token)
+                # Clean up step span reference and end the span
+                self._current_step_span = None
                 span.end()
 
     @abstractmethod
@@ -368,51 +367,77 @@ async def _process_message_with_telemetry(
 
         This method creates a child span for each message processing
         operation, automatically recording errors and success metrics.
-        The child span will automatically be nested under the current
-        active span in the context.
+        The child span will be nested under the step span.
+
+        The step span context is attached here (not in execute()) to
+        ensure step spans are siblings under the flow span, not nested.
         """
-        # Get current context and create child span within it
-        span = self._tracer.start_span(
-            f"step.{self.step.id}.process_message",
-            attributes={
-                "session.id": message.session.session_id,
-            },
-        )
+        # Attach step span context so process_message span becomes its child
+        step_span = getattr(self, "_current_step_span", None)
+        if step_span and step_span.is_recording():
+            ctx = trace.set_span_in_context(step_span)
+            token = context.attach(ctx)
+        else:
+            token = None
 
         try:
-            output_count = 0
-            error_occurred = False
-
-            async for output_msg in self.process_message(message):
-                output_count += 1
-                if output_msg.is_failed():
-                    error_occurred = True
-                    span.add_event(
-                        "message_failed",
-                        {
-                            "error": str(output_msg.error),
-                        },
+            # Create child span for this specific message processing
+            span = self._tracer.start_span(
+                f"step.{self.step.id}.process_message",
+                attributes={
+                    "session.id": message.session.session_id,
+                },
+            )
+
+            try:
+                output_count = 0
+                error_occurred = False
+
+                async for output_msg in self.process_message(message):
+                    output_count += 1
+                    if output_msg.is_failed():
+                        error_occurred = True
+                        span.add_event(
+                            "message_failed",
+                            {
+                                "error": str(output_msg.error),
+                            },
+                        )
+                    # Enrich with process_message span for feedback tracking
+                    span_context = span.get_span_context()
+                    updated_metadata = {
+                        **output_msg.metadata,
+                        "span_id": format(span_context.span_id, "016x"),
+                        "trace_id": format(span_context.trace_id, "032x"),
+                    }
+                    yield output_msg.model_copy(
+                        update={"metadata": updated_metadata}
                     )
-                yield output_msg
 
-            # Record processing metrics
-            span.set_attribute("message.outputs", output_count)
+                # Record processing metrics
+                span.set_attribute("message.outputs", output_count)
+
+                if error_occurred:
+                    span.set_status(
+                        Status(
+                            StatusCode.ERROR, "Message processing had errors"
+                        )
+                    )
+                else:
+                    span.set_status(Status(StatusCode.OK))
 
-            if error_occurred:
+            except Exception as e:
+                span.record_exception(e)
                 span.set_status(
-                    Status(StatusCode.ERROR, "Message processing had errors")
+                    Status(StatusCode.ERROR, f"Processing failed: {e}")
                 )
-            else:
-                span.set_status(Status(StatusCode.OK))
-
-        except Exception as e:
-            span.record_exception(e)
-            span.set_status(
-                Status(StatusCode.ERROR, f"Processing failed: {e}")
-            )
-            raise
+                raise
+            finally:
+                span.end()
         finally:
-            span.end()
+            # Detach step span context
+            if token is not None:
+                context.detach(token)
 
     async def finalize(self) -> AsyncIterator[FlowMessage]:
         """
diff --git a/qtype/interpreter/base/stream_emitter.py b/qtype/interpreter/base/stream_emitter.py
index 6d8b5ebc..84fb86e4 100644
--- a/qtype/interpreter/base/stream_emitter.py
+++ b/qtype/interpreter/base/stream_emitter.py
@@ -35,6 +35,8 @@ async def process_message(self, message: FlowMessage):
 
 from typing import Any
 
+from opentelemetry import trace
+
 from qtype.interpreter.types import (
     ErrorEvent,
     ReasoningStreamDeltaEvent,
@@ -54,6 +56,24 @@ async def process_message(self, message: FlowMessage):
 from qtype.semantic.model import Step
 
 
+def get_current_telemetry_metadata() -> dict[str, Any]:
+    """
+    Get current OpenTelemetry span context as metadata dict.
+
+    Returns:
+        Dictionary with span_id and trace_id if span is recording,
+        empty dict otherwise
+    """
+    span = trace.get_current_span()
+    if span and span.is_recording():
+        ctx = span.get_span_context()
+        return {
+            "span_id": format(ctx.span_id, "016x"),
+            "trace_id": format(ctx.trace_id, "032x"),
+        }
+    return {}
+
+
 class TextStreamContext:
     """
     Async context manager for text streaming.
@@ -83,7 +103,11 @@ async def __aenter__(self) -> TextStreamContext:
         """Emit TextStreamStartEvent when entering context."""
         if self.on_stream_event:
             await self.on_stream_event(
-                TextStreamStartEvent(step=self.step, stream_id=self.stream_id)
+                TextStreamStartEvent(
+                    step=self.step,
+                    stream_id=self.stream_id,
+                    metadata=get_current_telemetry_metadata(),
+                )
             )
         return self
 
@@ -96,7 +120,11 @@ async def __aexit__(
         """Emit TextStreamEndEvent when exiting context."""
         if self.on_stream_event:
             await self.on_stream_event(
-                TextStreamEndEvent(step=self.step, stream_id=self.stream_id)
+                TextStreamEndEvent(
+                    step=self.step,
+                    stream_id=self.stream_id,
+                    metadata=get_current_telemetry_metadata(),
+                )
             )
         return False
 
@@ -113,6 +141,7 @@ async def delta(self, text: str) -> None:
                     step=self.step,
                     stream_id=self.stream_id,
                     delta=text,
+                    metadata=get_current_telemetry_metadata(),
                 )
             )
 
@@ -158,7 +187,9 @@ async def __aexit__(
         if self._started and self.on_stream_event:
             await self.on_stream_event(
                 ReasoningStreamEndEvent(
-                    step=self.step, stream_id=self.stream_id
+                    step=self.step,
+                    stream_id=self.stream_id,
+                    metadata=get_current_telemetry_metadata(),
                 )
             )
         return False
@@ -173,11 +204,15 @@ async def delta(self, text: str) -> None:
             text: The incremental reasoning content to append to the stream
         """
         if self.on_stream_event:
+            metadata = get_current_telemetry_metadata()
+
             # Emit start event on first delta
             if not self._started:
                 await self.on_stream_event(
                     ReasoningStreamStartEvent(
-                        step=self.step, stream_id=self.stream_id
+                        step=self.step,
+                        stream_id=self.stream_id,
+                        metadata=metadata,
                     )
                 )
                 self._started = True
@@ -187,6 +222,7 @@ async def delta(self, text: str) -> None:
                     step=self.step,
                     stream_id=self.stream_id,
                     delta=text,
+                    metadata=metadata,
                 )
             )
 
@@ -218,7 +254,11 @@ def __init__(
     async def __aenter__(self) -> StepBoundaryContext:
         """Emit StepStartEvent when entering context."""
         if self.on_stream_event:
-            await self.on_stream_event(StepStartEvent(step=self.step))
+            await self.on_stream_event(
+                StepStartEvent(
+                    step=self.step, metadata=get_current_telemetry_metadata()
+                )
+            )
         return self
 
     async def __aexit__(
@@ -229,7 +269,11 @@ async def __aexit__(
     ) -> bool:
         """Emit StepEndEvent when exiting context."""
         if self.on_stream_event:
-            await self.on_stream_event(StepEndEvent(step=self.step))
+            await self.on_stream_event(
+                StepEndEvent(
+                    step=self.step, metadata=get_current_telemetry_metadata()
+                )
+            )
         return False
 
 
@@ -277,6 +321,7 @@ async def __aenter__(self) -> ToolExecutionContext:
                     tool_call_id=self.tool_call_id,
                     tool_name=self.tool_name,
                     tool_input=self.tool_input,
+                    metadata=get_current_telemetry_metadata(),
                 )
             )
         return self
@@ -299,6 +344,7 @@ async def __aexit__(
                     step=self.step,
                     tool_call_id=self.tool_call_id,
                     error_message=str(exc_val),
+                    metadata=get_current_telemetry_metadata(),
                 )
             )
             self._completed = True
@@ -319,6 +365,7 @@ async def complete(self, output: Any) -> None:
                     step=self.step,
                     tool_call_id=self.tool_call_id,
                     tool_output=output,
+                    metadata=get_current_telemetry_metadata(),
                 )
             )
         self._completed = True
@@ -338,6 +385,7 @@ async def error(self, error_message: str) -> None:
                     step=self.step,
                     tool_call_id=self.tool_call_id,
                     error_message=error_message,
+                    metadata=get_current_telemetry_metadata(),
                 )
             )
         self._completed = True
@@ -387,6 +435,18 @@ def __init__(
         self.step = step
         self.on_stream_event = on_stream_event
 
+    def _get_span_context(self) -> tuple[str | None, str | None]:
+        """
+        Get current OpenTelemetry span context.
+
+        Returns:
+            Tuple of (span_id, trace_id) as hex strings, or (None, None)
+
+        Deprecated: Use get_current_telemetry_metadata() instead.
+        """
+        metadata = get_current_telemetry_metadata()
+        return metadata.get("span_id"), metadata.get("trace_id")
+
     def text_stream(self, stream_id: str) -> TextStreamContext:
         """
         Create a context manager for text streaming.
@@ -459,7 +519,11 @@ async def status(self, message: str) -> None:
         """
         if self.on_stream_event:
             await self.on_stream_event(
-                StatusEvent(step=self.step, message=message)
+                StatusEvent(
+                    step=self.step,
+                    message=message,
+                    metadata=get_current_telemetry_metadata(),
+                )
             )
 
     async def error(self, error_message: str) -> None:
@@ -471,5 +535,9 @@ async def error(self, error_message: str) -> None:
         """
         if self.on_stream_event:
             await self.on_stream_event(
-                ErrorEvent(step=self.step, error_message=error_message)
+                ErrorEvent(
+                    step=self.step,
+                    error_message=error_message,
+                    metadata=get_current_telemetry_metadata(),
+                )
             )
diff --git a/qtype/interpreter/feedback_api.py b/qtype/interpreter/feedback_api.py
new file mode 100644
index 00000000..85b496dd
--- /dev/null
+++ b/qtype/interpreter/feedback_api.py
@@ -0,0 +1,185 @@
+from __future__ import annotations
+
+import logging
+from typing import Annotated, Any, Literal, Union
+from urllib.parse import urlparse
+
+from fastapi import FastAPI, HTTPException, status
+from pydantic import BaseModel, Field
+
+from qtype.semantic.model import TelemetrySink
+
+logger = logging.getLogger(__name__)
+
+
+def _format_feedback_label(feedback: FeedbackData) -> str:
+    """Format feedback data into a human-readable label."""
+    if isinstance(feedback, ThumbsFeedbackData):
+        return "👍" if feedback.value else "👎"
+    elif isinstance(feedback, RatingFeedbackData):
+        return str(feedback.score)
+    elif isinstance(feedback, CategoryFeedbackData):
+        return ", ".join(feedback.categories)
+    return "unknown"
+
+
+class ThumbsFeedbackData(BaseModel):
+    """Thumbs up/down feedback data."""
+
+    type: Literal["thumbs"] = "thumbs"
+    value: bool = Field(
+        ..., description="True for thumbs up, False for thumbs down."
+    )
+    explanation: str | None = Field(
+        default=None, description="Optional text explanation for the feedback."
+    )
+
+
+class RatingFeedbackData(BaseModel):
+    """Numeric rating feedback data."""
+
+    type: Literal["rating"] = "rating"
+    score: int = Field(..., description="Numeric rating score (e.g., 1-5).")
+    explanation: str | None = Field(
+        default=None, description="Optional text explanation for the feedback."
+    )
+
+
+class CategoryFeedbackData(BaseModel):
+    """Category selection feedback data."""
+
+    type: Literal["category"] = "category"
+    categories: list[str] = Field(
+        ..., description="List of selected category labels."
+    )
+    explanation: str | None = Field(
+        default=None, description="Optional text explanation for the feedback."
+    )
+
+
+FeedbackData = Annotated[
+    Union[ThumbsFeedbackData, RatingFeedbackData, CategoryFeedbackData],
+    Field(discriminator="type"),
+]
+
+
+class FeedbackRequest(BaseModel):
+    """Request model for submitting user feedback on a flow output."""
+
+    span_id: str = Field(..., description="Span ID of the output being rated.")
+    trace_id: str = Field(..., description="Trace ID of the flow execution.")
+    feedback: FeedbackData = Field(
+        ..., description="Feedback data (type determined by discriminator)."
+    )
+
+
+class FeedbackResponse(BaseModel):
+    """Response model for feedback submission."""
+
+    status: Literal["success"] = "success"
+    message: str = "Feedback submitted successfully"
+
+
+def create_feedback_endpoint(
+    app: FastAPI, telemetry: TelemetrySink, secret_manager: Any
+) -> None:
+    """
+    Register the feedback submission endpoint with the FastAPI application.
+
+    This creates a POST /feedback endpoint that accepts feedback submissions
+    and forwards them to the configured telemetry backend.
+
+    Args:
+        app: FastAPI application instance.
+        telemetry: Telemetry sink configuration.
+        secret_manager: Secret manager for resolving secret references.
+    """
+    # Create client based on provider
+    client = None
+
+    if telemetry.provider == "Phoenix":
+        from phoenix.client import Client
+
+        # Resolve endpoint in case it's a secret reference
+        args = {"base_url": telemetry.endpoint}
+        args = secret_manager.resolve_secrets_in_dict(
+            args, f"telemetry sink '{telemetry.id}' endpoint"
+        )
+
+        # Phoenix Client expects just the base URL (e.g., http://localhost:6006)
+        # Parse the URL and reconstruct with just scheme and netloc (host:port)
+        parsed = urlparse(args["base_url"])
+        base_url = f"{parsed.scheme}://{parsed.netloc}"
+
+        client = Client(base_url=base_url)
+    elif telemetry.provider == "Langfuse":
+        logger.warning(
+            "Langfuse feedback not yet implemented. "
+            "Feedback endpoint will not be created."
+        )
+        return
+    else:
+        logger.warning(
+            f"Feedback endpoint not created: unsupported telemetry "
+            f"provider '{telemetry.provider}'."
+        )
+        return
+
+    @app.post(
+        "/feedback",
+        response_model=FeedbackResponse,
+        tags=["feedback"],
+        summary="Submit user feedback on flow outputs",
+        description=(
+            "Submit user feedback (thumbs, rating, or category) on a "
+            "specific flow output. Feedback is sent to the telemetry "
+            "backend as span annotations."
+        ),
+    )
+    async def submit_feedback(request: FeedbackRequest) -> FeedbackResponse:
+        """
+        Submit user feedback on a flow output.
+
+        The feedback is recorded as a span annotation in the telemetry backend.
+        """
+        try:
+            if telemetry.provider == "Phoenix":
+                # Submit to Phoenix using span annotations API
+                label = _format_feedback_label(request.feedback)
+                explanation = getattr(request.feedback, "explanation", None)
+
+                # Calculate score based on feedback type
+                score = None
+                if isinstance(request.feedback, ThumbsFeedbackData):
+                    score = 1.0 if request.feedback.value else 0.0
+                elif isinstance(request.feedback, RatingFeedbackData):
+                    score = float(request.feedback.score)
+
+                client.spans.add_span_annotation(
+                    span_id=request.span_id,
+                    annotation_name="user_feedback",
+                    label=label,
+                    score=score,
+                    explanation=explanation,
+                    annotator_kind="HUMAN",
+                )
+
+                logger.info(
+                    f"Feedback submitted to Phoenix for span {request.span_id}: "
+                    f"{request.feedback.type} = {label}"
+                )
+
+            elif telemetry.provider == "Langfuse":
+                # TODO: Implement Langfuse feedback submission
+                raise NotImplementedError(
+                    "Langfuse feedback not yet implemented"
+                )
+
+            return FeedbackResponse()
+
+        except Exception as e:
+            logger.error(f"Failed to submit feedback: {e}", exc_info=True)
+            raise HTTPException(
+                status_code=status.HTTP_500_INTERNAL_SERVER_ERROR,
+                detail="Failed to submit feedback.",
+            ) from e
diff --git a/qtype/interpreter/metadata_api.py b/qtype/interpreter/metadata_api.py
index 3a52893a..e1f3c44a 100644
--- a/qtype/interpreter/metadata_api.py
+++ b/qtype/interpreter/metadata_api.py
@@ -5,6 +5,8 @@
 from typing import Any
 
 from fastapi import FastAPI
+from opentelemetry import trace
+from opentelemetry.trace import NoOpTracerProvider
 from pydantic import BaseModel, Field
 
 from qtype.interpreter.typing import create_input_shape, create_output_shape
@@ -43,6 +45,14 @@ class FlowMetadata(BaseModel):
     output_schema: dict[str, Any] = Field(
         ..., description="JSON schema for output"
     )
+    feedback: dict[str, Any] | None = Field(
+        default=None,
+        description="Feedback configuration if enabled for this flow",
+    )
+    telemetry_enabled: bool = Field(
+        default=False,
+        description="Whether telemetry is currently configured and recording",
+    )
 
 
 def create_metadata_endpoints(app: FastAPI, application: Application) -> None:
@@ -101,6 +111,15 @@ def _create_flow_metadata(flow: Flow) -> FlowMetadata:
         f"/flows/{flow.id}/stream" if flow.interface is not None else None
     )
 
+    # Check if telemetry is enabled
+    provider = trace.get_tracer_provider()
+    telemetry_enabled = not isinstance(provider, NoOpTracerProvider)
+
+    # Serialize feedback configuration if present
+    feedback_config = None
+    if flow.feedback:
+        feedback_config = flow.feedback.model_dump()
+
     return FlowMetadata(
         id=flow.id,
         description=flow.description,
@@ -112,4 +131,6 @@ def _create_flow_metadata(flow: Flow) -> FlowMetadata:
         ),
         input_schema=input_model.model_json_schema(),
         output_schema=output_model.model_json_schema(),
+        feedback=feedback_config,
+        telemetry_enabled=telemetry_enabled,
     )
diff --git a/qtype/interpreter/stream/chat/converter.py b/qtype/interpreter/stream/chat/converter.py
index fced692e..a2d97beb 100644
--- a/qtype/interpreter/stream/chat/converter.py
+++ b/qtype/interpreter/stream/chat/converter.py
@@ -377,11 +377,22 @@ async def stream_events():
     # Create converter for stateful event-to-chunk conversion
     converter = StreamEventConverter()
 
+    # Track telemetry metadata from events
+    telemetry_metadata: dict[str, str] = {}
+
     # Process events and convert to chunks
     async for event in event_stream:
         if event is None:
             break  # End of stream
 
+        # Extract telemetry metadata from first event that has it
+        if not telemetry_metadata and event.metadata:
+            if "span_id" in event.metadata and "trace_id" in event.metadata:
+                telemetry_metadata = {
+                    "span_id": event.metadata["span_id"],
+                    "trace_id": event.metadata["trace_id"],
+                }
+
         # Convert event to chunks and yield as SSE
         for chunk in converter.convert(event):
             yield (
@@ -390,8 +401,15 @@ async def stream_events():
                 f"\n\n"
             )
 
-    # End message stream with optional metadata
-    finish_chunk = FinishChunk(messageMetadata=output_metadata)  # type: ignore[arg-type]
+    # Merge telemetry metadata with output_metadata for FinishChunk
+    final_metadata = {**telemetry_metadata}
+    if output_metadata:
+        final_metadata.update(output_metadata)
+
+    # End message stream with metadata (includes telemetry)
+    finish_chunk = FinishChunk(
+        messageMetadata=final_metadata if final_metadata else None
+    )
     yield (
         f"data: "
         f"{finish_chunk.model_dump_json(by_alias=True, exclude_none=True)}"
diff --git a/qtype/interpreter/types.py b/qtype/interpreter/types.py
index d5790863..631e5e8a 100644
--- a/qtype/interpreter/types.py
+++ b/qtype/interpreter/types.py
@@ -38,7 +38,23 @@ def __bool__(self) -> bool:
 # and can be converted to Vercel UI chunks for frontend display
 
 
-class TextStreamStartEvent(BaseModel):
+class BaseStreamEvent(BaseModel):
+    """
+    Base class for all stream events.
+
+    Provides common metadata field for telemetry and other contextual data.
+    The metadata dict typically contains:
+    - span_id: OpenTelemetry span ID (16 hex chars)
+    - trace_id: OpenTelemetry trace ID (32 hex chars)
+    """
+
+    metadata: dict[str, Any] = Field(
+        default_factory=dict,
+        description="Metadata for telemetry and context tracking",
+    )
+
+
+class TextStreamStartEvent(BaseStreamEvent):
     """Signals the start of incremental text streaming.
 
     Use this when beginning to stream LLM-generated content or other
@@ -55,7 +71,7 @@ class TextStreamStartEvent(BaseModel):
     )
 
 
-class TextStreamDeltaEvent(BaseModel):
+class TextStreamDeltaEvent(BaseStreamEvent):
     """Carries an incremental chunk of text content.
 
     Use this for streaming LLM responses or other incremental text.
@@ -72,7 +88,7 @@ class TextStreamDeltaEvent(BaseModel):
     delta: str = Field(description="Incremental text content to append")
 
 
-class TextStreamEndEvent(BaseModel):
+class TextStreamEndEvent(BaseStreamEvent):
     """Signals the completion of incremental text streaming.
 
     Use this to mark the end of a text stream. After this event,
@@ -88,7 +104,7 @@ class TextStreamEndEvent(BaseModel):
     )
 
 
-class ReasoningStreamStartEvent(BaseModel):
+class ReasoningStreamStartEvent(BaseStreamEvent):
     """Signals the start of incremental reasoning streaming.
 
     Use this when an agent begins outputting reasoning/thinking steps.
@@ -105,7 +121,7 @@ class ReasoningStreamStartEvent(BaseModel):
     )
 
 
-class ReasoningStreamDeltaEvent(BaseModel):
+class ReasoningStreamDeltaEvent(BaseStreamEvent):
     """Carries an incremental chunk of reasoning content.
 
     Use this for streaming agent reasoning/thinking steps.
@@ -122,7 +138,7 @@ class ReasoningStreamDeltaEvent(BaseModel):
     delta: str = Field(description="Incremental reasoning content to append")
 
 
-class ReasoningStreamEndEvent(BaseModel):
+class ReasoningStreamEndEvent(BaseStreamEvent):
     """Signals the completion of incremental reasoning streaming.
 
     Use this to mark the end of a reasoning stream. After this event,
@@ -138,7 +154,7 @@ class ReasoningStreamEndEvent(BaseModel):
     )
 
 
-class StatusEvent(BaseModel):
+class StatusEvent(BaseStreamEvent):
     """Reports a complete status message from a step.
 
     Use this for non-streaming status updates like:
@@ -155,7 +171,7 @@ class StatusEvent(BaseModel):
     message: str = Field(description="Complete status message to display")
 
 
-class StepStartEvent(BaseModel):
+class StepStartEvent(BaseStreamEvent):
     """Marks the beginning of a logical step boundary.
 
     Use this to group related events together visually in the UI.
@@ -168,7 +184,7 @@ class StepStartEvent(BaseModel):
     step: Step
 
 
-class StepEndEvent(BaseModel):
+class StepEndEvent(BaseStreamEvent):
     """Marks the end of a logical step boundary.
 
     Use this to close a step boundary opened by StepStartEvent.
@@ -180,7 +196,7 @@ class StepEndEvent(BaseModel):
     step: Step
 
 
-class ToolExecutionStartEvent(BaseModel):
+class ToolExecutionStartEvent(BaseStreamEvent):
     """Signals the start of tool execution.
 
     Use this when a tool is about to be invoked, either by an LLM
@@ -198,7 +214,7 @@ class ToolExecutionStartEvent(BaseModel):
     )
 
 
-class ToolExecutionEndEvent(BaseModel):
+class ToolExecutionEndEvent(BaseStreamEvent):
     """Signals the completion of tool execution.
 
     Use this when a tool has finished executing successfully.
@@ -214,7 +230,7 @@ class ToolExecutionEndEvent(BaseModel):
     tool_output: Any = Field(description="Output returned by the tool")
 
 
-class ToolExecutionErrorEvent(BaseModel):
+class ToolExecutionErrorEvent(BaseStreamEvent):
     """Signals that tool execution failed.
 
     Use this when a tool encounters an error during execution.
@@ -230,7 +246,7 @@ class ToolExecutionErrorEvent(BaseModel):
     error_message: str = Field(description="Description of the error")
 
 
-class ErrorEvent(BaseModel):
+class ErrorEvent(BaseStreamEvent):
     """Signals a general error occurred during step execution.
 
     Use this for errors that aren't specific to tool execution.
@@ -330,6 +346,10 @@ class FlowMessage(BaseModel):
         description="Mapping of variable IDs to their values.",
     )
     error: Optional[StepError] = None
+    metadata: Dict[str, Any] = Field(
+        default_factory=dict,
+        description="Metadata for telemetry, span IDs, and other system-level data.",
+    )
 
     def is_failed(self) -> bool:
         """Checks if this state has encountered an error."""
diff --git a/qtype/interpreter/typing.py b/qtype/interpreter/typing.py
index 61d95deb..37cb70fc 100644
--- a/qtype/interpreter/typing.py
+++ b/qtype/interpreter/typing.py
@@ -60,10 +60,19 @@ def _fields_from_variables(variables: list[Variable]) -> dict:
 
 
 def create_output_shape(flow: Flow) -> Type[BaseModel]:
+    fields = _fields_from_variables(flow.outputs)
+    # Add metadata field for telemetry (span_id, trace_id)
+    fields["metadata"] = (
+        dict[str, Any] | None,
+        Field(
+            default=None,
+            description="Telemetry metadata including span_id and trace_id",
+        ),
+    )
     return create_model(
         f"{flow.id}Result",
         __base__=BaseModel,
-        **_fields_from_variables(flow.outputs),
+        **fields,
     )  # type: ignore
 
 
@@ -133,7 +142,11 @@ def flow_results_to_output_container(
             errors.append(m.error.model_dump())
         else:
             output_instance = output_shape(**m.variables)
-            outputs.append(output_instance.model_dump())
+            output_dict = output_instance.model_dump()
+            # Include metadata (span_id, trace_id) if present
+            if m.metadata:
+                output_dict["metadata"] = m.metadata
+            outputs.append(output_dict)
 
     return output_container(outputs=outputs, errors=errors)
 
diff --git a/qtype/semantic/checker.py b/qtype/semantic/checker.py
index e0a51d58..51604bf1 100644
--- a/qtype/semantic/checker.py
+++ b/qtype/semantic/checker.py
@@ -624,8 +624,24 @@ def _validate_application(application: Application) -> None:
     Raises:
         QTypeSemanticError: If SecretReference is used but
             secret_manager is not configured, or if secret_manager
-            configuration is invalid
+            configuration is invalid, or if feedback is configured
+            without telemetry
     """
+    # Check if feedback is configured without telemetry
+    if application.telemetry is None:
+        flows_with_feedback = [
+            flow.id for flow in application.flows if flow.feedback is not None
+        ]
+        if flows_with_feedback:
+            raise QTypeSemanticError(
+                (
+                    f"Application '{application.id}' has flows with feedback "
+                    f"configured but no telemetry sink defined. "
+                    f"Flows with feedback: {', '.join(flows_with_feedback)}. "
+                    "Please add a telemetry configuration to the application."
+                )
+            )
+
     if application.secret_manager is None:
         # Check if any SecretReference is used in the application
         if _has_secret_reference(application):
diff --git a/qtype/semantic/model.py b/qtype/semantic/model.py
index 4b79cdd6..476ce5b8 100644
--- a/qtype/semantic/model.py
+++ b/qtype/semantic/model.py
@@ -158,6 +158,15 @@ class AuthorizationProviderList(BaseModel):
     root: list[AuthorizationProvider] = Field(...)
 
 
+class Feedback(BaseModel):
+    """Base class for user feedback configurations on flow outputs."""
+
+    type: str = Field(..., description="Type of feedback widget to display.")
+    explanation: bool = Field(
+        False, description="Whether to enable optional text explanation field."
+    )
+
+
 class ConstantPath(BaseModel):
     """Semantic version of ConstantPath."""
 
@@ -216,6 +225,12 @@ class Flow(BaseModel):
         description="List of steps or references to steps",
     )
     interface: FlowInterface | None = Field(None)
+    feedback: ThumbsFeedback | RatingFeedback | CategoryFeedback | None = (
+        Field(
+            None,
+            description="Optional feedback configuration for collecting user ratings on flow outputs.",
+        )
+    )
     variables: list[Variable] = Field(
         default_factory=list,
         description="List of variables available at the application scope.",
@@ -669,6 +684,31 @@ class Writer(Step, BatchableStepMixin):
     id: str = Field(..., description="Unique ID of the data writer.")
 
 
+class CategoryFeedback(Feedback):
+    """Categorical feedback with predefined tags."""
+
+    type: Literal["category"] = Field("category")
+    categories: list[str] = Field(
+        ..., description="List of category labels users can select from."
+    )
+    allow_multiple: bool = Field(
+        True, description="Whether users can select multiple categories."
+    )
+
+
+class RatingFeedback(Feedback):
+    """Numerical rating feedback (1-5 or 1-10 scale)."""
+
+    type: Literal["rating"] = Field("rating")
+    scale: int = Field(5, description="Maximum value for rating scale.")
+
+
+class ThumbsFeedback(Feedback):
+    """Binary thumbs up/down feedback."""
+
+    type: Literal["thumbs"] = Field("thumbs")
+
+
 class DocumentIndex(Index):
     """Document search index for text-based search (e.g., Elasticsearch, OpenSearch)."""
 
diff --git a/schema/qtype.schema.json b/schema/qtype.schema.json
index c59cd85f..798570d8 100644
--- a/schema/qtype.schema.json
+++ b/schema/qtype.schema.json
@@ -930,6 +930,44 @@
       "title": "CacheConfig",
       "type": "object"
     },
+    "CategoryFeedback": {
+      "additionalProperties": false,
+      "description": "Categorical feedback with predefined tags.",
+      "properties": {
+        "type": {
+          "const": "category",
+          "default": "category",
+          "title": "Type",
+          "type": "string"
+        },
+        "explanation": {
+          "default": false,
+          "description": "Whether to enable optional text explanation field.",
+          "title": "Explanation",
+          "type": "boolean"
+        },
+        "categories": {
+          "description": "List of category labels users can select from.",
+          "items": {
+            "type": "string"
+          },
+          "minItems": 1,
+          "title": "Categories",
+          "type": "array"
+        },
+        "allow_multiple": {
+          "default": true,
+          "description": "Whether users can select multiple categories.",
+          "title": "Allow Multiple",
+          "type": "boolean"
+        }
+      },
+      "required": [
+        "categories"
+      ],
+      "title": "CategoryFeedback",
+      "type": "object"
+    },
     "Collect": {
       "additionalProperties": false,
       "description": "A step that collects all inputs and creates a single list to return.",
@@ -2370,6 +2408,37 @@
           ],
           "default": null
         },
+        "feedback": {
+          "anyOf": [
+            {
+              "discriminator": {
+                "mapping": {
+                  "category": "#/$defs/CategoryFeedback",
+                  "rating": "#/$defs/RatingFeedback",
+                  "thumbs": "#/$defs/ThumbsFeedback"
+                },
+                "propertyName": "type"
+              },
+              "oneOf": [
+                {
+                  "$ref": "#/$defs/ThumbsFeedback"
+                },
+                {
+                  "$ref": "#/$defs/RatingFeedback"
+                },
+                {
+                  "$ref": "#/$defs/CategoryFeedback"
+                }
+              ]
+            },
+            {
+              "type": "null"
+            }
+          ],
+          "default": null,
+          "description": "Optional feedback configuration for collecting user ratings on flow outputs.",
+          "title": "Feedback"
+        },
         "variables": {
           "description": "List of variables available at the application scope.",
           "items": {
@@ -3295,6 +3364,32 @@
       "title": "PythonFunctionTool",
       "type": "object"
     },
+    "RatingFeedback": {
+      "additionalProperties": false,
+      "description": "Numerical rating feedback (1-5 or 1-10 scale).",
+      "properties": {
+        "type": {
+          "const": "rating",
+          "default": "rating",
+          "title": "Type",
+          "type": "string"
+        },
+        "explanation": {
+          "default": false,
+          "description": "Whether to enable optional text explanation field.",
+          "title": "Explanation",
+          "type": "boolean"
+        },
+        "scale": {
+          "default": 5,
+          "description": "Maximum value for rating scale.",
+          "title": "Scale",
+          "type": "integer"
+        }
+      },
+      "title": "RatingFeedback",
+      "type": "object"
+    },
     "Reference_AWSAuthProvider_": {
       "properties": {
         "$ref": {
@@ -3659,6 +3754,26 @@
       "title": "TextWidget",
       "type": "string"
     },
+    "ThumbsFeedback": {
+      "additionalProperties": false,
+      "description": "Binary thumbs up/down feedback.",
+      "properties": {
+        "type": {
+          "const": "thumbs",
+          "default": "thumbs",
+          "title": "Type",
+          "type": "string"
+        },
+        "explanation": {
+          "default": false,
+          "description": "Whether to enable optional text explanation field.",
+          "title": "Explanation",
+          "type": "boolean"
+        }
+      },
+      "title": "ThumbsFeedback",
+      "type": "object"
+    },
     "ToolList": {
       "description": "Schema for a standalone list of tools.",
       "items": {
diff --git a/tests/interpreter/test_step_executor.py b/tests/interpreter/test_step_executor.py
index 13190203..10b56718 100644
--- a/tests/interpreter/test_step_executor.py
+++ b/tests/interpreter/test_step_executor.py
@@ -7,6 +7,7 @@
 
 import pytest
 from opentelemetry import trace
+from opentelemetry.sdk.trace import TracerProvider
 
 from qtype.base.types import ConcurrencyConfig
 from qtype.interpreter.base.base_step_executor import StepExecutor
@@ -388,6 +389,53 @@ async def test_finalize_hook(self, simple_step, session, executor_context):
         assert results[-1].variables.get("finalized") == "true"
         # Note: Progress count timing depends on stream implementation details
 
+    async def test_span_metadata_enrichment(self, simple_step, session):
+        """Test that span_id and trace_id are added to message metadata."""
+        # Set up a real TracerProvider that records spans
+        tracer_provider = TracerProvider()
+        tracer = tracer_provider.get_tracer(__name__)
+
+        # Create context with recording tracer
+        context = ExecutorContext(
+            secret_manager=NoOpSecretManager(),
+            tracer=tracer,
+        )
+
+        executor = MockExecutor(
+            simple_step,
+            context,
+            suffix="_processed",
+        )
+        results = await collect_stream(executor, ["msg1", "msg2"], session)
+
+        assert len(results) == 2
+
+        # Each message should have span_id and trace_id in metadata
+        for result in results:
+            assert "span_id" in result.metadata
+            assert "trace_id" in result.metadata
+
+            # Verify they are valid hex strings
+            span_id = result.metadata["span_id"]
+            trace_id = result.metadata["trace_id"]
+
+            # span_id should be 16 hex chars (64-bit)
+            assert len(span_id) == 16
+            assert all(c in "0123456789abcdef" for c in span_id)
+
+            # trace_id should be 32 hex chars (128-bit)
+            assert len(trace_id) == 32
+            assert all(c in "0123456789abcdef" for c in trace_id)
+
+        # Each message should have a unique process_message span_id
+        # (this allows per-message feedback instead of per-step)
+        span_ids = [r.metadata["span_id"] for r in results]
+        assert len(set(span_ids)) == len(results)
+
+        # Trace ID should be the same for all messages in the same execution
+        trace_ids = [r.metadata["trace_id"] for r in results]
+        assert len(set(trace_ids)) == 1
+
     async def test_dependencies_injection(self, simple_step, executor_context):
         """Test that dependencies are injected and accessible."""
         test_dep = {"key": "value"}
diff --git a/tests/semantic/checker-error-specs/invalid_feedback_without_telemetry.qtype.yaml b/tests/semantic/checker-error-specs/invalid_feedback_without_telemetry.qtype.yaml
new file mode 100644
index 00000000..d1dd5a60
--- /dev/null
+++ b/tests/semantic/checker-error-specs/invalid_feedback_without_telemetry.qtype.yaml
@@ -0,0 +1,27 @@
+id: test_feedback_without_telemetry
+description: Test that feedback requires telemetry to be configured
+
+flows:
+  - id: chat
+    description: Flow with feedback but no telemetry (should fail validation)
+    interface:
+      type: Conversational
+    feedback:
+      type: thumbs
+      explanation: false
+    variables:
+      - id: msg
+        type: ChatMessage
+    steps:
+      - type: Echo
+        id: echo
+        inputs:
+          - msg
+        outputs:
+          - msg
+    inputs:
+      - msg
+    outputs:
+      - msg
+
+# Note: No telemetry configured - this should cause validation error
diff --git a/tests/semantic/test_checker_validation.py b/tests/semantic/test_checker_validation.py
index de3dace6..026d417e 100644
--- a/tests/semantic/test_checker_validation.py
+++ b/tests/semantic/test_checker_validation.py
@@ -105,6 +105,10 @@
             "invalid_secret_manager_wrong_auth_type.qtype.yaml",
             "AWSSecretManager 'my_secret_manager' requires an AWSAuthProvider",
         ),
+        (
+            "invalid_feedback_without_telemetry.qtype.yaml",
+            "has flows with feedback configured but no telemetry sink defined",
+        ),
         (
             "invalid_complete_flow_no_text_output.qtype.yaml",
             "final step 'echo_step' is of type 'Echo' which does not support streaming",
diff --git a/tests/semantic/test_feedback_validation.py b/tests/semantic/test_feedback_validation.py
new file mode 100644
index 00000000..ce1f0eae
--- /dev/null
+++ b/tests/semantic/test_feedback_validation.py
@@ -0,0 +1,101 @@
+"""Tests for semantic validation of feedback configurations."""
+
+from __future__ import annotations
+
+from qtype.semantic import loader
+
+
+class TestFeedbackSemanticValidation:
+    """Test semantic validation rules for feedback."""
+
+    def test_thumbs_feedback_loads_correctly(self, tmp_path):
+        """Test that thumbs feedback configuration loads and validates."""
+        yaml_content = """
+id: test_app
+flows:
+  - id: test_flow
+    feedback:
+      type: thumbs
+      explanation: true
+    steps:
+      - type: Echo
+        id: echo1
+"""
+        yaml_file = tmp_path / "test.yaml"
+        yaml_file.write_text(yaml_content)
+
+        app, _ = loader.load(str(yaml_file))
+        flow = app.flows[0]
+        assert flow.feedback is not None
+        assert flow.feedback.type == "thumbs"
+        assert flow.feedback.explanation is True
+
+    def test_rating_feedback_loads_correctly(self, tmp_path):
+        """Test that rating feedback configuration loads and validates."""
+        yaml_content = """
+id: test_app
+flows:
+  - id: test_flow
+    feedback:
+      type: rating
+      scale: 10
+      explanation: false
+    steps:
+      - type: Echo
+        id: echo1
+"""
+        yaml_file = tmp_path / "test.yaml"
+        yaml_file.write_text(yaml_content)
+
+        app, _ = loader.load(str(yaml_file))
+        flow = app.flows[0]
+        assert flow.feedback is not None
+        assert flow.feedback.type == "rating"
+        assert flow.feedback.scale == 10
+        assert flow.feedback.explanation is False
+
+    def test_category_feedback_loads_correctly(self, tmp_path):
+        """Test that category feedback configuration loads and validates."""
+        yaml_content = """
+id: test_app
+flows:
+  - id: test_flow
+    feedback:
+      type: category
+      categories:
+        - accurate
+        - helpful
+        - creative
+      allow_multiple: true
+      explanation: true
+    steps:
+      - type: Echo
+        id: echo1
+"""
+        yaml_file = tmp_path / "test.yaml"
+        yaml_file.write_text(yaml_content)
+
+        app, _ = loader.load(str(yaml_file))
+        flow = app.flows[0]
+        assert flow.feedback is not None
+        assert flow.feedback.type == "category"
+        assert flow.feedback.categories == ["accurate", "helpful", "creative"]
+        assert flow.feedback.allow_multiple is True
+        assert flow.feedback.explanation is True
+
+    def test_flow_without_feedback(self, tmp_path):
+        """Test that flows work without feedback configuration."""
+        yaml_content = """
+id: test_app
+flows:
+  - id: test_flow
+    steps:
+      - type: Echo
+        id: echo1
+"""
+        yaml_file = tmp_path / "test.yaml"
+        yaml_file.write_text(yaml_content)
+
+        app, _ = loader.load(str(yaml_file))
+        flow = app.flows[0]
+        assert flow.feedback is None
diff --git a/ui/components/FlowResponseCard.tsx b/ui/components/FlowResponseCard.tsx
index a469e136..8f8e4121 100644
--- a/ui/components/FlowResponseCard.tsx
+++ b/ui/components/FlowResponseCard.tsx
@@ -6,6 +6,7 @@
 
 "use client";
 
+import { FeedbackButton } from "@/components/feedback";
 import { Alert, AlertDescription } from "@/components/ui/Alert";
 
 import { MarkdownContainer } from "./MarkdownContainer";
@@ -21,6 +22,7 @@ import {
 } from "./outputs";
 
 import type { SchemaProperty, ResponseData } from "@/types";
+import type { FeedbackConfig } from "@/types/FlowMetadata";
 
 interface ResponsePropertyProps {
   name: string;
@@ -129,11 +131,15 @@ function ResponseProperty({ name, property, value }: ResponsePropertyProps) {
 interface FlowResponseCardProps {
   responseSchema?: SchemaProperty | null;
   responseData?: ResponseData;
+  feedbackConfig?: FeedbackConfig | null;
+  telemetryEnabled?: boolean;
 }
 
 export default function FlowResponseCard({
   responseSchema,
   responseData,
+  feedbackConfig,
+  telemetryEnabled = false,
 }: FlowResponseCardProps) {
   if (!responseData) {
     return (
@@ -158,11 +164,36 @@ export default function FlowResponseCard({
       ? (responseData as Record<string, ResponseData>).outputs || responseData
       : responseData || {};
 
+  // Extract metadata (span_id, trace_id) from response
+  const metadata =
+    responseData && typeof responseData === "object"
+      ? (responseData as Record<string, unknown>).metadata
+      : null;
+
+  const spanId =
+    metadata && typeof metadata === "object"
+      ? (metadata as Record<string, unknown>).span_id
+      : null;
+
+  const traceId =
+    metadata && typeof metadata === "object"
+      ? (metadata as Record<string, unknown>).trace_id
+      : null;
+
+  const showFeedback =
+    feedbackConfig &&
+    telemetryEnabled &&
+    spanId &&
+    traceId &&
+    typeof spanId === "string" &&
+    typeof traceId === "string";
+
   return (
     <div className="space-y-4">
       {responseSchema.properties &&
-        Object.entries(responseSchema.properties).map(
-          ([propertyName, propertySchema]) => {
+        Object.entries(responseSchema.properties)
+          .filter(([propertyName]) => propertyName !== "metadata")
+          .map(([propertyName, propertySchema]) => {
             const value = (outputsData as Record<string, ResponseData>)[
               propertyName
             ];
@@ -179,8 +210,18 @@ export default function FlowResponseCard({
                 value={value}
               />
             );
-          },
-        )}
+          })}
+
+      {showFeedback && (
+        <div className="pt-4 border-t">
+          <FeedbackButton
+            feedbackConfig={feedbackConfig}
+            spanId={spanId}
+            traceId={traceId}
+            telemetryEnabled={telemetryEnabled}
+          />
+        </div>
+      )}
     </div>
   );
 }
diff --git a/ui/components/FlowResponseTable.tsx b/ui/components/FlowResponseTable.tsx
index e9df5b0a..089924cb 100644
--- a/ui/components/FlowResponseTable.tsx
+++ b/ui/components/FlowResponseTable.tsx
@@ -19,14 +19,18 @@ import { Download } from "lucide-react";
 import Papa from "papaparse";
 import { useMemo, useState } from "react";
 
+import { FeedbackButton } from "@/components/feedback";
 import { Button } from "@/components/ui/Button";
 import { Input } from "@/components/ui/Input";
 
 import type { SchemaProperty, ResponseData } from "@/types";
+import type { FeedbackConfig } from "@/types/FlowMetadata";
 
 interface FlowResponseTableProps {
   responseSchema?: SchemaProperty | null;
   outputs: ResponseData[];
+  feedbackConfig?: FeedbackConfig | null;
+  telemetryEnabled?: boolean;
 }
 
 function formatCellValue(value: ResponseData, qtypeType?: string): string {
@@ -61,6 +65,8 @@ function formatCellValue(value: ResponseData, qtypeType?: string): string {
 export default function FlowResponseTable({
   responseSchema,
   outputs,
+  feedbackConfig,
+  telemetryEnabled = false,
 }: FlowResponseTableProps) {
   const [searchText, setSearchText] = useState("");
   const [sorting, setSorting] = useState<SortingState>([]);
@@ -78,18 +84,50 @@ export default function FlowResponseTable({
   const columns = useMemo<ColumnDef<Record<string, ResponseData>>[]>(() => {
     if (!responseSchema?.properties) return [];
 
-    return Object.entries(responseSchema.properties).map(([key, schema]) => {
-      const prop = schema as SchemaProperty;
-      return {
-        accessorKey: key,
-        header: prop.title || key,
+    const dataColumns = Object.entries(responseSchema.properties)
+      .filter(([key]) => key !== "metadata")
+      .map(([key, schema]) => {
+        const prop = schema as SchemaProperty;
+        return {
+          accessorKey: key,
+          header: prop.title || key,
+          cell: ({ row }) => {
+            const value = row.original[key];
+            return formatCellValue(value, prop.qtype_type);
+          },
+        };
+      });
+
+    // Add feedback column if enabled
+    if (feedbackConfig && telemetryEnabled) {
+      dataColumns.push({
+        id: "feedback",
+        header: "Feedback",
         cell: ({ row }) => {
-          const value = row.original[key];
-          return formatCellValue(value, prop.qtype_type);
+          const metadata = row.original.metadata as
+            | Record<string, unknown>
+            | undefined;
+          const spanId = metadata?.span_id as string | undefined;
+          const traceId = metadata?.trace_id as string | undefined;
+
+          if (!spanId || !traceId) {
+            return null;
+          }
+
+          return (
+            <FeedbackButton
+              feedbackConfig={feedbackConfig}
+              spanId={spanId}
+              traceId={traceId}
+              telemetryEnabled={telemetryEnabled}
+            />
+          );
         },
-      };
-    });
-  }, [responseSchema]);
+      });
+    }
+
+    return dataColumns;
+  }, [responseSchema, feedbackConfig, telemetryEnabled]);
 
   const table = useReactTable({
     data,
diff --git a/ui/components/chat/MessageBubble.tsx b/ui/components/chat/MessageBubble.tsx
index f1fbe8db..501a4a84 100644
--- a/ui/components/chat/MessageBubble.tsx
+++ b/ui/components/chat/MessageBubble.tsx
@@ -1,5 +1,6 @@
 import { Bot, User } from "lucide-react";
 
+import { FeedbackButton } from "@/components/feedback";
 import { Avatar, AvatarFallback } from "@/components/ui/Avatar";
 
 import { MarkdownContainer } from "../MarkdownContainer";
@@ -13,10 +14,13 @@ import { FileDisplay } from ".";
 import type { Message } from "./types";
 import type { MessagePartWithText } from "./types/MessagePart";
 import type { FileAttachment } from "@/types";
+import type { FeedbackConfig } from "@/types/FlowMetadata";
 
 interface MessageBubbleProps {
   message: Message;
   isStreaming?: boolean;
+  feedbackConfig?: FeedbackConfig | null;
+  telemetryEnabled?: boolean;
 }
 
 interface StreamingPart {
@@ -24,7 +28,12 @@ interface StreamingPart {
   [key: string]: unknown;
 }
 
-function MessageBubble({ message, isStreaming = false }: MessageBubbleProps) {
+function MessageBubble({
+  message,
+  isStreaming = false,
+  feedbackConfig,
+  telemetryEnabled = false,
+}: MessageBubbleProps) {
   const isUser = message.role === "user";
 
   const reasoningContent = getPartContent(
@@ -50,6 +59,18 @@ function MessageBubble({ message, isStreaming = false }: MessageBubbleProps) {
     isStreaming,
   );
 
+  // Extract span_id and trace_id from metadata for feedback
+  const spanId = message.metadata?.span_id as string | undefined;
+  const traceId = message.metadata?.trace_id as string | undefined;
+
+  const showFeedback =
+    !isUser &&
+    !isStreaming &&
+    feedbackConfig &&
+    telemetryEnabled &&
+    spanId &&
+    traceId;
+
   return (
     <div
       className={`flex gap-3 w-full ${
@@ -97,6 +118,17 @@ function MessageBubble({ message, isStreaming = false }: MessageBubbleProps) {
             size={file.size}
           />
         ))}
+
+        {showFeedback && (
+          <div className="mt-2">
+            <FeedbackButton
+              feedbackConfig={feedbackConfig}
+              spanId={spanId}
+              traceId={traceId}
+              telemetryEnabled={telemetryEnabled}
+            />
+          </div>
+        )}
       </div>
 
       {isUser && (
diff --git a/ui/components/feedback/CategoryFeedback.tsx b/ui/components/feedback/CategoryFeedback.tsx
new file mode 100644
index 00000000..554890b0
--- /dev/null
+++ b/ui/components/feedback/CategoryFeedback.tsx
@@ -0,0 +1,78 @@
+/**
+ * CategoryFeedback Component
+ *
+ * Categorical feedback with predefined tags (single or multi-select)
+ */
+
+"use client";
+
+import { Check } from "lucide-react";
+import { useState } from "react";
+
+import { Button } from "@/components/ui/Button";
+
+interface CategoryFeedbackProps {
+  categories: string[];
+  allowMultiple: boolean;
+  onFeedback: (feedback: { type: "category"; categories: string[] }) => void;
+}
+
+export function CategoryFeedback({
+  categories,
+  allowMultiple,
+  onFeedback,
+}: CategoryFeedbackProps) {
+  const [selectedCategories, setSelectedCategories] = useState<Set<string>>(
+    new Set(),
+  );
+
+  const handleCategoryClick = (category: string) => {
+    if (allowMultiple) {
+      // Multi-select mode
+      const newSelected = new Set(selectedCategories);
+      if (newSelected.has(category)) {
+        newSelected.delete(category);
+      } else {
+        newSelected.add(category);
+      }
+      setSelectedCategories(newSelected);
+    } else {
+      // Single-select mode - submit immediately
+      onFeedback({ type: "category", categories: [category] });
+    }
+  };
+
+  const handleSubmit = () => {
+    if (selectedCategories.size > 0) {
+      onFeedback({
+        type: "category",
+        categories: Array.from(selectedCategories),
+      });
+    }
+  };
+
+  return (
+    <div className="flex flex-wrap items-center gap-2">
+      {categories.map((category) => {
+        const isSelected = selectedCategories.has(category);
+        return (
+          <Button
+            key={category}
+            variant={isSelected ? "default" : "outline"}
+            size="sm"
+            onClick={() => handleCategoryClick(category)}
+            className="h-8"
+          >
+            {isSelected && <Check className="mr-1 h-3 w-3" />}
+            {category}
+          </Button>
+        );
+      })}
+      {allowMultiple && selectedCategories.size > 0 && (
+        <Button variant="default" size="sm" onClick={handleSubmit}>
+          Submit ({selectedCategories.size})
+        </Button>
+      )}
+    </div>
+  );
+}
diff --git a/ui/components/feedback/FeedbackButton.tsx b/ui/components/feedback/FeedbackButton.tsx
new file mode 100644
index 00000000..91d0e0ca
--- /dev/null
+++ b/ui/components/feedback/FeedbackButton.tsx
@@ -0,0 +1,173 @@
+/**
+ * FeedbackButton Component
+ *
+ * Displays feedback UI based on flow configuration and handles submission to Phoenix
+ */
+
+"use client";
+
+import { Check, Loader2 } from "lucide-react";
+import { useState } from "react";
+
+import { apiClient } from "@/lib/apiClient";
+
+import { CategoryFeedback } from "./CategoryFeedback";
+import { FeedbackExplanationModal } from "./FeedbackExplanationModal";
+import { RatingFeedback } from "./RatingFeedback";
+import { ThumbsFeedback } from "./ThumbsFeedback";
+
+import type { FeedbackConfig } from "@/types/FlowMetadata";
+
+interface FeedbackButtonProps {
+  feedbackConfig: FeedbackConfig;
+  spanId: string;
+  traceId: string;
+  telemetryEnabled: boolean;
+}
+
+export function FeedbackButton({
+  feedbackConfig,
+  spanId,
+  traceId,
+  telemetryEnabled,
+}: FeedbackButtonProps) {
+  const [submitted, setSubmitted] = useState(false);
+  const [isSubmitting, setIsSubmitting] = useState(false);
+  const [error, setError] = useState<string | null>(null);
+  const [showExplanation, setShowExplanation] = useState(false);
+  const [pendingFeedback, setPendingFeedback] = useState<{
+    type: "thumbs" | "rating" | "category";
+    value?: boolean;
+    score?: number;
+    categories?: string[];
+  } | null>(null);
+
+  if (!telemetryEnabled) {
+    return null; // Don't show feedback if telemetry is not enabled
+  }
+
+  if (submitted) {
+    return (
+      <div className="flex items-center gap-2 text-sm text-green-600">
+        <Check className="h-4 w-4" />
+        <span>Feedback submitted</span>
+      </div>
+    );
+  }
+
+  if (isSubmitting) {
+    return (
+      <div className="flex items-center gap-2 text-sm text-gray-500">
+        <Loader2 className="h-4 w-4 animate-spin" />
+        <span>Submitting...</span>
+      </div>
+    );
+  }
+
+  const handleFeedbackSubmit = async (
+    feedback: {
+      type: "thumbs" | "rating" | "category";
+      value?: boolean;
+      score?: number;
+      categories?: string[];
+    },
+    explanation?: string,
+  ) => {
+    setIsSubmitting(true);
+    setError(null);
+
+    try {
+      // Construct feedback data based on type
+      let feedbackData:
+        | { type: "thumbs"; value: boolean; explanation?: string }
+        | { type: "rating"; score: number; explanation?: string }
+        | { type: "category"; categories: string[]; explanation?: string };
+
+      if (feedback.type === "thumbs" && feedback.value !== undefined) {
+        feedbackData = { type: "thumbs", value: feedback.value, explanation };
+      } else if (feedback.type === "rating" && feedback.score !== undefined) {
+        feedbackData = { type: "rating", score: feedback.score, explanation };
+      } else if (feedback.type === "category" && feedback.categories) {
+        feedbackData = {
+          type: "category",
+          categories: feedback.categories,
+          explanation,
+        };
+      } else {
+        throw new Error("Invalid feedback data");
+      }
+
+      await apiClient.submitFeedback({
+        span_id: spanId,
+        trace_id: traceId,
+        feedback: feedbackData,
+      });
+
+      setSubmitted(true);
+      setPendingFeedback(null);
+      setShowExplanation(false);
+    } catch (err) {
+      setError(
+        err instanceof Error ? err.message : "Failed to submit feedback",
+      );
+      setPendingFeedback(null);
+      setShowExplanation(false);
+    } finally {
+      setIsSubmitting(false);
+    }
+  };
+
+  const handleFeedbackClick = (feedback: {
+    type: "thumbs" | "rating" | "category";
+    value?: boolean;
+    score?: number;
+    categories?: string[];
+  }) => {
+    // If explanation is enabled, show modal first
+    if (feedbackConfig.explanation) {
+      setPendingFeedback(feedback);
+      setShowExplanation(true);
+    } else {
+      // Submit directly without explanation
+      handleFeedbackSubmit(feedback);
+    }
+  };
+
+  return (
+    <div className="flex flex-col gap-2">
+      <div className="flex items-center gap-2">
+        {feedbackConfig.type === "thumbs" && (
+          <ThumbsFeedback onFeedback={handleFeedbackClick} />
+        )}
+        {feedbackConfig.type === "rating" && (
+          <RatingFeedback
+            scale={feedbackConfig.scale}
+            onFeedback={handleFeedbackClick}
+          />
+        )}
+        {feedbackConfig.type === "category" && (
+          <CategoryFeedback
+            categories={feedbackConfig.categories}
+            allowMultiple={feedbackConfig.allow_multiple}
+            onFeedback={handleFeedbackClick}
+          />
+        )}
+      </div>
+
+      {error && <div className="text-sm text-red-600">{error}</div>}
+
+      {showExplanation && pendingFeedback && (
+        <FeedbackExplanationModal
+          isOpen={showExplanation}
+          onClose={() => {
+            setShowExplanation(false);
+            setPendingFeedback(null);
+          }}
+          onSubmit={(explanation) => {
+            handleFeedbackSubmit(pendingFeedback, explanation);
+          }}
+        />
+      )}
+    </div>
+  );
+}
diff --git a/ui/components/feedback/FeedbackExplanationModal.tsx b/ui/components/feedback/FeedbackExplanationModal.tsx
new file mode 100644
index 00000000..69fffa91
--- /dev/null
+++ b/ui/components/feedback/FeedbackExplanationModal.tsx
@@ -0,0 +1,72 @@
+/**
+ * FeedbackExplanationModal Component
+ *
+ * Optional modal for adding text explanation to feedback
+ */
+
+"use client";
+
+import { X } from "lucide-react";
+import { useState } from "react";
+
+import { Button } from "@/components/ui/Button";
+import { Card } from "@/components/ui/Card";
+
+interface FeedbackExplanationModalProps {
+  isOpen: boolean;
+  onClose: () => void;
+  onSubmit: (explanation?: string) => void;
+}
+
+export function FeedbackExplanationModal({
+  isOpen,
+  onClose,
+  onSubmit,
+}: FeedbackExplanationModalProps) {
+  const [explanation, setExplanation] = useState("");
+
+  if (!isOpen) return null;
+
+  const handleSubmit = () => {
+    onSubmit(explanation.trim() || undefined);
+  };
+
+  const handleSkip = () => {
+    onSubmit(undefined);
+  };
+
+  return (
+    <div className="fixed inset-0 z-50 flex items-center justify-center bg-black/50">
+      <Card className="w-full max-w-md p-6">
+        <div className="flex items-center justify-between mb-4">
+          <h3 className="text-lg font-semibold">Add Explanation (Optional)</h3>
+          <Button
+            variant="ghost"
+            size="sm"
+            onClick={onClose}
+            className="h-8 w-8 p-0"
+          >
+            <X className="h-4 w-4" />
+          </Button>
+        </div>
+
+        <div className="space-y-4">
+          <textarea
+            value={explanation}
+            onChange={(e) => setExplanation(e.target.value)}
+            placeholder="Why did you give this feedback? (optional)"
+            className="w-full min-h-[100px] p-3 border rounded-md resize-none focus:outline-none focus:ring-2 focus:ring-blue-500"
+            autoFocus
+          />
+
+          <div className="flex justify-end gap-2">
+            <Button variant="outline" onClick={handleSkip}>
+              Skip
+            </Button>
+            <Button onClick={handleSubmit}>Submit</Button>
+          </div>
+        </div>
+      </Card>
+    </div>
+  );
+}
diff --git a/ui/components/feedback/RatingFeedback.tsx b/ui/components/feedback/RatingFeedback.tsx
new file mode 100644
index 00000000..ffedd1da
--- /dev/null
+++ b/ui/components/feedback/RatingFeedback.tsx
@@ -0,0 +1,51 @@
+/**
+ * RatingFeedback Component
+ *
+ * Star rating feedback widget (1-5 or 1-10 scale)
+ */
+
+"use client";
+
+import { Star } from "lucide-react";
+import { useState } from "react";
+
+import { Button } from "@/components/ui/Button";
+
+interface RatingFeedbackProps {
+  scale: 5 | 10;
+  onFeedback: (feedback: { type: "rating"; score: number }) => void;
+}
+
+export function RatingFeedback({ scale, onFeedback }: RatingFeedbackProps) {
+  const [hoveredRating, setHoveredRating] = useState<number | null>(null);
+
+  return (
+    <div className="flex items-center gap-1">
+      {Array.from({ length: scale }, (_, i) => i + 1).map((rating) => {
+        const isFilled = hoveredRating ? rating <= hoveredRating : false;
+
+        return (
+          <Button
+            key={rating}
+            variant="ghost"
+            size="sm"
+            onClick={() => onFeedback({ type: "rating", score: rating })}
+            onMouseEnter={() => setHoveredRating(rating)}
+            onMouseLeave={() => setHoveredRating(null)}
+            className="h-8 w-8 p-0 hover:bg-transparent"
+            title={`Rate ${rating} out of ${scale}`}
+          >
+            <Star
+              className={`h-4 w-4 ${
+                isFilled ? "fill-yellow-400 text-yellow-400" : "text-gray-300"
+              }`}
+            />
+          </Button>
+        );
+      })}
+      <span className="ml-2 text-sm text-gray-500">
+        {hoveredRating ? `${hoveredRating}/${scale}` : `Rate 1-${scale}`}
+      </span>
+    </div>
+  );
+}
diff --git a/ui/components/feedback/ThumbsFeedback.tsx b/ui/components/feedback/ThumbsFeedback.tsx
new file mode 100644
index 00000000..67a863cd
--- /dev/null
+++ b/ui/components/feedback/ThumbsFeedback.tsx
@@ -0,0 +1,40 @@
+/**
+ * ThumbsFeedback Component
+ *
+ * Binary thumbs up/down feedback widget
+ */
+
+"use client";
+
+import { ThumbsDown, ThumbsUp } from "lucide-react";
+
+import { Button } from "@/components/ui/Button";
+
+interface ThumbsFeedbackProps {
+  onFeedback: (feedback: { type: "thumbs"; value: boolean }) => void;
+}
+
+export function ThumbsFeedback({ onFeedback }: ThumbsFeedbackProps) {
+  return (
+    <div className="flex items-center gap-1">
+      <Button
+        variant="outline"
+        size="sm"
+        onClick={() => onFeedback({ type: "thumbs", value: true })}
+        className="h-8 w-8 p-0"
+        title="Thumbs up"
+      >
+        <ThumbsUp className="h-4 w-4" />
+      </Button>
+      <Button
+        variant="outline"
+        size="sm"
+        onClick={() => onFeedback({ type: "thumbs", value: false })}
+        className="h-8 w-8 p-0"
+        title="Thumbs down"
+      >
+        <ThumbsDown className="h-4 w-4" />
+      </Button>
+    </div>
+  );
+}
diff --git a/ui/components/feedback/index.ts b/ui/components/feedback/index.ts
new file mode 100644
index 00000000..8f1bc35a
--- /dev/null
+++ b/ui/components/feedback/index.ts
@@ -0,0 +1,5 @@
+export { CategoryFeedback } from "./CategoryFeedback";
+export { FeedbackButton } from "./FeedbackButton";
+export { FeedbackExplanationModal } from "./FeedbackExplanationModal";
+export { RatingFeedback } from "./RatingFeedback";
+export { ThumbsFeedback } from "./ThumbsFeedback";
diff --git a/ui/components/flows/Chat.tsx b/ui/components/flows/Chat.tsx
index 8c00dbec..25358ee1 100644
--- a/ui/components/flows/Chat.tsx
+++ b/ui/components/flows/Chat.tsx
@@ -199,6 +199,8 @@ function ChatFlow({ flow }: ChatFlowProps) {
                     isStreaming={
                       status === "streaming" && index === messages.length - 1
                     }
+                    feedbackConfig={flow.feedback}
+                    telemetryEnabled={flow.telemetry_enabled}
                   />
                 );
               })
diff --git a/ui/components/flows/Rest.tsx b/ui/components/flows/Rest.tsx
index 7e3c7d48..6585c656 100644
--- a/ui/components/flows/Rest.tsx
+++ b/ui/components/flows/Rest.tsx
@@ -220,6 +220,8 @@ function RestFlow({ flow }: FlowProps) {
                           <FlowResponseCard
                             responseSchema={flow.output_schema}
                             responseData={output}
+                            feedbackConfig={flow.feedback}
+                            telemetryEnabled={flow.telemetry_enabled}
                           />
                         </div>
                       ))}
@@ -228,6 +230,8 @@ function RestFlow({ flow }: FlowProps) {
                     <FlowResponseTable
                       responseSchema={flow.output_schema}
                       outputs={responseData.outputs}
+                      feedbackConfig={flow.feedback}
+                      telemetryEnabled={flow.telemetry_enabled}
                     />
                   )}
                 </div>
diff --git a/ui/lib/apiClient.ts b/ui/lib/apiClient.ts
index bd0ab31b..e190ea61 100644
--- a/ui/lib/apiClient.ts
+++ b/ui/lib/apiClient.ts
@@ -152,7 +152,10 @@ export class ApiClient {
   /**
    * POST request helper
    */
-  private async post<T>(endpoint: string, data?: FlowInputValues): Promise<T> {
+  private async post<T>(
+    endpoint: string,
+    data?: FlowInputValues | Record<string, unknown>,
+  ): Promise<T> {
     const response = await this.fetchWithTimeout(this.getUrl(endpoint), {
       method: "POST",
       body: data ? JSON.stringify(data) : undefined,
@@ -218,6 +221,20 @@ export class ApiClient {
   setBaseUrl(baseUrl: string): void {
     this.config.baseUrl = baseUrl;
   }
+
+  /**
+   * Submit user feedback on a flow output
+   */
+  async submitFeedback(feedback: {
+    span_id: string;
+    trace_id: string;
+    feedback:
+      | { type: "thumbs"; value: boolean; explanation?: string }
+      | { type: "rating"; score: number; explanation?: string }
+      | { type: "category"; categories: string[]; explanation?: string };
+  }): Promise<{ status: string; message: string }> {
+    return this.post("/feedback", feedback);
+  }
 }
 
 /**
diff --git a/ui/types/Feedback.ts b/ui/types/Feedback.ts
new file mode 100644
index 00000000..fe62c0f5
--- /dev/null
+++ b/ui/types/Feedback.ts
@@ -0,0 +1,37 @@
+/**
+ * Types for feedback submission
+ */
+
+export interface ThumbsFeedbackData {
+  type: "thumbs";
+  value: boolean;
+  explanation?: string;
+}
+
+export interface RatingFeedbackData {
+  type: "rating";
+  score: number;
+  explanation?: string;
+}
+
+export interface CategoryFeedbackData {
+  type: "category";
+  categories: string[];
+  explanation?: string;
+}
+
+export type FeedbackData =
+  | ThumbsFeedbackData
+  | RatingFeedbackData
+  | CategoryFeedbackData;
+
+export interface FeedbackSubmission {
+  span_id: string;
+  trace_id: string;
+  feedback: FeedbackData;
+}
+
+export interface FeedbackResponse {
+  status: "success";
+  message: string;
+}
diff --git a/ui/types/FlowMetadata.ts b/ui/types/FlowMetadata.ts
index ead46282..4421271f 100644
--- a/ui/types/FlowMetadata.ts
+++ b/ui/types/FlowMetadata.ts
@@ -6,6 +6,26 @@ export interface FlowEndpoints {
   stream?: string | null;
 }
 
+export interface ThumbsFeedback {
+  type: "thumbs";
+  explanation: boolean;
+}
+
+export interface RatingFeedback {
+  type: "rating";
+  scale: 5 | 10;
+  explanation: boolean;
+}
+
+export interface CategoryFeedback {
+  type: "category";
+  categories: string[];
+  allow_multiple: boolean;
+  explanation: boolean;
+}
+
+export type FeedbackConfig = ThumbsFeedback | RatingFeedback | CategoryFeedback;
+
 export interface FlowMetadata {
   id: string;
   description: string | null;
@@ -14,4 +34,6 @@ export interface FlowMetadata {
   endpoints: FlowEndpoints;
   input_schema: Record<string, unknown>;
   output_schema: Record<string, unknown>;
+  feedback?: FeedbackConfig | null;
+  telemetry_enabled: boolean;
 }
diff --git a/uv.lock b/uv.lock
index 99119463..83944ac9 100644
--- a/uv.lock
+++ b/uv.lock
@@ -347,7 +347,7 @@ wheels = [
 
 [[package]]
 name = "arize-phoenix"
-version = "12.9.0"
+version = "12.35.0"
 source = { registry = "https://pypi.org/simple" }
 dependencies = [
     { name = "aioitertools" },
@@ -365,6 +365,7 @@ dependencies = [
     { name = "httpx" },
     { name = "jinja2" },
     { name = "jmespath" },
+    { name = "ldap3" },
     { name = "numpy", version = "2.2.6", source = { registry = "https://pypi.org/simple" }, marker = "python_full_version < '3.11'" },
     { name = "numpy", version = "2.3.4", source = { registry = "https://pypi.org/simple" }, marker = "python_full_version >= '3.11'" },
     { name = "openinference-instrumentation" },
@@ -394,14 +395,14 @@ dependencies = [
     { name = "uvicorn" },
     { name = "wrapt" },
 ]
-sdist = { url = "https://files.pythonhosted.org/packages/a9/a5/68ed6961eef8350def2248f031d22b2a0dc62a6b14c9e0fdcbd5d7cf4287/arize_phoenix-12.9.0.tar.gz", hash = "sha256:b1c6defac94bb85d02630eead112dfd94086f61c10d28a9e8bb7936a50bc1a77", size = 2325256, upload-time = "2025-10-29T21:26:25.258Z" }
+sdist = { url = "https://files.pythonhosted.org/packages/5c/7f/e2a298879e5b40efc8860c480dd9f79fb59e1495729828244235e4682266/arize_phoenix-12.35.0.tar.gz", hash = "sha256:0833c4b478ebb7b02d7f74f04f6bbe6d68ed7cebf2d22baffc5eb4aaf4358002", size = 2394470, upload-time = "2026-02-09T23:27:56.696Z" }
 wheels = [
-    { url = "https://files.pythonhosted.org/packages/fd/63/8b01223c176a7a18402c752f7b25acfeae81abf1cfae8532aa2a518f4f72/arize_phoenix-12.9.0-py3-none-any.whl", hash = "sha256:db81e0bcc1653eadbfc17ab4078294939842341cb7cd4cd168140eea2229ab2f", size = 2548796, upload-time = "2025-10-29T21:26:22.976Z" },
+    { url = "https://files.pythonhosted.org/packages/d4/c4/3c1c839297a6b4e967d49cb4139454f329a6453589b04b457b1a95a665b9/arize_phoenix-12.35.0-py3-none-any.whl", hash = "sha256:2dc5b214d82be151718b8089440f83ad4c8e59d9097e3459b458e071bf655995", size = 2620357, upload-time = "2026-02-09T23:27:54.712Z" },
 ]
 
 [[package]]
 name = "arize-phoenix-client"
-version = "1.21.0"
+version = "1.28.1"
 source = { registry = "https://pypi.org/simple" }
 dependencies = [
     { name = "httpx" },
@@ -412,14 +413,14 @@ dependencies = [
     { name = "tqdm" },
     { name = "typing-extensions" },
 ]
-sdist = { url = "https://files.pythonhosted.org/packages/ca/00/ffef83cc5a335061f0eee538e6d0d0ab594d1a9920b23b6560c095db3b04/arize_phoenix_client-1.21.0.tar.gz", hash = "sha256:72e5ce34f0cbe731d189cda9c93cd0e011886eaadf42be289b96b72187623e1b", size = 122369, upload-time = "2025-09-29T18:58:00.224Z" }
+sdist = { url = "https://files.pythonhosted.org/packages/89/a8/b15e630f68bc1d65de8756f18e44e518f9d3df985f659c85ca7bad5ad0f9/arize_phoenix_client-1.28.1.tar.gz", hash = "sha256:382ac12e635a7b9c1bcbf793b100fcc5a7f3cec84702c3ba6088f1ffbdc9abda", size = 143651, upload-time = "2026-02-09T23:01:44.582Z" }
 wheels = [
-    { url = "https://files.pythonhosted.org/packages/09/31/3cfaf7721858390da6cd6c1f8c5b65c4e0421b67958c723c61c43e86688e/arize_phoenix_client-1.21.0-py3-none-any.whl", hash = "sha256:be3574363f686508f1f21f8cb956d5141ea6781b0b8b573844f1e8278a927e57", size = 129062, upload-time = "2025-09-29T18:57:59.124Z" },
+    { url = "https://files.pythonhosted.org/packages/be/47/03c280e8b723eac3469f747bfdaa95c3d678a4d52472ac3bcb7f59d7eb73/arize_phoenix_client-1.28.1-py3-none-any.whl", hash = "sha256:14e4002815b45ce975e4d1af119c6f8aabd2e7068e62d012fcc3528af62aad3d", size = 149693, upload-time = "2026-02-09T23:01:43.114Z" },
 ]
 
 [[package]]
 name = "arize-phoenix-evals"
-version = "2.5.0"
+version = "2.9.0"
 source = { registry = "https://pypi.org/simple" }
 dependencies = [
     { name = "jsonpath-ng" },
@@ -432,14 +433,14 @@ dependencies = [
     { name = "tqdm" },
     { name = "typing-extensions" },
 ]
-sdist = { url = "https://files.pythonhosted.org/packages/08/51/de7bd0611ee4e9a229a5eca3e7458a3682c159c8ccefe332a54adb25d3ac/arize_phoenix_evals-2.5.0.tar.gz", hash = "sha256:6f7995ee29e401a9df6ead675ea9d5dd005ccd5ffe209924f265e9b80b1cdd81", size = 98136, upload-time = "2025-10-07T15:27:46.612Z" }
+sdist = { url = "https://files.pythonhosted.org/packages/c7/f3/80d6157fc07f5a6bab6359cd34ebb7d18dc4c43d35d25438215b50101de2/arize_phoenix_evals-2.9.0.tar.gz", hash = "sha256:adc7f45d9ceaf9b0d8785aa94373eeb8d073f43f471c42c64a1d83d5ba1dc716", size = 117742, upload-time = "2026-02-03T04:11:05.966Z" }
 wheels = [
-    { url = "https://files.pythonhosted.org/packages/f0/e7/5126a9c1c9577699d47f852802e1016e0636bff907c0f57f4f23d59607ea/arize_phoenix_evals-2.5.0-py3-none-any.whl", hash = "sha256:ddea69bff74dc5f0417cb13c05920a42bfdc7b36572e96290acdc2875cf6832b", size = 134718, upload-time = "2025-10-07T15:27:45.212Z" },
+    { url = "https://files.pythonhosted.org/packages/72/0f/1e091d6446840f28aca0eeda0c741a17c86c766045c73c0dd07bfa504191/arize_phoenix_evals-2.9.0-py3-none-any.whl", hash = "sha256:ed63891187fd71730d57e5c27f416fbfdb9c977d2bc996b47c1dd36c8493b499", size = 169650, upload-time = "2026-02-03T04:11:04.355Z" },
 ]
 
 [[package]]
 name = "arize-phoenix-otel"
-version = "0.13.1"
+version = "0.14.0"
 source = { registry = "https://pypi.org/simple" }
 dependencies = [
     { name = "openinference-instrumentation" },
@@ -451,9 +452,9 @@ dependencies = [
     { name = "typing-extensions" },
     { name = "wrapt" },
 ]
-sdist = { url = "https://files.pythonhosted.org/packages/44/3b/8745dc29b9d7db658f64d4a14d100285d1b74f38827171c22120aa5b7c9c/arize_phoenix_otel-0.13.1.tar.gz", hash = "sha256:6fb7bcfed4260b9ddd5bcaa20a678b60e388525e4bbaec1247092f163a0e0204", size = 20166, upload-time = "2025-09-10T06:09:30.954Z" }
+sdist = { url = "https://files.pythonhosted.org/packages/7c/17/ebd502f1bd8a0a6087ea28be8de8b765bcf34fb1b9bc4d6fd6d91bd822f1/arize_phoenix_otel-0.14.0.tar.gz", hash = "sha256:ad1368f0f52c242591ec554cedeccf718abda81383cf8c8d3ade218a7b20b955", size = 20155, upload-time = "2025-11-19T19:48:29.447Z" }
 wheels = [
-    { url = "https://files.pythonhosted.org/packages/8d/40/1d421e172453f07fc8a91b5a2407350bbba598e37b9025ae84b68b0ce8a2/arize_phoenix_otel-0.13.1-py3-none-any.whl", hash = "sha256:98d34da78aebac7f60ec4bc30f0eab1e4490c7329b2c74988b9684f9dc182949", size = 17717, upload-time = "2025-09-10T06:09:30.037Z" },
+    { url = "https://files.pythonhosted.org/packages/c0/be/e7ddb54c4ad6115d2d468b71e90d7a2718735fd217f05c50759799191bfe/arize_phoenix_otel-0.14.0-py3-none-any.whl", hash = "sha256:47bf5563b9342a931385a16609ca83ada44d56a00bf6ed3be199226792b9937f", size = 17708, upload-time = "2025-11-19T19:48:28.252Z" },
 ]
 
 [[package]]
@@ -946,6 +947,18 @@ toml = [
     { name = "tomli", marker = "python_full_version <= '3.11'" },
 ]
 
+[[package]]
+name = "cross-web"
+version = "0.4.1"
+source = { registry = "https://pypi.org/simple" }
+dependencies = [
+    { name = "typing-extensions" },
+]
+sdist = { url = "https://files.pythonhosted.org/packages/a4/58/e688e99d1493c565d1587e64b499268d0a3129ae59f4efe440aac395f803/cross_web-0.4.1.tar.gz", hash = "sha256:0466295028dcae98c9ab3d18757f90b0e74fac2ff90efbe87e74657546d9993d", size = 157385, upload-time = "2026-01-09T18:17:41.534Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/67/49/92b46b6e65f09b717a66c4e5a9bc47a45ebc83dd0e0ed126f8258363479d/cross_web-0.4.1-py3-none-any.whl", hash = "sha256:41b07c3a38253c517ec0603c1a366353aff77538946092b0f9a2235033f192c2", size = 14320, upload-time = "2026-01-09T18:17:40.325Z" },
+]
+
 [[package]]
 name = "cryptography"
 version = "46.0.3"
@@ -2514,6 +2527,30 @@ wheels = [
     { url = "https://files.pythonhosted.org/packages/41/a0/b91504515c1f9a299fc157967ffbd2f0321bce0516a3d5b89f6f4cad0355/lazy_object_proxy-1.12.0-pp39.pp310.pp311.graalpy311-none-any.whl", hash = "sha256:c3b2e0af1f7f77c4263759c4824316ce458fabe0fceadcd24ef8ca08b2d1e402", size = 15072, upload-time = "2025-08-22T13:50:05.498Z" },
 ]
 
+[[package]]
+name = "ldap3"
+version = "2.9.1"
+source = { registry = "https://pypi.org/simple" }
+dependencies = [
+    { name = "pyasn1" },
+]
+sdist = { url = "https://files.pythonhosted.org/packages/43/ac/96bd5464e3edbc61595d0d69989f5d9969ae411866427b2500a8e5b812c0/ldap3-2.9.1.tar.gz", hash = "sha256:f3e7fc4718e3f09dda568b57100095e0ce58633bcabbed8667ce3f8fbaa4229f", size = 398830, upload-time = "2021-07-18T06:34:21.786Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/4e/f6/71d6ec9f18da0b2201287ce9db6afb1a1f637dedb3f0703409558981c723/ldap3-2.9.1-py2.py3-none-any.whl", hash = "sha256:5869596fc4948797020d3f03b7939da938778a0f9e2009f7a072ccf92b8e8d70", size = 432192, upload-time = "2021-07-18T06:34:12.905Z" },
+]
+
+[[package]]
+name = "lia-web"
+version = "0.3.1"
+source = { registry = "https://pypi.org/simple" }
+dependencies = [
+    { name = "cross-web" },
+]
+sdist = { url = "https://files.pythonhosted.org/packages/05/3d/7d574a7a5cf5fbc5fc09c07ea3696dd400353b7702bc009cf596b8c12035/lia_web-0.3.1.tar.gz", hash = "sha256:7f551269eddd729f1437e9341ad21622a849eb0c0975d9232ccbbaadbdc74c06", size = 2021, upload-time = "2025-12-25T20:41:51.195Z" }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/a1/8b/b628fc18658f94b3d094708a18b71083cf47628e85cbc6b9edba54d5b2d7/lia_web-0.3.1-py3-none-any.whl", hash = "sha256:e4e6e7a9381e228aca60a6f3d67dbae9a5f4638eced242d931f95797ddba3f8b", size = 5933, upload-time = "2025-12-25T20:41:52.289Z" },
+]
+
 [[package]]
 name = "llama-cloud"
 version = "0.1.35"
@@ -5736,7 +5773,7 @@ provides-extras = ["interpreter", "mcp"]
 
 [package.metadata.requires-dev]
 dev = [
-    { name = "arize-phoenix", specifier = ">=11.2.2" },
+    { name = "arize-phoenix", specifier = ">=12.35.0" },
     { name = "boto3", specifier = ">=1.34.0" },
     { name = "coverage", specifier = ">=7.0.0" },
     { name = "ipython", specifier = ">=8.37.0" },
@@ -6694,17 +6731,18 @@ wheels = [
 
 [[package]]
 name = "strawberry-graphql"
-version = "0.270.1"
+version = "0.287.3"
 source = { registry = "https://pypi.org/simple" }
 dependencies = [
-    { name = "graphql-core", marker = "python_full_version < '4'" },
+    { name = "graphql-core" },
+    { name = "lia-web" },
     { name = "packaging" },
     { name = "python-dateutil" },
     { name = "typing-extensions" },
 ]
-sdist = { url = "https://files.pythonhosted.org/packages/67/aa/9d8a53fbf0271e7a5c5155b76d256caf4b94f422676226253648871cc7c1/strawberry_graphql-0.270.1.tar.gz", hash = "sha256:d64524a943851d83252e39b82ef768ee494259edecf9510b37bad9a46b745db8", size = 207190, upload-time = "2025-05-22T12:29:28.617Z" }
+sdist = { url = "https://files.pythonhosted.org/packages/e5/45/5a466ecd7503ad165ed5050e694f3a871b4df085cfaff5c357259bef0ccc/strawberry_graphql-0.287.3.tar.gz", hash = "sha256:c81126cc75102aa32417048f074429d6c5c8d096424aa939fdb8827b8c5f84a9", size = 211998, upload-time = "2025-12-12T11:50:23.266Z" }
 wheels = [
-    { url = "https://files.pythonhosted.org/packages/99/e0/c45d74578e7b8cb7e082697d998cebd8ef97afa3d7aedc22e4acd8ae7163/strawberry_graphql-0.270.1-py3-none-any.whl", hash = "sha256:3593086dc08614ae241cb88f7691e90f90b01cab6ee6351cb3838fc5ba8bfab0", size = 301232, upload-time = "2025-05-22T12:29:25.739Z" },
+    { url = "https://files.pythonhosted.org/packages/7c/8e/ffd20e179cc8218465599922660323f453c7b955aca2b909e5b86ba61eb0/strawberry_graphql-0.287.3-py3-none-any.whl", hash = "sha256:2bb1f9b122ef1213f82f01cf27a095eb0776fda78e12af9e60c54de6e543797c", size = 309183, upload-time = "2025-12-12T11:50:20.574Z" },
 ]
 
 [[package]]

From 6ef015e02f5a0e17aded2adeab69ab37f9337986 Mon Sep 17 00:00:00 2001
From: Lou Kratz <219901029+loukratz-bv@users.noreply.github.com>
Date: Fri, 13 Feb 2026 13:08:25 -0500
Subject: [PATCH 2/4] docs: How To Add Feedback Buttons

---
 .../Qtype Server/add_feedback_buttons.md      | 40 +++++++++++++++++++
 1 file changed, 40 insertions(+)
 create mode 100644 docs/How To/Qtype Server/add_feedback_buttons.md

diff --git a/docs/How To/Qtype Server/add_feedback_buttons.md b/docs/How To/Qtype Server/add_feedback_buttons.md
new file mode 100644
index 00000000..39d45495
--- /dev/null
+++ b/docs/How To/Qtype Server/add_feedback_buttons.md	
@@ -0,0 +1,40 @@
+# Add Feedback Buttons
+
+Collect user feedback (thumbs, ratings, or categories) directly in the QType UI by adding a `feedback` block to your flow. Feedback submission requires `telemetry` to be enabled so QType can attach the feedback to traces/spans.
+
+### QType YAML
+
+```yaml
+flows:
+  - id: my_flow
+    interface:
+      type: Conversational
+
+    feedback:
+      type: thumbs
+      explanation: true
+
+telemetry:
+  id: app_telemetry
+  provider: Phoenix
+  endpoint: http://localhost:6006/v1/traces
+```
+
+### Explanation
+
+- **flows[].feedback**: Enables a feedback widget on the flow’s outputs in the UI.
+- **feedback.type**: Feedback widget type: `thumbs`, `rating`, or `category`.
+- **feedback.explanation**: If `true`, prompts the user for an optional text explanation along with their feedback.
+- **rating.scale**: For `rating` feedback, sets the maximum score (typically `5` or `10`).
+- **category.categories**: For `category` feedback, the list of selectable labels.
+- **category.allow_multiple**: For `category` feedback, allows selecting multiple labels.
+- **telemetry**: Must be configured for feedback submission; QType records feedback as telemetry annotations.
+
+## See Also
+
+- [Serve Flows as UI](serve_flows_as_ui.md)
+- [Use Conversational Interfaces](use_conversational_interfaces.md)
+- [TelemetrySink Reference](../../components/TelemetrySink.md)
+- [Example: Thumbs Feedback](../../../examples/feedback/thumbs_feedback_example.qtype.yaml)
+- [Example: Rating Feedback](../../../examples/feedback/rating_feedback_example.qtype.yaml)
+- [Example: Category Feedback](../../../examples/feedback/category_feedback_example.qtype.yaml)

From ae48496a0c32d490a9dcf7a3c0c92cfd6ed8c848 Mon Sep 17 00:00:00 2001
From: Lou Kratz <219901029+loukratz-bv@users.noreply.github.com>
Date: Fri, 13 Feb 2026 13:10:11 -0500
Subject: [PATCH 3/4] tweaks

---
 .../create-gallery-example.chatmode.md        |   0
 .../create-howto-example.chatmode.md          |   0
 .../documentation-writer.chatmode.md          |   0
 qtype/dsl/model.py                            | 131 +++++++++---------
 qtype/interpreter/base/base_step_executor.py  |  36 +++--
 qtype/interpreter/feedback_api.py             |  65 ++++++---
 qtype/interpreter/types.py                    |  21 ++-
 qtype/interpreter/typing.py                   |   9 +-
 qtype/semantic/checker.py                     |  25 ++--
 qtype/semantic/generate.py                    |  14 +-
 qtype/semantic/model.py                       |  39 +-----
 tests/semantic/test_checker_validation.py     |   8 +-
 tests/semantic/test_feedback_validation.py    |  15 ++
 13 files changed, 193 insertions(+), 170 deletions(-)
 rename .github/{chatmodes => agents}/create-gallery-example.chatmode.md (100%)
 rename .github/{chatmodes => agents}/create-howto-example.chatmode.md (100%)
 rename .github/{chatmodes => agents}/documentation-writer.chatmode.md (100%)

diff --git a/.github/chatmodes/create-gallery-example.chatmode.md b/.github/agents/create-gallery-example.chatmode.md
similarity index 100%
rename from .github/chatmodes/create-gallery-example.chatmode.md
rename to .github/agents/create-gallery-example.chatmode.md
diff --git a/.github/chatmodes/create-howto-example.chatmode.md b/.github/agents/create-howto-example.chatmode.md
similarity index 100%
rename from .github/chatmodes/create-howto-example.chatmode.md
rename to .github/agents/create-howto-example.chatmode.md
diff --git a/.github/chatmodes/documentation-writer.chatmode.md b/.github/agents/documentation-writer.chatmode.md
similarity index 100%
rename from .github/chatmodes/documentation-writer.chatmode.md
rename to .github/agents/documentation-writer.chatmode.md
diff --git a/qtype/dsl/model.py b/qtype/dsl/model.py
index 4fdefd94..6c4679ed 100644
--- a/qtype/dsl/model.py
+++ b/qtype/dsl/model.py
@@ -5,13 +5,14 @@
 from abc import ABC
 from enum import Enum
 from functools import partial
-from typing import Annotated, Any, Literal, Type, Union
+from typing import Annotated, Any, Literal, Type
 
 from pydantic import (
     BaseModel,
     Field,
     RootModel,
     ValidationInfo,
+    field_validator,
     model_serializer,
     model_validator,
 )
@@ -621,7 +622,10 @@ class RatingFeedback(Feedback):
 
     type: Literal["rating"] = "rating"
     scale: int = Field(
-        default=5, description="Maximum value for rating scale."
+        default=5,
+        ge=2,
+        le=10,
+        description="Maximum value for rating scale (2-10).",
     )
 
 
@@ -639,14 +643,21 @@ class CategoryFeedback(Feedback):
         description="Whether users can select multiple categories.",
     )
 
+    @field_validator("categories")
+    @classmethod
+    def validate_categories_not_empty(cls, v: list[str]) -> list[str]:
+        """Validate that category strings are not empty."""
+        for category in v:
+            if not category.strip():
+                raise ValueError(
+                    "Category labels must not be empty or whitespace-only"
+                )
+        return v
+
 
 # Create a union type for all feedback types (defined here before Flow)
 FeedbackType = Annotated[
-    Union[
-        ThumbsFeedback,
-        RatingFeedback,
-        CategoryFeedback,
-    ],
+    ThumbsFeedback | RatingFeedback | CategoryFeedback,
     Field(discriminator="type"),
 ]
 
@@ -1377,84 +1388,66 @@ class BedrockReranker(Reranker, ConcurrentStepMixin):
 
 # Create a union type for all tool types
 ToolType = Annotated[
-    Union[
-        APITool,
-        PythonFunctionTool,
-    ],
+    APITool | PythonFunctionTool,
     Field(discriminator="type"),
 ]
 
 # Create a union type for all source types
-SourceType = Union[
-    DocumentSource,
-    FileSource,
-    SQLSource,
-]
+SourceType = DocumentSource | FileSource | SQLSource
 
 # Create a union type for all authorization provider types
-AuthProviderType = Union[
-    APIKeyAuthProvider,
-    BearerTokenAuthProvider,
-    AWSAuthProvider,
-    OAuth2AuthProvider,
-    VertexAuthProvider,
-]
+AuthProviderType = (
+    APIKeyAuthProvider
+    | BearerTokenAuthProvider
+    | AWSAuthProvider
+    | OAuth2AuthProvider
+    | VertexAuthProvider
+)
 
 # Create a union type for all secret manager types
 SecretManagerType = Annotated[
-    Union[
-        AWSSecretManager
-        # Add future managers like KubernetesSecretManager here
-    ],
+    AWSSecretManager,  # Add future managers like KubernetesSecretManager here
     Field(discriminator="type"),
 ]
 
 # Create a union type for all step types
 StepType = Annotated[
-    Union[
-        Agent,
-        Aggregate,
-        BedrockReranker,
-        Collect,
-        Construct,
-        Decoder,
-        DocToTextConverter,
-        DocumentEmbedder,
-        DocumentSearch,
-        DocumentSplitter,
-        DocumentSource,
-        Echo,
-        Explode,
-        FieldExtractor,
-        FileSource,
-        FileWriter,
-        IndexUpsert,
-        InvokeEmbedding,
-        InvokeFlow,
-        InvokeTool,
-        LLMInference,
-        PromptTemplate,
-        SQLSource,
-        VectorSearch,
-    ],
+    Agent
+    | Aggregate
+    | BedrockReranker
+    | Collect
+    | Construct
+    | Decoder
+    | DocToTextConverter
+    | DocumentEmbedder
+    | DocumentSearch
+    | DocumentSplitter
+    | DocumentSource
+    | Echo
+    | Explode
+    | FieldExtractor
+    | FileSource
+    | FileWriter
+    | IndexUpsert
+    | InvokeEmbedding
+    | InvokeFlow
+    | InvokeTool
+    | LLMInference
+    | PromptTemplate
+    | SQLSource
+    | VectorSearch,
     Field(discriminator="type"),
 ]
 
 # Create a union type for all index types
 IndexType = Annotated[
-    Union[
-        DocumentIndex,
-        VectorIndex,
-    ],
+    DocumentIndex | VectorIndex,
     Field(discriminator="type"),
 ]
 
 # Create a union type for all model types
 ModelType = Annotated[
-    Union[
-        EmbeddingModel,
-        Model,
-    ],
+    EmbeddingModel | Model,
     Field(discriminator="type"),
 ]
 
@@ -1494,14 +1487,14 @@ class VariableList(RootModel[list[Variable]]):
     root: list[Variable]
 
 
-DocumentType = Union[
-    Application,
-    AuthorizationProviderList,
-    ModelList,
-    ToolList,
-    TypeList,
-    VariableList,
-]
+DocumentType = (
+    Application
+    | AuthorizationProviderList
+    | ModelList
+    | ToolList
+    | TypeList
+    | VariableList
+)
 
 
 class Document(RootModel[DocumentType]):
diff --git a/qtype/interpreter/base/base_step_executor.py b/qtype/interpreter/base/base_step_executor.py
index 7440d427..2743461f 100644
--- a/qtype/interpreter/base/base_step_executor.py
+++ b/qtype/interpreter/base/base_step_executor.py
@@ -2,6 +2,7 @@
 
 import logging
 from abc import ABC, abstractmethod
+from contextlib import nullcontext
 from typing import Any, AsyncIterator
 
 from aiostream import stream
@@ -9,7 +10,7 @@
     OpenInferenceSpanKindValues,
     SpanAttributes,
 )
-from opentelemetry import context, trace
+from opentelemetry import trace
 from opentelemetry.trace import Status, StatusCode
 
 from qtype.interpreter.base.executor_context import ExecutorContext
@@ -372,15 +373,17 @@ async def _process_message_with_telemetry(
         The step span context is attached here (not in execute()) to
         ensure step spans are siblings under the flow span, not nested.
         """
-        # Attach step span context so process_message span becomes its child
+        # Get step span and use context manager for proper handling
         step_span = getattr(self, "_current_step_span", None)
-        if step_span and step_span.is_recording():
-            ctx = trace.set_span_in_context(step_span)
-            token = context.attach(ctx)
-        else:
-            token = None
-
-        try:
+        if not step_span or not step_span.is_recording():
+            step_span = None
+
+        # Use context manager to attach step span
+        with (
+            trace.use_span(step_span, end_on_exit=False)
+            if step_span
+            else nullcontext()
+        ):
             # Create child span for this specific message processing
             span = self._tracer.start_span(
                 f"step.{self.step.id}.process_message",
@@ -405,14 +408,11 @@ async def _process_message_with_telemetry(
                         )
                     # Enrich with process_message span for feedback tracking
                     span_context = span.get_span_context()
-                    updated_metadata = {
-                        **output_msg.metadata,
-                        "span_id": format(span_context.span_id, "016x"),
-                        "trace_id": format(span_context.trace_id, "032x"),
-                    }
-                    yield output_msg.model_copy(
-                        update={"metadata": updated_metadata}
+                    output_msg = output_msg.with_telemetry_metadata(
+                        span_id=format(span_context.span_id, "016x"),
+                        trace_id=format(span_context.trace_id, "032x"),
                     )
+                    yield output_msg
 
                 # Record processing metrics
                 span.set_attribute("message.outputs", output_count)
@@ -434,10 +434,6 @@ async def _process_message_with_telemetry(
                 raise
             finally:
                 span.end()
-        finally:
-            # Detach step span context
-            if token is not None:
-                context.detach(token)
 
     async def finalize(self) -> AsyncIterator[FlowMessage]:
         """
diff --git a/qtype/interpreter/feedback_api.py b/qtype/interpreter/feedback_api.py
index 85b496dd..62255903 100644
--- a/qtype/interpreter/feedback_api.py
+++ b/qtype/interpreter/feedback_api.py
@@ -1,17 +1,26 @@
 from __future__ import annotations
 
 import logging
-from typing import Annotated, Any, Literal, Union
+from enum import Enum
+from typing import Annotated, Any, Literal
 from urllib.parse import urlparse
 
 from fastapi import FastAPI, HTTPException, status
 from pydantic import BaseModel, Field
 
+from qtype.interpreter.base.secrets import SecretManagerBase
 from qtype.semantic.model import TelemetrySink
 
 logger = logging.getLogger(__name__)
 
 
+class TelemetryProvider(str, Enum):
+    """Supported telemetry providers."""
+
+    PHOENIX = "Phoenix"
+    LANGFUSE = "Langfuse"
+
+
 def _format_feedback_label(feedback: FeedbackData) -> str:
     """Format feedback data into a human-readable label."""
     if isinstance(feedback, ThumbsFeedbackData):
@@ -58,7 +67,7 @@ class CategoryFeedbackData(BaseModel):
 
 
 FeedbackData = Annotated[
-    Union[ThumbsFeedbackData, RatingFeedbackData, CategoryFeedbackData],
+    ThumbsFeedbackData | RatingFeedbackData | CategoryFeedbackData,
     Field(discriminator="type"),
 ]
 
@@ -80,24 +89,20 @@ class FeedbackResponse(BaseModel):
     message: str = "Feedback submitted successfully"
 
 
-def create_feedback_endpoint(
-    app: FastAPI, telemetry: TelemetrySink, secret_manager: Any
-) -> None:
+def _create_telemetry_client(
+    telemetry: TelemetrySink, secret_manager: SecretManagerBase
+) -> Any:
     """
-    Register the feedback submission endpoint with the FastAPI application.
-
-    This creates a POST /feedback endpoint that accepts feedback submissions
-    and forwards them to the configured telemetry backend.
+    Create telemetry client based on provider.
 
     Args:
-        app: FastAPI application instance.
         telemetry: Telemetry sink configuration.
         secret_manager: Secret manager for resolving secret references.
-    """
-    # Create client based on provider
-    client = None
 
-    if telemetry.provider == "Phoenix":
+    Returns:
+        Provider-specific client instance, or None if not supported.
+    """
+    if telemetry.provider == TelemetryProvider.PHOENIX.value:
         from phoenix.client import Client
 
         # Resolve endpoint in case it's a secret reference
@@ -111,18 +116,38 @@ def create_feedback_endpoint(
         parsed = urlparse(args["base_url"])
         base_url = f"{parsed.scheme}://{parsed.netloc}"
 
-        client = Client(base_url=base_url)
-    elif telemetry.provider == "Langfuse":
+        return Client(base_url=base_url)
+    elif telemetry.provider == TelemetryProvider.LANGFUSE.value:
         logger.warning(
             "Langfuse feedback not yet implemented. "
             "Feedback endpoint will not be created."
         )
-        return
+        return None
     else:
         logger.warning(
             f"Feedback endpoint not created: unsupported telemetry "
             f"provider '{telemetry.provider}'."
         )
+        return None
+
+
+def create_feedback_endpoint(
+    app: FastAPI, telemetry: TelemetrySink, secret_manager: SecretManagerBase
+) -> None:
+    """
+    Register the feedback submission endpoint with the FastAPI application.
+
+    This creates a POST /feedback endpoint that accepts feedback submissions
+    and forwards them to the configured telemetry backend.
+
+    Args:
+        app: FastAPI application instance.
+        telemetry: Telemetry sink configuration.
+        secret_manager: Secret manager for resolving secret references.
+    """
+    # Create client based on provider
+    client = _create_telemetry_client(telemetry, secret_manager)
+    if client is None:
         return
 
     @app.post(
@@ -143,10 +168,10 @@ async def submit_feedback(request: FeedbackRequest) -> FeedbackResponse:
         The feedback is recorded as a span annotation in the telemetry backend.
         """
         try:
-            if telemetry.provider == "Phoenix":
+            if telemetry.provider == TelemetryProvider.PHOENIX.value:
                 # Submit to Phoenix using span annotations API
                 label = _format_feedback_label(request.feedback)
-                explanation = getattr(request.feedback, "explanation", None)
+                explanation = request.feedback.explanation
 
                 # Calculate score based on feedback type
                 score = None
@@ -169,7 +194,7 @@ async def submit_feedback(request: FeedbackRequest) -> FeedbackResponse:
                     f"{request.feedback.type} = {label}"
                 )
 
-            elif telemetry.provider == "Langfuse":
+            elif telemetry.provider == TelemetryProvider.LANGFUSE.value:
                 # TODO: Implement Langfuse feedback submission
                 raise NotImplementedError(
                     "Langfuse feedback not yet implemented"
diff --git a/qtype/interpreter/types.py b/qtype/interpreter/types.py
index 631e5e8a..185ff588 100644
--- a/qtype/interpreter/types.py
+++ b/qtype/interpreter/types.py
@@ -346,7 +346,7 @@ class FlowMessage(BaseModel):
         description="Mapping of variable IDs to their values.",
     )
     error: Optional[StepError] = None
-    metadata: Dict[str, Any] = Field(
+    metadata: dict[str, Any] = Field(
         default_factory=dict,
         description="Metadata for telemetry, span IDs, and other system-level data.",
     )
@@ -355,6 +355,25 @@ def is_failed(self) -> bool:
         """Checks if this state has encountered an error."""
         return self.error is not None
 
+    def with_telemetry_metadata(
+        self, span_id: str, trace_id: str
+    ) -> "FlowMessage":
+        """Create a copy with telemetry metadata added.
+
+        Args:
+            span_id: OpenTelemetry span ID (16 hex chars)
+            trace_id: OpenTelemetry trace ID (32 hex chars)
+
+        Returns:
+            New FlowMessage with telemetry metadata
+        """
+        updated_metadata = {
+            **self.metadata,
+            "span_id": span_id,
+            "trace_id": trace_id,
+        }
+        return self.model_copy(update={"metadata": updated_metadata})
+
     def is_set(self, var_id: str) -> bool:
         """Check if a variable is set (not UNSET, may be None)."""
         value = self.variables.get(var_id, UNSET)
diff --git a/qtype/interpreter/typing.py b/qtype/interpreter/typing.py
index 37cb70fc..8f85b51b 100644
--- a/qtype/interpreter/typing.py
+++ b/qtype/interpreter/typing.py
@@ -63,9 +63,9 @@ def create_output_shape(flow: Flow) -> Type[BaseModel]:
     fields = _fields_from_variables(flow.outputs)
     # Add metadata field for telemetry (span_id, trace_id)
     fields["metadata"] = (
-        dict[str, Any] | None,
+        dict[str, Any],
         Field(
-            default=None,
+            default_factory=dict,
             description="Telemetry metadata including span_id and trace_id",
         ),
     )
@@ -143,9 +143,8 @@ def flow_results_to_output_container(
         else:
             output_instance = output_shape(**m.variables)
             output_dict = output_instance.model_dump()
-            # Include metadata (span_id, trace_id) if present
-            if m.metadata:
-                output_dict["metadata"] = m.metadata
+            # Merge metadata from FlowMessage
+            output_dict["metadata"] = {**output_dict["metadata"], **m.metadata}
             outputs.append(output_dict)
 
     return output_container(outputs=outputs, errors=errors)
diff --git a/qtype/semantic/checker.py b/qtype/semantic/checker.py
index 51604bf1..bfffaab3 100644
--- a/qtype/semantic/checker.py
+++ b/qtype/semantic/checker.py
@@ -723,30 +723,25 @@ def _validate_bindings(
 
     Raises:
         QTypeSemanticError: If any binding keys don't match valid IDs
-    """  # Check input_bindings
+    """
+    # Check input_bindings
     for binding_key in input_bindings.keys():
         if binding_key not in valid_input_ids:
             raise QTypeSemanticError(
-                (
-                    f"{step_type} step '{step_id}' has input_binding "
-                    f"'{binding_key}' which does not match any {component_type} "
-                    f"parameter. {component_type.capitalize()} '{component_id}' has input "
-                    f"parameters: {sorted(valid_input_ids)}. {component_type.capitalize()} "
-                    f"parameter '{binding_key}' not defined in {component_type}."
-                )
+                f"{step_type} step '{step_id}' has input_binding "
+                f"'{binding_key}' which does not exist. "
+                f"Valid {component_type} '{component_id}' input parameters: "
+                f"{sorted(valid_input_ids)}"
             )
 
     # Check output_bindings
     for binding_key in output_bindings.keys():
         if binding_key not in valid_output_ids:
             raise QTypeSemanticError(
-                (
-                    f"{step_type} step '{step_id}' has output_binding "
-                    f"'{binding_key}' which does not match any {component_type} "
-                    f"parameter. {component_type.capitalize()} '{component_id}' has output "
-                    f"parameters: {sorted(valid_output_ids)}. {component_type.capitalize()} "
-                    f"parameter '{binding_key}' not defined in {component_type}."
-                )
+                f"{step_type} step '{step_id}' has output_binding "
+                f"'{binding_key}' which does not exist. "
+                f"Valid {component_type} '{component_id}' output parameters: "
+                f"{sorted(valid_output_ids)}"
             )
 
 
diff --git a/qtype/semantic/generate.py b/qtype/semantic/generate.py
index bef20737..48d745cc 100644
--- a/qtype/semantic/generate.py
+++ b/qtype/semantic/generate.py
@@ -31,14 +31,19 @@ def _is_dsl_type(type_obj: Any) -> bool:
 
 FIELDS_TO_IGNORE = {"Application.references"}
 TYPES_TO_IGNORE = {
+    "CategoryFeedback",
     "CustomType",
     "DecoderFormat",
     "Document",
+    "Feedback",
+    "FeedbackType",
     "ListType",
     "PrimitiveTypeEnum",
+    "RatingFeedback",
     "StrictBaseModel",
-    "TypeDefinition",
+    "ThumbsFeedback",
     "ToolParameter",
+    "TypeDefinition",
     "Variable",
 }
 
@@ -141,10 +146,15 @@ def generate_semantic_model(args: argparse.Namespace) -> None:
             # Import enums, mixins, and type aliases
             from qtype.base.types import BatchableStepMixin, BatchConfig, CachedStepMixin, ConcurrencyConfig, ConcurrentStepMixin  # noqa: F401
             from qtype.dsl.model import (  # noqa: F401
+                CategoryFeedback,
                 CustomType,
                 DecoderFormat,
+                Feedback,
+                FeedbackType,
                 ListType,
-                PrimitiveTypeEnum
+                PrimitiveTypeEnum,
+                RatingFeedback,
+                ThumbsFeedback,
             )
             from qtype.dsl.model import Variable as DSLVariable  # noqa: F401
             from qtype.dsl.model import VariableType  # noqa: F401
diff --git a/qtype/semantic/model.py b/qtype/semantic/model.py
index 476ce5b8..f6b50657 100644
--- a/qtype/semantic/model.py
+++ b/qtype/semantic/model.py
@@ -28,10 +28,15 @@
 )
 from qtype.dsl.model import VariableType  # noqa: F401
 from qtype.dsl.model import (  # noqa: F401
+    CategoryFeedback,
     CustomType,
     DecoderFormat,
+    Feedback,
+    FeedbackType,
     ListType,
     PrimitiveTypeEnum,
+    RatingFeedback,
+    ThumbsFeedback,
 )
 from qtype.dsl.model import Variable as DSLVariable  # noqa: F401
 from qtype.semantic.base_types import ImmutableModel
@@ -158,15 +163,6 @@ class AuthorizationProviderList(BaseModel):
     root: list[AuthorizationProvider] = Field(...)
 
 
-class Feedback(BaseModel):
-    """Base class for user feedback configurations on flow outputs."""
-
-    type: str = Field(..., description="Type of feedback widget to display.")
-    explanation: bool = Field(
-        False, description="Whether to enable optional text explanation field."
-    )
-
-
 class ConstantPath(BaseModel):
     """Semantic version of ConstantPath."""
 
@@ -684,31 +680,6 @@ class Writer(Step, BatchableStepMixin):
     id: str = Field(..., description="Unique ID of the data writer.")
 
 
-class CategoryFeedback(Feedback):
-    """Categorical feedback with predefined tags."""
-
-    type: Literal["category"] = Field("category")
-    categories: list[str] = Field(
-        ..., description="List of category labels users can select from."
-    )
-    allow_multiple: bool = Field(
-        True, description="Whether users can select multiple categories."
-    )
-
-
-class RatingFeedback(Feedback):
-    """Numerical rating feedback (1-5 or 1-10 scale)."""
-
-    type: Literal["rating"] = Field("rating")
-    scale: int = Field(5, description="Maximum value for rating scale.")
-
-
-class ThumbsFeedback(Feedback):
-    """Binary thumbs up/down feedback."""
-
-    type: Literal["thumbs"] = Field("thumbs")
-
-
 class DocumentIndex(Index):
     """Document search index for text-based search (e.g., Elasticsearch, OpenSearch)."""
 
diff --git a/tests/semantic/test_checker_validation.py b/tests/semantic/test_checker_validation.py
index 026d417e..26d6838b 100644
--- a/tests/semantic/test_checker_validation.py
+++ b/tests/semantic/test_checker_validation.py
@@ -115,19 +115,19 @@
         ),
         (
             "invalid_invoke_tool_wrong_input_binding.qtype.yaml",
-            "Tool parameter 'wrong_param' not defined in tool",
+            "which does not exist",
         ),
         (
             "invalid_invoke_tool_wrong_output_binding.qtype.yaml",
-            "Tool parameter 'result' not defined in tool",
+            "which does not exist",
         ),
         (
             "invalid_invoke_flow_wrong_input_binding.qtype.yaml",
-            "Flow parameter 'wrong_param' not defined in flow",
+            "which does not exist",
         ),
         (
             "invalid_invoke_flow_wrong_output_binding.qtype.yaml",
-            "Flow parameter 'wrong_output' not defined in flow",
+            "which does not exist",
         ),
     ],
 )
diff --git a/tests/semantic/test_feedback_validation.py b/tests/semantic/test_feedback_validation.py
index ce1f0eae..56a02a19 100644
--- a/tests/semantic/test_feedback_validation.py
+++ b/tests/semantic/test_feedback_validation.py
@@ -20,6 +20,11 @@ def test_thumbs_feedback_loads_correctly(self, tmp_path):
     steps:
       - type: Echo
         id: echo1
+
+telemetry:
+  id: test_telemetry
+  provider: Phoenix
+  endpoint: http://localhost:6006/v1/traces
 """
         yaml_file = tmp_path / "test.yaml"
         yaml_file.write_text(yaml_content)
@@ -43,6 +48,11 @@ def test_rating_feedback_loads_correctly(self, tmp_path):
     steps:
       - type: Echo
         id: echo1
+
+telemetry:
+  id: test_telemetry
+  provider: Phoenix
+  endpoint: http://localhost:6006/v1/traces
 """
         yaml_file = tmp_path / "test.yaml"
         yaml_file.write_text(yaml_content)
@@ -71,6 +81,11 @@ def test_category_feedback_loads_correctly(self, tmp_path):
     steps:
       - type: Echo
         id: echo1
+
+telemetry:
+  id: test_telemetry
+  provider: Phoenix
+  endpoint: http://localhost:6006/v1/traces
 """
         yaml_file = tmp_path / "test.yaml"
         yaml_file.write_text(yaml_content)

From 669bdd9ee84c3f39f1613790403871a5c17450b1 Mon Sep 17 00:00:00 2001
From: Lou Kratz <219901029+loukratz-bv@users.noreply.github.com>
Date: Fri, 13 Feb 2026 18:29:43 -0500
Subject: [PATCH 4/4] Cleanup ux code

---
 ui/components/FlowResponseCard.tsx            | 34 ++-------
 ui/components/FlowResponseTable.tsx           | 70 ++++++++++---------
 ui/components/chat/MessageBubble.tsx          | 13 ++--
 ui/components/feedback/FeedbackButton.tsx     | 70 +++++--------------
 .../feedback/FeedbackExplanationModal.tsx     | 15 ++--
 ui/components/feedback/RatingFeedback.tsx     |  4 +-
 ui/lib/apiClient.ts                           | 25 ++++---
 ui/lib/telemetry.ts                           | 43 ++++++++++++
 ui/types/FlowMetadata.ts                      | 11 +--
 9 files changed, 143 insertions(+), 142 deletions(-)
 create mode 100644 ui/lib/telemetry.ts

diff --git a/ui/components/FlowResponseCard.tsx b/ui/components/FlowResponseCard.tsx
index 8f8e4121..d41c5d20 100644
--- a/ui/components/FlowResponseCard.tsx
+++ b/ui/components/FlowResponseCard.tsx
@@ -8,6 +8,7 @@
 
 import { FeedbackButton } from "@/components/feedback";
 import { Alert, AlertDescription } from "@/components/ui/Alert";
+import { getTelemetryIdsFromValue, METADATA_FIELD } from "@/lib/telemetry";
 
 import { MarkdownContainer } from "./MarkdownContainer";
 import {
@@ -164,35 +165,13 @@ export default function FlowResponseCard({
       ? (responseData as Record<string, ResponseData>).outputs || responseData
       : responseData || {};
 
-  // Extract metadata (span_id, trace_id) from response
-  const metadata =
-    responseData && typeof responseData === "object"
-      ? (responseData as Record<string, unknown>).metadata
-      : null;
-
-  const spanId =
-    metadata && typeof metadata === "object"
-      ? (metadata as Record<string, unknown>).span_id
-      : null;
-
-  const traceId =
-    metadata && typeof metadata === "object"
-      ? (metadata as Record<string, unknown>).trace_id
-      : null;
-
-  const showFeedback =
-    feedbackConfig &&
-    telemetryEnabled &&
-    spanId &&
-    traceId &&
-    typeof spanId === "string" &&
-    typeof traceId === "string";
+  const telemetryIds = getTelemetryIdsFromValue(responseData);
 
   return (
     <div className="space-y-4">
       {responseSchema.properties &&
         Object.entries(responseSchema.properties)
-          .filter(([propertyName]) => propertyName !== "metadata")
+          .filter(([propertyName]) => propertyName !== METADATA_FIELD)
           .map(([propertyName, propertySchema]) => {
             const value = (outputsData as Record<string, ResponseData>)[
               propertyName
@@ -212,13 +191,12 @@ export default function FlowResponseCard({
             );
           })}
 
-      {showFeedback && (
+      {feedbackConfig && telemetryEnabled && telemetryIds && (
         <div className="pt-4 border-t">
           <FeedbackButton
             feedbackConfig={feedbackConfig}
-            spanId={spanId}
-            traceId={traceId}
-            telemetryEnabled={telemetryEnabled}
+            spanId={telemetryIds.spanId}
+            traceId={telemetryIds.traceId}
           />
         </div>
       )}
diff --git a/ui/components/FlowResponseTable.tsx b/ui/components/FlowResponseTable.tsx
index 089924cb..dfc9fec9 100644
--- a/ui/components/FlowResponseTable.tsx
+++ b/ui/components/FlowResponseTable.tsx
@@ -22,6 +22,7 @@ import { useMemo, useState } from "react";
 import { FeedbackButton } from "@/components/feedback";
 import { Button } from "@/components/ui/Button";
 import { Input } from "@/components/ui/Input";
+import { getTelemetryIdsFromMetadata, METADATA_FIELD } from "@/lib/telemetry";
 
 import type { SchemaProperty, ResponseData } from "@/types";
 import type { FeedbackConfig } from "@/types/FlowMetadata";
@@ -84,42 +85,40 @@ export default function FlowResponseTable({
   const columns = useMemo<ColumnDef<Record<string, ResponseData>>[]>(() => {
     if (!responseSchema?.properties) return [];
 
-    const dataColumns = Object.entries(responseSchema.properties)
-      .filter(([key]) => key !== "metadata")
-      .map(([key, schema]) => {
-        const prop = schema as SchemaProperty;
-        return {
-          accessorKey: key,
-          header: prop.title || key,
-          cell: ({ row }) => {
-            const value = row.original[key];
-            return formatCellValue(value, prop.qtype_type);
-          },
-        };
-      });
+    const dataColumns: ColumnDef<Record<string, ResponseData>>[] =
+      Object.entries(responseSchema.properties)
+        .filter(([key]) => key !== METADATA_FIELD)
+        .map(([key, schema]) => {
+          const prop = schema as SchemaProperty;
+          return {
+            accessorKey: key,
+            header: prop.title || key,
+            cell: (ctx) => {
+              const value = ctx.row.original[key];
+              return formatCellValue(value, prop.qtype_type);
+            },
+          };
+        });
 
     // Add feedback column if enabled
     if (feedbackConfig && telemetryEnabled) {
       dataColumns.push({
         id: "feedback",
         header: "Feedback",
-        cell: ({ row }) => {
-          const metadata = row.original.metadata as
-            | Record<string, unknown>
-            | undefined;
-          const spanId = metadata?.span_id as string | undefined;
-          const traceId = metadata?.trace_id as string | undefined;
+        cell: (ctx) => {
+          const telemetryIds = getTelemetryIdsFromMetadata(
+            ctx.row.original[METADATA_FIELD],
+          );
 
-          if (!spanId || !traceId) {
+          if (!telemetryIds) {
             return null;
           }
 
           return (
             <FeedbackButton
               feedbackConfig={feedbackConfig}
-              spanId={spanId}
-              traceId={traceId}
-              telemetryEnabled={telemetryEnabled}
+              spanId={telemetryIds.spanId}
+              traceId={telemetryIds.traceId}
             />
           );
         },
@@ -144,18 +143,23 @@ export default function FlowResponseTable({
   });
 
   const handleDownloadCSV = () => {
+    const exportableProperties = Object.entries(
+      responseSchema?.properties ?? {},
+    )
+      .filter(([key]) => key !== METADATA_FIELD)
+      .map(([key, schema]) => ({
+        key,
+        schema: schema as SchemaProperty,
+      }));
+
     const csvData = table.getFilteredRowModel().rows.map((row) => {
       const rowData: Record<string, string> = {};
-      columns.forEach((col) => {
-        const key = (col as { accessorKey: string }).accessorKey;
-        const propertySchema = responseSchema?.properties?.[key] as
-          | SchemaProperty
-          | undefined;
-        rowData[String(col.header)] = formatCellValue(
-          row.original[key],
-          propertySchema?.qtype_type,
-        );
-      });
+
+      for (const { key, schema } of exportableProperties) {
+        const header = schema.title || key;
+        rowData[header] = formatCellValue(row.original[key], schema.qtype_type);
+      }
+
       return rowData;
     });
 
diff --git a/ui/components/chat/MessageBubble.tsx b/ui/components/chat/MessageBubble.tsx
index 501a4a84..a00c2194 100644
--- a/ui/components/chat/MessageBubble.tsx
+++ b/ui/components/chat/MessageBubble.tsx
@@ -2,6 +2,7 @@ import { Bot, User } from "lucide-react";
 
 import { FeedbackButton } from "@/components/feedback";
 import { Avatar, AvatarFallback } from "@/components/ui/Avatar";
+import { getTelemetryIdsFromMetadata } from "@/lib/telemetry";
 
 import { MarkdownContainer } from "../MarkdownContainer";
 import { Thinking } from "../outputs";
@@ -59,17 +60,14 @@ function MessageBubble({
     isStreaming,
   );
 
-  // Extract span_id and trace_id from metadata for feedback
-  const spanId = message.metadata?.span_id as string | undefined;
-  const traceId = message.metadata?.trace_id as string | undefined;
+  const telemetryIds = getTelemetryIdsFromMetadata(message.metadata);
 
   const showFeedback =
     !isUser &&
     !isStreaming &&
     feedbackConfig &&
     telemetryEnabled &&
-    spanId &&
-    traceId;
+    telemetryIds;
 
   return (
     <div
@@ -123,9 +121,8 @@ function MessageBubble({
           <div className="mt-2">
             <FeedbackButton
               feedbackConfig={feedbackConfig}
-              spanId={spanId}
-              traceId={traceId}
-              telemetryEnabled={telemetryEnabled}
+              spanId={telemetryIds.spanId}
+              traceId={telemetryIds.traceId}
             />
           </div>
         )}
diff --git a/ui/components/feedback/FeedbackButton.tsx b/ui/components/feedback/FeedbackButton.tsx
index 91d0e0ca..e5ad8bf5 100644
--- a/ui/components/feedback/FeedbackButton.tsx
+++ b/ui/components/feedback/FeedbackButton.tsx
@@ -16,40 +16,32 @@ import { FeedbackExplanationModal } from "./FeedbackExplanationModal";
 import { RatingFeedback } from "./RatingFeedback";
 import { ThumbsFeedback } from "./ThumbsFeedback";
 
+import type { FeedbackData, FeedbackSubmission } from "@/types/Feedback";
 import type { FeedbackConfig } from "@/types/FlowMetadata";
 
 interface FeedbackButtonProps {
   feedbackConfig: FeedbackConfig;
   spanId: string;
   traceId: string;
-  telemetryEnabled: boolean;
 }
 
 export function FeedbackButton({
   feedbackConfig,
   spanId,
   traceId,
-  telemetryEnabled,
 }: FeedbackButtonProps) {
   const [submitted, setSubmitted] = useState(false);
   const [isSubmitting, setIsSubmitting] = useState(false);
   const [error, setError] = useState<string | null>(null);
   const [showExplanation, setShowExplanation] = useState(false);
-  const [pendingFeedback, setPendingFeedback] = useState<{
-    type: "thumbs" | "rating" | "category";
-    value?: boolean;
-    score?: number;
-    categories?: string[];
-  } | null>(null);
-
-  if (!telemetryEnabled) {
-    return null; // Don't show feedback if telemetry is not enabled
-  }
+  const [pendingFeedback, setPendingFeedback] = useState<FeedbackData | null>(
+    null,
+  );
 
   if (submitted) {
     return (
-      <div className="flex items-center gap-2 text-sm text-green-600">
-        <Check className="h-4 w-4" />
+      <div className="flex items-center gap-2 text-sm text-muted-foreground">
+        <Check className="h-4 w-4 text-primary" />
         <span>Feedback submitted</span>
       </div>
     );
@@ -57,7 +49,7 @@ export function FeedbackButton({
 
   if (isSubmitting) {
     return (
-      <div className="flex items-center gap-2 text-sm text-gray-500">
+      <div className="flex items-center gap-2 text-sm text-muted-foreground">
         <Loader2 className="h-4 w-4 animate-spin" />
         <span>Submitting...</span>
       </div>
@@ -65,43 +57,24 @@ export function FeedbackButton({
   }
 
   const handleFeedbackSubmit = async (
-    feedback: {
-      type: "thumbs" | "rating" | "category";
-      value?: boolean;
-      score?: number;
-      categories?: string[];
-    },
+    feedback: FeedbackData,
     explanation?: string,
   ) => {
     setIsSubmitting(true);
     setError(null);
 
     try {
-      // Construct feedback data based on type
-      let feedbackData:
-        | { type: "thumbs"; value: boolean; explanation?: string }
-        | { type: "rating"; score: number; explanation?: string }
-        | { type: "category"; categories: string[]; explanation?: string };
-
-      if (feedback.type === "thumbs" && feedback.value !== undefined) {
-        feedbackData = { type: "thumbs", value: feedback.value, explanation };
-      } else if (feedback.type === "rating" && feedback.score !== undefined) {
-        feedbackData = { type: "rating", score: feedback.score, explanation };
-      } else if (feedback.type === "category" && feedback.categories) {
-        feedbackData = {
-          type: "category",
-          categories: feedback.categories,
-          explanation,
-        };
-      } else {
-        throw new Error("Invalid feedback data");
-      }
-
-      await apiClient.submitFeedback({
+      const feedbackWithExplanation: FeedbackData = explanation
+        ? { ...feedback, explanation }
+        : feedback;
+
+      const submission: FeedbackSubmission = {
         span_id: spanId,
         trace_id: traceId,
-        feedback: feedbackData,
-      });
+        feedback: feedbackWithExplanation,
+      };
+
+      await apiClient.submitFeedback(submission);
 
       setSubmitted(true);
       setPendingFeedback(null);
@@ -117,12 +90,7 @@ export function FeedbackButton({
     }
   };
 
-  const handleFeedbackClick = (feedback: {
-    type: "thumbs" | "rating" | "category";
-    value?: boolean;
-    score?: number;
-    categories?: string[];
-  }) => {
+  const handleFeedbackClick = (feedback: FeedbackData) => {
     // If explanation is enabled, show modal first
     if (feedbackConfig.explanation) {
       setPendingFeedback(feedback);
@@ -154,7 +122,7 @@ export function FeedbackButton({
         )}
       </div>
 
-      {error && <div className="text-sm text-red-600">{error}</div>}
+      {error && <div className="text-sm text-destructive">{error}</div>}
 
       {showExplanation && pendingFeedback && (
         <FeedbackExplanationModal
diff --git a/ui/components/feedback/FeedbackExplanationModal.tsx b/ui/components/feedback/FeedbackExplanationModal.tsx
index 69fffa91..9592167c 100644
--- a/ui/components/feedback/FeedbackExplanationModal.tsx
+++ b/ui/components/feedback/FeedbackExplanationModal.tsx
@@ -7,10 +7,11 @@
 "use client";
 
 import { X } from "lucide-react";
-import { useState } from "react";
+import { useEffect, useState } from "react";
 
 import { Button } from "@/components/ui/Button";
 import { Card } from "@/components/ui/Card";
+import { Textarea } from "@/components/ui/textarea";
 
 interface FeedbackExplanationModalProps {
   isOpen: boolean;
@@ -25,6 +26,12 @@ export function FeedbackExplanationModal({
 }: FeedbackExplanationModalProps) {
   const [explanation, setExplanation] = useState("");
 
+  useEffect(() => {
+    if (!isOpen) {
+      setExplanation("");
+    }
+  }, [isOpen]);
+
   if (!isOpen) return null;
 
   const handleSubmit = () => {
@@ -36,7 +43,7 @@ export function FeedbackExplanationModal({
   };
 
   return (
-    <div className="fixed inset-0 z-50 flex items-center justify-center bg-black/50">
+    <div className="fixed inset-0 z-50 flex items-center justify-center bg-foreground/20">
       <Card className="w-full max-w-md p-6">
         <div className="flex items-center justify-between mb-4">
           <h3 className="text-lg font-semibold">Add Explanation (Optional)</h3>
@@ -51,11 +58,11 @@ export function FeedbackExplanationModal({
         </div>
 
         <div className="space-y-4">
-          <textarea
+          <Textarea
             value={explanation}
             onChange={(e) => setExplanation(e.target.value)}
             placeholder="Why did you give this feedback? (optional)"
-            className="w-full min-h-[100px] p-3 border rounded-md resize-none focus:outline-none focus:ring-2 focus:ring-blue-500"
+            className="min-h-[100px] resize-none"
             autoFocus
           />
 
diff --git a/ui/components/feedback/RatingFeedback.tsx b/ui/components/feedback/RatingFeedback.tsx
index ffedd1da..57b2a87c 100644
--- a/ui/components/feedback/RatingFeedback.tsx
+++ b/ui/components/feedback/RatingFeedback.tsx
@@ -37,7 +37,9 @@ export function RatingFeedback({ scale, onFeedback }: RatingFeedbackProps) {
           >
             <Star
               className={`h-4 w-4 ${
-                isFilled ? "fill-yellow-400 text-yellow-400" : "text-gray-300"
+                isFilled
+                  ? "fill-primary text-primary"
+                  : "text-muted-foreground opacity-60"
               }`}
             />
           </Button>
diff --git a/ui/lib/apiClient.ts b/ui/lib/apiClient.ts
index e190ea61..c5a65d21 100644
--- a/ui/lib/apiClient.ts
+++ b/ui/lib/apiClient.ts
@@ -8,6 +8,7 @@
 
 import type { FlowMetadata } from "@/types";
 import type { FlowInputValues, ResponseData } from "@/types";
+import type { FeedbackResponse, FeedbackSubmission } from "@/types/Feedback";
 import type { OpenAPIV3_1 } from "openapi-types";
 
 // Use the official OpenAPI spec type
@@ -152,10 +153,10 @@ export class ApiClient {
   /**
    * POST request helper
    */
-  private async post<T>(
+  private async post<TResponse, TBody = FlowInputValues>(
     endpoint: string,
-    data?: FlowInputValues | Record<string, unknown>,
-  ): Promise<T> {
+    data?: TBody,
+  ): Promise<TResponse> {
     const response = await this.fetchWithTimeout(this.getUrl(endpoint), {
       method: "POST",
       body: data ? JSON.stringify(data) : undefined,
@@ -171,7 +172,7 @@ export class ApiClient {
     path: string,
     inputs?: FlowInputValues,
   ): Promise<T> {
-    return this.post<T>(path, inputs);
+    return this.post<T, FlowInputValues>(path, inputs);
   }
 
   /**
@@ -225,15 +226,13 @@ export class ApiClient {
   /**
    * Submit user feedback on a flow output
    */
-  async submitFeedback(feedback: {
-    span_id: string;
-    trace_id: string;
-    feedback:
-      | { type: "thumbs"; value: boolean; explanation?: string }
-      | { type: "rating"; score: number; explanation?: string }
-      | { type: "category"; categories: string[]; explanation?: string };
-  }): Promise<{ status: string; message: string }> {
-    return this.post("/feedback", feedback);
+  async submitFeedback(
+    submission: FeedbackSubmission,
+  ): Promise<FeedbackResponse> {
+    return this.post<FeedbackResponse, FeedbackSubmission>(
+      "/feedback",
+      submission,
+    );
   }
 }
 
diff --git a/ui/lib/telemetry.ts b/ui/lib/telemetry.ts
new file mode 100644
index 00000000..0305f750
--- /dev/null
+++ b/ui/lib/telemetry.ts
@@ -0,0 +1,43 @@
+/**
+ * Telemetry helpers.
+ *
+ * Centralizes extraction of telemetry IDs (span_id, trace_id) from metadata.
+ */
+
+export const METADATA_FIELD = "metadata";
+
+export interface TelemetryIds {
+  spanId: string;
+  traceId: string;
+}
+
+type UnknownRecord = Record<string, unknown>;
+
+function isRecord(value: unknown): value is UnknownRecord {
+  return typeof value === "object" && value !== null;
+}
+
+export function getTelemetryIdsFromMetadata(
+  metadata: unknown,
+): TelemetryIds | null {
+  if (!isRecord(metadata)) return null;
+
+  const spanId = metadata.span_id;
+  const traceId = metadata.trace_id;
+
+  if (typeof spanId !== "string" || typeof traceId !== "string") {
+    return null;
+  }
+
+  if (spanId.length === 0 || traceId.length === 0) {
+    return null;
+  }
+
+  return { spanId, traceId };
+}
+
+export function getTelemetryIdsFromValue(value: unknown): TelemetryIds | null {
+  if (!isRecord(value)) return null;
+
+  return getTelemetryIdsFromMetadata(value[METADATA_FIELD]);
+}
diff --git a/ui/types/FlowMetadata.ts b/ui/types/FlowMetadata.ts
index 4421271f..0a07b80d 100644
--- a/ui/types/FlowMetadata.ts
+++ b/ui/types/FlowMetadata.ts
@@ -6,25 +6,28 @@ export interface FlowEndpoints {
   stream?: string | null;
 }
 
-export interface ThumbsFeedback {
+export interface ThumbsFeedbackConfig {
   type: "thumbs";
   explanation: boolean;
 }
 
-export interface RatingFeedback {
+export interface RatingFeedbackConfig {
   type: "rating";
   scale: 5 | 10;
   explanation: boolean;
 }
 
-export interface CategoryFeedback {
+export interface CategoryFeedbackConfig {
   type: "category";
   categories: string[];
   allow_multiple: boolean;
   explanation: boolean;
 }
 
-export type FeedbackConfig = ThumbsFeedback | RatingFeedback | CategoryFeedback;
+export type FeedbackConfig =
+  | ThumbsFeedbackConfig
+  | RatingFeedbackConfig
+  | CategoryFeedbackConfig;
 
 export interface FlowMetadata {
   id: string;