From a34fd6646bb99d22bf54e953aa8d134fc2bbe707 Mon Sep 17 00:00:00 2001
From: ananya roy <ananya.roy@example.com>
Date: Fri, 1 May 2026 08:36:50 +1000
Subject: [PATCH] Add SEO-optimized Responsible AI page

Adds a new /responsible-ai landing page covering AI safety evaluation,
guardrails, governance, and bias detection with MLflow. Includes 12 FAQs,
3 code examples, Schema.org structured data, and cross-links to related
SEO pages.

Co-authored-by: Isaac
---
 website/src/pages/responsible-ai.tsx | 1180 ++++++++++++++++++++++++++
 1 file changed, 1180 insertions(+)
 create mode 100644 website/src/pages/responsible-ai.tsx
diff --git a/website/src/pages/responsible-ai.tsx b/website/src/pages/responsible-ai.tsx
new file mode 100644
index 0000000000..b84fbd8b9b
--- /dev/null
+++ b/website/src/pages/responsible-ai.tsx
@@ -0,0 +1,1180 @@
+import { useState } from "react";
+import Head from "@docusaurus/Head";
+import Link from "@docusaurus/Link";
+import { Highlight } from "prism-react-renderer";
+import { Header } from "../components/Header/Header";
+import { SocialLinksFooter } from "../components/SocialLinksFooter/SocialLinksFooter";
+import { ArticleSidebar } from "../components/ArticleSidebar/ArticleSidebar";
+import { MLFLOW_GENAI_DOCS_URL } from "@site/src/constants";
+import { CopyButton } from "../components/CodeSnippet/CopyButton";
+import { customNightOwl, CODE_BG } from "../components/CodeSnippet/codeTheme";
+
+const SEO_TITLE =
+  "Responsible AI: Safety, Guardrails & Governance | MLflow AI Platform";
+const SEO_DESCRIPTION =
+  "Responsible AI ensures AI systems are safe, fair, transparent, and accountable. Evaluate safety, enforce guardrails, and govern AI agents with MLflow's open-source platform.";
+
+const faqs: {
+  question: string;
+  answer: React.ReactNode;
+  answerText?: string;
+}[] = [
+  {
+    question: "What is responsible AI?",
+    answer:
+      "Responsible AI is a set of principles and practices for building AI systems that are safe, fair, transparent, accountable, and privacy-preserving. For production agents and LLM applications, responsible AI means systematically evaluating safety, enforcing guardrails on inputs and outputs, maintaining complete audit trails through tracing, and enabling human oversight throughout the AI lifecycle. It's not a single tool but a comprehensive approach spanning development, deployment, and production operations.",
+  },
+  {
+    question: "Why does responsible AI matter for LLM applications and agents?",
+    answer:
+      "LLMs and autonomous agents introduce risks that traditional software testing cannot catch: hallucinations that present false information as fact, harmful or toxic content generation, PII exposure in inputs and outputs, prompt injection attacks that bypass safety controls, and uncontrolled agent behavior like infinite loops or unauthorized tool use. These failures have real consequences — legal liability, regulatory penalties, user harm, and brand damage. Responsible AI practices provide systematic safeguards through evaluation, guardrails, monitoring, and governance.",
+  },
+  {
+    question: "What are the key pillars of a responsible AI framework?",
+    answer: (
+      <>
+        A comprehensive responsible AI framework rests on five pillars: (1){" "}
+        <strong>Safety</strong> — preventing harmful, toxic, or dangerous
+        outputs through{" "}
+        <Link href={MLFLOW_GENAI_DOCS_URL + "eval-monitor/scorers/"}>
+          evaluation
+        </Link>{" "}
+        and runtime guardrails. (2) <strong>Fairness</strong> — detecting and
+        mitigating bias across demographic groups. (3){" "}
+        <strong>Transparency</strong> — making AI decision-making explainable
+        through <Link href={MLFLOW_GENAI_DOCS_URL + "tracing/"}>tracing</Link>{" "}
+        and observability. (4) <strong>Accountability</strong> — maintaining
+        audit trails and governance controls. (5) <strong>Privacy</strong> —
+        protecting personally identifiable information and controlling data
+        access. MLflow addresses all five through its integrated platform.
+      </>
+    ),
+    answerText:
+      "A comprehensive responsible AI framework rests on five pillars: (1) Safety — preventing harmful, toxic, or dangerous outputs through evaluation and runtime guardrails. (2) Fairness — detecting and mitigating bias across demographic groups. (3) Transparency — making AI decision-making explainable through tracing and observability. (4) Accountability — maintaining audit trails and governance controls. (5) Privacy — protecting personally identifiable information and controlling data access. MLflow addresses all five through its integrated platform.",
+  },
+  {
+    question: "What is AI safety evaluation?",
+    answer: (
+      <>
+        AI safety evaluation systematically tests AI outputs for harmful
+        content, policy violations, and unsafe behavior. Unlike traditional
+        testing that checks for deterministic outputs, safety evaluation uses
+        LLM judges to assess whether responses contain toxicity, violence,
+        misinformation, or other harmful content.{" "}
+        <Link href={MLFLOW_GENAI_DOCS_URL + "eval-monitor/scorers/"}>
+          MLflow provides built-in Safety and ConversationalSafety scorers
+        </Link>{" "}
+        for detecting harmful content in single-turn and multi-turn
+        interactions, plus APIs to create custom judges for domain-specific
+        safety policies.
+      </>
+    ),
+    answerText:
+      "AI safety evaluation systematically tests AI outputs for harmful content, policy violations, and unsafe behavior. Unlike traditional testing that checks for deterministic outputs, safety evaluation uses LLM judges to assess whether responses contain toxicity, violence, misinformation, or other harmful content. MLflow provides built-in Safety and ConversationalSafety scorers for detecting harmful content in single-turn and multi-turn interactions, plus APIs to create custom judges for domain-specific safety policies.",
+  },
+  {
+    question: "What are AI guardrails?",
+    answer: (
+      <>
+        AI guardrails are runtime controls that filter or modify AI inputs and
+        outputs in real time, acting as a safety net between your AI system and
+        end users. <Link href="/ai-gateway">MLflow's AI Gateway</Link> provides
+        input guardrails (blocking prompt injection attempts, filtering harmful
+        requests) and output guardrails (PII redaction, toxicity detection,
+        content policy enforcement). Guardrails complement evaluation:
+        evaluation catches issues during development and testing, while
+        guardrails prevent harmful content from reaching users in production.
+      </>
+    ),
+    answerText:
+      "AI guardrails are runtime controls that filter or modify AI inputs and outputs in real time, acting as a safety net between your AI system and end users. MLflow's AI Gateway provides input guardrails (blocking prompt injection attempts, filtering harmful requests) and output guardrails (PII redaction, toxicity detection, content policy enforcement). Guardrails complement evaluation: evaluation catches issues during development and testing, while guardrails prevent harmful content from reaching users in production.",
+  },
+  {
+    question: "How do I evaluate AI safety with MLflow?",
+    answer: (
+      <>
+        Use{" "}
+        <Link href={MLFLOW_GENAI_DOCS_URL + "eval-monitor/"}>
+          <code>mlflow.genai.evaluate()</code>
+        </Link>{" "}
+        with built-in scorers: <code>Safety()</code> checks single-turn
+        responses for harmful content, and <code>ConversationalSafety()</code>{" "}
+        assesses multi-turn conversations for escalating risks. For
+        organization-specific policies, create custom judges with{" "}
+        <code>make_judge()</code> that evaluate responses against your specific
+        compliance requirements. Results are tracked in the MLflow UI, where you
+        can view pass rates, drill into failures, and compare safety metrics
+        across versions.
+      </>
+    ),
+    answerText:
+      "Use mlflow.genai.evaluate() with built-in scorers: Safety() checks single-turn responses for harmful content, and ConversationalSafety() assesses multi-turn conversations for escalating risks. For organization-specific policies, create custom judges with make_judge() that evaluate responses against your specific compliance requirements. Results are tracked in the MLflow UI, where you can view pass rates, drill into failures, and compare safety metrics across versions.",
+  },
+  {
+    question: "What is guideline adherence evaluation?",
+    answer: (
+      <>
+        Guideline adherence evaluation uses custom LLM judges to verify that AI
+        outputs comply with specific business rules, ethical guidelines, or
+        regulatory requirements. Instead of generic safety checks, you define
+        natural-language rules (e.g., "never provide medical diagnoses," "always
+        include financial disclaimers") and{" "}
+        <Link
+          href={
+            MLFLOW_GENAI_DOCS_URL +
+            "eval-monitor/scorers/llm-judge/custom-judges/"
+          }
+        >
+          MLflow's custom judges
+        </Link>{" "}
+        automatically score every response against those rules. This enables
+        organizations to enforce compliance at scale without manual review of
+        every output.
+      </>
+    ),
+    answerText:
+      "Guideline adherence evaluation uses custom LLM judges to verify that AI outputs comply with specific business rules, ethical guidelines, or regulatory requirements. Instead of generic safety checks, you define natural-language rules (e.g., 'never provide medical diagnoses,' 'always include financial disclaimers') and MLflow's custom judges automatically score every response against those rules. This enables organizations to enforce compliance at scale without manual review of every output.",
+  },
+  {
+    question: "How does AI observability support responsible AI?",
+    answer: (
+      <>
+        <Link href="/ai-observability">AI observability</Link> is the foundation
+        of responsible AI transparency.{" "}
+        <Link href={MLFLOW_GENAI_DOCS_URL + "tracing/"}>MLflow tracing</Link>{" "}
+        captures the complete execution context of every AI interaction: which
+        LLM was called, what prompts were sent, which tools were used, and how
+        agents reasoned through decisions. This creates an auditable record that
+        supports incident investigation, compliance reporting, bias auditing,
+        and root cause analysis when issues are detected.
+      </>
+    ),
+    answerText:
+      "AI observability is the foundation of responsible AI transparency. MLflow tracing captures the complete execution context of every AI interaction: which LLM was called, what prompts were sent, which tools were used, and how agents reasoned through decisions. This creates an auditable record that supports incident investigation, compliance reporting, bias auditing, and root cause analysis when issues are detected.",
+  },
+  {
+    question: "How do I implement AI governance with MLflow?",
+    answer: (
+      <>
+        <Link href="/ai-gateway">MLflow's AI Gateway</Link> centralizes AI
+        governance: credential management prevents LLM API key sprawl, rate
+        limiting controls costs and prevents abuse, content guardrails enforce
+        safety policies at the gateway level, and access controls determine who
+        can use which models. Combined with{" "}
+        <Link href={MLFLOW_GENAI_DOCS_URL + "tracing/"}>tracing</Link> for
+        auditability and{" "}
+        <Link href={MLFLOW_GENAI_DOCS_URL + "eval-monitor/"}>evaluation</Link>{" "}
+        for quality assurance, organizations get end-to-end governance across
+        their entire AI stack.
+      </>
+    ),
+    answerText:
+      "MLflow's AI Gateway centralizes AI governance: credential management prevents LLM API key sprawl, rate limiting controls costs and prevents abuse, content guardrails enforce safety policies at the gateway level, and access controls determine who can use which models. Combined with tracing for auditability and evaluation for quality assurance, organizations get end-to-end governance across their entire AI stack.",
+  },
+  {
+    question: "What is red-teaming for AI systems?",
+    answer:
+      "Red-teaming tests AI systems against adversarial inputs to discover safety vulnerabilities before deployment. Teams create adversarial evaluation datasets containing edge cases, harmful prompts, prompt injection attempts, and boundary-pushing scenarios. These are run through MLflow evaluations with safety scorers to measure how well the system resists adversarial attacks. Results identify where additional guardrails, prompt improvements, or model fine-tuning are needed to harden the system before production exposure.",
+  },
+  {
+    question: "How do I monitor responsible AI metrics in production?",
+    answer: (
+      <>
+        <Link href="/ai-monitoring">MLflow's monitoring capabilities</Link>{" "}
+        continuously score production traces with safety judges, detecting
+        quality degradation and policy violations in real time. Configure
+        sampling to evaluate a representative subset of production traffic, set
+        alert thresholds for safety pass rates, and route flagged interactions
+        to human reviewers. This creates a continuous feedback loop: production
+        failures become evaluation test cases, which drive improvements that are
+        validated before redeployment.
+      </>
+    ),
+    answerText:
+      "MLflow's monitoring capabilities continuously score production traces with safety judges, detecting quality degradation and policy violations in real time. Configure sampling to evaluate a representative subset of production traffic, set alert thresholds for safety pass rates, and route flagged interactions to human reviewers. This creates a continuous feedback loop: production failures become evaluation test cases, which drive improvements that are validated before redeployment.",
+  },
+  {
+    question: "Is MLflow free for responsible AI evaluation and governance?",
+    answer:
+      "Yes. MLflow is completely free and open source under the Apache 2.0 license, backed by the Linux Foundation. All responsible AI features — safety evaluation, custom compliance judges, tracing for auditability, AI Gateway guardrails, and production monitoring — are included at no cost, including for commercial use. The only costs are your own infrastructure and any LLM API calls for running judges. Managed MLflow is also available on Databricks and other platforms if you prefer hosted solutions.",
+  },
+];
+
+const faqJsonLd = {
+  "@context": "https://schema.org",
+  "@type": "FAQPage",
+  mainEntity: faqs.map((faq) => ({
+    "@type": "Question",
+    name: faq.question,
+    acceptedAnswer: {
+      "@type": "Answer",
+      text: faq.answerText || faq.answer,
+    },
+  })),
+};
+
+const softwareJsonLd = {
+  "@context": "https://schema.org",
+  "@type": "SoftwareApplication",
+  name: "MLflow",
+  applicationCategory: "DeveloperApplication",
+  operatingSystem: "Cross-platform",
+  offers: {
+    "@type": "Offer",
+    price: "0",
+    priceCurrency: "USD",
+  },
+  description:
+    "Open-source AI platform with responsible AI evaluation, safety guardrails, and governance for agents and LLM applications.",
+  url: "https://mlflow.org",
+  license: "https://www.apache.org/licenses/LICENSE-2.0",
+};
+
+const SAFETY_EVAL_CODE = `import mlflow
+from mlflow.genai.scorers import Safety, ConversationalSafety
+
+# Evaluate single-turn and multi-turn safety
+results = mlflow.genai.evaluate(
+    data="safety_eval_dataset",      # Your evaluation dataset
+    predict_fn=my_agent,              # Your agent or LLM app
+    scorers=[
+        Safety(),                     # Harmful content detection
+        ConversationalSafety(),       # Multi-turn safety assessment
+    ],
+)
+
+# Check safety pass rates
+print(f"Safety pass rate: {results.metrics['safety/pass_rate']}")
+print(f"Conversational safety: {results.metrics['conversational_safety/pass_rate']}")`;
+
+const POLICY_JUDGE_CODE = `import mlflow
+from mlflow.genai.judges import make_judge
+from typing import Literal
+
+# Define a custom judge for regulatory compliance
+compliance_judge = make_judge(
+    name="regulatory_compliance",
+    instructions=(
+        "Evaluate whether the {{ outputs }} complies with these policies:\\n"
+        "1. Never provide specific medical diagnoses or dosage recommendations\\n"
+        "2. Always include disclaimers for financial advice\\n"
+        "3. Never share or request personally identifiable information\\n"
+        "4. Refuse requests to generate harmful or deceptive content\\n"
+        "Assess the response against the user's {{ inputs }}."
+    ),
+    feedback_value_type=Literal["compliant", "non_compliant"],
+)
+
+# Run compliance evaluation across your dataset
+results = mlflow.genai.evaluate(
+    data=eval_data,
+    scorers=[compliance_judge],
+)
+
+# View results in the MLflow UI
+print(f"Compliance rate: {results.metrics['regulatory_compliance/pass_rate']}")`;
+
+const BIAS_EVAL_CODE = `import mlflow
+from mlflow.genai.scorers import Safety
+from mlflow.genai.judges import make_judge
+from typing import Literal
+
+# Create a custom judge for bias detection
+bias_judge = make_judge(
+    name="bias_detection",
+    instructions=(
+        "Analyze the {{ outputs }} for any signs of bias, "
+        "stereotyping, or unfair treatment based on race, "
+        "gender, age, religion, or other protected attributes. "
+        "Consider the context of the {{ inputs }}."
+    ),
+    feedback_value_type=Literal["unbiased", "biased"],
+)
+
+# Run a comprehensive responsible AI evaluation
+results = mlflow.genai.evaluate(
+    data="responsible_ai_dataset",
+    predict_fn=my_agent,
+    scorers=[
+        Safety(),          # Harmful content detection
+        bias_judge,        # Bias and fairness assessment
+    ],
+)
+
+# Review results
+print(f"Safety: {results.metrics['safety/pass_rate']}")
+print(f"Bias-free: {results.metrics['bias_detection/pass_rate']}")`;
+
+export default function ResponsibleAI() {
+  const [openFaqIndex, setOpenFaqIndex] = useState<number | null>(0);
+
+  return (
+    <>
+      <Head>
+        <title>{SEO_TITLE}</title>
+        <meta name="description" content={SEO_DESCRIPTION} />
+        <meta property="og:title" content={SEO_TITLE} />
+        <meta property="og:description" content={SEO_DESCRIPTION} />
+        <meta property="og:type" content="website" />
+        <meta property="og:url" content="https://mlflow.org/responsible-ai" />
+        <link rel="canonical" href="https://mlflow.org/responsible-ai" />
+        <script type="application/ld+json">{JSON.stringify(faqJsonLd)}</script>
+        <script type="application/ld+json">
+          {JSON.stringify(softwareJsonLd)}
+        </script>
+        <style>{`
+          @import url('https://fonts.googleapis.com/css2?family=DM+Mono:ital,wght@0,300;0,400;0,500;1,300;1,400;1,500&family=DM+Sans:ital,opsz,wght@0,9..40,100..1000;1,9..40,100..1000&display=swap');
+
+          header, nav {
+            background: #000000 !important;
+          }
+
+          body {
+            background: #ffffff;
+            margin: 0;
+            padding: 0;
+            font-family: 'DM Sans', system-ui, -apple-system, BlinkMacSystemFont, 'Segoe UI', Roboto, sans-serif;
+          }
+          .article-page {
+            background: #ffffff;
+            min-height: 100vh;
+          }
+          .article-container {
+            max-width: 900px;
+            margin: 0 auto;
+            padding: 60px 24px 100px;
+          }
+          .article-container h1 {
+            font-family: 'DM Sans', sans-serif;
+            font-size: 3rem !important;
+            font-weight: 700 !important;
+            color: #1a1a1a !important;
+            margin: 48px 0 32px 0 !important;
+            line-height: 1.0 !important;
+            letter-spacing: -0.03em !important;
+          }
+          .article-container h2 {
+            font-family: 'DM Sans', sans-serif;
+            font-size: 2rem;
+            font-weight: 700;
+            color: #1a1a1a;
+            margin: 64px 0 32px 0;
+            line-height: 1.2;
+            letter-spacing: -0.01em;
+          }
+          .article-container h3 {
+            font-family: 'DM Sans', sans-serif;
+            font-size: 1.5rem;
+            font-weight: 600;
+            color: #1a1a1a;
+            margin: 32px 0 16px 0;
+            line-height: 1.2;
+          }
+          .article-container p {
+            font-family: 'DM Sans', sans-serif;
+            font-size: 16px;
+            color: #3d3d3d;
+            line-height: 1.7;
+            margin: 0 0 24px 0;
+          }
+          .article-container strong {
+            font-weight: 600;
+            color: #1a1a1a;
+          }
+          .article-container a {
+            color: #0194e2 !important;
+            text-decoration: none;
+            transition: all 0.2s ease;
+          }
+          .article-container a:hover {
+            color: #0072b0 !important;
+            text-decoration: underline;
+          }
+          .info-box a {
+            color: #0194e2 !important;
+            font-weight: 500;
+          }
+          .info-box a:hover {
+            color: #0072b0 !important;
+          }
+          .article-container ul {
+            list-style-type: disc;
+            margin: 20px 0;
+            padding-left: 24px;
+            list-style-position: outside;
+          }
+          .article-container li {
+            font-family: 'DM Sans', sans-serif;
+            font-size: 16px;
+            color: #3d3d3d;
+            line-height: 1.7;
+            margin-bottom: 20px;
+            padding-left: 8px;
+            text-wrap: pretty;
+          }
+          .article-container li a {
+            font-weight: 600;
+            color: #0194e2 !important;
+          }
+          .grid-2 {
+            display: grid;
+            grid-template-columns: repeat(auto-fit, minmax(320px, 1fr));
+            gap: 24px;
+            margin: 40px 0 56px 0;
+          }
+          .card {
+            background: #ffffff;
+            border: 1px solid #e5e7eb;
+            border-radius: 4px;
+            padding: 32px;
+            box-shadow: 0 0 0 1px rgba(50, 50, 93, 0.05), 0 0 14px 5px rgba(50, 50, 93, 0.08), 0 0 10px 3px rgba(0, 0, 0, 0.05);
+            transition: all 0.3s ease;
+          }
+          .card:hover {
+            box-shadow: 0 10px 30px rgba(0, 0, 0, 0.1);
+            transform: translateY(-2px);
+          }
+          .card h3 {
+            font-family: 'DM Sans', sans-serif;
+            margin-top: 0 !important;
+            margin-bottom: 32px !important;
+            font-size: 1.3rem;
+            font-weight: 600;
+            color: #1a1a1a;
+            line-height: 1.2;
+          }
+          .card p {
+            font-family: 'DM Sans', sans-serif;
+            margin-bottom: 14px;
+            font-size: 14px;
+            line-height: 1.5;
+            color: #505050;
+          }
+          .card p:last-child {
+            margin-bottom: 0;
+          }
+          .faq-list {
+            margin: 32px 0;
+          }
+          .faq-item {
+            border: 1px solid #e5e7eb;
+            border-radius: 4px;
+            margin-bottom: 16px;
+            background: #ffffff;
+            transition: all 0.2s ease;
+          }
+          .faq-item:hover {
+            box-shadow: 0 2px 8px rgba(0, 0, 0, 0.08);
+          }
+          .faq-question {
+            font-family: 'DM Sans', sans-serif;
+            padding: 20px 24px;
+            font-size: 18px;
+            font-weight: 500;
+            color: #1a1a1a;
+            cursor: pointer;
+            background: transparent;
+            border: none;
+            width: 100%;
+            text-align: left;
+            display: flex;
+            justify-content: space-between;
+            align-items: center;
+            transition: background 0.2s ease;
+          }
+          .faq-question:hover {
+            background: #f9fafb;
+          }
+          .faq-answer {
+            font-family: 'DM Sans', sans-serif;
+            padding: 0 24px 20px;
+            font-size: 16px;
+            color: #3d3d3d;
+            line-height: 1.6;
+          }
+          .faq-chevron {
+            transition: transform 0.2s ease;
+            flex-shrink: 0;
+            margin-left: 16px;
+            color: #6b7280;
+            font-size: 12px;
+          }
+          .faq-chevron.open {
+            transform: rotate(180deg);
+          }
+          .info-box {
+            background: rgb(238, 249, 253);
+            border: 1px solid rgb(41, 120, 115);
+            padding: 20px 24px;
+            margin: 40px 0;
+            border-radius: 5.6px;
+          }
+          .info-box p {
+            font-family: 'DM Sans', sans-serif;
+            margin: 0;
+            font-size: 16px;
+            line-height: 1.6;
+            color: #1e293b;
+          }
+          .article-sidebar {
+            position: fixed;
+            top: 100px;
+            left: calc(50% + 900px / 2 + 48px);
+            width: 280px;
+            max-height: calc(100vh - 120px);
+            overflow-y: auto;
+          }
+          .article-sidebar .toc-title {
+            font-family: 'DM Sans', sans-serif;
+            font-size: 13px;
+            font-weight: 600;
+            text-transform: uppercase;
+            letter-spacing: 0.08em;
+            color: #9ca3af;
+            margin: 0 0 12px 0;
+          }
+          .article-sidebar ul {
+            margin: 0;
+            padding: 0;
+            list-style: none;
+            border-left: 1px solid #e5e7eb;
+          }
+          .article-sidebar li {
+            margin: 0;
+            padding: 0;
+          }
+          .article-sidebar a {
+            font-family: 'DM Sans', sans-serif;
+            display: block;
+            padding: 8px 0 8px 16px;
+            font-size: 16px;
+            color: #0194e2 !important;
+            text-decoration: none !important;
+            transition: all 0.15s ease;
+            line-height: 1.4;
+          }
+          .article-sidebar a:hover {
+            color: #0072b0 !important;
+          }
+          .article-sidebar .toc-divider {
+            border: none;
+            border-top: 1px solid #e5e7eb;
+            margin: 12px 0 12px 0;
+          }
+          @media (max-width: 1400px) {
+            .article-sidebar {
+              display: none;
+            }
+          }
+          @media (max-width: 768px) {
+            .article-container {
+              padding: 40px 20px 80px;
+            }
+            .article-container h1 {
+              font-size: 36px !important;
+              margin-bottom: 24px !important;
+            }
+            .article-container h2 {
+              font-size: 28px;
+              margin: 40px 0 20px 0;
+            }
+            .grid-2 {
+              grid-template-columns: 1fr;
+              gap: 20px;
+            }
+            .card {
+              padding: 24px;
+            }
+            .faq-question {
+              padding: 18px 20px;
+              font-size: 17px;
+            }
+            .faq-answer {
+              padding: 0 20px 20px;
+              font-size: 16px;
+            }
+          }
+        `}</style>
+      </Head>
+
+      <div className="article-page">
+        <Header />
+
+        <div className="article-container">
+          <h1>Responsible AI</h1>
+
+          <p>
+            Responsible AI is the discipline of building AI systems that are
+            safe, fair, transparent, accountable, and privacy-preserving. For
+            production{" "}
+            <Link href={MLFLOW_GENAI_DOCS_URL + "eval-monitor/"}>
+              agents and LLM applications
+            </Link>
+            , responsible AI means systematically{" "}
+            <Link href="/llm-evaluation">evaluating safety</Link>, enforcing{" "}
+            <Link href="/ai-gateway">guardrails</Link> on inputs and outputs,
+            maintaining complete audit trails through{" "}
+            <Link href="/llm-tracing">tracing</Link>, and enabling governance
+            and human oversight throughout the AI lifecycle.
+          </p>
+
+          <p>
+            As AI moves from prototypes to customer-facing production systems,
+            the stakes increase dramatically. Agents make autonomous decisions,
+            LLMs generate content at scale, and failures — harmful outputs,
+            bias, PII leaks, hallucinations — have real consequences including
+            legal liability, regulatory penalties, and loss of user trust.
+            Responsible AI practices are no longer optional for organizations
+            deploying AI in production.
+          </p>
+
+          <p>
+            <Link href="/genai">MLflow</Link> provides an integrated responsible
+            AI toolkit: safety evaluation with{" "}
+            <Link href={MLFLOW_GENAI_DOCS_URL + "eval-monitor/scorers/"}>
+              built-in and custom scorers
+            </Link>
+            , AI Gateway guardrails for runtime protection, tracing for
+            transparency and auditability, and governance for centralized policy
+            enforcement. All open source under Apache 2.0 with no vendor
+            lock-in.
+          </p>
+
+          <div
+            style={{
+              background: "#f9fafb",
+              border: "1px solid #e5e7eb",
+              borderRadius: "8px",
+              padding: "20px 24px",
+              margin: "40px 0",
+            }}
+          >
+            <p style={{ marginBottom: "12px" }}>
+              <strong>Quick Navigation:</strong>
+            </p>
+            <ul style={{ margin: 0, paddingLeft: "24px" }}>
+              <li style={{ marginBottom: "8px" }}>
+                <a href="#why-responsible-ai">Why Responsible AI Matters</a>
+              </li>
+              <li style={{ marginBottom: "8px" }}>
+                <a href="#what-is-responsible-ai">What is Responsible AI</a>
+              </li>
+              <li style={{ marginBottom: "8px" }}>
+                <a href="#responsible-ai-genai">
+                  Responsible AI for Agents and LLMs
+                </a>
+              </li>
+              <li style={{ marginBottom: "8px" }}>
+                <a href="#key-pillars">
+                  Key Pillars of a Responsible AI Framework
+                </a>
+              </li>
+              <li style={{ marginBottom: "8px" }}>
+                <a href="#how-to-implement">
+                  How to Implement Responsible AI with MLflow
+                </a>
+              </li>
+              <li style={{ marginBottom: "0" }}>
+                <a href="#faq">FAQ</a>
+              </li>
+            </ul>
+          </div>
+
+          <h2 id="why-responsible-ai">Why Responsible AI Matters</h2>
+
+          <p>
+            AI systems introduce unique risks that traditional software
+            practices cannot address. Without systematic responsible AI
+            practices, organizations face safety incidents, regulatory
+            violations, and erosion of user trust:
+          </p>
+
+          <div className="grid-2">
+            <div className="card">
+              <h3>Safety Risks</h3>
+              <p>
+                <strong>Problem:</strong> LLMs can generate harmful, toxic, or
+                misleading content. Agents can take unsafe autonomous actions
+                like deleting data or making unauthorized API calls. Without
+                systematic testing, these failures reach users.
+              </p>
+              <p>
+                <strong>Solution:</strong> Evaluate every response with{" "}
+                <Link href={MLFLOW_GENAI_DOCS_URL + "eval-monitor/scorers/"}>
+                  safety scorers
+                </Link>
+                . MLflow's built-in Safety and ConversationalSafety judges
+                detect harmful content before deployment and in production.
+              </p>
+            </div>
+
+            <div className="card">
+              <h3>Compliance Requirements</h3>
+              <p>
+                <strong>Problem:</strong> Regulations like the EU AI Act, NIST
+                AI RMF, and industry-specific standards require organizations to
+                demonstrate AI governance, risk management, and auditability.
+              </p>
+              <p>
+                <strong>Solution:</strong> Maintain complete audit trails with{" "}
+                <Link href={MLFLOW_GENAI_DOCS_URL + "tracing/"}>tracing</Link>,
+                enforce policies at the{" "}
+                <Link href="/ai-gateway">gateway level</Link>, and continuously
+                monitor compliance metrics with automated judges.
+              </p>
+            </div>
+
+            <div className="card">
+              <h3>Bias and Fairness</h3>
+              <p>
+                <strong>Problem:</strong> AI systems can amplify biases from
+                training data, producing unfair outcomes across demographic
+                groups. Without evaluation, bias goes undetected until it causes
+                harm.
+              </p>
+              <p>
+                <strong>Solution:</strong> Create custom judges to evaluate bias
+                across protected attributes. Run evaluations across diverse test
+                cases and{" "}
+                <Link href="/ai-monitoring">monitor production behavior</Link>{" "}
+                for emerging bias patterns.
+              </p>
+            </div>
+
+            <div className="card">
+              <h3>Trust and Accountability</h3>
+              <p>
+                <strong>Problem:</strong> Users and stakeholders need confidence
+                that AI systems behave predictably and that failures can be
+                investigated, explained, and corrected.
+              </p>
+              <p>
+                <strong>Solution:</strong> Full{" "}
+                <Link href="/ai-observability">tracing</Link> creates
+                transparency into every AI decision. Governance controls enforce
+                accountability. Human-in-the-loop review provides oversight for
+                high-stakes decisions.
+              </p>
+            </div>
+          </div>
+
+          <h2 id="what-is-responsible-ai">What is Responsible AI</h2>
+
+          <p>
+            Responsible AI is a framework of principles and practices for
+            developing, deploying, and governing AI systems ethically and
+            safely. It encompasses five core pillars: <strong>safety</strong>{" "}
+            (preventing harmful outputs), <strong>fairness</strong> (avoiding
+            bias and discrimination), <strong>transparency</strong> (making AI
+            decisions explainable), <strong>accountability</strong> (maintaining
+            audit trails and governance), and <strong>privacy</strong>{" "}
+            (protecting personal data).
+          </p>
+
+          <p>
+            Responsible AI is not a single tool or checkbox — it's a
+            comprehensive approach spanning the entire AI lifecycle. During
+            development, it means evaluating safety and fairness before
+            deployment. At deployment, it means enforcing guardrails and access
+            controls. In production, it means continuously monitoring for safety
+            regressions, bias drift, and policy violations. At every stage,
+            human oversight ensures that automated systems remain aligned with
+            organizational values and regulatory requirements.
+          </p>
+
+          <p>
+            For traditional ML, responsible AI focused primarily on model
+            fairness metrics and explainability. For generative AI — LLMs and
+            autonomous agents — the scope expands dramatically to include
+            content safety, policy compliance, PII protection, prompt injection
+            defense, hallucination detection, and controlling unpredictable
+            agent behavior. This broader scope requires new tooling built
+            specifically for the generative AI era.
+          </p>
+
+          <h2 id="responsible-ai-genai">Responsible AI for Agents and LLMs</h2>
+
+          <p>
+            Generative AI introduces responsible AI challenges that are
+            fundamentally different from traditional ML. LLMs generate free-form
+            text, making output validation far more complex than checking
+            classification accuracy. Autonomous agents compound these challenges
+            by taking multi-step actions with real-world consequences.
+          </p>
+
+          <p>Key risks specific to agents and LLM applications include:</p>
+
+          <ul>
+            <li>
+              <strong>Harmful content generation:</strong> Toxicity, violence,
+              misinformation, or content that violates organizational policies
+            </li>
+            <li>
+              <strong>Hallucination:</strong> Presenting fabricated information
+              as fact, particularly dangerous in medical, legal, and financial
+              domains
+            </li>
+            <li>
+              <strong>PII exposure:</strong> Leaking personally identifiable
+              information in inputs, outputs, or agent tool calls
+            </li>
+            <li>
+              <strong>Prompt injection:</strong> Adversarial inputs that bypass
+              safety controls and manipulate agent behavior
+            </li>
+            <li>
+              <strong>Uncontrolled agent behavior:</strong> Tool misuse,
+              infinite loops, unauthorized actions, and runaway costs from
+              autonomous agents
+            </li>
+            <li>
+              <strong>Bias amplification:</strong> Reinforcing stereotypes or
+              producing unfair outcomes across demographic groups in
+              conversational responses
+            </li>
+            <li>
+              <strong>Compliance violations:</strong> Providing medical
+              diagnoses, financial advice, or legal counsel without appropriate
+              disclaimers or qualifications
+            </li>
+          </ul>
+
+          <p>
+            These risks require a multi-layered defense: pre-deployment{" "}
+            <Link href="/llm-evaluation">evaluation</Link> to catch issues
+            during development, runtime{" "}
+            <Link href="/ai-gateway">guardrails</Link> to prevent harmful
+            content from reaching users, continuous{" "}
+            <Link href="/ai-monitoring">monitoring</Link> to detect emerging
+            problems, and <Link href="/ai-observability">observability</Link> to
+            investigate and resolve incidents.
+          </p>
+
+          <h2 id="key-pillars">Key Pillars of a Responsible AI Framework</h2>
+
+          <p>
+            A comprehensive responsible AI implementation combines six
+            capabilities that work together across the AI lifecycle:
+          </p>
+
+          <ul>
+            <li>
+              <Link
+                href={MLFLOW_GENAI_DOCS_URL + "eval-monitor/scorers/"}
+                style={{ color: "#007bff", fontWeight: "600" }}
+              >
+                Safety Evaluation
+              </Link>
+              : Built-in Safety and ConversationalSafety scorers evaluate every
+              output for harmful content. Custom LLM judges enforce
+              domain-specific safety policies tailored to your organization's
+              requirements.
+            </li>
+            <li>
+              <Link
+                href="/ai-gateway"
+                style={{ color: "#007bff", fontWeight: "600" }}
+              >
+                Guardrails
+              </Link>
+              : AI Gateway provides runtime input/output filtering — PII
+              redaction, toxicity detection, prompt injection prevention, and
+              content policy enforcement — acting as a safety net between your
+              AI system and end users.
+            </li>
+            <li>
+              <Link
+                href={MLFLOW_GENAI_DOCS_URL + "tracing/"}
+                style={{ color: "#007bff", fontWeight: "600" }}
+              >
+                Transparency and Observability
+              </Link>
+              : Full tracing captures every LLM call, tool use, and agent
+              reasoning step. Complete audit trails enable incident
+              investigation, compliance reporting, and bias auditing.
+            </li>
+            <li>
+              <Link
+                href="/ai-gateway"
+                style={{ color: "#007bff", fontWeight: "600" }}
+              >
+                Governance
+              </Link>
+              : Centralized credential management, access controls, rate
+              limiting, and cost budgets through the AI Gateway. Prevents API
+              key sprawl and ensures consistent policy enforcement across teams.
+            </li>
+            <li>
+              <Link
+                href={
+                  MLFLOW_GENAI_DOCS_URL +
+                  "eval-monitor/scorers/llm-judge/custom-judges/"
+                }
+                style={{ color: "#007bff", fontWeight: "600" }}
+              >
+                Guideline Adherence
+              </Link>
+              : Custom LLM judges that enforce natural-language business rules,
+              ethical guidelines, and regulatory requirements across every AI
+              response — scaling compliance without manual review.
+            </li>
+            <li>
+              <Link
+                href={MLFLOW_GENAI_DOCS_URL + "eval-monitor/"}
+                style={{ color: "#007bff", fontWeight: "600" }}
+              >
+                Human Oversight
+              </Link>
+              : Review apps and feedback collection for human-in-the-loop
+              validation. Human feedback calibrates automated judges and turns
+              production failures into test cases that prevent regressions.
+            </li>
+          </ul>
+
+          <h2 id="how-to-implement">
+            How to Implement Responsible AI with MLflow
+          </h2>
+
+          <p>
+            <Link href="/genai">MLflow</Link> provides an integrated toolkit for
+            implementing responsible AI across the development lifecycle. With
+            just a few lines of code, you can evaluate safety, enforce
+            compliance policies, and detect bias in your agents and LLM
+            applications. Check out the{" "}
+            <Link href={MLFLOW_GENAI_DOCS_URL + "eval-monitor/"}>
+              MLflow evaluation documentation
+            </Link>{" "}
+            for comprehensive guides and framework-specific examples.
+          </p>
+
+          <p style={{ marginTop: "32px", marginBottom: "0px" }}>
+            <strong>Safety Evaluation with Built-in Scorers</strong>
+          </p>
+
+          <p>
+            Use built-in Safety and ConversationalSafety scorers to detect
+            harmful content in single-turn and multi-turn interactions. Results
+            are tracked in the MLflow UI with pass rates, failure details, and
+            version comparison.
+          </p>
+
+          <div
+            className="rounded-lg border border-white/10 overflow-hidden"
+            style={{ backgroundColor: CODE_BG, margin: "8px 0" }}
+          >
+            <div className="flex items-center justify-between px-3 py-1.5 border-b border-white/10 bg-white/5">
+              <span className="text-xs text-white/50 font-mono">python</span>
+              <CopyButton code={SAFETY_EVAL_CODE} />
+            </div>
+            <div className="p-3 overflow-x-auto">
+              <Highlight
+                theme={customNightOwl}
+                code={SAFETY_EVAL_CODE}
+                language="python"
+              >
+                {({ style, tokens, getLineProps, getTokenProps }) => (
+                  <pre
+                    className="text-xs font-mono !m-0 !p-0 text-left"
+                    style={{
+                      ...style,
+                      backgroundColor: "transparent",
+                    }}
+                  >
+                    {tokens.map((line, i) => (
+                      <div key={i} {...getLineProps({ line })}>
+                        {line.map((token, key) => (
+                          <span key={key} {...getTokenProps({ token })} />
+                        ))}
+                      </div>
+                    ))}
+                  </pre>
+                )}
+              </Highlight>
+            </div>
+          </div>
+
+          <p style={{ marginTop: "32px", marginBottom: "0px" }}>
+            <strong>Custom Policy Compliance Judge</strong>
+          </p>
+
+          <p>
+            For organization-specific regulatory requirements, content policies,
+            or brand guidelines, create custom judges that evaluate every
+            response against your rules. This scales compliance assessment
+            without manual review.
+          </p>
+
+          <div
+            className="rounded-lg border border-white/10 overflow-hidden"
+            style={{ backgroundColor: CODE_BG, margin: "8px 0" }}
+          >
+            <div className="flex items-center justify-between px-3 py-1.5 border-b border-white/10 bg-white/5">
+              <span className="text-xs text-white/50 font-mono">python</span>
+              <CopyButton code={POLICY_JUDGE_CODE} />
+            </div>
+            <div className="p-3 overflow-x-auto">
+              <Highlight
+                theme={customNightOwl}
+                code={POLICY_JUDGE_CODE}
+                language="python"
+              >
+                {({ style, tokens, getLineProps, getTokenProps }) => (
+                  <pre
+                    className="text-xs font-mono !m-0 !p-0 text-left"
+                    style={{
+                      ...style,
+                      backgroundColor: "transparent",
+                    }}
+                  >
+                    {tokens.map((line, i) => (
+                      <div key={i} {...getLineProps({ line })}>
+                        {line.map((token, key) => (
+                          <span key={key} {...getTokenProps({ token })} />
+                        ))}
+                      </div>
+                    ))}
+                  </pre>
+                )}
+              </Highlight>
+            </div>
+          </div>
+
+          <p style={{ marginTop: "32px", marginBottom: "0px" }}>
+            <strong>Bias Detection and Comprehensive Evaluation</strong>
+          </p>
+
+          <p>
+            Combine built-in safety evaluation with custom bias detection to run
+            comprehensive responsible AI assessments. Custom judges can evaluate
+            for stereotyping, unfair treatment, and demographic bias.
+          </p>
+
+          <div
+            className="rounded-lg border border-white/10 overflow-hidden"
+            style={{ backgroundColor: CODE_BG, margin: "8px 0" }}
+          >
+            <div className="flex items-center justify-between px-3 py-1.5 border-b border-white/10 bg-white/5">
+              <span className="text-xs text-white/50 font-mono">python</span>
+              <CopyButton code={BIAS_EVAL_CODE} />
+            </div>
+            <div className="p-3 overflow-x-auto">
+              <Highlight
+                theme={customNightOwl}
+                code={BIAS_EVAL_CODE}
+                language="python"
+              >
+                {({ style, tokens, getLineProps, getTokenProps }) => (
+                  <pre
+                    className="text-xs font-mono !m-0 !p-0 text-left"
+                    style={{
+                      ...style,
+                      backgroundColor: "transparent",
+                    }}
+                  >
+                    {tokens.map((line, i) => (
+                      <div key={i} {...getLineProps({ line })}>
+                        {line.map((token, key) => (
+                          <span key={key} {...getTokenProps({ token })} />
+                        ))}
+                      </div>
+                    ))}
+                  </pre>
+                )}
+              </Highlight>
+            </div>
+          </div>
+
+          <div className="info-box">
+            <p>
+              <Link href="/genai" style={{ color: "#007bff" }}>
+                <strong>MLflow</strong>
+              </Link>{" "}
+              is the largest open-source{" "}
+              <strong>
+                AI engineering platform for agents, LLMs, and ML models
+              </strong>
+              , with over 30 million monthly downloads. Thousands of
+              organizations use MLflow to evaluate safety, enforce guardrails,
+              monitor compliance, and govern production AI systems while
+              controlling costs and managing access to models and data. Backed
+              by the Linux Foundation and licensed under Apache 2.0, MLflow
+              provides a complete responsible AI toolkit with no vendor lock-in.{" "}
+              <Link href={MLFLOW_GENAI_DOCS_URL}>Get started →</Link>
+            </p>
+          </div>
+
+          <h2 id="faq">Frequently Asked Questions</h2>
+
+          <div className="faq-list">
+            {faqs.map((faq, index) => (
+              <div key={index} className="faq-item">
+                <button
+                  className="faq-question"
+                  onClick={() =>
+                    setOpenFaqIndex(openFaqIndex === index ? null : index)
+                  }
+                >
+                  <span>{faq.question}</span>
+                  <span
+                    className={`faq-chevron ${openFaqIndex === index ? "open" : ""}`}
+                  >
+                    ▼
+                  </span>
+                </button>
+                {openFaqIndex === index && (
+                  <div className="faq-answer">{faq.answer}</div>
+                )}
+              </div>
+            ))}
+          </div>
+
+          <h2>Related Resources</h2>
+
+          <ul>
+            <li>
+              <Link href={MLFLOW_GENAI_DOCS_URL + "eval-monitor/scorers/"}>
+                Safety Evaluation Documentation
+              </Link>
+            </li>
+            <li>
+              <Link
+                href={
+                  MLFLOW_GENAI_DOCS_URL +
+                  "eval-monitor/scorers/llm-judge/custom-judges/"
+                }
+              >
+                Custom Compliance Judges Documentation
+              </Link>
+            </li>
+            <li>
+              <Link href={MLFLOW_GENAI_DOCS_URL + "tracing/"}>
+                Tracing and Observability Documentation
+              </Link>
+            </li>
+            <li>
+              <Link href="/llm-evaluation">LLM and Agent Evaluation Guide</Link>
+            </li>
+            <li>
+              <Link href="/ai-gateway">AI Gateway and Guardrails Guide</Link>
+            </li>
+            <li>
+              <Link href="/ai-observability">AI Observability Guide</Link>
+            </li>
+            <li>
+              <Link href="/ai-monitoring">AI Monitoring Guide</Link>
+            </li>
+            <li>
+              <Link href="/llm-tracing">LLM Tracing Guide</Link>
+            </li>
+            <li>
+              <Link href="/genai">MLflow for Agents and LLMs Overview</Link>
+            </li>
+          </ul>
+        </div>
+
+        <ArticleSidebar />
+        <SocialLinksFooter />
+      </div>
+    </>
+  );
+}