CodeForAfrica · koechkevin · Feb 3, 2026 · Feb 4, 2026 · Feb 5, 2026 · Feb 6, 2026
diff --git a/apps/trustlab/public/robots.txt b/apps/trustlab/public/robots.txt
diff --git a/apps/trustlab/src/app/robots.js b/apps/trustlab/src/app/robots.js
@@ -0,0 +1,3 @@
+import { getRobotsTxtContent } from "@/trustlab/lib/data";
+
+export default getRobotsTxtContent;
diff --git a/apps/trustlab/src/lib/data/common/seo.js b/apps/trustlab/src/lib/data/common/seo.js
@@ -1,4 +1,5 @@
 import { site } from "@/trustlab/utils";
+import parseRobotsToMetadata from "@/trustlab/utils/parseRobotsTxt";
 
 const HOMEPAGE_TITLES = ["home", "homepage", "index"];
 
@@ -60,4 +61,8 @@ export function getPageSeoFromMeta(page, settings) {
   };
 }
 
+export function parseRobotsTxt(content = "") {
+  return parseRobotsToMetadata(content);
+}
+
 export default undefined;
diff --git a/apps/trustlab/src/lib/data/index.js b/apps/trustlab/src/lib/data/index.js
@@ -1,3 +1,8 @@
-export { getPageStaticPaths, getPageStaticProps } from "./local";
+export {
+  getPageStaticPaths,
+  getPageStaticProps,
+  getServerSideProps,
+  getRobotsTxtContent,
+} from "./local";
 
 export default undefined;
diff --git a/apps/trustlab/src/lib/data/local/index.js b/apps/trustlab/src/lib/data/local/index.js
@@ -1,4 +1,5 @@
 import { getPageProps, getPagePaths } from "@/trustlab/lib/data/common";
+import { parseRobotsTxt } from "@/trustlab/lib/data/common/seo";
 import api from "@/trustlab/lib/payload";
 
 export async function getPageStaticPaths() {
@@ -15,3 +16,20 @@ export async function getPageStaticProps(context) {
     revalidate: 60,
   };
 }
+
+export async function getServerSideProps(context) {
+  const props = await getPageProps(api, context);
+  if (!props) {
+    return { notFound: true };
+  }
+  return {
+    props,
+  };
+}
+
+export async function getRobotsTxtContent() {
-export async function getRobotsTxtContent() {
+export async function getRobots() {
-export async function getRobotsTxtContent() {
+export async function getRobots() {
+  const siteSettings = await api.findGlobal("site-settings");
+  return parseRobotsTxt(siteSettings?.robotsTxt);
+}
+
+export default undefined;
diff --git a/apps/trustlab/src/payload/globals/tabs/SeoTab.js b/apps/trustlab/src/payload/globals/tabs/SeoTab.js
@@ -7,6 +7,26 @@ import {
   /* eslint-disable-next-line import/no-unresolved */
 } from "@payloadcms/plugin-seo/fields";
 
+import parseRobotsToMetadata from "@/trustlab/utils/parseRobotsTxt";
+
+const validateRobotsTxt = (value) => {
+  if (!value?.trim()) {
+    return true;
+  }
+  const result = parseRobotsToMetadata(value, { collectDiagnostics: true });
+  if (!result.errors?.length) {
+    return true;
+  }
+  const message = result.errors
+    .map(({ line, directive, reason }) =>
+      [`line ${line}`, directive ? `directive "${directive}"` : null, reason]
+        .filter(Boolean)
+        .join(" "),
+    )
+    .join("; ");
+  return `Invalid robots.txt: ${message}`;
+};
+
 const SeoTab = {
   label: "SEO",
   fields: [
@@ -46,6 +66,18 @@ const SeoTab = {
         }),
       ],
     },
+    {
+      name: "robotsTxt",
+      label: "robots.txt content",
-      label: "robots.txt content",
+      label: "robots.txt",
-      label: "robots.txt content",
+      label: "robots.txt",
+      type: "code",
+      defaultValue: "User-agent: *\nDisallow: /",
+      admin: {
+        language: "plaintext",
+        rows: 14,
+        description: "Paste the exact robots.txt text to serve.",
-        description: "Paste the exact robots.txt text to serve.",
+        description: "Enter the exact robots.txt text to serve.",
-        description: "Paste the exact robots.txt text to serve.",
+        description: "Enter the exact robots.txt text to serve.",
+      },
+      validate: validateRobotsTxt,
+    },
   ],
 };
 

diff --git a/apps/trustlab/src/utils/parseRobotsTxt.js b/apps/trustlab/src/utils/parseRobotsTxt.js
@@ -0,0 +1,203 @@
+const USER_AGENT_REGEX = /^user-agent$/i;
+const ALLOW_REGEX = /^allow$/i;
+const DISALLOW_REGEX = /^disallow$/i;
+const CRAWL_DELAY_REGEX = /^crawl-delay$/i;
+const CACHE_DELAY_REGEX = /^cache-delay$/i;
+const VISIT_TIME_REGEX = /^visit-time$/i;
+const SITEMAP_REGEX = /^sitemap$/i;
+const HOST_REGEX = /^host$/i;
+const CLEAN_PARAM_REGEX = /^clean-param$/i;
+
+const KNOWN_DIRECTIVES = new Set([
+  "user-agent",
+  "allow",
+  "disallow",
+  "crawl-delay",
+  "cache-delay",
+  "visit-time",
+  "sitemap",
+  "host",
+  "clean-param",
+]);
+
+const normalizeString = (value) =>
+  typeof value === "string" ? value : `${value ?? ""}`;
+
+const appendDirectiveValue = (previous, value) => {
+  if (previous === undefined || previous === null || previous === "") {
+    return value;
+  }
+  if (Array.isArray(previous)) {
+    return [...previous, value];
+  }
+  return [previous, value];
+};
+
+const appendUserAgent = (previous, value) => {
+  const normalized = value || "*";
+  if (!previous || previous === "") {
+    return normalized;
+  }
+  if (Array.isArray(previous)) {
+    return [...previous, normalized];
+  }
+  if (previous === normalized) {
+    return previous;
+  }
+  return [previous, normalized];
+};
+
+const startRule = (rules, userAgent, meta = {}) => {
+  const rule = { userAgent: userAgent || "*", ...meta };
+  rules.push(rule);
+  return rule;
+};
+
+const updateRule = (rule, next) => Object.assign(rule, next);
+
+export default function parseRobotsToMetadata(rawContent = "", options = {}) {
+  const { collectDiagnostics = false } = options;
+  const diagnostics = collectDiagnostics ? [] : undefined;
+  const content = normalizeString(rawContent);
+  const rules = [];
+  const sitemap = [];
+  const cleanParams = [];
+  let host = null;
+  let current = null;
+  let currentHasDirectives = false;
+
+  const ensureRule = () => {
+    if (!current) {
+      current = startRule(rules, "*", { autoUserAgent: true });
+      currentHasDirectives = false;
+    }
+    return current;
+  };
+
+  content
+    .replace(/\r\n?/g, "\n")
+    .split("\n")
+    .forEach((rawLine, index) => {
+      const line = rawLine.trim();
+      if (!line || line.startsWith("#")) {
+        return;
+      }
+
+      const separatorIndex = line.indexOf(":");
+      if (separatorIndex === -1) {
+        if (diagnostics) {
+          diagnostics.push({
+            line: index + 1,
+            directive: line,
+            reason: 'Missing ":" separator',
+          });
+        }
+        return;
+      }
+
+      const key = line.slice(0, separatorIndex).trim();
+      const keyLower = key.toLowerCase();
+      const value = line.slice(separatorIndex + 1).trim();
+
+      if (!KNOWN_DIRECTIVES.has(keyLower)) {
+        if (diagnostics) {
+          diagnostics.push({
+            line: index + 1,
+            directive: key,
+            reason: "Unknown directive",
+          });
+        }
+        return;
+      }
+
+      if (SITEMAP_REGEX.test(key)) {
+        if (value) {
+          sitemap.push(value);
+        }
+        return;
+      }
+
+      if (HOST_REGEX.test(key)) {
+        if (value) {
+          host = value;
+        }
+        return;
+      }
+
+      if (CLEAN_PARAM_REGEX.test(key)) {
+        if (value) {
+          cleanParams.push(value);
+        }
+        return;
+      }
+
+      if (USER_AGENT_REGEX.test(key)) {
+        if (current && current.autoUserAgent) {
+          updateRule(current, { userAgent: value || "*" });
+          delete current.autoUserAgent;
+        } else if (!current || currentHasDirectives) {
+          current = startRule(rules, value || "*");
+        } else {
+          updateRule(current, {
+            userAgent: appendUserAgent(current.userAgent, value || "*"),
+          });
+        }
+        currentHasDirectives = false;
+        return;
+      }
+
+      const rule = ensureRule();
+
+      if (ALLOW_REGEX.test(key)) {
+        updateRule(rule, { allow: appendDirectiveValue(rule.allow, value) });
+        currentHasDirectives = true;
+        return;
+      }
+
+      if (DISALLOW_REGEX.test(key)) {
+        updateRule(rule, {
+          disallow: appendDirectiveValue(rule.disallow, value),
+        });
+        currentHasDirectives = true;
+        return;
+      }
+
+      if (CRAWL_DELAY_REGEX.test(key)) {
+        const numeric = Number(value);
+        updateRule(rule, {
+          crawlDelay: Number.isFinite(numeric) ? numeric : value,
+        });
+        currentHasDirectives = true;
+        return;
+      }
+
+      if (CACHE_DELAY_REGEX.test(key)) {
+        const numeric = Number(value);
+        updateRule(rule, {
+          cacheDelay: Number.isFinite(numeric) ? numeric : value,
+        });
+        currentHasDirectives = true;
+        return;
+      }
+
+      if (VISIT_TIME_REGEX.test(key)) {
+        updateRule(rule, {
+          visitTime: appendDirectiveValue(rule.visitTime, value),
+        });
+        currentHasDirectives = true;
+      }
+    });
+
+  const sanitizedRules = rules.map((ruleEntry) => {
+    const { autoUserAgent, ...cleanRule } = ruleEntry;
+    return cleanRule;
+  });
+
+  return {
+    rules: sanitizedRules,
+    sitemap,
+    host,
+    cleanParams,
+    errors: diagnostics,
+  };
+}
Original file line number	Diff line number	Diff line change
		@@ -0,0 +1,3 @@
		import { getRobotsTxtContent } from "@/trustlab/lib/data";

		export default getRobotsTxtContent;