Skip to content

Commit

Permalink
fix(sitemap): exclude pages with robots noindex from sitemap
Browse files Browse the repository at this point in the history
  • Loading branch information
Josh-Cena committed Apr 9, 2022
1 parent b50def3 commit 93bbc70
Show file tree
Hide file tree
Showing 12 changed files with 69 additions and 40 deletions.
16 changes: 7 additions & 9 deletions packages/docusaurus-plugin-debug/src/index.ts
Original file line number Diff line number Diff line change
Expand Up @@ -9,8 +9,6 @@ import type {LoadContext, Plugin} from '@docusaurus/types';
import {docuHash, normalizeUrl, posixPath} from '@docusaurus/utils';
import path from 'path';

export const routeBasePath = '__docusaurus/debug';

export default function pluginDebug({
siteConfig: {baseUrl},
generatedFilesDir,
Expand Down Expand Up @@ -42,37 +40,37 @@ export default function pluginDebug({

// Home is config (duplicate for now)
addRoute({
path: normalizeUrl([baseUrl, routeBasePath]),
path: normalizeUrl([baseUrl, '__docusaurus/debug']),
component: '@theme/DebugConfig',
exact: true,
});

addRoute({
path: normalizeUrl([baseUrl, routeBasePath, 'config']),
path: normalizeUrl([baseUrl, '__docusaurus/debug/config']),
component: '@theme/DebugConfig',
exact: true,
});

addRoute({
path: normalizeUrl([baseUrl, routeBasePath, 'metadata']),
path: normalizeUrl([baseUrl, '__docusaurus/debug/metadata']),
component: '@theme/DebugSiteMetadata',
exact: true,
});

addRoute({
path: normalizeUrl([baseUrl, routeBasePath, 'registry']),
path: normalizeUrl([baseUrl, '__docusaurus/debug/registry']),
component: '@theme/DebugRegistry',
exact: true,
});

addRoute({
path: normalizeUrl([baseUrl, routeBasePath, 'routes']),
path: normalizeUrl([baseUrl, '__docusaurus/debug/routes']),
component: '@theme/DebugRoutes',
exact: true,
});

addRoute({
path: normalizeUrl([baseUrl, routeBasePath, 'content']),
path: normalizeUrl([baseUrl, '__docusaurus/debug/content']),
component: '@theme/DebugContent',
exact: true,
modules: {
Expand All @@ -81,7 +79,7 @@ export default function pluginDebug({
});

addRoute({
path: normalizeUrl([baseUrl, routeBasePath, 'globalData']),
path: normalizeUrl([baseUrl, '__docusaurus/debug/globalData']),
component: '@theme/DebugGlobalData',
exact: true,
});
Expand Down
4 changes: 0 additions & 4 deletions packages/docusaurus-plugin-debug/src/plugin-debug.d.ts
Original file line number Diff line number Diff line change
Expand Up @@ -7,10 +7,6 @@

/// <reference types="@docusaurus/module-type-aliases" />

declare module '@docusaurus/plugin-debug' {
export const routeBasePath: string;
}

declare module '@theme/DebugConfig' {
export default function DebugMetadata(): JSX.Element;
}
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -35,6 +35,7 @@ export default function DebugLayout({
<Head>
<html lang="en" />
<title>Docusaurus debug panel</title>
<meta name="robots" content="noindex" />
</Head>

<div>
Expand Down
34 changes: 23 additions & 11 deletions packages/docusaurus-plugin-sitemap/src/createSitemap.ts
Original file line number Diff line number Diff line change
Expand Up @@ -10,10 +10,13 @@ import type {PluginOptions} from '@docusaurus/plugin-sitemap';
import type {DocusaurusConfig} from '@docusaurus/types';
import {applyTrailingSlash} from '@docusaurus/utils-common';
import {createMatcher} from '@docusaurus/utils';
import type {HelmetServerState} from 'react-helmet-async';
import type {ReactElement} from 'react';

export default async function createSitemap(
siteConfig: DocusaurusConfig,
routesPaths: string[],
helmet: {[location: string]: HelmetServerState},
options: PluginOptions,
): Promise<string> {
const {url: hostname} = siteConfig;
Expand All @@ -26,18 +29,27 @@ export default async function createSitemap(

const sitemapStream = new SitemapStream({hostname});

routesPaths
.filter((route) => !route.endsWith('404.html') && !ignoreMatcher(route))
.forEach((routePath) =>
sitemapStream.write({
url: applyTrailingSlash(routePath, {
trailingSlash: siteConfig.trailingSlash,
baseUrl: siteConfig.baseUrl,
}),
changefreq,
priority,
}),
function routeShouldBeIncluded(route: string) {
if (route.endsWith('404.html') || ignoreMatcher(route)) {
return false;
}
// https://github.com/staylor/react-helmet-async/pull/167
const meta = helmet[route]?.meta.toComponent() as unknown as ReactElement[];
return !meta.some(
(tag) => tag.props.name === 'robots' && tag.props.content === 'noindex',
);
}

routesPaths.filter(routeShouldBeIncluded).forEach((routePath) =>
sitemapStream.write({
url: applyTrailingSlash(routePath, {
trailingSlash: siteConfig.trailingSlash,
baseUrl: siteConfig.baseUrl,
}),
changefreq,
priority,
}),
);

sitemapStream.end();

Expand Down
3 changes: 2 additions & 1 deletion packages/docusaurus-plugin-sitemap/src/index.ts
Original file line number Diff line number Diff line change
Expand Up @@ -18,14 +18,15 @@ export default function pluginSitemap(
return {
name: 'docusaurus-plugin-sitemap',

async postBuild({siteConfig, routesPaths, outDir}) {
async postBuild({siteConfig, routesPaths, outDir, helmet}) {
if (siteConfig.noIndex) {
return;
}
// Generate sitemap.
const generatedSitemap = await createSitemap(
siteConfig,
routesPaths,
helmet,
options,
);

Expand Down
12 changes: 3 additions & 9 deletions packages/docusaurus-preset-classic/src/index.ts
Original file line number Diff line number Diff line change
Expand Up @@ -5,7 +5,6 @@
* LICENSE file in the root directory of this source tree.
*/

import {routeBasePath as debugPluginRouteBasePath} from '@docusaurus/plugin-debug';
import type {
Preset,
LoadContext,
Expand All @@ -29,21 +28,20 @@ export default function preset(
opts: Options = {},
): Preset {
const {siteConfig} = context;
const {themeConfig, baseUrl} = siteConfig;
const {themeConfig} = siteConfig;
const {algolia} = themeConfig as Partial<ThemeConfig>;
const isProd = process.env.NODE_ENV === 'production';
const {
debug,
docs,
blog,
pages,
sitemap = {},
sitemap,
theme,
googleAnalytics,
gtag,
...rest
} = opts;
const isDebugEnabled = debug || (debug === undefined && !isProd);

const themes: PluginConfig[] = [];
themes.push(makePluginConfig('@docusaurus/theme-classic', theme));
Expand Down Expand Up @@ -76,17 +74,13 @@ export default function preset(
makePluginConfig('@docusaurus/plugin-google-analytics', googleAnalytics),
);
}
if (isDebugEnabled) {
if (debug || (debug === undefined && !isProd)) {
plugins.push(require.resolve('@docusaurus/plugin-debug'));
}
if (gtag) {
plugins.push(makePluginConfig('@docusaurus/plugin-google-gtag', gtag));
}
if (isProd && sitemap !== false) {
if (isDebugEnabled) {
sitemap.ignorePatterns ??= [];
sitemap.ignorePatterns.push(`${baseUrl}${debugPluginRouteBasePath}/**`);
}
plugins.push(makePluginConfig('@docusaurus/plugin-sitemap', sitemap));
}
if (Object.keys(rest).length > 0) {
Expand Down
1 change: 1 addition & 0 deletions packages/docusaurus-types/package.json
Original file line number Diff line number Diff line change
Expand Up @@ -19,6 +19,7 @@
"commander": "^5.1.0",
"history": "^4.9.0",
"joi": "^17.6.0",
"react-helmet-async": "^1.2.3",
"utility-types": "^3.10.0",
"webpack": "^5.72.0",
"webpack-merge": "^5.8.0"
Expand Down
8 changes: 7 additions & 1 deletion packages/docusaurus-types/src/index.d.ts
Original file line number Diff line number Diff line change
Expand Up @@ -10,6 +10,7 @@ import type {CustomizeRuleString} from 'webpack-merge/dist/types';
import type {CommanderStatic} from 'commander';
import type {ParsedUrlQueryInput} from 'querystring';
import type Joi from 'joi';
import type {HelmetServerState} from 'react-helmet-async';
import type {
DeepRequired,
Required as RequireKeys,
Expand Down Expand Up @@ -319,7 +320,12 @@ export type Plugin<Content = unknown> = {
actions: PluginContentLoadedActions;
}) => Promise<void> | void;
routesLoaded?: (routes: RouteConfig[]) => void; // TODO remove soon, deprecated (alpha-60)
postBuild?: (props: Props & {content: Content}) => Promise<void> | void;
postBuild?: (
props: Props & {
content: Content;
helmet: {[location: string]: HelmetServerState};
},
) => Promise<void> | void;
// TODO refactor the configureWebpack API surface: use an object instead of
// multiple params (requires breaking change)
configureWebpack?: (
Expand Down
2 changes: 2 additions & 0 deletions packages/docusaurus/src/client/serverEntry.tsx
Original file line number Diff line number Diff line change
Expand Up @@ -70,6 +70,7 @@ async function doRender(locals: Locals & {path: string}) {
preBodyTags,
postBodyTags,
onLinksCollected,
onHeadTagsCollected,
baseUrl,
ssrTemplate,
noIndex,
Expand Down Expand Up @@ -105,6 +106,7 @@ async function doRender(locals: Locals & {path: string}) {
helmet.link.toString(),
helmet.script.toString(),
];
onHeadTagsCollected(location, helmet);
const metaAttributes = metaStrings.filter(Boolean);

const {generatedFilesDir} = locals;
Expand Down
11 changes: 10 additions & 1 deletion packages/docusaurus/src/commands/build.ts
Original file line number Diff line number Diff line change
Expand Up @@ -27,6 +27,7 @@ import {
import CleanWebpackPlugin from '../webpack/plugins/CleanWebpackPlugin';
import {loadI18n} from '../server/i18n';
import {mapAsyncSequential} from '@docusaurus/utils';
import type {HelmetServerState} from 'react-helmet-async';

export async function build(
siteDir: string,
Expand Down Expand Up @@ -149,12 +150,16 @@ async function buildLocale({
);

const allCollectedLinks: {[location: string]: string[]} = {};
const headTags: {[location: string]: HelmetServerState} = {};

let serverConfig: Configuration = await createServerConfig({
props,
onLinksCollected: (staticPagePath, links) => {
allCollectedLinks[staticPagePath] = links;
},
onHeadTagsCollected: (staticPagePath, tags) => {
headTags[staticPagePath] = tags;
},
});

if (staticDirectories.length > 0) {
Expand Down Expand Up @@ -224,7 +229,11 @@ async function buildLocale({
if (!plugin.postBuild) {
return;
}
await plugin.postBuild({...props, content: plugin.content});
await plugin.postBuild({
...props,
helmet: headTags,
content: plugin.content,
});
}),
);

Expand Down
6 changes: 6 additions & 0 deletions packages/docusaurus/src/deps.d.ts
Original file line number Diff line number Diff line change
Expand Up @@ -35,13 +35,19 @@ declare module 'react-loadable-ssr-addon-v5-slorber' {
}

declare module '@slorber/static-site-generator-webpack-plugin' {
import type {HelmetServerState} from 'react-helmet-async';

export type Locals = {
routesLocation: {[filePath: string]: string};
generatedFilesDir: string;
headTags: string;
preBodyTags: string;
postBodyTags: string;
onLinksCollected: (staticPagePath: string, links: string[]) => void;
onHeadTagsCollected: (
staticPagePath: string,
tags: HelmetServerState,
) => void;
baseUrl: string;
ssrTemplate: string;
noIndex: boolean;
Expand Down
11 changes: 7 additions & 4 deletions packages/docusaurus/src/webpack/server.ts
Original file line number Diff line number Diff line change
Expand Up @@ -17,14 +17,16 @@ import {NODE_MAJOR_VERSION, NODE_MINOR_VERSION} from '@docusaurus/utils';
import ssrDefaultTemplate from './templates/ssr.html.template';

// Forked for Docusaurus: https://github.com/slorber/static-site-generator-webpack-plugin
import StaticSiteGeneratorPlugin from '@slorber/static-site-generator-webpack-plugin';
import StaticSiteGeneratorPlugin, {
type Locals,
} from '@slorber/static-site-generator-webpack-plugin';

export default async function createServerConfig({
props,
onLinksCollected = () => {},
}: {
onLinksCollected,
onHeadTagsCollected,
}: Pick<Locals, 'onLinksCollected' | 'onHeadTagsCollected'> & {
props: Props;
onLinksCollected?: (staticPagePath: string, links: string[]) => void;
}): Promise<Configuration> {
const {
baseUrl,
Expand Down Expand Up @@ -73,6 +75,7 @@ export default async function createServerConfig({
preBodyTags,
postBodyTags,
onLinksCollected,
onHeadTagsCollected,
ssrTemplate: ssrTemplate ?? ssrDefaultTemplate,
noIndex,
},
Expand Down

0 comments on commit 93bbc70

Please sign in to comment.