2022-03-18 22:35:45 +00:00
|
|
|
import type { AstroConfig, AstroIntegration } from 'astro';
|
2022-06-20 19:31:39 +00:00
|
|
|
import {
|
|
|
|
EnumChangefreq,
|
|
|
|
simpleSitemapAndIndex,
|
2023-03-20 16:02:07 +00:00
|
|
|
type LinkItem as LinkItemBase,
|
|
|
|
type SitemapItemLoose,
|
2022-06-20 19:31:39 +00:00
|
|
|
} from 'sitemap';
|
2022-06-16 19:08:44 +00:00
|
|
|
import { fileURLToPath } from 'url';
|
2022-06-16 19:06:48 +00:00
|
|
|
import { ZodError } from 'zod';
|
2022-03-18 22:35:45 +00:00
|
|
|
|
2022-06-21 15:29:18 +00:00
|
|
|
import { generateSitemap } from './generate-sitemap.js';
|
|
|
|
import { Logger } from './utils/logger.js';
|
|
|
|
import { validateOptions } from './validate-options.js';
|
2022-06-16 19:06:48 +00:00
|
|
|
|
2023-05-25 09:15:26 +00:00
|
|
|
export { EnumChangefreq as ChangeFreqEnum } from 'sitemap';
|
2023-02-17 18:46:00 +00:00
|
|
|
export type ChangeFreq = `${EnumChangefreq}`;
|
2022-06-16 19:06:48 +00:00
|
|
|
export type SitemapItem = Pick<
|
|
|
|
SitemapItemLoose,
|
|
|
|
'url' | 'lastmod' | 'changefreq' | 'priority' | 'links'
|
|
|
|
>;
|
|
|
|
export type LinkItem = LinkItemBase;
|
|
|
|
|
|
|
|
export type SitemapOptions =
|
2022-04-02 18:29:59 +00:00
|
|
|
| {
|
2023-07-14 19:32:59 +00:00
|
|
|
filter?(page: string): boolean;
|
|
|
|
customPages?: string[];
|
|
|
|
|
|
|
|
i18n?: {
|
|
|
|
defaultLocale: string;
|
|
|
|
locales: Record<string, string>;
|
|
|
|
};
|
|
|
|
// number of entries per sitemap file
|
|
|
|
entryLimit?: number;
|
|
|
|
|
|
|
|
// sitemap specific
|
|
|
|
changefreq?: ChangeFreq;
|
|
|
|
lastmod?: Date;
|
|
|
|
priority?: number;
|
|
|
|
|
|
|
|
// called for each sitemap item just before to save them on disk, sync or async
|
|
|
|
serialize?(item: SitemapItem): SitemapItem | Promise<SitemapItem | undefined> | undefined;
|
|
|
|
}
|
2022-04-02 18:29:59 +00:00
|
|
|
| undefined;
|
|
|
|
|
2022-06-16 19:06:48 +00:00
|
|
|
function formatConfigErrorMessage(err: ZodError) {
|
|
|
|
const errorList = err.issues.map((issue) => ` ${issue.path.join('.')} ${issue.message + '.'}`);
|
|
|
|
return errorList.join('\n');
|
2022-03-18 22:35:45 +00:00
|
|
|
}
|
|
|
|
|
2022-06-16 19:06:48 +00:00
|
|
|
const PKG_NAME = '@astrojs/sitemap';
|
|
|
|
const OUTFILE = 'sitemap-index.xml';
|
2023-07-14 19:30:33 +00:00
|
|
|
const STATUS_CODE_PAGES = new Set(['/404', '/500']);
|
2022-06-16 19:06:48 +00:00
|
|
|
|
|
|
|
const createPlugin = (options?: SitemapOptions): AstroIntegration => {
|
2022-03-18 22:35:45 +00:00
|
|
|
let config: AstroConfig;
|
2023-05-03 16:19:45 +00:00
|
|
|
const logger = new Logger(PKG_NAME);
|
|
|
|
|
2022-03-18 22:35:45 +00:00
|
|
|
return {
|
2022-06-16 19:06:48 +00:00
|
|
|
name: PKG_NAME,
|
|
|
|
|
2022-03-18 22:35:45 +00:00
|
|
|
hooks: {
|
2022-06-16 19:06:48 +00:00
|
|
|
'astro:config:done': async ({ config: cfg }) => {
|
|
|
|
config = cfg;
|
2022-03-18 22:35:45 +00:00
|
|
|
},
|
2022-06-16 19:06:48 +00:00
|
|
|
|
2023-05-08 20:12:41 +00:00
|
|
|
'astro:build:done': async ({ dir, routes, pages }) => {
|
2022-06-16 19:06:48 +00:00
|
|
|
try {
|
2023-05-03 16:19:45 +00:00
|
|
|
if (!config.site) {
|
|
|
|
logger.warn(
|
|
|
|
'The Sitemap integration requires the `site` astro.config option. Skipping.'
|
|
|
|
);
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
2022-06-16 19:06:48 +00:00
|
|
|
const opts = validateOptions(config.site, options);
|
|
|
|
|
2022-06-30 16:02:39 +00:00
|
|
|
const { filter, customPages, serialize, entryLimit } = opts;
|
2022-06-16 19:06:48 +00:00
|
|
|
|
|
|
|
let finalSiteUrl: URL;
|
2022-06-30 16:02:39 +00:00
|
|
|
if (config.site) {
|
2022-06-16 19:06:48 +00:00
|
|
|
finalSiteUrl = new URL(config.base, config.site);
|
2022-06-30 16:02:39 +00:00
|
|
|
} else {
|
|
|
|
console.warn(
|
|
|
|
'The Sitemap integration requires the `site` astro.config option. Skipping.'
|
|
|
|
);
|
|
|
|
return;
|
2022-06-16 19:06:48 +00:00
|
|
|
}
|
|
|
|
|
2023-07-14 19:32:59 +00:00
|
|
|
let pageUrls = pages
|
|
|
|
.filter((p) => !STATUS_CODE_PAGES.has('/' + p.pathname.slice(0, -1)))
|
|
|
|
.map((p) => {
|
|
|
|
if (p.pathname !== '' && !finalSiteUrl.pathname.endsWith('/'))
|
|
|
|
finalSiteUrl.pathname += '/';
|
|
|
|
const path = finalSiteUrl.pathname + p.pathname;
|
|
|
|
return new URL(path, finalSiteUrl).href;
|
|
|
|
});
|
2023-05-08 20:12:41 +00:00
|
|
|
|
|
|
|
let routeUrls = routes.reduce<string[]>((urls, r) => {
|
2023-07-17 20:29:56 +00:00
|
|
|
// Only expose pages, not endpoints or redirects
|
|
|
|
if (r.type !== 'page') return urls;
|
|
|
|
|
2023-05-03 16:19:45 +00:00
|
|
|
/**
|
|
|
|
* Dynamic URLs have entries with `undefined` pathnames
|
|
|
|
*/
|
|
|
|
if (r.pathname) {
|
2023-07-14 19:30:33 +00:00
|
|
|
if (STATUS_CODE_PAGES.has(r.pathname)) return urls;
|
2023-05-03 16:19:45 +00:00
|
|
|
/**
|
|
|
|
* remove the initial slash from relative pathname
|
|
|
|
* because `finalSiteUrl` always has trailing slash
|
|
|
|
*/
|
|
|
|
const path = finalSiteUrl.pathname + r.generate(r.pathname).substring(1);
|
|
|
|
|
|
|
|
let newUrl = new URL(path, finalSiteUrl).href;
|
|
|
|
|
|
|
|
if (config.trailingSlash === 'never') {
|
|
|
|
urls.push(newUrl);
|
|
|
|
} else if (config.build.format === 'directory' && !newUrl.endsWith('/')) {
|
|
|
|
urls.push(newUrl + '/');
|
|
|
|
} else {
|
|
|
|
urls.push(newUrl);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
return urls;
|
|
|
|
}, []);
|
2022-06-16 19:06:48 +00:00
|
|
|
|
2023-06-02 08:07:44 +00:00
|
|
|
pageUrls = Array.from(new Set([...pageUrls, ...routeUrls, ...(customPages ?? [])]));
|
|
|
|
|
2022-06-16 19:06:48 +00:00
|
|
|
try {
|
|
|
|
if (filter) {
|
|
|
|
pageUrls = pageUrls.filter(filter);
|
|
|
|
}
|
|
|
|
} catch (err) {
|
|
|
|
logger.error(`Error filtering pages\n${(err as any).toString()}`);
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (pageUrls.length === 0) {
|
2023-05-03 16:19:45 +00:00
|
|
|
logger.warn(`No pages found!\n\`${OUTFILE}\` not created.`);
|
2022-06-16 19:06:48 +00:00
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
let urlData = generateSitemap(pageUrls, finalSiteUrl.href, opts);
|
|
|
|
|
|
|
|
if (serialize) {
|
|
|
|
try {
|
2022-06-20 19:29:53 +00:00
|
|
|
const serializedUrls: SitemapItem[] = [];
|
2022-06-16 19:06:48 +00:00
|
|
|
for (const item of urlData) {
|
|
|
|
const serialized = await Promise.resolve(serialize(item));
|
2022-06-27 18:12:43 +00:00
|
|
|
if (serialized) {
|
|
|
|
serializedUrls.push(serialized);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
if (serializedUrls.length === 0) {
|
|
|
|
logger.warn('No pages found!');
|
|
|
|
return;
|
2022-06-16 19:06:48 +00:00
|
|
|
}
|
|
|
|
urlData = serializedUrls;
|
|
|
|
} catch (err) {
|
|
|
|
logger.error(`Error serializing pages\n${(err as any).toString()}`);
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
await simpleSitemapAndIndex({
|
|
|
|
hostname: finalSiteUrl.href,
|
|
|
|
destinationDir: fileURLToPath(dir),
|
|
|
|
sourceData: urlData,
|
|
|
|
limit: entryLimit,
|
|
|
|
gzip: false,
|
|
|
|
});
|
|
|
|
logger.success(`\`${OUTFILE}\` is created.`);
|
|
|
|
} catch (err) {
|
|
|
|
if (err instanceof ZodError) {
|
|
|
|
logger.warn(formatConfigErrorMessage(err));
|
|
|
|
} else {
|
|
|
|
throw err;
|
|
|
|
}
|
2022-05-12 20:19:58 +00:00
|
|
|
}
|
2022-03-18 22:35:45 +00:00
|
|
|
},
|
|
|
|
},
|
|
|
|
};
|
2022-06-16 19:06:48 +00:00
|
|
|
};
|
|
|
|
|
|
|
|
export default createPlugin;
|