sitemap.js 12 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249
  1. /**
  2. * 每天运行一次,生成站点地图
  3. */
  4. const fs = require('fs');
  5. const datefns = require('date-fns');
  6. const models = require('../../models');
  7. const categories = require('../../config/category');
  8. const tags = require('../../config/tag');
  9. const date = datefns.format(Date.now(), 'yyyy-MM-dd');
  10. const sitemapPath = __dirname + '/../../dist/sitemap.xml';
  11. const sitemapTempPath = __dirname + '/../../dist/sitemap.xml.temp';
  12. // 生成站点地图
  13. async function generateSitemap() {
  14. let commonXml = [
  15. '<?xml version="1.0" encoding="UTF-8"?>',
  16. // '<urlset xmlns="http://www.sitemaps.org/schemas/sitemap/0.9">',
  17. '<urlset',
  18. ' xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"',
  19. ' xsi:schemaLocation="http://www.sitemaps.org/schemas/sitemap/0.9 http://www.sitemaps.org/schemas/sitemap/0.9/sitemap.xsd http://www.w3.org/1999/xhtml http://www.w3.org/2002/08/xhtml/xhtml1-strict.xsd"',
  20. ' xmlns="http://www.sitemaps.org/schemas/sitemap/0.9"',
  21. ' xmlns:xhtml="http://www.w3.org/1999/xhtml"',
  22. '>',
  23. ' <url>',
  24. ' <loc>https://art.pcoloring.com</loc>',
  25. ' <xhtml:link rel="alternate" hreflang="en" href="https://art.pcoloring.com/en" />',
  26. ' <xhtml:link rel="alternate" hreflang="es" href="https://art.pcoloring.com/es" />',
  27. ' <xhtml:link rel="alternate" hreflang="pt" href="https://art.pcoloring.com/pt" />',
  28. ' <xhtml:link rel="alternate" hreflang="ja" href="https://art.pcoloring.com/ja" />',
  29. ' <xhtml:link rel="alternate" hreflang="zh" href="https://art.pcoloring.com/zh" />',
  30. ` <lastmod>${date}</lastmod>`,
  31. ' </url>',
  32. ' <url>',
  33. ' <loc>https://art.pcoloring.com/en/category</loc>',
  34. ' <xhtml:link rel="alternate" hreflang="en" href="https://art.pcoloring.com/en/category" />',
  35. ' <xhtml:link rel="alternate" hreflang="es" href="https://art.pcoloring.com/es/category" />',
  36. ' <xhtml:link rel="alternate" hreflang="pt" href="https://art.pcoloring.com/pt/category" />',
  37. ' <xhtml:link rel="alternate" hreflang="ja" href="https://art.pcoloring.com/ja/category" />',
  38. ' <xhtml:link rel="alternate" hreflang="zh" href="https://art.pcoloring.com/zh/category" />',
  39. ` <lastmod>${date}</lastmod>`,
  40. ' </url>',
  41. ' <url>',
  42. ' <loc>https://art.pcoloring.com/en/tag</loc>',
  43. ' <xhtml:link rel="alternate" hreflang="en" href="https://art.pcoloring.com/en/tag" />',
  44. ' <xhtml:link rel="alternate" hreflang="es" href="https://art.pcoloring.com/es/tag" />',
  45. ' <xhtml:link rel="alternate" hreflang="pt" href="https://art.pcoloring.com/pt/tag" />',
  46. ' <xhtml:link rel="alternate" hreflang="ja" href="https://art.pcoloring.com/ja/tag" />',
  47. ' <xhtml:link rel="alternate" hreflang="zh" href="https://art.pcoloring.com/zh/tag" />',
  48. ` <lastmod>${date}</lastmod>`,
  49. ' </url>',
  50. ' <url>',
  51. ' <loc>https://art.pcoloring.com/en/albums</loc>',
  52. ' <xhtml:link rel="alternate" hreflang="en" href="https://art.pcoloring.com/en/albums" />',
  53. ' <xhtml:link rel="alternate" hreflang="es" href="https://art.pcoloring.com/es/albums" />',
  54. ' <xhtml:link rel="alternate" hreflang="pt" href="https://art.pcoloring.com/pt/albums" />',
  55. ' <xhtml:link rel="alternate" hreflang="ja" href="https://art.pcoloring.com/ja/albums" />',
  56. ' <xhtml:link rel="alternate" hreflang="zh" href="https://art.pcoloring.com/zh/albums" />',
  57. ` <lastmod>${date}</lastmod>`,
  58. ' </url>',
  59. ' <url>',
  60. ' <loc>https://art.pcoloring.com/en/special</loc>',
  61. ' <xhtml:link rel="alternate" hreflang="en" href="https://art.pcoloring.com/en/special" />',
  62. ' <xhtml:link rel="alternate" hreflang="es" href="https://art.pcoloring.com/es/special" />',
  63. ' <xhtml:link rel="alternate" hreflang="pt" href="https://art.pcoloring.com/pt/special" />',
  64. ' <xhtml:link rel="alternate" hreflang="ja" href="https://art.pcoloring.com/ja/special" />',
  65. ' <xhtml:link rel="alternate" hreflang="zh" href="https://art.pcoloring.com/zh/special" />',
  66. ` <lastmod>${date}</lastmod>`,
  67. ' </url>',
  68. ' <url>',
  69. ' <loc>https://art.pcoloring.com/en/designers</loc>',
  70. ' <xhtml:link rel="alternate" hreflang="en" href="https://art.pcoloring.com/en/designers" />',
  71. ' <xhtml:link rel="alternate" hreflang="es" href="https://art.pcoloring.com/es/designers" />',
  72. ' <xhtml:link rel="alternate" hreflang="pt" href="https://art.pcoloring.com/pt/designers" />',
  73. ' <xhtml:link rel="alternate" hreflang="ja" href="https://art.pcoloring.com/ja/designers" />',
  74. ' <xhtml:link rel="alternate" hreflang="zh" href="https://art.pcoloring.com/zh/designers" />',
  75. ` <lastmod>${date}</lastmod>`,
  76. ' </url>',
  77. ' <url>',
  78. ' <loc>https://art.pcoloring.com/en/info</loc>',
  79. ' <xhtml:link rel="alternate" hreflang="en" href="https://art.pcoloring.com/en/info" />',
  80. ' <xhtml:link rel="alternate" hreflang="es" href="https://art.pcoloring.com/es/info" />',
  81. ' <xhtml:link rel="alternate" hreflang="pt" href="https://art.pcoloring.com/pt/info" />',
  82. ' <xhtml:link rel="alternate" hreflang="ja" href="https://art.pcoloring.com/ja/info" />',
  83. ' <xhtml:link rel="alternate" hreflang="zh" href="https://art.pcoloring.com/zh/info" />',
  84. ` <lastmod>${date}</lastmod>`,
  85. ' </url>',
  86. ];
  87. // categories
  88. let categoriesXml = [];
  89. categories.forEach(e => {
  90. categoriesXml = categoriesXml.concat([
  91. ' <url>',
  92. ` <loc>https://art.pcoloring.com/en/category/${e.id}</loc>`,
  93. ` <xhtml:link rel="alternate" hreflang="en" href="https://art.pcoloring.com/en/category/${e.id}" />`,
  94. ` <xhtml:link rel="alternate" hreflang="es" href="https://art.pcoloring.com/es/category/${e.id}" />`,
  95. ` <xhtml:link rel="alternate" hreflang="pt" href="https://art.pcoloring.com/pt/category/${e.id}" />`,
  96. ` <xhtml:link rel="alternate" hreflang="ja" href="https://art.pcoloring.com/ja/category/${e.id}" />`,
  97. ` <xhtml:link rel="alternate" hreflang="zh" href="https://art.pcoloring.com/zh/category/${e.id}" />`,
  98. ` <lastmod>${date}</lastmod>`,
  99. ' </url>',
  100. ]
  101. );
  102. });
  103. console.log(categoriesXml);
  104. // tags
  105. let tagsXml = [];
  106. tags.forEach(e => {
  107. tagsXml = tagsXml.concat([
  108. ' <url>',
  109. ` <loc>https://art.pcoloring.com/en/tag/${e.tag}</loc>`,
  110. ` <xhtml:link rel="alternate" hreflang="en" href="https://art.pcoloring.com/en/tag/${e.tag}" />`,
  111. ` <xhtml:link rel="alternate" hreflang="es" href="https://art.pcoloring.com/es/tag/${e.tag}" />`,
  112. ` <xhtml:link rel="alternate" hreflang="pt" href="https://art.pcoloring.com/pt/tag/${e.tag}" />`,
  113. ` <xhtml:link rel="alternate" hreflang="ja" href="https://art.pcoloring.com/ja/tag/${e.tag}" />`,
  114. ` <xhtml:link rel="alternate" hreflang="zh" href="https://art.pcoloring.com/zh/tag/${e.tag}" />`,
  115. ` <lastmod>${date}</lastmod>`,
  116. ' </url>',
  117. ]);
  118. });
  119. console.log(tagsXml);
  120. // albums
  121. let albums = await models.ArtAlbum
  122. .find({ pid: 'art', enabled: true })
  123. .sort({ order: 'asc' })
  124. .select('_id')
  125. .lean()
  126. .exec();
  127. let albumsXml = [];
  128. albums.forEach(e => {
  129. albumsXml = albumsXml.concat([
  130. ' <url>',
  131. ` <loc>https://art.pcoloring.com/en/album/${e._id}</loc>`,
  132. ` <xhtml:link rel="alternate" hreflang="en" href="https://art.pcoloring.com/en/album/${e._id}" />`,
  133. ` <xhtml:link rel="alternate" hreflang="es" href="https://art.pcoloring.com/es/album/${e._id}" />`,
  134. ` <xhtml:link rel="alternate" hreflang="pt" href="https://art.pcoloring.com/pt/album/${e._id}" />`,
  135. ` <xhtml:link rel="alternate" hreflang="ja" href="https://art.pcoloring.com/ja/album/${e._id}" />`,
  136. ` <xhtml:link rel="alternate" hreflang="zh" href="https://art.pcoloring.com/zh/album/${e._id}" />`,
  137. ` <lastmod>${date}</lastmod>`,
  138. ' </url>',
  139. ])
  140. });
  141. console.log(albumsXml);
  142. // designers
  143. let designers = await models.Art.aggregate([
  144. // 首先,过滤出 status = 9000 的文档
  145. { $match: { open: true, status: 9000 } },
  146. // 首先,根据 user 字段进行分组,并计算每个 user 出现的次数
  147. { $group: { _id: '$user', count: { $sum: 1 } } },
  148. // 然后,按照 count 字段进行降序排列
  149. { $sort: { count: -1 } },
  150. // 接着,与 users 集合进行连接,以获取用户的详细信息
  151. {
  152. $lookup: {
  153. from: 'users', // 要连接的集合名称
  154. localField: '_id', // 本地字段(即上一步分组后的 _id 字段)
  155. foreignField: '_id', // 要连接的集合中的字段
  156. as: 'userDetails' // 连接后结果存储在新字段 userDetails 中
  157. }
  158. },
  159. // 展开 userDetails 数组,以便将用户信息提升到顶层
  160. { $unwind: '$userDetails' },
  161. // 调整输出格式,只保留需要的字段
  162. { $project: { _id: 1, user: '$_id', count: 1, username: '$userDetails.username', name: '$userDetails.name' } },
  163. // 限制返回的记录数量
  164. { $limit: 40 }
  165. ]);
  166. let designersXml = [];
  167. designers.forEach(e => {
  168. designersXml = designersXml.concat([
  169. ' <url>',
  170. ` <loc>https://art.pcoloring.com/en/designer/${e._id}</loc>`,
  171. ` <xhtml:link rel="alternate" hreflang="en" href="https://art.pcoloring.com/en/designer/${e._id}" />`,
  172. ` <xhtml:link rel="alternate" hreflang="es" href="https://art.pcoloring.com/es/designer/${e._id}" />`,
  173. ` <xhtml:link rel="alternate" hreflang="pt" href="https://art.pcoloring.com/pt/designer/${e._id}" />`,
  174. ` <xhtml:link rel="alternate" hreflang="ja" href="https://art.pcoloring.com/ja/designer/${e._id}" />`,
  175. ` <xhtml:link rel="alternate" hreflang="zh" href="https://art.pcoloring.com/zh/designer/${e._id}" />`,
  176. ` <lastmod>${date}</lastmod>`,
  177. ' </url>',
  178. ])
  179. });
  180. console.log(designersXml);
  181. // details
  182. let detailsXml = [];
  183. const cursor = await models.Art
  184. .find({ open: true, status: 9000 })
  185. .select('name title')
  186. .sort({ publishTime: -1 }).cursor(); // 使用cursor,避免一次查询太多记录内存受不了
  187. // 遍历游标中的每个文档
  188. for await (const doc of cursor) {
  189. let uriTitle = doc.name;
  190. if (doc.title) {
  191. try {
  192. let titleJson = JSON.parse(doc.title);
  193. if (titleJson.en) uriTitle = titleJson.en; // URL 里还是尽量用英文title
  194. } catch (e) {
  195. console.error(e.message);
  196. }
  197. }
  198. let utf8name = encodeURIComponent(uriTitle.replace(/[\s_]+/g, '-')).toLowerCase();
  199. detailsXml = detailsXml.concat([
  200. ' <url>',
  201. ` <loc>https://art.pcoloring.com/en/coloring-page/${utf8name}-${doc._id}</loc>`,
  202. ` <xhtml:link rel="alternate" hreflang="en" href="https://art.pcoloring.com/en/coloring-page/${utf8name}-${doc._id}" />`,
  203. ` <xhtml:link rel="alternate" hreflang="es" href="https://art.pcoloring.com/es/coloring-page/${utf8name}-${doc._id}" />`,
  204. ` <xhtml:link rel="alternate" hreflang="pt" href="https://art.pcoloring.com/pt/coloring-page/${utf8name}-${doc._id}" />`,
  205. ` <xhtml:link rel="alternate" hreflang="ja" href="https://art.pcoloring.com/ja/coloring-page/${utf8name}-${doc._id}" />`,
  206. ` <xhtml:link rel="alternate" hreflang="zh" href="https://art.pcoloring.com/zh/coloring-page/${utf8name}-${doc._id}" />`,
  207. ` <lastmod>${date}</lastmod>`,
  208. ' </url>',
  209. ]);
  210. console.log(`process detail ${doc._id} url done`);
  211. }
  212. let endXml = ['</urlset>'];
  213. let sitemapXml = [...commonXml, ...categoriesXml, ...tagsXml, ...albumsXml, ...designersXml, ...detailsXml, ...endXml];
  214. let sitemapXmlStr = sitemapXml.join('\n');
  215. fs.writeFileSync(sitemapTempPath, sitemapXmlStr); // 先写入临时文件
  216. fs.renameSync(sitemapTempPath, sitemapPath); // 再重命名
  217. console.log('生成sitemap成功');
  218. }
  219. function run() {
  220. generateSitemap();
  221. }
  222. module.exports = { run }
  223. if (require.main == module) {
  224. run();
  225. }