sitemap.js 6.1 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201
  1. /**
  2. * 每天运行一次,生成站点地图
  3. */
  4. const fs = require('fs');
  5. const datefns = require('date-fns');
  6. const models = require('../../models');
  7. const categories = require('../../config/category');
  8. const tags = require('../../config/tag');
  9. const date = datefns.format(Date.now(), 'yyyy-MM-dd');
  10. const sitemapPath = __dirname + '/../../dist/sitemap.xml';
  11. const sitemapTempPath = __dirname + '/../../dist/sitemap.xml.temp';
  12. // 生成站点地图
  13. async function generateSitemap() {
  14. let commonXml = [
  15. '<?xml version="1.0" encoding="UTF-8"?>',
  16. // '<urlset xmlns="http://www.sitemaps.org/schemas/sitemap/0.9">',
  17. '<urlset',
  18. ' xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"',
  19. ' xsi:schemaLocation="http://www.sitemaps.org/schemas/sitemap/0.9 http://www.sitemaps.org/schemas/sitemap/0.9/sitemap.xsd http://www.w3.org/1999/xhtml http://www.w3.org/2002/08/xhtml/xhtml1-strict.xsd"',
  20. ' xmlns="http://www.sitemaps.org/schemas/sitemap/0.9"',
  21. ' xmlns:xhtml="http://www.w3.org/1999/xhtml"',
  22. '>',
  23. ' <url>',
  24. ' <loc>https://art.pcoloring.com/en</loc>',
  25. ` <lastmod>${date}</lastmod>`,
  26. ' <changefreq>daily</changefreq>',
  27. ' <priority>1.0</priority>',
  28. ' </url>',
  29. ' <url>',
  30. ' <loc>https://art.pcoloring.com/en/category</loc>',
  31. ` <lastmod>${date}</lastmod>`,
  32. ' <changefreq>daily</changefreq>',
  33. ' <priority>0.8</priority>',
  34. ' </url>',
  35. ' <url>',
  36. ' <loc>https://art.pcoloring.com/en/tag</loc>',
  37. ` <lastmod>${date}</lastmod>`,
  38. ' <changefreq>daily</changefreq>',
  39. ' <priority>0.8</priority>',
  40. ' </url>',
  41. ' <url>',
  42. ' <loc>https://art.pcoloring.com/en/albums</loc>',
  43. ` <lastmod>${date}</lastmod>`,
  44. ' <changefreq>weekly</changefreq>',
  45. ' <priority>0.8</priority>',
  46. ' </url>',
  47. ' <url>',
  48. ' <loc>https://art.pcoloring.com/en/special</loc>',
  49. ` <lastmod>${date}</lastmod>`,
  50. ' <changefreq>daily</changefreq>',
  51. ' <priority>0.8</priority>',
  52. ' </url>',
  53. ' <url>',
  54. ' <loc>https://art.pcoloring.com/en/artists</loc>',
  55. ` <lastmod>${date}</lastmod>`,
  56. ' <changefreq>monthly</changefreq>',
  57. ' <priority>0.8</priority>',
  58. ' </url>',
  59. ' <url>',
  60. ' <loc>https://art.pcoloring.com/en/info</loc>',
  61. ` <lastmod>${date}</lastmod>`,
  62. ' </url>',
  63. ];
  64. // categories
  65. let categoriesXml = [];
  66. categories.forEach(e => {
  67. categoriesXml = categoriesXml.concat([
  68. ' <url>',
  69. ` <loc>https://art.pcoloring.com/en/category/${e.id}</loc>`,
  70. ` <lastmod>${date}</lastmod>`,
  71. ' </url>',
  72. ]
  73. );
  74. });
  75. console.log(categoriesXml);
  76. // tags
  77. let tagsXml = [];
  78. tags.forEach(e => {
  79. tagsXml = tagsXml.concat([
  80. ' <url>',
  81. ` <loc>https://art.pcoloring.com/en/tag/${e.tag}</loc>`,
  82. ` <lastmod>${date}</lastmod>`,
  83. ' </url>',
  84. ]);
  85. });
  86. console.log(tagsXml);
  87. // albums
  88. let albums = await models.ArtAlbum
  89. .find({ pid: 'art', enabled: true })
  90. .sort({ order: 'asc' })
  91. .select('_id')
  92. .lean()
  93. .exec();
  94. let albumsXml = [];
  95. albums.forEach(e => {
  96. albumsXml = albumsXml.concat([
  97. ' <url>',
  98. ` <loc>https://art.pcoloring.com/en/coloring-page-album/${e._id}</loc>`,
  99. ` <lastmod>${date}</lastmod>`,
  100. ' </url>',
  101. ])
  102. });
  103. console.log(albumsXml);
  104. // designers
  105. let designers = await models.Art.aggregate([
  106. // 首先,过滤出 status = 9000 的文档
  107. { $match: { open: true, status: 9000 } },
  108. // 首先,根据 user 字段进行分组,并计算每个 user 出现的次数
  109. { $group: { _id: '$user', count: { $sum: 1 } } },
  110. // 然后,按照 count 字段进行降序排列
  111. { $sort: { count: -1 } },
  112. // 接着,与 users 集合进行连接,以获取用户的详细信息
  113. {
  114. $lookup: {
  115. from: 'users', // 要连接的集合名称
  116. localField: '_id', // 本地字段(即上一步分组后的 _id 字段)
  117. foreignField: '_id', // 要连接的集合中的字段
  118. as: 'userDetails' // 连接后结果存储在新字段 userDetails 中
  119. }
  120. },
  121. // 展开 userDetails 数组,以便将用户信息提升到顶层
  122. { $unwind: '$userDetails' },
  123. // 调整输出格式,只保留需要的字段
  124. { $project: { _id: 1, user: '$_id', count: 1, username: '$userDetails.username', name: '$userDetails.name' } },
  125. // 限制返回的记录数量
  126. { $limit: 40 }
  127. ]);
  128. let designersXml = [];
  129. designers.forEach(e => {
  130. designersXml = designersXml.concat([
  131. ' <url>',
  132. ` <loc>https://art.pcoloring.com/en/artist/${e._id}</loc>`,
  133. ` <lastmod>${date}</lastmod>`,
  134. ' </url>',
  135. ])
  136. });
  137. console.log(designersXml);
  138. // details
  139. let detailsXml = [];
  140. const cursor = await models.Art
  141. .find({ open: true, status: 9000 })
  142. .select('name title')
  143. .sort({ publishTime: -1 }).cursor(); // 使用cursor,避免一次查询太多记录内存受不了
  144. // 遍历游标中的每个文档
  145. for await (const doc of cursor) {
  146. let uriTitle = doc.name;
  147. if (doc.title) {
  148. try {
  149. let titleJson = JSON.parse(doc.title);
  150. if (titleJson.en) uriTitle = titleJson.en; // URL 里还是尽量用英文title
  151. } catch (e) {
  152. console.error(e.message);
  153. }
  154. }
  155. let utf8name = encodeURIComponent(uriTitle.replace(/[\s_]+/g, '-')).toLowerCase();
  156. detailsXml = detailsXml.concat([
  157. ' <url>',
  158. ` <loc>https://art.pcoloring.com/en/coloring-page/${utf8name}-${doc._id}</loc>`,
  159. ` <lastmod>${date}</lastmod>`,
  160. ' </url>',
  161. ]);
  162. console.log(`process detail ${doc._id} url done`);
  163. }
  164. let endXml = ['</urlset>'];
  165. let sitemapXml = [...commonXml, ...categoriesXml, ...tagsXml, ...albumsXml, ...designersXml, ...detailsXml, ...endXml];
  166. let sitemapXmlStr = sitemapXml.join('\n');
  167. fs.writeFileSync(sitemapTempPath, sitemapXmlStr); // 先写入临时文件
  168. fs.renameSync(sitemapTempPath, sitemapPath); // 再重命名
  169. console.log('生成sitemap成功');
  170. }
  171. function run() {
  172. generateSitemap();
  173. }
  174. module.exports = { run }
  175. if (require.main == module) {
  176. run();
  177. }