feat: Add new source: freebuf (#260)

bruceblink · web-flow · commit 57cb70ecc9c5 · 2025-12-06T19:02:45.000+08:00
* feat: Add new source: freebuf

* fix: 修复freebuf新闻id为空字符串的问题，现在使用截取文章url的方式获取文章id
diff --git a/public/icons/freebuf.png b/public/icons/freebuf.png
diff --git a/server/glob.d.ts b/server/glob.d.ts
@@ -11,6 +11,7 @@ declare module 'glob:./sources/{*.ts,**/index.ts}' {
   export const douban: typeof import('./sources/douban')
   export const douyin: typeof import('./sources/douyin')
   export const fastbull: typeof import('./sources/fastbull')
+  export const freebuf: typeof import('./sources/freebuf')
   export const gelonghui: typeof import('./sources/gelonghui')
   export const ghxi: typeof import('./sources/ghxi')
   export const github: typeof import('./sources/github')
diff --git a/server/sources/freebuf.ts b/server/sources/freebuf.ts
@@ -0,0 +1,184 @@
+import * as cheerio from "cheerio"
+
+// 定义文章统计信息接口
+interface ArticleStats {
+  views: number
+  collections: number
+}
+
+// 定义作者信息接口
+interface AuthorInfo {
+  name: string
+  avatar?: string
+  profileUrl?: string
+}
+
+// 定义文章数据接口
+interface ArticleData {
+  title: string
+  url: string
+  description: string
+  publishTime: string
+  author: AuthorInfo
+  stats: ArticleStats
+  album?: string
+  image?: string
+  category?: string
+}
+
+// 辅助函数：安全提取文本
+function safeExtract($element: cheerio.Cheerio<any>, selector: string): string {
+  const result = $element.find(selector).first().text().trim()
+  return result || ""
+}
+
+// 辅助函数：安全提取属性
+function safeExtractAttribute($element: cheerio.Cheerio<any>, selector: string, attribute: string): string {
+  return $element.find(selector).first().attr(attribute) || ""
+}
+
+// 辅助函数：格式化URL
+function formatUrl(url: string | undefined, baseUrl: string = "https://www.freebuf.com"): string {
+  if (!url) return ""
+  return url.startsWith("http") ? url : `${baseUrl}${url}`
+}
+
+// 辅助函数：提取统计信息
+function extractStats($article: cheerio.Cheerio<any>): ArticleStats {
+  const stats: ArticleStats = { views: 0, collections: 0 }
+
+  // 提取围观数
+  const viewElement = $article.find("a:contains(\"围观\")")
+  if (viewElement.length) {
+    const viewText = viewElement.find("span").first().text()
+    stats.views = Number.parseInt(viewText) || 0
+  }
+
+  // 提取收藏数
+  const collectElement = $article.find("a:contains(\"收藏\")")
+  if (collectElement.length) {
+    const collectText = collectElement.find("span").first().text()
+    stats.collections = Number.parseInt(collectText) || 0
+  }
+
+  return stats
+}
+
+// 辅助函数：提取作者信息
+function extractAuthor($article: cheerio.Cheerio<any>): AuthorInfo {
+  const author: AuthorInfo = { name: "" }
+
+  const authorLink = $article.find(".item-bottom a").first()
+  if (authorLink.length) {
+    author.name = authorLink.find("span").last().text().trim()
+    author.profileUrl = formatUrl(authorLink.attr("href"))
+
+    const avatarImg = authorLink.find(".ant-avatar img")
+    if (avatarImg.length) {
+      author.avatar = avatarImg.attr("src")
+    }
+  }
+
+  return author
+}
+
+// 辅助函数：提取分类信息
+function extractCategory($article: cheerio.Cheerio<any>): string {
+  // 从URL路径推断分类
+  const articleUrl = $article.find(".title-left .title").parent().attr("href") || ""
+  if (articleUrl.includes("/articles/web/")) return "Web安全"
+  if (articleUrl.includes("/articles/database/")) return "数据安全"
+  if (articleUrl.includes("/articles/network/")) return "网络安全"
+  if (articleUrl.includes("/articles/mobile/")) return "移动安全"
+  if (articleUrl.includes("/articles/cloud/")) return "云安全"
+
+  return ""
+}
+
+// 通过截取freebuf的文章url获取新闻id
+function extractIdFromUrl(url: string): string {
+  // 找到最后一个斜杠
+  const lastPart = url.slice(url.lastIndexOf("/") + 1) // "460614.html"
+  // 去掉 .html，只保留数字
+  const match = lastPart.match(/\d+/)
+  return match ? match[0] : ""
+}
+
+export default defineSource(async () => {
+  const baseUrl = "https://www.freebuf.com"
+  const html = await myFetch<any>(baseUrl, {
+    headers: {
+      "User-Agent":
+                "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/121.0.0.0 Safari/537.36",
+      "Referer": "https://www.freebuf.com/",
+      "Accept": "text/html,application/xhtml+xml,application/xml;q=0.9,image/avif,image/webp,image/apng,*/*;q=0.8,application/signed-exchange;v=b3;q=0.7",
+    },
+  })
+  const $ = cheerio.load(html)
+  const articles: ArticleData[] = []
+  // 遍历每个文章项
+  $(".article-item").each((index: number, articleElement) => {
+    const $article = $(articleElement)
+
+    try {
+      // 提取文章标题和URL
+      const titleLink = $article.find(".title-left .title").parent()
+      const title = titleLink.find(".title").text().trim()
+      const url = formatUrl(titleLink.attr("href"), baseUrl)
+
+      // 如果标题为空，跳过此项
+      if (!title) return
+
+      // 提取文章描述
+      const description = safeExtract($article, ".item-right .text-line-2")
+
+      // 提取发布时间
+      const publishTime = safeExtract($article, ".item-bottom span:last-child")
+
+      // 提取作者信息
+      const author = extractAuthor($article)
+
+      // 提取统计信息
+      const stats = extractStats($article)
+
+      // 提取专辑信息
+      const album = safeExtract($article, ".from-column span")
+
+      // 提取图片
+      const image = safeExtractAttribute($article, ".img-view img", "src")
+
+      // 提取分类
+      const category = extractCategory($article)
+
+      // 构建完整的文章对象
+      const article: ArticleData = {
+        title,
+        url,
+        description,
+        publishTime,
+        author,
+        stats,
+        album: album || undefined,
+        image: image || undefined,
+        category: category || undefined,
+      }
+
+      articles.push(article)
+    } catch (error) {
+      console.warn(`解析第${index + 1}篇文章时出错:`, error instanceof Error ? error.message : String(error))
+    }
+  })
+  // 转换数据格式
+  return articles.map(item => ({
+    id: extractIdFromUrl(item.url),
+    title: item.title,
+    url: item.url,
+    extra: {
+      hover: item.description,
+      time: item.publishTime,
+      author: item.author,
+      stats: item.stats,
+      album: item.album,
+    },
+  }))
+})
diff --git a/shared/pinyin.json b/shared/pinyin.json
@@ -44,5 +44,6 @@
   "chongbuluo-hot": "chongbuluo-zuire",
   "douban": "douban-remendianying",
   "steam": "Steam-zaixianrenshu",
-  "tencent-hot": "tengxunxinwen-zonghezaobao"
+  "tencent-hot": "tengxunxinwen-zonghezaobao",
+  "freebuf": "Freebuf-wangluoanquan"
 }
diff --git a/shared/pre-sources.ts b/shared/pre-sources.ts
@@ -443,6 +443,14 @@ export const originSources = {
       },
     },
   },
+  "freebuf": {
+    name: "Freebuf",
+    column: "china",
+    title: "网络安全",
+    color: "green",
+    type: "hottest",
+    home: "https://www.freebuf.com/",
+  },
 } as const satisfies Record<string, OriginSource>
 
 export function genSources() {
diff --git a/shared/sources.json b/shared/sources.json
@@ -509,5 +509,14 @@
     "color": "blue",
     "interval": 1800000,
     "title": "综合早报"
+  },
+  "freebuf": {
+    "title": "网络安全",
+    "name": "Freebuf",
+    "type": "hottest",
+    "column": "china",
+    "home": "https://www.freebuf.com/",
+    "color": "green",
+    "interval": 600000
   }
 }

Original file line number	Diff line number	Diff line change
`@@ -44,5 +44,6 @@`
`44`	`44`	`"chongbuluo-hot": "chongbuluo-zuire",`
`45`	`45`	`"douban": "douban-remendianying",`
`46`	`46`	`"steam": "Steam-zaixianrenshu",`
`47`		`- "tencent-hot": "tengxunxinwen-zonghezaobao"`
	`47`	`+ "tencent-hot": "tengxunxinwen-zonghezaobao",`
	`48`	`+ "freebuf": "Freebuf-wangluoanquan"`
`48`	`49`	`}`