25개 이상의 토픽을 선택하실 수 없습니다. Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
 
 
 
 
 
 

23 lines
1.4 KiB

  1. -- 爬虫-新闻数据中间表
  2. CREATE TABLE IF NOT EXISTS `pap_spider_news` (
  3. `id` int(11) NOT NULL AUTO_INCREMENT,
  4. `origin_id` int(11) NOT NULL DEFAULT 0 COMMENT '原站文章ID',
  5. `type` varchar(20) NOT NULL DEFAULT 'news' COMMENT '来源类型 news/about',
  6. `title` varchar(500) NOT NULL DEFAULT '' COMMENT '文章标题',
  7. `category` varchar(100) DEFAULT '' COMMENT '原站栏目分类',
  8. `publish_time` datetime DEFAULT NULL COMMENT '原站发布时间',
  9. `content` longtext COMMENT '处理后的正文(图片已转存)',
  10. `content_original` longtext COMMENT '原始正文HTML(未处理图片)',
  11. `cover` varchar(500) DEFAULT '' COMMENT '封面图(转存后)',
  12. `cover_original` varchar(500) DEFAULT '' COMMENT '原始封面图URL',
  13. `images` text COMMENT '图片映射JSON [{original, new}]',
  14. `status` tinyint(1) DEFAULT 0 COMMENT '0待爬取 1已爬取详情 2图片已转存 3已同步到article -1失败',
  15. `article_id` int(11) DEFAULT 0 COMMENT '同步到article表后的ID',
  16. `error_msg` varchar(1000) DEFAULT '' COMMENT '错误信息',
  17. `create_time` datetime DEFAULT CURRENT_TIMESTAMP,
  18. `update_time` datetime DEFAULT CURRENT_TIMESTAMP ON UPDATE CURRENT_TIMESTAMP,
  19. PRIMARY KEY (`id`),
  20. UNIQUE KEY `uk_type_origin_id` (`type`, `origin_id`),
  21. KEY `idx_status` (`status`)
  22. ) ENGINE=InnoDB DEFAULT CHARSET=utf8mb4 COMMENT='爬虫-新闻数据';