query.json 2.1 KB
Newer Older
Z
Zhou Rui 已提交
1 2
{
  "crawlWorkCompleted": {
Z
zhourui 已提交
3 4 5
    "enable": true,
    "cron": "50 50 21 * * ?",
    "count": 500.0,
Z
Zhou Rui 已提交
6 7 8 9 10
    "excludeAttachment": [],
    "excludeSite": [],
    "maxAttachmentSize": 5242880.0,
    "###enable": "是否启用###",
    "###cron": "定时cron表达式.###",
Z
zhourui 已提交
11
    "###count": "每次处理的数量,默认每小时处理所以默认为500,同时每次将重爬最旧的25%,按时间轮询25%.###",
Z
Zhou Rui 已提交
12 13 14 15 16
    "###excludeAttachment": "忽略附件名称.###",
    "###excludeSite": "忽略附件位置.###",
    "###maxAttachmentSize": "最大附件大小.###"
  },
  "crawlWork": {
Z
zhourui 已提交
17 18 19
    "enable": true,
    "cron": "40 40 10,12,14,16 * * ?",
    "count": 50.0,
Z
Zhou Rui 已提交
20 21 22 23 24
    "excludeAttachment": [],
    "excludeSite": [],
    "maxAttachmentSize": 5242880.0,
    "###enable": "是否启用###",
    "###cron": "定时cron表达式.###",
Z
zhourui 已提交
25
    "###count": "每次处理的数量,默认每小时处理所以默认为50,同时每次将重爬最旧的50%,按时间轮询50%.###",
Z
Zhou Rui 已提交
26 27 28 29 30
    "###excludeAttachment": "忽略附件名称.###",
    "###excludeSite": "忽略附件位置.###",
    "###maxAttachmentSize": "最大附件大小.###"
  },
  "crawlCms": {
Z
zhourui 已提交
31 32 33
    "enable": true,
    "cron": "30 30 9,12,15,18 * * ?",
    "count": 30.0,
Z
Zhou Rui 已提交
34 35 36 37
    "excludeAttachment": [],
    "maxAttachmentSize": 5242880.0,
    "###enable": "是否启用###",
    "###cron": "定时cron表达式.###",
Z
zhourui 已提交
38
    "###count": "每次处理的数量,默认每小时处理所以默认为30,同时每次将重爬最旧的50%,按时间轮询50%.###",
Z
Zhou Rui 已提交
39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55
    "###excludeAttachment": "忽略附件名称.###",
    "###maxAttachmentSize": "最大附件大小.###"
  },
  "extractOffice": true,
  "extractPdf": true,
  "extractText": true,
  "extractImage": false,
  "tessLanguage": "chi_sim",
  "###crawlWorkCompleted": "已完成工作收集器设置.###",
  "###crawlWork": "工作收集器设置.###",
  "###crawlCms": "内容管理收集器设置.###",
  "###extractOffice": "抽取office中的文本.###",
  "###extractPdf": "抽取pdf中的文本.###",
  "###extractText": "抽取文本中的文本.###",
  "###extractImage": "抽取图像中的文本.###",
  "###tessLanguage": "tess使用语言.###"
}