-
Notifications
You must be signed in to change notification settings - Fork 4
/
Copy pathconstants.js
66 lines (54 loc) · 1.45 KB
/
constants.js
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
const CRAWL_SITE = "gitee";
module.exports = {
/**
* 爬取的数据源站点 github | gitee
*/
CRAWL_SITE,
/**
* 需解析的语言类型
*/
SUPPORT_LANGUAGE: ["java", "js", "cpp", "py"],
/**
* 是否启用强制更新
* 如开启,会跳过读取本地缓存,拉取最新文件
*/
IS_FORCE_UPDATE_MODE: true,
/**
* 请求处理频率 ms
*/
REQUEST_RATE: 300,
/**
* markdown输出目录
*/
RAW_MARKDOWN_OUTPUT_DIR: "spider/raw-markdown",
/**
* 转化后的json输出目录
*/
DB_JSON_OUTPUT_DIR: "spider/yield-db-json",
/**
* 获取问题列表地址
*/
PROBLEMS_URL: CRAWL_SITE === "gitee"
? "https://gitee.com/golong/leetcode/tree/master/problems"
: "https://github.com/azl397985856/leetcode/tree/master/problems",
/**
* 抓取页面问题内容的dom元素选择器
*/
QUESTION_DOM_SELECTOR: CRAWL_SITE === "gitee"
? ".tree-item-file-name.tree-list-item a"
: ".position-relative.js-navigation-item .js-navigation-open",
/**
* markdwon下载地址
*/
BASE_MARKDWON_DOWNLOAD_URL: CRAWL_SITE === "gitee"
? "https://gitee.com/golong/leetcode/raw/master/problems/"
: "https://raw.githubusercontent.com/azl397985856/leetcode/master/problems/",
/**
* 过滤英文文档末尾标识
*/
CRAWL_IGNORE_SUFFIX: [".en.md", "-en.md"],
/**
* 爬虫抓取同一文件时的最大失败次数(多为网络原因导致, 切换到gitee源)
*/
MAX_CRAWL_RETRY_NUMBER: 100,
};