-
Notifications
You must be signed in to change notification settings - Fork 1
Expand file tree
/
Copy pathutil.js
More file actions
233 lines (203 loc) · 6.51 KB
/
util.js
File metadata and controls
233 lines (203 loc) · 6.51 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
var cheerio = require("cheerio");
var mongoose = require("mongoose");
var fs = require("fs");
exports.saveApiCatalog = saveApiCatalog;
exports.getPage = getPage;
exports.sleep = sleep;
//做了一些修改
//等待函数
async function sleep(time) {
return new Promise((resolve, reject) => {
setTimeout(resolve, time);
})
}
//保存所有大模块
exports.saveApi = async function (result) {
var $ = result.$;
var href = result.href;
var host = result.host;
var protocol = result.protocol;
var list = $("#column2 ul li");
list.each(function (index, item) {
var name = $(this).find("a").text();
var url = $(this).find("a").attr("href");
var ApiDocSchema = mongoose.model("apidoc");
ApiDocSchema.findOne({name: name}, (err, doc) => {
if (!doc) {
var id = mongoose.Types.ObjectId();
var api = new ApiDocSchema({name, url, href, id});
api.save((err, product) => {
if (err) Promise.reject(err);
})
}
})
})
}
//根据url获取页面数据
async function getPage(browser, url) {
const page = await browser.newPage();
await page.goto(url);
await sleep(1000);
const bodyHandle = await page.$('body');
var result = await page.evaluate(body => {
var html = body.innerHTML;
var href = window.location.href;
return {
html,
href
}
}, bodyHandle);
return Promise.resolve({$: cheerio.load(result.html), href: result.href});
}
//保存Api的目录
async function saveApiCatalog(browser) {
var ApiDocSchema = mongoose.model("apidoc");
ApiDocSchema.find({}, (err, doc) => {
if (err) return Promise.reject(err);
for (let i = 0; i < doc.length; i++) {
var url = `${doc[i].href}${doc[i].url}`;
var apidocid = doc[i]._id;
saveApiDetail(browser, url, doc[i].name, apidocid);
}
})
}
async function saveApiDetail(browser, url, name, apidocid) {
var result = await getPage(browser, url);
var $ = result.$;
var children = $("#toc > ul").first();
var CatalogSchema = mongoose.model("catalog");
var root = new CatalogSchema();
getChild(children, 1, $, root, null, apidocid);
var CatalogSchema = mongoose.model("catalog");
root.save(() => {
console.log("保存成功!");
})
}
//使用递归实现
function getChild(child, currentLevel, $, root, parent, apidocid) {
var level = currentLevel;
if (child.is("ul")) {
//第一层保存根节点
level++;
child.children("li").each((t, s) => {
var me = $(s);
var span = $(s).find("span").first();
var anchorClass = "#" + span.children("a").first().attr("href").replace("#", "");
//锚点
var anchor = $(anchorClass).parent().parent();
//获取锚点下对应的信息
if (level - 1 == 1 && t == 0) {
root.name = span.text();
root.level = level;
root.leaf = true;
root.anchorClass = anchorClass;
root.docapiid = apidocid;
getVersionInformation(root, anchorClass, $);
getParameterInformation(root, anchor, $);
getApiDetailInformation(root, anchor, $)
}
else {
var data = {
name: span.text(),
level: level - 1,
leaf: true,
anchorClass: anchorClass,
children: [],
versions: [],
parameters: []
}
getVersionInformation(data, anchorClass, $);
getParameterInformation(data, anchor, $);
getApiDetailInformation(data, anchor, $)
if (level - 1 == 2) {
root.children.push(data);
}
else {
parent.children.push(data);
}
}
// var space = ""
// for (var i = 0; i < level; i++)
// space += " ";
// console.log(space + span.text());
// var href = span.children("a").first().attr("href");
// // var x=$(`a[href=${href}]`);
// // console.log(x.length);
//var anchor = $(`#${href.replace("#", "")}`).parent().parent();
// //获取版本信息版本信息
// var metaData = anchor.next().next();
// //如果存在就读取版本信息
// if (metaData.hasClass("api_metadata")) {
// var table = metaData.find(".changelog table tbody")
// if (table.length == 0) {
// //console.log("当前版本:"+metaData.children().first().text())
// }
// //读取版本列表
// else {
// table.children("tbody tr").each((index, item) => {
// if (index == 0) {
// // console.log("版本 变更");
// }
// if (index > 0) {
// var meta = $(item);
// //console.log(`${meta.children().first().text()} ${meta.children().first().next().text()}`);
// }
// });
// }
//
// }
//
// //获取参数列表
//var parameterlist = anchor.next().next().next();
// if (parameterlist.is("ul")) {
// parameterlist.children("li").each((index, item) => {
// //console.log($(item).text().trim().replace("\n",""));
// });
// }
// //获取接口详细内容
// var content = parameterlist.nextUntil("h1,h2,h3,h4,h5");
// content.each((index, item) => {
// console.log($(item).text());
// })
getChild(me.children().first().next(), level, $, root, data);
})
}
}
//获取版本信息
function getVersionInformation(data, anchorClass, $) {
var anchor = $(anchorClass).parent().parent();
var metaData = anchor.next().next();
if (metaData.hasClass("api_metadata")) {
var table = metaData.find(".changelog table tbody")
if (table.length == 0) {
data.versions.push({key: "当前版本", value: metaData.children().first().text()});
}
//读取版本列表
else {
table.children("tbody tr").each((index, item) => {
if (index > 0) {
var meta = $(item);
data.versions.push({key: meta.children().first().text(), value: meta.children().first().next().text()});
}
});
}
}
}
//获取参数信息
function getParameterInformation(data, element, $) {
var parameterlist = element.next().next().next();
if (parameterlist.is("ul")) {
parameterlist.children("li").each((index, item) => {
data.parameters.push($(item).text().trim().replace("\n", ""));
});
}
}
//获取Api详情数据
function getApiDetailInformation(data, element, $) {
var content = element.next().next().next().nextUntil("h1,h2,h3,h4,h5");
var str = "";
content.each((index, item) => {
str += $(item).text() + "\n";
})
data.content = str;
}