PKGG
http://www.zrrr.net#searchcon ul
采集机器人 (2)2023/04/01
数据采集
{
"bookSourceComment": "xpath;coolapk@芜恙;intro;nextUrl",
"bookSourceGroup": "",
"bookSourceName": "PKGG",
"bookSourceType": 0,
"bookSourceUrl": "http:\/\/www.zrrr.net#searchcon ul",
"bookUrlPattern": "http:\/\/www.zrrr.net\/book\/.+",
"customOrder": 0,
"enabled": true,
"enabledExplore": false,
"lastUpdateTime": 1600749854852,
"ruleBookInfo": {
"author": "\/\/*[@class=\"author\"]\/span[2]\/text()",
"coverUrl": "\/\/*[@class=\"fengmian\"]\/img\/@src",
"intro": "\/\/*[@class=\"intro\"]\/p",
"kind": "\/\/*[@class=\"author\"]\/span[1]\/text()&&\/\/p[@class=\"author\"]\/span[3]\/text()##.*:|中.*|已",
"lastChapter": "\/\/*[@class=\"lastchapter\"]\/a\/text()&&\/\/*[@class=\"author\"]\/span[4]\/text()##(.+)\\n.*\\d+-(\\d+-\\d+).*##$1▪$2",
"name": "\/\/h1\/text()"
},
"ruleContent": {
"content": "\/\/*[@id=\"TextContent\"]@js:result+'本章未完'",
"nextContentUrl": "@js:if(result.match(\/\\(1\\\/(\\d+)\\)分页\/)){\n page = result.match(\/\\(1\\\/(\\d+)\\)分页\/)[1];\n list = [];\n for (i = 2; i <= page; i++) {\n list.push(baseUrl.replace(\/.html\/g, '_' + i + '.html'))\n }\n list\n}",
"replaceRegex": "##\\s*本章未完\\s*|.*本章完.*"
},
"ruleExplore": {},
"ruleSearch": {
"author": "\/\/li[9]\/text()",
"bookList": "\/\/*[@class=\"searchcon\"]\/ul",
"bookUrl": "\/\/li[7]\/a\/@href",
"coverUrl": "\/\/li[7]\/a\/@href##.*\/((\\d+)\\d{3})\/##\/image\/$2\/$1\/$1s.jpg",
"kind": "\/\/li[12]\/text()",
"lastChapter": "\/\/li[8]\/a\/text()&&\/\/li[11]\/text()@js:var t = result.replace(\/.*\\n\/,'');\nvar n = result.replace(\/\\n.*\/,'');\nn+ '▪' +t;",
"name": "\/\/li[7]\/a\/text()",
"wordCount": "\/\/li[10]\/text()"
},
"ruleToc": {
"chapterList": "\/\/*[@class=\"chapters\"]\/li\/a",
"chapterName": "text",
"chapterUrl": "href"
},
"searchUrl": "\/modules\/article\/search.php,{\n \"charset\": \"gbk\",\n \"method\": \"POST\",\n \"body\": \"searchkey={{key}}\"\n}",
"weight": 0
}