|
|
@ -25,9 +25,7 @@ import kotlin.collections.HashMap |
|
|
|
@Keep |
|
|
|
@Keep |
|
|
|
@Suppress("unused", "RegExpRedundantEscape") |
|
|
|
@Suppress("unused", "RegExpRedundantEscape") |
|
|
|
class AnalyzeRule(val ruleData: RuleDataInterface) : JsExtensions { |
|
|
|
class AnalyzeRule(val ruleData: RuleDataInterface) : JsExtensions { |
|
|
|
|
|
|
|
var book: BaseBook? = null |
|
|
|
var book = if (ruleData is BaseBook) ruleData else null |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
var chapter: BookChapter? = null |
|
|
|
var chapter: BookChapter? = null |
|
|
|
var nextChapterUrl: String? = null |
|
|
|
var nextChapterUrl: String? = null |
|
|
|
var content: Any? = null |
|
|
|
var content: Any? = null |
|
|
@ -44,12 +42,18 @@ class AnalyzeRule(val ruleData: RuleDataInterface) : JsExtensions { |
|
|
|
private var objectChangedJS = false |
|
|
|
private var objectChangedJS = false |
|
|
|
private var objectChangedJP = false |
|
|
|
private var objectChangedJP = false |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
init { |
|
|
|
|
|
|
|
if (ruleData is BaseBook) { |
|
|
|
|
|
|
|
book = ruleData |
|
|
|
|
|
|
|
} |
|
|
|
|
|
|
|
} |
|
|
|
|
|
|
|
|
|
|
|
@JvmOverloads |
|
|
|
@JvmOverloads |
|
|
|
fun setContent(content: Any?, baseUrl: String? = null): AnalyzeRule { |
|
|
|
fun setContent(content: Any?, baseUrl: String? = null): AnalyzeRule { |
|
|
|
if (content == null) throw AssertionError("内容不可空(Content cannot be null)") |
|
|
|
if (content == null) throw AssertionError("Content cannot be null") |
|
|
|
this.content = content |
|
|
|
this.content = content |
|
|
|
isJSON = content.toString().isJson() |
|
|
|
|
|
|
|
setBaseUrl(baseUrl) |
|
|
|
setBaseUrl(baseUrl) |
|
|
|
|
|
|
|
isJSON = content.toString().isJson() |
|
|
|
objectChangedXP = true |
|
|
|
objectChangedXP = true |
|
|
|
objectChangedJS = true |
|
|
|
objectChangedJS = true |
|
|
|
objectChangedJP = true |
|
|
|
objectChangedJP = true |
|
|
@ -59,13 +63,15 @@ class AnalyzeRule(val ruleData: RuleDataInterface) : JsExtensions { |
|
|
|
fun setBaseUrl(baseUrl: String?): AnalyzeRule { |
|
|
|
fun setBaseUrl(baseUrl: String?): AnalyzeRule { |
|
|
|
baseUrl?.let { |
|
|
|
baseUrl?.let { |
|
|
|
this.baseUrl = baseUrl |
|
|
|
this.baseUrl = baseUrl |
|
|
|
|
|
|
|
val urlMatcher = AnalyzeUrl.paramPattern.matcher(baseUrl) |
|
|
|
|
|
|
|
if (urlMatcher.find()) this.baseUrl = baseUrl.substring(0, urlMatcher.start()) |
|
|
|
} |
|
|
|
} |
|
|
|
return this |
|
|
|
return this |
|
|
|
} |
|
|
|
} |
|
|
|
|
|
|
|
|
|
|
|
fun setRedirectUrl(url: String): URL? { |
|
|
|
fun setRedirectUrl(url: String): URL? { |
|
|
|
kotlin.runCatching { |
|
|
|
kotlin.runCatching { |
|
|
|
val urlMatcher = AnalyzeUrl.paramPattern.matcher(url) |
|
|
|
val urlMatcher = AnalyzeUrl.paramPattern.matcher(baseUrl) |
|
|
|
redirectUrl = URL(if (urlMatcher.find()) url.substring(0, urlMatcher.start()) else url) |
|
|
|
redirectUrl = URL(if (urlMatcher.find()) url.substring(0, urlMatcher.start()) else url) |
|
|
|
} |
|
|
|
} |
|
|
|
return redirectUrl |
|
|
|
return redirectUrl |
|
|
@ -122,7 +128,7 @@ class AnalyzeRule(val ruleData: RuleDataInterface) : JsExtensions { |
|
|
|
@JvmOverloads |
|
|
|
@JvmOverloads |
|
|
|
fun getStringList(rule: String?, isUrl: Boolean = false): List<String>? { |
|
|
|
fun getStringList(rule: String?, isUrl: Boolean = false): List<String>? { |
|
|
|
if (rule.isNullOrEmpty()) return null |
|
|
|
if (rule.isNullOrEmpty()) return null |
|
|
|
val ruleList = splitSourceRule(rule, true) |
|
|
|
val ruleList = splitSourceRule(rule) |
|
|
|
return getStringList(ruleList, isUrl) |
|
|
|
return getStringList(ruleList, isUrl) |
|
|
|
} |
|
|
|
} |
|
|
|
|
|
|
|
|
|
|
@ -282,7 +288,7 @@ class AnalyzeRule(val ruleData: RuleDataInterface) : JsExtensions { |
|
|
|
@Suppress("UNCHECKED_CAST") |
|
|
|
@Suppress("UNCHECKED_CAST") |
|
|
|
fun getElements(ruleStr: String): List<Any> { |
|
|
|
fun getElements(ruleStr: String): List<Any> { |
|
|
|
var result: Any? = null |
|
|
|
var result: Any? = null |
|
|
|
val ruleList = splitSourceRule(ruleStr, true) |
|
|
|
val ruleList = splitSourceRule(ruleStr) |
|
|
|
content?.let { o -> |
|
|
|
content?.let { o -> |
|
|
|
if (ruleList.isNotEmpty()) result = o |
|
|
|
if (ruleList.isNotEmpty()) result = o |
|
|
|
for (sourceRule in ruleList) { |
|
|
|
for (sourceRule in ruleList) { |
|
|
@ -357,44 +363,58 @@ class AnalyzeRule(val ruleData: RuleDataInterface) : JsExtensions { |
|
|
|
/** |
|
|
|
/** |
|
|
|
* 分解规则生成规则列表 |
|
|
|
* 分解规则生成规则列表 |
|
|
|
*/ |
|
|
|
*/ |
|
|
|
fun splitSourceRule(ruleStr: String?, isList: Boolean = false): List<SourceRule> { |
|
|
|
fun splitSourceRule(ruleStr: String?, mode: Mode = Mode.Default): List<SourceRule> { |
|
|
|
if (ruleStr.isNullOrEmpty()) return ArrayList<SourceRule>() |
|
|
|
var vRuleStr = ruleStr |
|
|
|
val ruleList = ArrayList<SourceRule>() |
|
|
|
val ruleList = ArrayList<SourceRule>() |
|
|
|
var mMode: Mode = Mode.Default |
|
|
|
if (vRuleStr.isNullOrEmpty()) return ruleList |
|
|
|
var start = 0 |
|
|
|
//检测Mode |
|
|
|
//仅首字符为:时为AllInOne,其实:与伪类选择器冲突,建议改成?更合理 |
|
|
|
var mMode: Mode = mode |
|
|
|
if (isList && ruleStr.startsWith(":")) { |
|
|
|
when { |
|
|
|
|
|
|
|
vRuleStr.startsWith("@@") -> { |
|
|
|
|
|
|
|
vRuleStr = vRuleStr.substring(2) |
|
|
|
|
|
|
|
} |
|
|
|
|
|
|
|
vRuleStr.startsWith("@XPath:", true) -> { |
|
|
|
|
|
|
|
mMode = Mode.XPath |
|
|
|
|
|
|
|
vRuleStr = vRuleStr.substring(7) |
|
|
|
|
|
|
|
} |
|
|
|
|
|
|
|
vRuleStr.startsWith("@Json:", true) -> { |
|
|
|
|
|
|
|
mMode = Mode.Json |
|
|
|
|
|
|
|
vRuleStr = vRuleStr.substring(6) |
|
|
|
|
|
|
|
} |
|
|
|
|
|
|
|
vRuleStr.startsWith(":") -> { |
|
|
|
mMode = Mode.Regex |
|
|
|
mMode = Mode.Regex |
|
|
|
isRegex = true |
|
|
|
isRegex = true |
|
|
|
start = 1 |
|
|
|
vRuleStr = vRuleStr.substring(1) |
|
|
|
} |
|
|
|
} |
|
|
|
|
|
|
|
isRegex -> mMode = Mode.Regex |
|
|
|
|
|
|
|
isJSON -> mMode = Mode.Json |
|
|
|
|
|
|
|
} |
|
|
|
|
|
|
|
//拆分为规则列表 |
|
|
|
|
|
|
|
var start = 0 |
|
|
|
var tmp: String |
|
|
|
var tmp: String |
|
|
|
val jsMatcher = JS_PATTERN.matcher(ruleStr) |
|
|
|
val jsMatcher = JS_PATTERN.matcher(vRuleStr) |
|
|
|
while (jsMatcher.find()) { |
|
|
|
while (jsMatcher.find()) { |
|
|
|
if (jsMatcher.start() > start) { |
|
|
|
if (jsMatcher.start() > start) { |
|
|
|
tmp = ruleStr.substring(start, jsMatcher.start()).trim { it <= ' ' } |
|
|
|
tmp = vRuleStr.substring(start, jsMatcher.start()).trim { it <= ' ' } |
|
|
|
if (tmp.isNotEmpty()) { |
|
|
|
if (!TextUtils.isEmpty(tmp)) { |
|
|
|
ruleList.add(SourceRule(tmp, mMode)) |
|
|
|
ruleList.add(SourceRule(tmp, mMode)) |
|
|
|
} |
|
|
|
} |
|
|
|
} |
|
|
|
} |
|
|
|
ruleList.add(SourceRule(jsMatcher.group(2) ?: jsMatcher.group(1), Mode.Js)) |
|
|
|
ruleList.add(SourceRule(jsMatcher.group(), Mode.Js)) |
|
|
|
start = jsMatcher.end() |
|
|
|
start = jsMatcher.end() |
|
|
|
} |
|
|
|
} |
|
|
|
|
|
|
|
if (vRuleStr.length > start) { |
|
|
|
if (ruleStr.length > start) { |
|
|
|
tmp = vRuleStr.substring(start).trim { it <= ' ' } |
|
|
|
tmp = ruleStr.substring(start).trim { it <= ' ' } |
|
|
|
if (!TextUtils.isEmpty(tmp)) { |
|
|
|
if (tmp.isNotEmpty()) { |
|
|
|
|
|
|
|
ruleList.add(SourceRule(tmp, mMode)) |
|
|
|
ruleList.add(SourceRule(tmp, mMode)) |
|
|
|
} |
|
|
|
} |
|
|
|
} |
|
|
|
} |
|
|
|
|
|
|
|
|
|
|
|
return ruleList |
|
|
|
return ruleList |
|
|
|
} |
|
|
|
} |
|
|
|
|
|
|
|
|
|
|
|
/** |
|
|
|
/** |
|
|
|
* 规则类 |
|
|
|
* 规则类 |
|
|
|
*/ |
|
|
|
*/ |
|
|
|
|
|
|
|
|
|
|
|
inner class SourceRule internal constructor(ruleStr: String, mainMode: Mode = Mode.Default) { |
|
|
|
inner class SourceRule internal constructor(ruleStr: String, mainMode: Mode = Mode.Default) { |
|
|
|
internal var mode: Mode |
|
|
|
internal var mode: Mode |
|
|
|
internal var rule: String |
|
|
|
internal var rule: String |
|
|
@ -410,33 +430,39 @@ class AnalyzeRule(val ruleData: RuleDataInterface) : JsExtensions { |
|
|
|
|
|
|
|
|
|
|
|
init { |
|
|
|
init { |
|
|
|
this.mode = mainMode |
|
|
|
this.mode = mainMode |
|
|
|
rule = when { |
|
|
|
if (mode == Mode.Js) { |
|
|
|
|
|
|
|
rule = if (ruleStr.startsWith("<js>")) { |
|
|
|
|
|
|
|
ruleStr.substring(4, ruleStr.lastIndexOf("<")) |
|
|
|
|
|
|
|
} else { |
|
|
|
|
|
|
|
ruleStr.substring(4) |
|
|
|
|
|
|
|
} |
|
|
|
|
|
|
|
} else { |
|
|
|
|
|
|
|
when { |
|
|
|
ruleStr.startsWith("@CSS:", true) -> { |
|
|
|
ruleStr.startsWith("@CSS:", true) -> { |
|
|
|
mode = Mode.Default |
|
|
|
mode = Mode.Default |
|
|
|
ruleStr |
|
|
|
rule = ruleStr |
|
|
|
} |
|
|
|
} |
|
|
|
ruleStr.startsWith("@@") -> { |
|
|
|
ruleStr.startsWith("@@") -> { |
|
|
|
mode = Mode.Default |
|
|
|
mode = Mode.Default |
|
|
|
ruleStr.substring(2) |
|
|
|
rule = ruleStr.substring(2) |
|
|
|
} |
|
|
|
} |
|
|
|
ruleStr.startsWith("@XPath:", true) -> { |
|
|
|
ruleStr.startsWith("@XPath:", true) -> { |
|
|
|
mode = Mode.XPath |
|
|
|
mode = Mode.XPath |
|
|
|
ruleStr.substring(7) |
|
|
|
rule = ruleStr.substring(7) |
|
|
|
} |
|
|
|
} |
|
|
|
ruleStr.startsWith("/") -> {//XPath特征很明显,无需配置单独的识别标头 |
|
|
|
ruleStr.startsWith("//") -> {//XPath特征很明显,无需配置单独的识别标头 |
|
|
|
mode = Mode.XPath |
|
|
|
mode = Mode.XPath |
|
|
|
ruleStr |
|
|
|
rule = ruleStr |
|
|
|
} |
|
|
|
} |
|
|
|
ruleStr.startsWith("@Json:", true) -> { |
|
|
|
ruleStr.startsWith("@Json:", true) -> { |
|
|
|
mode = Mode.Json |
|
|
|
mode = Mode.Json |
|
|
|
ruleStr.substring(6) |
|
|
|
rule = ruleStr.substring(6) |
|
|
|
} |
|
|
|
} |
|
|
|
ruleStr.startsWith("$.") || isJSON -> { |
|
|
|
ruleStr.startsWith("$.") -> { |
|
|
|
mode = Mode.Json |
|
|
|
mode = Mode.Json |
|
|
|
ruleStr |
|
|
|
rule = ruleStr |
|
|
|
} |
|
|
|
} |
|
|
|
else -> { |
|
|
|
else -> rule = ruleStr |
|
|
|
ruleStr |
|
|
|
|
|
|
|
} |
|
|
|
} |
|
|
|
} |
|
|
|
} |
|
|
|
//分离put |
|
|
|
//分离put |
|
|
@ -445,14 +471,7 @@ class AnalyzeRule(val ruleData: RuleDataInterface) : JsExtensions { |
|
|
|
var start = 0 |
|
|
|
var start = 0 |
|
|
|
var tmp: String |
|
|
|
var tmp: String |
|
|
|
val evalMatcher = evalPattern.matcher(rule) |
|
|
|
val evalMatcher = evalPattern.matcher(rule) |
|
|
|
|
|
|
|
while (evalMatcher.find()) { |
|
|
|
if (evalMatcher.find()) { |
|
|
|
|
|
|
|
if (mode != Mode.Js && mode != Mode.Regex |
|
|
|
|
|
|
|
&& evalMatcher.start() == 0 |
|
|
|
|
|
|
|
) { |
|
|
|
|
|
|
|
mode = Mode.Regex |
|
|
|
|
|
|
|
} |
|
|
|
|
|
|
|
do { |
|
|
|
|
|
|
|
if (evalMatcher.start() > start) { |
|
|
|
if (evalMatcher.start() > start) { |
|
|
|
tmp = rule.substring(start, evalMatcher.start()) |
|
|
|
tmp = rule.substring(start, evalMatcher.start()) |
|
|
|
if (mode != Mode.Js && mode != Mode.Regex |
|
|
|
if (mode != Mode.Js && mode != Mode.Regex |
|
|
@ -461,6 +480,10 @@ class AnalyzeRule(val ruleData: RuleDataInterface) : JsExtensions { |
|
|
|
mode = Mode.Regex |
|
|
|
mode = Mode.Regex |
|
|
|
} |
|
|
|
} |
|
|
|
splitRegex(tmp) |
|
|
|
splitRegex(tmp) |
|
|
|
|
|
|
|
} else if (mode != Mode.Js && mode != Mode.Regex |
|
|
|
|
|
|
|
&& evalMatcher.start() == 0 |
|
|
|
|
|
|
|
) { |
|
|
|
|
|
|
|
mode = Mode.Regex |
|
|
|
} |
|
|
|
} |
|
|
|
tmp = evalMatcher.group() |
|
|
|
tmp = evalMatcher.group() |
|
|
|
when { |
|
|
|
when { |
|
|
@ -477,7 +500,6 @@ class AnalyzeRule(val ruleData: RuleDataInterface) : JsExtensions { |
|
|
|
} |
|
|
|
} |
|
|
|
} |
|
|
|
} |
|
|
|
start = evalMatcher.end() |
|
|
|
start = evalMatcher.end() |
|
|
|
} while (evalMatcher.find()) |
|
|
|
|
|
|
|
} |
|
|
|
} |
|
|
|
if (rule.length > start) { |
|
|
|
if (rule.length > start) { |
|
|
|
tmp = rule.substring(start) |
|
|
|
tmp = rule.substring(start) |
|
|
@ -493,12 +515,10 @@ class AnalyzeRule(val ruleData: RuleDataInterface) : JsExtensions { |
|
|
|
var tmp: String |
|
|
|
var tmp: String |
|
|
|
val ruleStrArray = ruleStr.split("##") |
|
|
|
val ruleStrArray = ruleStr.split("##") |
|
|
|
val regexMatcher = regexPattern.matcher(ruleStrArray[0]) |
|
|
|
val regexMatcher = regexPattern.matcher(ruleStrArray[0]) |
|
|
|
|
|
|
|
while (regexMatcher.find()) { |
|
|
|
if (regexMatcher.find()) { |
|
|
|
|
|
|
|
if (mode != Mode.Js && mode != Mode.Regex) { |
|
|
|
if (mode != Mode.Js && mode != Mode.Regex) { |
|
|
|
mode = Mode.Regex |
|
|
|
mode = Mode.Regex |
|
|
|
} |
|
|
|
} |
|
|
|
do { |
|
|
|
|
|
|
|
if (regexMatcher.start() > start) { |
|
|
|
if (regexMatcher.start() > start) { |
|
|
|
tmp = ruleStr.substring(start, regexMatcher.start()) |
|
|
|
tmp = ruleStr.substring(start, regexMatcher.start()) |
|
|
|
ruleType.add(defaultRuleType) |
|
|
|
ruleType.add(defaultRuleType) |
|
|
@ -508,7 +528,6 @@ class AnalyzeRule(val ruleData: RuleDataInterface) : JsExtensions { |
|
|
|
ruleType.add(tmp.substring(1).toInt()) |
|
|
|
ruleType.add(tmp.substring(1).toInt()) |
|
|
|
ruleParam.add(tmp) |
|
|
|
ruleParam.add(tmp) |
|
|
|
start = regexMatcher.end() |
|
|
|
start = regexMatcher.end() |
|
|
|
} while (regexMatcher.find()) |
|
|
|
|
|
|
|
} |
|
|
|
} |
|
|
|
if (ruleStr.length > start) { |
|
|
|
if (ruleStr.length > start) { |
|
|
|
tmp = ruleStr.substring(start) |
|
|
|
tmp = ruleStr.substring(start) |
|
|
@ -581,10 +600,15 @@ class AnalyzeRule(val ruleData: RuleDataInterface) : JsExtensions { |
|
|
|
} |
|
|
|
} |
|
|
|
|
|
|
|
|
|
|
|
private fun isRule(ruleStr: String): Boolean { |
|
|
|
private fun isRule(ruleStr: String): Boolean { |
|
|
|
return ruleStr.startsWith('@') //js首个字符不可能是@,除非是装饰器,所以@开头规定为规则 |
|
|
|
return when { |
|
|
|
|| ruleStr.startsWith("$.") |
|
|
|
ruleStr.startsWith("$.") -> true |
|
|
|
|| ruleStr.startsWith("$[") |
|
|
|
ruleStr.startsWith("@Json:", true) -> true |
|
|
|
|| ruleStr.startsWith("//") |
|
|
|
ruleStr.startsWith("//") -> true |
|
|
|
|
|
|
|
ruleStr.startsWith("@XPath:", true) -> true |
|
|
|
|
|
|
|
ruleStr.startsWith("@CSS:", true) -> true |
|
|
|
|
|
|
|
ruleStr.startsWith("@@") -> true |
|
|
|
|
|
|
|
else -> false |
|
|
|
|
|
|
|
} |
|
|
|
} |
|
|
|
} |
|
|
|
} |
|
|
|
} |
|
|
|
|
|
|
|
|
|
|
@ -662,6 +686,7 @@ class AnalyzeRule(val ruleData: RuleDataInterface) : JsExtensions { |
|
|
|
|
|
|
|
|
|
|
|
companion object { |
|
|
|
companion object { |
|
|
|
private val putPattern = Pattern.compile("@put:(\\{[^}]+?\\})", Pattern.CASE_INSENSITIVE) |
|
|
|
private val putPattern = Pattern.compile("@put:(\\{[^}]+?\\})", Pattern.CASE_INSENSITIVE) |
|
|
|
|
|
|
|
private val getPattern = Pattern.compile("@get:\\{([^}]+?)\\}", Pattern.CASE_INSENSITIVE) |
|
|
|
private val evalPattern = |
|
|
|
private val evalPattern = |
|
|
|
Pattern.compile("@get:\\{[^}]+?\\}|\\{\\{[\\w\\W]*?\\}\\}", Pattern.CASE_INSENSITIVE) |
|
|
|
Pattern.compile("@get:\\{[^}]+?\\}|\\{\\{[\\w\\W]*?\\}\\}", Pattern.CASE_INSENSITIVE) |
|
|
|
private val regexPattern = Pattern.compile("\\$\\d{1,2}") |
|
|
|
private val regexPattern = Pattern.compile("\\$\\d{1,2}") |
|
|
|