|
这是,翻页线索规则:
<?xml version="1.0" encoding="UTF-8"?>
<spider-clue-extraction>
<theme>阿里访客详情分析1</theme>
<scope>
<from>HTML</from>
<path-type>a</path-type>
<path>
/html/body/div[position()=1]/div[position()=3]/div[position()=1]/div[position()=9]/div[position()=6]/div/div[position()=1]//a[.//text()="next"]
</path>
<clue-type>inthread</clue-type>
<target-theme>
<name>阿里访客详情分析1</name>
<prefix-position>hostname+pathname</prefix-position>
</target-theme>
<simClick>true</simClick>
</scope>
undefined
</spider-clue-extraction> |
|