关关采集规则(杰奇纯文字小说版)

合集下载
  1. 1、下载文档前请自行甄别文档内容的完整性,平台不提供额外的编辑、内容补充、找答案等附加服务。
  2. 2、"仅部分预览"的文档,不可在线预览部分如存在完整性等问题,可反馈申请退款(可完整预览的文档不适用该条件!)。
  3. 3、如文档侵犯您的权益,请联系客服反馈,我们会尽快为您处理(人工客服工作时间:9:00-18:30)。

<?xml version="1.0"?>
<RuleConfigInfo xmlns:xsi="/2001/XMLSchema-instance" xmlns:xsd="/2001/XMLSchema">
<RuleV ersion>
<RegexName>RuleV ersion</RegexName>
<Pattern />
<Method>Match</Method>
<Options>None</Options>
<FilterPattern />
</RuleV ersion>
<RuleID>
<RegexName>RuleID</RegexName>
<Pattern>3232</Pattern>
<Method>Match</Method>
<Options>None</Options>
<FilterPattern />
</RuleID>
<GetSiteName>
<RegexName>GetSiteName</RegexName>
<Pattern>相爱小说网</Pattern>
<Method>Match</Method>
<Options>None</Options>
<FilterPattern />
</GetSiteName>
<GetSiteCharset>
<RegexName>GetSiteCharset</RegexName>
<Pattern>gbk</Pattern>
<Method>Match</Method>
<Options>None</Options>
<FilterPattern />
</GetSiteCharset>
<GetSiteUrl>
<RegexName>GetSiteUrl</RegexName>
<Pattern></Pattern>
<Method>Match</Method>
<Options>None</Options>
<FilterPattern />
</GetSiteUrl>
<NovelSearchUrl>
<RegexName>NovelSearchUrl</RegexName>
<Pattern>/modules/article/search.php</Pattern>
<Method>Match</Method>
<Options>None</Options>
<FilterPattern />
</NovelSearchUrl>
<NovelSearchData>
<RegexName>NovelSearchData</RegexName>
<Pattern>searchkey={SearchKey}</Pattern>
<Method>Match</Method>
<Options>None</Options>
<FilterPattern />
</NovelSearchData>
<NovelSearch_GetNovelKey>
<RegexName>NovelSearch_GetNovelKey</RegexName>
<Pattern>&lt;td class="odd"&gt;&lt;a href="/files/article/info/\d*/(\d*).html"&gt;.+?&lt;/a&gt;&lt;/td&gt;</Pattern> <Method>Match</Method>
<Options>None</Options>
<FilterPattern />
</NovelSearch_GetNovelKey>
<NovelListUrl>
<RegexName>NovelListUrl</RegexName>
<Pattern>/files/article/toplastupdate/0/1.html</Pattern>
<Method>Match</Method>
<Options>None</Options>
<FilterPattern />
</NovelListUrl>
<NovelList_GetNovelKey>
<RegexName>NovelList_GetNovelKey</RegexName>
<Pattern>&lt;td class="odd"&gt;&lt;a href="/files/article/info/\d*/(\d*).html"&gt;.+?&lt;/a&gt;&lt;/td&gt;</Pattern> <Method>Match</Method>
<Options>None</Options>
<FilterPattern />
</NovelList_GetNovelKey>
<NovelUrl>
<RegexName>NovelUrl</RegexName>
<Pattern>/modules/article/artic leinfo.php?id={NovelKey}</Pattern>
<Method>Match</Method>
<Options>None</Options>
<FilterPattern />
</NovelUrl>
<NovelErr>
<RegexName>NovelErr</RegexName>
<Pattern>您要找的页面已被移动</Pattern>
<Method>Match</Method>
<Options>None</Options>
<FilterPattern />
</NovelErr>
<NovelName>
<RegexName>NovelName</RegexName>
<Pattern>h1 class="articlename" style="display:inline"&gt;&lt;a href="/files/article/html/\d*/\d*/index.html"&gt;(.+?)&lt;/a&gt;&lt;/h1&gt;</P attern>
<Method>Match</Method>
<Options>None</Options>
<FilterPattern />
</NovelName>
<NovelAuthor>
<RegexName>NovelAuthor</RegexName>
<Pattern>searchkey=.+?"&gt;(.+?)&lt;/a&gt;&lt;/td&gt;\s*&lt;td
width="22%"&gt;&lt;strong&gt;管</Pattern>
<Method>Match</Method>
<Options>None</Options>
<FilterPattern />
</NovelAuthor>
<LagerSort>
<RegexName>LagerSort</RegexName>
<Pattern>本书类别:&lt;/strong&gt;(.+?)&lt;/td&gt;\s*&lt;td width="22%"&gt;&lt;strong&gt;本书作者</Pattern>
<Method>Match</Method>
<Options>None</Options>
<FilterPattern />
</LagerSort>
<SmallSort>
<RegexName>SmallSort</RegexName>
<Pattern>本书类别:&lt;/strong&gt;(.+?)&lt;/td&gt;\s*&lt;td width="22%"&gt;&lt;strong&gt;本书作者</Pattern>
<Method>Match</Method>
<Options>None</Options>
<FilterPattern />
</SmallSort>
<NovelIntro>
<RegexName>NovelIntro</RegexName>
<Pattern>内容详细简介介绍:(.+?)&lt;script type="text/javascript"&gt;/*460*60</Pattern> <Method>Match</Method>
<Options>Singleline</Options>
<FilterPattern>电脑站:|手机站:|[\w\sA-Za-z0-9:/]{0,60}(?:\.|.)[\w\sA-Za-z0-9:/][^\s&amp;;&lt;&gt;\u4e00-\u9fa5]{0,60}</FilterPattern>
</NovelIntro>
<NovelKeyword>
<RegexName>NovelKeyword</RegexName>
<Pattern>h1 class="articlename" style="display:inline"&gt;&lt;a href="/files/article/html/\d*/\d*/index.html"&gt;(.+?)&lt;/a&gt;&lt;/h1&gt;</P attern>
<Method>Match</Method>
<Options>None</Options>
<FilterPattern />
</NovelKeyword>
<NovelDegree>
<RegexName>NovelDegree</RegexName>
<Pattern>文章状态:&lt;/strong&gt;(.+?)&lt;/td&gt;\s*&lt;td&gt;&lt;strong&gt;授权级别</Pattern>
<Method>Match</Method>
<Options>None</Options>
<FilterPattern />
</NovelDegree>
<NovelCover>
<RegexName>NovelCover</RegexName>
<Pattern>img class="picborder" src="(.+?)" width="120px" height="150px"</Pattern>
<Method>Match</Method>
<Options>None</Options>
<FilterPattern />
</NovelCover>
<NovelDefaultCoverUrl>
<RegexName>NovelDefaultCoverUrl</RegexName>
<Pattern />
<Method>Match</Method>
<Options>None</Options>
<FilterPattern />
</NovelDefaultCoverUrl>
<NovelInfo_GetNovelPubKey>
<RegexName>NovelInfo_GetNovelPubKey</RegexName>
<Pattern>&lt;a href="(.+?)"&gt;&lt;img src="/themes/Images/dian.gif" border="0" /&gt;&lt;/a&gt;</Pattern>
<Method>Match</Method>
<Options>None</Options>
<FilterPattern />
</NovelInfo_GetNovelPubKey>
<PubCookies>
<RegexName>PubCookies</RegexName>
<Pattern />
<Method>Match</Method>
<Options>None</Options>
<FilterPattern />
</PubCookies>
<PubIndexUrl>
<RegexName>PubIndexUrl</RegexName>
<Pattern>{NovelPubKey}</Pattern>
<Method>Match</Method>
<Options>None</Options>
<FilterPattern />
</PubIndexUrl>
<PubIndexErr>
<RegexName>PubIndexErr</RegexName>
<Pattern>这里必须填写</Pattern>
<Method>Match</Method>
<Options>None</Options>
<FilterPattern />
</PubIndexErr>
<PubV olumeContent>
<RegexName>PubV olumeContent</RegexName>
<Pattern />
<Method>Match</Method>
<Options>None</Options>
<FilterPattern />
</PubV olumeContent>
<PubV olumeSplit>
<RegexName>PubV olumeSplit</RegexName>
<Pattern>&lt;td colspan="4" class="vcss"&gt;</Pattern>
<Method>Spilt</Method>
<Options>None</Options>
<FilterPattern />
</PubV olumeSplit>
<PubV olumeName>
<RegexName>PubV olumeName</RegexName>
<Pattern>&lt;font color="#174973"&gt;&lt;strong class="title"&gt;(.+?)&lt;/strong&gt;&lt;/font&gt;</Pattern>
<Method>Match</Method>
<Options>None</Options>
<FilterPattern />
</PubV olumeName>
<PubChapterName>
<RegexName>PubChapterName</RegexName>
<Pattern>&lt;a href="\d*.html"&gt;(.+?)&lt;/a&gt;</Pattern>
<Method>Match</Method>
<Options>Singleline</Options>
<FilterPattern />
</PubChapterName>
<PubChapter_GetChapterKey>
<RegexName>PubChapter_GetChapterKey</RegexName>
<Pattern>&lt;a href="(\d*.html)"&gt;.+?&lt;/a&gt;</Pattern>
<Method>Match</Method>
<Options>Singleline</Options>
<FilterPattern />
</PubChapter_GetChapterKey>
<PubContentUrl>
<RegexName>PubContentUrl</RegexName>
<Pattern>{ChapterKey}</Pattern>
<Method>Match</Method>
<Options>None</Options>
<FilterPattern />
</PubContentUrl>
<PubContentErr>
<RegexName>PubContentErr</RegexName>
<Pattern>这里必须填写</Pattern>
<Method>Match</Method>
<Options>None</Options>
<FilterPattern />
</PubContentErr>
<PubContent_GetTextKey>
<RegexName>PubContent_GetTextKey</RegexName>
<Pattern />
<Method>Match</Method>
<Options>None</Options>
<FilterPattern />
</PubContent_GetTextKey>
<PubTextUrl>
<RegexName>PubTextUrl</RegexName>
<Pattern />
<Method>Match</Method>
<Options>None</Options>
<FilterPattern />
</PubTextUrl>
<PubContentText>
<RegexName>PubContentText</RegexName>
<Pattern>享有更多权利&lt;/font&gt;&lt;/a&gt;(.+?)&lt;font color=#ff00ff&gt;喜欢本篇文章</Pattern>
<Method>Match</Method>
<Options>IgnoreCase Singleline</Options>
<FilterPattern>复制</FilterPattern>
</PubContentText>
<PubContentReplace>
<RegexName>PubContentReplace</RegexName>
<Pattern />
<Method>Match</Method>
<Options>None</Options>
<FilterPattern />
</PubContentReplace>
<PubContentImages>
<RegexName>PubContentImages</RegexName>
<Pattern>&lt;div class="divimage"&gt;&lt;img src="(.+?)" border="0" class="imagecontent"&gt;&lt;/div&gt;</Pattern>
<Method>Match</Method>
<Options>None</Options>
<FilterPattern />
</PubContentImages>
</RuleConfigInfo>。

相关文档
最新文档