杰奇小说CMS伪静态规则和关关采集器的编写代码参考

罗帆 草根站长 2017-11-15 1681 0

记录一些规则,因为前面的网站被我删了,以防止将来某一天要用到的时候,可以参考。


杰奇cms的Windows服务器IIS的伪静态:

<?xml version="1.0" ?>
<rules>
	<rule name="mulu_rewrite">
		<match url="^([0-9]+)/([0-9]+)/$" ignoreCase="false"/>
		<action type="Rewrite" url="/modules/article/reader.php?aid={R:2}" appendQueryString="false"/>
	</rule>
	<rule name="zhangjie_rewrite">
		<match url="^([0-9]+)/([0-9]+)/([0-9]+).html$" ignoreCase="false"/>
		<action type="Rewrite" url="/modules/article/reader.php?aid={R:2}&amp;cid={R:3}" appendQueryString="false"/>
	</rule>
	<rule name="fenlei1_rewrite">
		<match url="^list/$" ignoreCase="false"/>
		<action type="Rewrite" url="/list.php" appendQueryString="false"/>
	</rule>
	<rule name="fenlei2_rewrite">
		<match url="^list/([0-9]+).html$" ignoreCase="false"/>
		<action type="Rewrite" url="/modules/article/articlelist.php?class={R:1}" appendQueryString="false"/>
	</rule>
	<rule name="fenlei3_rewrite">
		<match url="^list/([0-9]+)/([0-9]+).html$" ignoreCase="false"/>
		<action type="Rewrite" url="/modules/article/articlelist.php?class={R:1}&amp;page={R:2}" appendQueryString="false"/>
	</rule>
	<rule name="paihang1_rewrite">
		<match url="^top/$" ignoreCase="false"/>
		<action type="Rewrite" url="/top.php" appendQueryString="false"/>
	</rule>
	<rule name="paihang2_rewrite">
		<match url="^top/([a-z]+)/$" ignoreCase="false"/>
		<action type="Rewrite" url="/modules/article/toplist.php?sort={R:1}" appendQueryString="false"/>
	</rule>
	<rule name="paihang3_rewrite">
		<match url="^top/([a-z]+)/([0-9]+).html$" ignoreCase="false"/>
		<action type="Rewrite" url="/modules/article/toplist.php?sort={R:1}&amp;page={R:2}" appendQueryString="false"/>
	</rule>
	<rule name="quan1_rewrite">
		<match url="^wanben/$" ignoreCase="false"/>
		<action type="Rewrite" url="/modules/article/book_full.php?fullflag=1" appendQueryString="false"/>
	</rule>
	<rule name="quan2_rewrite">
		<match url="^wanben/([0-9]+)$" ignoreCase="false"/>
		<action type="Rewrite" url="/modules/article/book_full.php?fullflag=1&amp;page={R:1}" appendQueryString="false"/>
	</rule>
	<rule name="muban1_rewrite">
		<match url="^templates/(.*).html$" ignoreCase="false"/>
		<action type="Rewrite" url="/404.html" appendQueryString="false"/>
	</rule>
	<rule name="muban2_rewrite">
		<match url="^themes/book/(.*).html$" ignoreCase="false"/>
		<action type="Rewrite" url="/404.html" appendQueryString="false"/>
	</rule>
</rules>

这是对应的Linux的伪静态规则

rewrite ^/list/$ /list.php;
rewrite ^/top/$ /top.php;
rewrite ^/list/([0-9]+).html$ /modules/article/articlelist.php?class=$1;
rewrite ^/list/([0-9]+)/([0-9]+).html$ /modules/article/articlelist.php?class=$1&page=$2;
rewrite ^/top/([a-z]+)/$ /modules/article/toplist.php?sort=$1;
rewrite ^/top/([a-z]+)/([0-9]+).html$ /modules/article/toplist.php?sort=$1&page=$2;
rewrite ^/wanben/$ /modules/article/book_full.php?fullflag=1;
rewrite ^/wanben/([0-9]+)$ /modules/article/book_full.php?fullflag=1&page=$1;
rewrite ^/templates/(.*).html$ /404.html;
rewrite ^/themes/book/(.*).html$ /404.html;
rewrite ^/[0-9]+/([0-9]+)/$ /modules/article/reader.php?aid=$1;
rewrite ^/[0-9]+/([0-9]+)/([0-9]+).html$ /modules/article/reader.php?aid=$1&cid=$2;


上面这两个基本上可以搞定所有的了。下面是过往标记的。


宝塔Linux系统规则:

location / {
	rewrite ^(.*)list/([0-9]+)-([0-9]+)\.html$ $1/modules/article/articlelist.php?class=$2&page=$3;

	rewrite ^(.*)([0-9]+)/([0-9]+)/$ $1/modules/article/reader.php?aid=$3;
}




常见的.htaccess规则

# Helicon ISAPI_Rewrite configuration file
# Version 3.1.0.104

RewriteEngine On
RewriteRule ^list/([0-9]+)-([0-9]+).html$ /modules/article/articlelist.php?class=$1&page=$2

RewriteRule ^([0-9]+)/([0-9]+)/index.html$ /modules/article/reader.php?aid=$2

RewriteRule ^book/([a-z]+)-([0-9]+).html$ /modules/article/toplist.php?sort=$1&page=$2
RewriteRule ^author/(.*)$ /modules/article/authorarticle.php?author=$1

RewriteRule ^([0-9]+)/([0-9]+)/$ /modules/article/reader.php?aid=$2
RewriteRule ^([0-9]+)/([0-9]+)/([0-9]+).html$ /modules/article/reader.php?aid=$2&cid=$3




常见的

<rewrite>
<rules>
<rule name="Imported Rule 1">
<match url="^list/([0-9]+)-([0-9]+).html$" ignoreCase="false" />
<action type="Rewrite" url="/modules/article/articlelist.php?class={R:1}&amp;page={R:2}" appendQueryString="false" />
</rule>
<rule name="Imported Rule 2">
<match url="^([0-9]+)/([0-9]+)/$" ignoreCase="false" />
<action type="Rewrite" url="/modules/article/reader.php?aid={R:2}" appendQueryString="false" />
</rule>
<rule name="Imported Rule 3">
<match url="^([0-9]+)/([0-9]+)/index.html$" ignoreCase="false" />
<action type="Rewrite" url="/modules/article/reader.php?aid={R:2}" appendQueryString="false" />
</rule>
<rule name="Imported Rule 4">
<match url="^([0-9]+)/([0-9]+)/([0-9]+).html$" ignoreCase="false" />
<action type="Rewrite" url="/modules/article/reader.php?aid={R:2}&amp;cid={R:3}" appendQueryString="false" />
</rule>
<rule name="Imported Rule 5">
<match url="^book/([a-z]+)-([0-9]+).html$" ignoreCase="false" />
<action type="Rewrite" url="/modules/article/toplist.php?sort={R:1}&amp;page={R:2}" appendQueryString="false" />
</rule>
<rule name="Imported Rule 6">
<match url="^author/(.*)$" ignoreCase="false" />
<action type="Rewrite" url="/modules/article/authorarticle.php?author={R:1}" appendQueryString="false" />
</rule>
</rules>
</rewrite>



httpd.ini

[ISAPI_Rewrite]
# 3600 = 1 hour
CacheClockRate 3600
RepeatLimit 32
# Protect httpd.ini and httpd.parse.errors files
# from accessing through HTTP
RewriteRule ^(.*)/list/([0-9]+)-([0-9]+)\.html$ $1/modules/article/articlelist\.php\?class=$2&page=$3
RewriteRule ^(.*)/([0-9]+)/([0-9]+)/([0-9]+)\.html$ $1/modules/article/reader\.php\?aid=$3&cid=$4
RewriteRule ^(.*)/([0-9]+)/([0-9]+)/index\.html$ $1/modules/article/reader\.php\?aid=$3
RewriteRule ^(.*)/([0-9]+)/([0-9]+)/$ $1/modules/article/reader\.php\?aid=$3
RewriteRule ^(.*)/book/([a-z]+)-([0-9]+)\.html$ $1/modules/article/toplist\.php\?sort=$2&page=$3
RewriteRule ^(.*)/author/(.*)$ $1/modules/article/authorarticle\.php\?author=$2



nginx.conf

rewrite ^/list/([0-9]+)-([0-9]+).html$ /modules/article/articlelist.php?class=$1&page=$2 last;
rewrite ^/([0-9]+)/([0-9]+)/([0-9]+).html$ /modules/article/reader.php?aid=$2&cid=$3 last;
rewrite ^/([0-9]+)/([0-9]+)/index.html$ /modules/article/reader.php?aid=$2 last;
rewrite ^/([0-9]+)/([0-9]+)/$ /modules/article/reader.php?aid=$2 last;
rewrite ^/book/([a-z]+)-([0-9]+).html$ /modules/article/toplist.php?sort=$1&page=$2 last;
rewrite ^/author/(.*)$ /modules/article/authorarticle.php?author=$1 last;



备注下Windows系统的伪静态规则

RewriteEngine on
RewriteRule ^xuanhuan/$ /modules/article/articlelist.php?class=1
RewriteRule ^wuxia/$ /modules/article/articlelist.php?class=2
RewriteRule ^dushi/$ /modules/article/articlelist.php?class=3
RewriteRule ^lishi/$ /modules/article/articlelist.php?class=4
RewriteRule ^youxi/$ /modules/article/articlelist.php?class=5
RewriteRule ^kehuan/$ /modules/article/articlelist.php?class=6
RewriteRule ^qita/$ /modules/article/articlelist.php?class=7
RewriteRule ^xuanhuan/([0-9]+)/$ /modules/article/articlelist.php?class=1&page=$1
RewriteRule ^wuxia/([0-9]+)/$ /modules/article/articlelist.php?class=2&page=$1
RewriteRule ^dushi/([0-9]+)/$ /modules/article/articlelist.php?class=3&page=$1
RewriteRule ^lishi/([0-9]+)/$ /modules/article/articlelist.php?class=4&page=$1
RewriteRule ^youxi/([0-9]+)/$ /modules/article/articlelist.php?class=5&page=$1
RewriteRule ^kehuan/([0-9]+)/$ /modules/article/articlelist.php?class=6&page=$1
RewriteRule ^qita/([0-9]+)/$ /modules/article/articlelist.php?class=7&page=$1
RewriteRule ^fenlei/([0-9]+)_([0-9]+)/$ /modules/article/articlelist.php?class=$1&page=$2
RewriteRule ^top/([a-z]+)_([0-9]+)/$ /modules/article/toplist.php?sort=$1&page=$2
RewriteRule ^gengxin.html$ /modules/article/toplist.php?sort=lastupdate
RewriteRule ^paihang.html$ /modules/article/52mb_paihang.php
RewriteRule ^all.html$ /modules/article/52mb_quanbu.php
RewriteRule ^52mb/(.*).html$ /404.html
RewriteRule ^templates/(.*).html$ /404.html
RewriteRule ^themes/52mb/(.*).html$ /404.html
RewriteRule ^modules/article/templates/$ /404.html
RewriteRule ^modules/article/templates/(.*).html$ /404.html
RewriteRule ^book/([0-9]+).html$ modules/article/articleinfo.php?id=$1
RewriteRule ^([0-9]+)/([0-9]+)/$ modules/article/reader.php?aid=$2
RewriteRule ^([0-9]+)/([0-9]+)/index.html$ modules/article/reader.php?aid=$2
RewriteRule ^([0-9]+)/([0-9]+)/([0-9]+).html$ modules/article/reader.php?aid=$2&cid=$3



闲人笔趣阁主题伪静态

rewrite ^/xuanhuanxiaoshuo/$ /modules/article/articlelist.php?class=1 last;
rewrite ^/xiuzhenxiaoshuo/$ /modules/article/articlelist.php?class=2 last;
rewrite ^/dushixiaoshuo/$ /modules/article/articlelist.php?class=3 last;
rewrite ^/chuanyuexiaoshuo/$ /modules/article/articlelist.php?class=4 last;
rewrite ^/wangyouxiaoshuo/$ /modules/article/articlelist.php?class=5 last;
rewrite ^/kehuanxiaoshuo/$ /modules/article/articlelist.php?class=6 last;
rewrite ^/nvshengxiaoshuo/$ /modules/article/articlelist.php?class=7 last;
rewrite ^/qitaxiaoshuo/$ /modules/article/articlelist.php?class=8 last;
rewrite ^/xuanhuanxiaoshuo/([0-9]+)/$ /modules/article/articlelist.php?class=1&page=$2 last;
rewrite ^/xiuzhenxiaoshuo/([0-9]+)/$ /modules/article/articlelist.php?class=2&page=$2 last;
rewrite ^/dushixiaoshuo/([0-9]+)/$ /modules/article/articlelist.php?class=3&page=$2 last;
rewrite ^/chuanyuexiaoshuo/([0-9]+)/$ /modules/article/articlelist.php?class=4&page=$2 last;
rewrite ^/wangyouxiaoshuo/([0-9]+)/$ /modules/article/articlelist.php?class=5&page=$2 last;
rewrite ^/kehuanxiaoshuo/([0-9]+)/$ /modules/article/articlelist.php?class=6&page=$2 last;
rewrite ^/nvshengxiaoshuo/([0-9]+)/$ /modules/article/articlelist.php?class=7&page=$2 last;
rewrite ^/qitaxiaoshuo/([0-9]+)/$ /modules/article/articlelist.php?class=8&page=$2 last;
rewrite ^/wanben/1_([0-9]+)$ /modules/article/articlelist.php?fullflag=1&page=$2 last;
rewrite ^/paihangbang/$ /modules/article/paihang.php?type1=yes last;
rewrite ^/paihangbang/allvote.html$ /modules/article/paihang.php?type1=yes last;
rewrite ^/paihangbang/goodnum.html$ /modules/article/paihang.php?type2=yes last;
rewrite ^/paihangbang/newbook.html$ /modules/article/paihang.php?type3=yes last;
rewrite ^/xiaoshuodaquan/$ /modules/article/xiaoshuodaquan.php last;
rewrite ^/([0-9]+)_([0-9]+)/$ /modules/article/reader.php?aid=$2 last;
rewrite ^/([0-9]+)_([0-9]+)/([0-9]+).html$ /modules/article/reader.php?aid=$2&cid=$3 last;
rewrite ^/52mb/(.*).html$ /1.html last;
rewrite ^/templates/(.*).html$ /1.html last;
rewrite ^/themes/52mb/(.*).html$ /1.html last;
rewrite ^/modules/article/templates/$ /1.html last;
rewrite ^/modules/article/templates/(.*).html$ /1.html last;


备注一些关关采集的编写参考,其中:


①最新列表获取小说编号

<a href="xxxxxxxxxxxxxx.com/\d*_(\d*)/" title=".+?">(.+?)</a>


②小说编号链接

xxxxxxxxx.com/{NovelKey/1000}_{NovelKey}/


③小说简介正则

<div id="intro">((.|\n)+?)</div>


④章节名和序号

<dd><a href="/\d*_\d*/\d*.html">(.+?)</a></dd>
<dd><a href="/\d*_\d*/(\d*.html)">.+?</a></dd>


⑤章节内容地址

{ChapterKey}


⑥章节内容获取和里面的替换(注意这两个放在一个选项里面)

<div id="content">((.|\n)+?)<br/>
http♂
.com♂
.net♂
.cc♂
.info♂
.biz♂
.xyz♂
bqg♂
biquge♂
5200♂
优读文学♂
www♂
精彩小说无弹窗免费阅读!♂
一秒记住♂
&lt;♂
&amp;♂
微信关注♂

另外涉及到一些编码兼容之类

推荐都市大神老施新书♂
看书的朋友,你可以搜搜♂
.com♂
.cc♂
.Com♂
</p>♂
.cOm♂
.coM♂
.COm♂
.COM♂
.cOM♂
微信公众号♂
最新全本:、、、、、、、、、♂
QВ⑤♂
qb5♂
qb5♂
QВ5♂
qb5♂
Qb5♂
Qb⑤♂
qΒ5♂
qΒ⑤♂
QΒ5♂
qΒ⑤♂
qВ⑤♂
qВ5♂
qb⑤♂
qВ5♂
QΒ5♂
qВ5♂
QΒ5♂
qb⑤♂
http♂
.com♂
.net♂
.cc♂
.info♂
.biz♂
.xyz♂
bqg♂
biquge♂
5200♂
优读文学♂
www♂
精彩小说无弹窗免费阅读!♂
一秒记住♂
&lt;♂
&amp;♂
微信关注♂
<p>♂
&#8704;♂∀
&#8706;♂∂
&#8707;♂∃
&#8709;♂∅
&#8711;♂∇
&#8712;♂∈
&#8713;♂∉
&#8715;♂∋
&#8719;♂∏
&#8721;♂∑
&#8722;♂−
&#8727;♂∗
&#8730;♂√
&#8733;♂∝
&#8734;♂∞
&#8736;♂∠
&#8743;♂∧
&#8744;♂∨
&#8745;♂∩
&#8746;♂∪
&#8747;♂∫
&#8756;♂∴
&#8764;♂∼
&#8773;♂≅
&#8776;♂≈
&#8800;♂≠
&#8801;♂≡
&#8804;♂≤
&#8805;♂≥
&#8834;♂⊂
&#8835;♂⊃
&#8836;♂⊄
&#8838;♂⊆
&#8839;♂⊇
&#8853;♂⊕
&#8855;♂⊗
&#8869;♂⊥
&#8901;♂⋅
&#402;♂ƒ
&#710;♂ˆ
&#732;♂˜
&#8211;♂–
&#8212;♂—
&#8216;♂'
&#8217;♂'
&#8218;♂‚
&#8220;♂"
&#8221;♂"
&#8222;♂„
&#8224;♂†
&#8225;♂‡
&#8226;♂•
&#8230;♂…
&#8240;♂‰
&#8242;♂′
&#8243;♂″
&#8249;♂‹
&#8250;♂›
&#8254;♂‾
&#8364;♂€
&#8482;♂™
&#153;♂™
&#8592;♂←
&#8593;♂↑
&#8594;♂→
&#8595;♂↓
&#8596;♂↔
&#8629;♂↵
&#8968;♂⌈
&#8969;♂⌉
&#8970;♂⌊
&#8971;♂⌋
&#9674;♂◊


评论